|
|
|
@ -8,13 +8,13 @@ function train() {
|
|
|
|
|
use_mkldnn=$4
|
|
|
|
|
if [ $4 == "True" ]; then
|
|
|
|
|
thread=1
|
|
|
|
|
log="logs/${topology}-${layer_num}-mkldnn-${bs}.log"
|
|
|
|
|
log="logs/train-${topology}-${layer_num}-mkldnn-${bs}.log"
|
|
|
|
|
elif [ $4 == "False" ]; then
|
|
|
|
|
thread=`nproc`
|
|
|
|
|
# each trainer_count use only 1 core to avoid conflict
|
|
|
|
|
log="logs/${topology}-${layer_num}-${thread}mklml-${bs}.log"
|
|
|
|
|
log="logs/train-${topology}-${layer_num}-${thread}mklml-${bs}.log"
|
|
|
|
|
else
|
|
|
|
|
echo "Wrong input $3, use True or False."
|
|
|
|
|
echo "Wrong input $4, use True or False."
|
|
|
|
|
exit 0
|
|
|
|
|
fi
|
|
|
|
|
args="batch_size=${bs},layer_num=${layer_num}"
|
|
|
|
@ -30,13 +30,74 @@ function train() {
|
|
|
|
|
2>&1 | tee ${log}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if [ ! -d "train.list" ]; then
|
|
|
|
|
function test() {
|
|
|
|
|
unset OMP_NUM_THREADS MKL_NUM_THREADS OMP_DYNAMIC KMP_AFFINITY
|
|
|
|
|
topology=$1
|
|
|
|
|
layer_num=$2
|
|
|
|
|
bs=$3
|
|
|
|
|
use_mkldnn=$4
|
|
|
|
|
if [ $4 == "True" ]; then
|
|
|
|
|
thread=1
|
|
|
|
|
log="logs/test-${topology}-${layer_num}-mkldnn-${bs}.log"
|
|
|
|
|
elif [ $4 == "False" ]; then
|
|
|
|
|
thread=`nproc`
|
|
|
|
|
if [ $thread -gt $bs ]; then
|
|
|
|
|
thread=$bs
|
|
|
|
|
fi
|
|
|
|
|
log="logs/test-${topology}-${layer_num}-${thread}mklml-${bs}.log"
|
|
|
|
|
else
|
|
|
|
|
echo "Wrong input $4, use True or False."
|
|
|
|
|
exit 0
|
|
|
|
|
fi
|
|
|
|
|
|
|
|
|
|
models_in="models/${topology}-${layer_num}/pass-00000/"
|
|
|
|
|
if [ ! -d $models_in ]; then
|
|
|
|
|
echo "Training model ${topology}_${layer_num}"
|
|
|
|
|
paddle train --job=train \
|
|
|
|
|
--config="${topology}.py" \
|
|
|
|
|
--use_mkldnn=True \
|
|
|
|
|
--use_gpu=False \
|
|
|
|
|
--trainer_count=1 \
|
|
|
|
|
--num_passes=1 \
|
|
|
|
|
--save_dir="models/${topology}-${layer_num}" \
|
|
|
|
|
--config_args="batch_size=128,layer_num=${layer_num}" \
|
|
|
|
|
> /dev/null 2>&1
|
|
|
|
|
echo "Done"
|
|
|
|
|
fi
|
|
|
|
|
paddle train --job=test \
|
|
|
|
|
--config="${topology}.py" \
|
|
|
|
|
--use_mkldnn=$use_mkldnn \
|
|
|
|
|
--use_gpu=False \
|
|
|
|
|
--trainer_count=$thread \
|
|
|
|
|
--log_period=10 \
|
|
|
|
|
--config_args="batch_size=${bs},layer_num=${layer_num},is_test=True" \
|
|
|
|
|
--init_model_path=$models_in \
|
|
|
|
|
2>&1 | tee ${log}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if [ ! -f "train.list" ]; then
|
|
|
|
|
echo " " > train.list
|
|
|
|
|
fi
|
|
|
|
|
if [ ! -f "test.list" ]; then
|
|
|
|
|
echo " " > test.list
|
|
|
|
|
fi
|
|
|
|
|
if [ ! -d "logs" ]; then
|
|
|
|
|
mkdir logs
|
|
|
|
|
fi
|
|
|
|
|
if [ ! -d "models" ]; then
|
|
|
|
|
mkdir -p models
|
|
|
|
|
fi
|
|
|
|
|
|
|
|
|
|
# inference benchmark
|
|
|
|
|
for use_mkldnn in True False; do
|
|
|
|
|
for batchsize in 1 2 4 8 16; do
|
|
|
|
|
test googlenet v1 $batchsize $use_mkldnn
|
|
|
|
|
test resnet 50 $batchsize $use_mkldnn
|
|
|
|
|
test vgg 19 $batchsize $use_mkldnn
|
|
|
|
|
done
|
|
|
|
|
done
|
|
|
|
|
|
|
|
|
|
# training benchmark
|
|
|
|
|
for use_mkldnn in True False; do
|
|
|
|
|
for batchsize in 64 128 256; do
|
|
|
|
|
train vgg 19 $batchsize $use_mkldnn
|
|
|
|
|