mirror of
https://github.com/PaddlePaddle/PaddleClas.git
synced 2025-06-03 21:55:06 +08:00
support specify model_type in config
such as norm_train and to_static_train
This commit is contained in:
parent
811b483e30
commit
2d66aeeb77
@ -90,6 +90,8 @@ line_num=`expr $line_num + 1`
|
|||||||
fp_items=$(func_parser_value "${lines[line_num]}")
|
fp_items=$(func_parser_value "${lines[line_num]}")
|
||||||
line_num=`expr $line_num + 1`
|
line_num=`expr $line_num + 1`
|
||||||
epoch=$(func_parser_value "${lines[line_num]}")
|
epoch=$(func_parser_value "${lines[line_num]}")
|
||||||
|
line_num=`expr $line_num + 1`
|
||||||
|
model_type=$(func_parser_value "${lines[line_num]}")
|
||||||
|
|
||||||
line_num=`expr $line_num + 1`
|
line_num=`expr $line_num + 1`
|
||||||
profile_option_key=$(func_parser_key "${lines[line_num]}")
|
profile_option_key=$(func_parser_key "${lines[line_num]}")
|
||||||
@ -118,6 +120,7 @@ line_gpuid=4
|
|||||||
line_precision=6
|
line_precision=6
|
||||||
line_epoch=7
|
line_epoch=7
|
||||||
line_batchsize=9
|
line_batchsize=9
|
||||||
|
line_model_type=15
|
||||||
line_profile=13
|
line_profile=13
|
||||||
line_eval_py=24
|
line_eval_py=24
|
||||||
line_export_py=30
|
line_export_py=30
|
||||||
@ -138,6 +141,7 @@ if [[ ! -n "$PARAMS" ]];then
|
|||||||
batch_size_list=(${batch_size})
|
batch_size_list=(${batch_size})
|
||||||
fp_items_list=(${fp_items})
|
fp_items_list=(${fp_items})
|
||||||
device_num_list=(N1C4)
|
device_num_list=(N1C4)
|
||||||
|
model_type_list=(${model_type})
|
||||||
run_mode="DP"
|
run_mode="DP"
|
||||||
elif [[ ${PARAMS} = "dynamicTostatic" ]];then
|
elif [[ ${PARAMS} = "dynamicTostatic" ]];then
|
||||||
IFS="|"
|
IFS="|"
|
||||||
@ -165,14 +169,13 @@ else
|
|||||||
fp_items_list=($precision)
|
fp_items_list=($precision)
|
||||||
batch_size_list=($batch_size)
|
batch_size_list=($batch_size)
|
||||||
device_num_list=($device_num)
|
device_num_list=($device_num)
|
||||||
fi
|
|
||||||
|
|
||||||
# for log name
|
# parse "to_static" options and modify trainer into "to_static_trainer"
|
||||||
to_static=""
|
if [[ ${model_type} = "dynamicTostatic" ]];then
|
||||||
# parse "to_static" options and modify trainer into "to_static_trainer"
|
model_type_list="to_static_train"
|
||||||
if [[ ${model_type} = "dynamicTostatic" ]];then
|
else
|
||||||
to_static="d2sT_"
|
model_type_list="norm_train"
|
||||||
sed -i 's/trainer:norm_train/trainer:to_static_train/g' $FILENAME
|
fi
|
||||||
fi
|
fi
|
||||||
|
|
||||||
|
|
||||||
@ -180,10 +183,20 @@ IFS="|"
|
|||||||
for batch_size in ${batch_size_list[*]}; do
|
for batch_size in ${batch_size_list[*]}; do
|
||||||
for precision in ${fp_items_list[*]}; do
|
for precision in ${fp_items_list[*]}; do
|
||||||
for device_num in ${device_num_list[*]}; do
|
for device_num in ${device_num_list[*]}; do
|
||||||
|
for model_type in ${model_type_list[*]}; do
|
||||||
# sed batchsize and precision
|
# sed batchsize and precision
|
||||||
func_sed_params "$FILENAME" "${line_precision}" "$precision"
|
func_sed_params "$FILENAME" "${line_precision}" "$precision"
|
||||||
func_sed_params "$FILENAME" "${line_batchsize}" "$batch_size"
|
func_sed_params "$FILENAME" "${line_batchsize}" "$batch_size"
|
||||||
func_sed_params "$FILENAME" "${line_epoch}" "$epoch"
|
func_sed_params "$FILENAME" "${line_epoch}" "$epoch"
|
||||||
|
func_sed_params "$FILENAME" "${line_model_type}" "$model_type"
|
||||||
|
|
||||||
|
# for log name
|
||||||
|
if [[ ${model_type} = "to_static_train" ]];then
|
||||||
|
to_static="d2sT_"
|
||||||
|
else
|
||||||
|
to_static=""
|
||||||
|
fi
|
||||||
|
|
||||||
gpu_id=$(set_gpu_id $device_num)
|
gpu_id=$(set_gpu_id $device_num)
|
||||||
|
|
||||||
# It is needed that using dali, NHWC and 4 channels when training ResNet50 with AMPO2
|
# It is needed that using dali, NHWC and 4 channels when training ResNet50 with AMPO2
|
||||||
@ -307,4 +320,5 @@ for batch_size in ${batch_size_list[*]}; do
|
|||||||
fi
|
fi
|
||||||
done
|
done
|
||||||
done
|
done
|
||||||
|
done
|
||||||
done
|
done
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -50,5 +50,12 @@ inference:python/predict_cls.py -c configs/inference_cls.yaml
|
|||||||
-o Global.benchmark:False
|
-o Global.benchmark:False
|
||||||
null:null
|
null:null
|
||||||
null:null
|
null:null
|
||||||
|
===========================train_benchmark_params==========================
|
||||||
|
batch_size:64
|
||||||
|
fp_items:fp32|fp16
|
||||||
|
epoch:1
|
||||||
|
model_type:norm_train|to_static_train
|
||||||
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
random_infer_input:[{float32,[3,224,224]}]
|
random_infer_input:[{float32,[3,224,224]}]
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256
|
batch_size:256
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64
|
batch_size:64
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|128
|
batch_size:64|128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|128
|
batch_size:64|128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|128
|
batch_size:64|128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256|640
|
batch_size:256|640
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train|to_static_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256|640
|
batch_size:256|640
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256|640
|
batch_size:256|640
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256|640
|
batch_size:256|640
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:512
|
batch_size:512
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:256
|
batch_size:256
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -53,6 +53,7 @@ null:null
|
|||||||
batch_size:500
|
batch_size:500
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -50,5 +50,12 @@ inference:python/predict_cls.py -c configs/inference_cls.yaml
|
|||||||
-o Global.benchmark:False
|
-o Global.benchmark:False
|
||||||
null:null
|
null:null
|
||||||
null:null
|
null:null
|
||||||
|
===========================train_benchmark_params==========================
|
||||||
|
batch_size:64
|
||||||
|
fp_items:fp32|fp16
|
||||||
|
epoch:1
|
||||||
|
model_type:norm_train|to_static_train
|
||||||
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
random_infer_input:[{float32,[3,224,224]}]
|
random_infer_input:[{float32,[3,224,224]}]
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:32|64
|
batch_size:32|64
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,3 +54,4 @@ null:null
|
|||||||
batch_size:128|256
|
batch_size:128|256
|
||||||
fp_items:ampfp16
|
fp_items:ampfp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128|64
|
batch_size:128|64
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train|to_static_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,3 +54,4 @@ null:null
|
|||||||
batch_size:128|256
|
batch_size:128|256
|
||||||
fp_items:purefp16
|
fp_items:purefp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64
|
batch_size:64
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:256|1536
|
batch_size:256|1536
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:2
|
epoch:2
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:104|128
|
batch_size:104|128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train|to_static_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|104
|
batch_size:64|104
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|104
|
batch_size:64|104
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|104
|
batch_size:64|104
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:64|144
|
batch_size:64|144
|
||||||
fp_items:fp32
|
fp_items:fp32
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
@ -54,6 +54,7 @@ null:null
|
|||||||
batch_size:128
|
batch_size:128
|
||||||
fp_items:fp32|fp16
|
fp_items:fp32|fp16
|
||||||
epoch:1
|
epoch:1
|
||||||
|
model_type:norm_train
|
||||||
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
--profiler_options:batch_range=[10,20];state=GPU;tracer_option=Default;profile_path=model.profile
|
||||||
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
flags:FLAGS_eager_delete_tensor_gb=0.0;FLAGS_fraction_of_gpu_memory_to_use=0.98;FLAGS_conv_workspace_size_limit=4096
|
||||||
===========================infer_benchmark_params==========================
|
===========================infer_benchmark_params==========================
|
||||||
|
Loading…
x
Reference in New Issue
Block a user