feat: amp_O1 -> amp_O1_ultra, amp_O2 -> amp_O2_ultra
parent
18b25e3e86
commit
218da4ddf9
|
@ -10,9 +10,8 @@ Global:
|
||||||
epochs: 120
|
epochs: 120
|
||||||
print_batch_step: 10
|
print_batch_step: 10
|
||||||
use_visualdl: False
|
use_visualdl: False
|
||||||
image_channel: &image_channel 4
|
|
||||||
# used for static mode and model export
|
# used for static mode and model export
|
||||||
image_shape: [*image_channel, 224, 224]
|
image_shape: [3, 224, 224]
|
||||||
save_inference_dir: ./inference
|
save_inference_dir: ./inference
|
||||||
# training model under @to_static
|
# training model under @to_static
|
||||||
to_static: False
|
to_static: False
|
||||||
|
@ -29,8 +28,6 @@ AMP:
|
||||||
Arch:
|
Arch:
|
||||||
name: ResNet50
|
name: ResNet50
|
||||||
class_num: 1000
|
class_num: 1000
|
||||||
input_image_channel: *image_channel
|
|
||||||
data_format: "NHWC"
|
|
||||||
|
|
||||||
# loss function config for traing/eval process
|
# loss function config for traing/eval process
|
||||||
Loss:
|
Loss:
|
||||||
|
@ -76,7 +73,6 @@ DataLoader:
|
||||||
mean: [0.485, 0.456, 0.406]
|
mean: [0.485, 0.456, 0.406]
|
||||||
std: [0.229, 0.224, 0.225]
|
std: [0.229, 0.224, 0.225]
|
||||||
order: ''
|
order: ''
|
||||||
channel_num: *image_channel
|
|
||||||
|
|
||||||
sampler:
|
sampler:
|
||||||
name: DistributedBatchSampler
|
name: DistributedBatchSampler
|
||||||
|
@ -105,7 +101,6 @@ DataLoader:
|
||||||
mean: [0.485, 0.456, 0.406]
|
mean: [0.485, 0.456, 0.406]
|
||||||
std: [0.229, 0.224, 0.225]
|
std: [0.229, 0.224, 0.225]
|
||||||
order: ''
|
order: ''
|
||||||
channel_num: *image_channel
|
|
||||||
sampler:
|
sampler:
|
||||||
name: DistributedBatchSampler
|
name: DistributedBatchSampler
|
||||||
batch_size: 64
|
batch_size: 64
|
||||||
|
@ -131,7 +126,6 @@ Infer:
|
||||||
mean: [0.485, 0.456, 0.406]
|
mean: [0.485, 0.456, 0.406]
|
||||||
std: [0.229, 0.224, 0.225]
|
std: [0.229, 0.224, 0.225]
|
||||||
order: ''
|
order: ''
|
||||||
channel_num: *image_channel
|
|
||||||
- ToCHWImage:
|
- ToCHWImage:
|
||||||
PostProcess:
|
PostProcess:
|
||||||
name: Topk
|
name: Topk
|
||||||
|
|
|
@ -0,0 +1,147 @@
|
||||||
|
# global configs
|
||||||
|
Global:
|
||||||
|
checkpoints: null
|
||||||
|
pretrained_model: null
|
||||||
|
output_dir: ./output/
|
||||||
|
device: gpu
|
||||||
|
save_interval: 1
|
||||||
|
eval_during_train: True
|
||||||
|
eval_interval: 1
|
||||||
|
epochs: 120
|
||||||
|
print_batch_step: 10
|
||||||
|
use_visualdl: False
|
||||||
|
image_channel: &image_channel 4
|
||||||
|
# used for static mode and model export
|
||||||
|
image_shape: [*image_channel, 224, 224]
|
||||||
|
save_inference_dir: ./inference
|
||||||
|
# training model under @to_static
|
||||||
|
to_static: False
|
||||||
|
use_dali: True
|
||||||
|
|
||||||
|
# mixed precision training
|
||||||
|
AMP:
|
||||||
|
scale_loss: 128.0
|
||||||
|
use_dynamic_loss_scaling: True
|
||||||
|
# O1: mixed fp16
|
||||||
|
level: O1
|
||||||
|
|
||||||
|
# model architecture
|
||||||
|
Arch:
|
||||||
|
name: ResNet50
|
||||||
|
class_num: 1000
|
||||||
|
input_image_channel: *image_channel
|
||||||
|
data_format: "NHWC"
|
||||||
|
|
||||||
|
# loss function config for traing/eval process
|
||||||
|
Loss:
|
||||||
|
Train:
|
||||||
|
- CELoss:
|
||||||
|
weight: 1.0
|
||||||
|
Eval:
|
||||||
|
- CELoss:
|
||||||
|
weight: 1.0
|
||||||
|
|
||||||
|
|
||||||
|
Optimizer:
|
||||||
|
name: Momentum
|
||||||
|
momentum: 0.9
|
||||||
|
multi_precision: True
|
||||||
|
lr:
|
||||||
|
name: Piecewise
|
||||||
|
learning_rate: 0.1
|
||||||
|
decay_epochs: [30, 60, 90]
|
||||||
|
values: [0.1, 0.01, 0.001, 0.0001]
|
||||||
|
regularizer:
|
||||||
|
name: 'L2'
|
||||||
|
coeff: 0.0001
|
||||||
|
|
||||||
|
|
||||||
|
# data loader for train and eval
|
||||||
|
DataLoader:
|
||||||
|
Train:
|
||||||
|
dataset:
|
||||||
|
name: ImageNetDataset
|
||||||
|
image_root: ./dataset/ILSVRC2012/
|
||||||
|
cls_label_path: ./dataset/ILSVRC2012/train_list.txt
|
||||||
|
transform_ops:
|
||||||
|
- DecodeImage:
|
||||||
|
to_rgb: True
|
||||||
|
channel_first: False
|
||||||
|
- RandCropImage:
|
||||||
|
size: 224
|
||||||
|
- RandFlipImage:
|
||||||
|
flip_code: 1
|
||||||
|
- NormalizeImage:
|
||||||
|
scale: 1.0/255.0
|
||||||
|
mean: [0.485, 0.456, 0.406]
|
||||||
|
std: [0.229, 0.224, 0.225]
|
||||||
|
order: ''
|
||||||
|
channel_num: *image_channel
|
||||||
|
|
||||||
|
sampler:
|
||||||
|
name: DistributedBatchSampler
|
||||||
|
batch_size: 64
|
||||||
|
drop_last: False
|
||||||
|
shuffle: True
|
||||||
|
loader:
|
||||||
|
num_workers: 4
|
||||||
|
use_shared_memory: True
|
||||||
|
|
||||||
|
Eval:
|
||||||
|
dataset:
|
||||||
|
name: ImageNetDataset
|
||||||
|
image_root: ./dataset/ILSVRC2012/
|
||||||
|
cls_label_path: ./dataset/ILSVRC2012/val_list.txt
|
||||||
|
transform_ops:
|
||||||
|
- DecodeImage:
|
||||||
|
to_rgb: True
|
||||||
|
channel_first: False
|
||||||
|
- ResizeImage:
|
||||||
|
resize_short: 256
|
||||||
|
- CropImage:
|
||||||
|
size: 224
|
||||||
|
- NormalizeImage:
|
||||||
|
scale: 1.0/255.0
|
||||||
|
mean: [0.485, 0.456, 0.406]
|
||||||
|
std: [0.229, 0.224, 0.225]
|
||||||
|
order: ''
|
||||||
|
channel_num: *image_channel
|
||||||
|
sampler:
|
||||||
|
name: DistributedBatchSampler
|
||||||
|
batch_size: 64
|
||||||
|
drop_last: False
|
||||||
|
shuffle: False
|
||||||
|
loader:
|
||||||
|
num_workers: 4
|
||||||
|
use_shared_memory: True
|
||||||
|
|
||||||
|
Infer:
|
||||||
|
infer_imgs: docs/images/inference_deployment/whl_demo.jpg
|
||||||
|
batch_size: 10
|
||||||
|
transforms:
|
||||||
|
- DecodeImage:
|
||||||
|
to_rgb: True
|
||||||
|
channel_first: False
|
||||||
|
- ResizeImage:
|
||||||
|
resize_short: 256
|
||||||
|
- CropImage:
|
||||||
|
size: 224
|
||||||
|
- NormalizeImage:
|
||||||
|
scale: 1.0/255.0
|
||||||
|
mean: [0.485, 0.456, 0.406]
|
||||||
|
std: [0.229, 0.224, 0.225]
|
||||||
|
order: ''
|
||||||
|
channel_num: *image_channel
|
||||||
|
- ToCHWImage:
|
||||||
|
PostProcess:
|
||||||
|
name: Topk
|
||||||
|
topk: 5
|
||||||
|
class_id_map_file: ppcls/utils/imagenet1k_label_list.txt
|
||||||
|
|
||||||
|
Metric:
|
||||||
|
Train:
|
||||||
|
- TopkAcc:
|
||||||
|
topk: [1, 5]
|
||||||
|
Eval:
|
||||||
|
- TopkAcc:
|
||||||
|
topk: [1, 5]
|
Loading…
Reference in New Issue