Merge pull request #774 from cuicheng01/develop_reg

Update MobileNetV3_large_x1_0_CIFAR100_finetune.yaml
This commit is contained in:
Walter 2021-06-03 10:33:33 +08:00 committed by GitHub
commit 0116b51f1f
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23

View File

@ -1,65 +1,103 @@
mode: 'train' # global configs
ARCHITECTURE: Global:
name: 'MobileNetV3_large_x1_0' checkpoints: null
pretrained_model: null
checkpoints: "" output_dir: "./output/"
pretrained_model: "./pretrained/MobileNetV3_large_x1_0_pretrained" device: "gpu"
model_save_dir: "./output/" class_num: 100
classes_num: 100
total_images: 50000
save_interval: 1 save_interval: 1
validate: True eval_during_train: True
valid_interval: 1 eval_interval: 1
epochs: 100 epochs: 50
topk: 5 print_batch_step: 10
use_visualdl: False
# used for static mode and model export
image_shape: [3, 32, 32] image_shape: [3, 32, 32]
use_mix: False save_inference_dir: "./inference"
LEARNING_RATE: # model architecture
function: 'Cosine' Arch:
params: name: "MobileNetV3_large_x1_0"
lr: 0.04
OPTIMIZER: # loss function config for traing/eval process
function: 'Momentum' Loss:
params: Train:
- CELoss:
weight: 1.0
epsilon: 0.1
Eval:
- CELoss:
weight: 1.0
Optimizer:
name: Momentum
momentum: 0.9 momentum: 0.9
lr:
name: Cosine
learning_rate: 0.04
regularizer: regularizer:
function: 'L2' name: 'L2'
factor: 0.0001 coeff: 0.0001
TRAIN:
batch_size: 1024 # data loader for train and eval
num_workers: 4 DataLoader:
file_list: "./dataset/CIFAR100/train_list.txt" Train:
data_dir: "./dataset/CIFAR100/" dataset:
shuffle_seed: 0 name: ImageNetDataset
transforms: image_root: "./dataset/CIFAR100/"
- DecodeImage: cls_label_path: "./dataset/CIFAR100/train_list.txt"
to_rgb: True transform_ops:
channel_first: False
- RandCropImage: - RandCropImage:
size: 32 size: 32
scale: [0.5, 1]
ratio: [1, 1]
- RandFlipImage: - RandFlipImage:
flip_code: 1 flip_code: 1
- NormalizeImage: - NormalizeImage:
scale: 1./255. scale: 0.00392157
mean: [0.485, 0.456, 0.406] mean: [0.485, 0.456, 0.406]
std: [0.229, 0.224, 0.225] std: [0.229, 0.224, 0.225]
order: '' order: ''
- ToCHWImage:
mix: sampler:
- MixupOperator: name: DistributedBatchSampler
alpha: 0.2 batch_size: 1000
drop_last: False
shuffle: True
loader:
num_workers: 6
use_shared_memory: False
Eval:
# TOTO: modify to the latest trainer
dataset:
name: ImageNetDataset
image_root: "./dataset/CIFAR100/"
cls_label_path: "./dataset/CIFAR100/test_list.txt"
transform_ops:
- ResizeImage:
resize_short: 36
- CropImage:
size: 32
- NormalizeImage:
scale: 0.00392157
mean: [0.485, 0.456, 0.406]
std: [0.229, 0.224, 0.225]
order: ''
sampler:
name: DistributedBatchSampler
batch_size: 1000
drop_last: False
shuffle: False
loader:
num_workers: 6
use_shared_memory: False
VALID: Infer:
batch_size: 256 infer_imgs: "docs/images/whl/demo.jpg"
num_workers: 0 batch_size: 10
file_list: "./dataset/CIFAR100/test_list.txt"
data_dir: "./dataset/CIFAR100/"
shuffle_seed: 0
transforms: transforms:
- DecodeImage: - DecodeImage:
to_rgb: True to_rgb: True
@ -74,3 +112,16 @@ VALID:
std: [0.229, 0.224, 0.225] std: [0.229, 0.224, 0.225]
order: '' order: ''
- ToCHWImage: - ToCHWImage:
PostProcess:
name: Topk
topk: 5
class_id_map_file: "ppcls/utils/imagenet1k_label_list.txt"
Metric:
Train:
- Topk:
k: [1, 5]
Eval:
- Topk:
k: [1, 5]