From 2f2aa3037c60db7255e7c378bae523e3124a7487 Mon Sep 17 00:00:00 2001 From: Ezra-Yu <1105212286@qq.com> Date: Mon, 23 May 2022 08:43:23 +0000 Subject: [PATCH] Refactor default hooks configs --- configs/_base_/default_runtime.py | 47 ++++++++++++++----- configs/_base_/schedules/cifar10_bs128.py | 1 - configs/_base_/schedules/cub_bs64.py | 2 +- .../imagenet_bs1024_adamw_conformer.py | 1 - .../schedules/imagenet_bs1024_adamw_swin.py | 1 - .../_base_/schedules/imagenet_bs1024_coslr.py | 1 - .../imagenet_bs1024_linearlr_bn_nowd.py | 1 - configs/_base_/schedules/imagenet_bs2048.py | 2 +- .../_base_/schedules/imagenet_bs2048_AdamW.py | 1 - .../_base_/schedules/imagenet_bs2048_coslr.py | 1 - .../_base_/schedules/imagenet_bs2048_rsb.py | 2 +- configs/_base_/schedules/imagenet_bs256.py | 1 - .../_base_/schedules/imagenet_bs256_140e.py | 2 +- .../imagenet_bs256_200e_coslr_warmup.py | 1 - .../_base_/schedules/imagenet_bs256_coslr.py | 2 +- .../schedules/imagenet_bs256_epochstep.py | 1 - .../_base_/schedules/imagenet_bs4096_AdamW.py | 1 - .../convmixer-1024-20_10xb64_in1k.py | 2 + .../convmixer-1536-20_10xb64_in1k.py | 2 + .../convmixer/convmixer-768-32_10xb64_in1k.py | 2 + .../convnext/convnext-base_32xb128_in1k.py | 2 + .../convnext/convnext-large_64xb64_in1k.py | 2 + .../convnext/convnext-small_32xb128_in1k.py | 2 + .../convnext/convnext-tiny_32xb128_in1k.py | 2 + .../convnext/convnext-xlarge_64xb64_in1k.py | 2 + .../deit/deit-base_ft-16xb32_in1k-384px.py | 2 + configs/deit/deit-small_pt-4xb256_in1k.py | 2 + .../resnet50_b32x8_fp16_dynamic_imagenet.py | 6 --- .../mlp-mixer-base-p16_64xb64_in1k.py | 2 + .../mlp-mixer-large-p16_64xb64_in1k.py | 2 + .../mobilenet_v2_b32x8_imagenet.py | 6 --- .../mobilenet_v3_large_imagenet.py | 6 --- .../mobilenet_v3/mobilenet_v3_small_cifar.py | 6 --- .../mobilenet_v3_small_imagenet.py | 6 --- .../poolformer/poolformer-m36_32xb128_in1k.py | 2 + .../poolformer/poolformer-m48_32xb128_in1k.py | 2 + .../poolformer/poolformer-s12_32xb128_in1k.py | 2 + .../poolformer/poolformer-s24_32xb128_in1k.py | 2 + .../poolformer/poolformer-s36_32xb128_in1k.py | 2 + .../repmlp/repmlp-base_8xb64_in1k-256px.py | 2 + configs/repmlp/repmlp-base_8xb64_in1k.py | 2 + configs/resnest/resnest101_b64x32_imagenet.py | 6 --- configs/resnest/resnest200_b32x64_imagenet.py | 6 --- configs/resnest/resnest269_b32x64_imagenet.py | 6 --- configs/resnest/resnest50_b64x32_imagenet.py | 6 --- configs/resnet/resnet101_b16x8_cifar10.py | 6 --- configs/resnet/resnet101_b32x8_imagenet.py | 6 --- configs/resnet/resnet152_b16x8_cifar10.py | 6 --- configs/resnet/resnet152_b32x8_imagenet.py | 6 --- configs/resnet/resnet18_b16x8_cifar10.py | 6 --- configs/resnet/resnet18_b32x8_imagenet.py | 6 --- configs/resnet/resnet34_b32x8_imagenet.py | 6 --- configs/resnet/resnet50_b16x8_cifar100.py | 6 --- .../resnet/resnet50_b16x8_cifar10_mixup.py | 6 --- .../resnet/resnet50_b32x8_coslr_imagenet.py | 6 --- .../resnet/resnet50_b32x8_cutmix_imagenet.py | 6 --- configs/resnet/resnet50_b32x8_imagenet.py | 6 --- .../resnet50_b32x8_label_smooth_imagenet.py | 6 --- .../resnet/resnet50_b32x8_mixup_imagenet.py | 6 --- .../resnet50_b64x32_warmup_coslr_imagenet.py | 6 --- .../resnet/resnet50_b64x32_warmup_imagenet.py | 6 --- ...t50_b64x32_warmup_label_smooth_imagenet.py | 6 --- configs/resnet/resnetv1d101_b32x8_imagenet.py | 6 --- configs/resnet/resnetv1d152_b32x8_imagenet.py | 6 --- configs/resnet/resnetv1d50_b32x8_imagenet.py | 6 --- .../resnext101_32x4d_b32x8_imagenet.py | 6 --- .../resnext101_32x8d_b32x8_imagenet.py | 6 --- .../resnext152_32x4d_b32x8_imagenet.py | 6 --- .../resnext/resnext50_32x4d_b32x8_imagenet.py | 6 --- .../seresnet/seresnet101_b32x8_imagenet.py | 6 --- configs/seresnet/seresnet50_b32x8_imagenet.py | 6 --- .../seresnext101_32x4d_b32x8_imagenet.py | 6 --- .../seresnext50_32x4d_b32x8_imagenet.py | 6 --- ..._v1_1x_b64x16_linearlr_bn_nowd_imagenet.py | 6 --- .../swin-base_16xb64_in1k-384px.py | 2 + .../swin_transformer/swin-base_16xb64_in1k.py | 2 + .../swin-large_16xb64_in1k-384px.py | 2 + .../swin-large_16xb64_in1k.py | 2 + .../swin-small_16xb64_in1k.py | 2 + .../swin_transformer/swin-tiny_16xb64_in1k.py | 2 + .../swin_base_224_b16x64_300e_imagenet.py | 6 --- .../swin_base_384_evalonly_imagenet.py | 6 --- .../swin_large_224_evalonly_imagenet.py | 6 --- .../swin_large_384_evalonly_imagenet.py | 6 --- .../swin_small_224_b16x64_300e_imagenet.py | 6 --- .../swin_tiny_224_b16x64_300e_imagenet.py | 6 --- .../tnt_s_patch16_224_evalonly_imagenet.py | 6 --- configs/twins/twins-pcpvt-base_8xb128_in1k.py | 4 +- configs/twins/twins-svt-base_8xb128_in1k.py | 5 +- configs/van/van-base_8xb128_in1k.py | 2 + configs/van/van-large_8xb128_in1k.py | 2 + configs/van/van-small_8xb128_in1k.py | 2 + configs/van/van-tiny_8xb128_in1k.py | 2 + configs/vgg/vgg11_b32x8_imagenet.py | 6 --- configs/vgg/vgg11bn_b32x8_imagenet.py | 6 --- configs/vgg/vgg13_b32x8_imagenet.py | 6 --- configs/vgg/vgg13bn_b32x8_imagenet.py | 6 --- configs/vgg/vgg16_8xb16_voc.py | 1 + configs/vgg/vgg16_b32x8_imagenet.py | 6 --- configs/vgg/vgg16bn_b32x8_imagenet.py | 6 --- configs/vgg/vgg19_b32x8_imagenet.py | 6 --- configs/vgg/vgg19bn_b32x8_imagenet.py | 6 --- .../vit-base-p16_ft-64xb64_in1k-384.py | 2 + .../vit-base-p16_pt-64xb64_in1k-224.py | 2 + .../vit-base-p32_ft-64xb64_in1k-384.py | 2 + .../vit-base-p32_pt-64xb64_in1k-224.py | 2 + .../vit-large-p16_ft-64xb64_in1k-384.py | 2 + .../vit-large-p16_pt-64xb64_in1k-224.py | 2 + .../vit-large-p32_ft-64xb64_in1k-384.py | 2 + .../vit-large-p32_pt-64xb64_in1k-224.py | 2 + 110 files changed, 120 insertions(+), 350 deletions(-) delete mode 100644 configs/fp16/resnet50_b32x8_fp16_dynamic_imagenet.py delete mode 100644 configs/mobilenet_v2/mobilenet_v2_b32x8_imagenet.py delete mode 100644 configs/mobilenet_v3/mobilenet_v3_large_imagenet.py delete mode 100644 configs/mobilenet_v3/mobilenet_v3_small_cifar.py delete mode 100644 configs/mobilenet_v3/mobilenet_v3_small_imagenet.py delete mode 100644 configs/resnest/resnest101_b64x32_imagenet.py delete mode 100644 configs/resnest/resnest200_b32x64_imagenet.py delete mode 100644 configs/resnest/resnest269_b32x64_imagenet.py delete mode 100644 configs/resnest/resnest50_b64x32_imagenet.py delete mode 100644 configs/resnet/resnet101_b16x8_cifar10.py delete mode 100644 configs/resnet/resnet101_b32x8_imagenet.py delete mode 100644 configs/resnet/resnet152_b16x8_cifar10.py delete mode 100644 configs/resnet/resnet152_b32x8_imagenet.py delete mode 100644 configs/resnet/resnet18_b16x8_cifar10.py delete mode 100644 configs/resnet/resnet18_b32x8_imagenet.py delete mode 100644 configs/resnet/resnet34_b32x8_imagenet.py delete mode 100644 configs/resnet/resnet50_b16x8_cifar100.py delete mode 100644 configs/resnet/resnet50_b16x8_cifar10_mixup.py delete mode 100644 configs/resnet/resnet50_b32x8_coslr_imagenet.py delete mode 100644 configs/resnet/resnet50_b32x8_cutmix_imagenet.py delete mode 100644 configs/resnet/resnet50_b32x8_imagenet.py delete mode 100644 configs/resnet/resnet50_b32x8_label_smooth_imagenet.py delete mode 100644 configs/resnet/resnet50_b32x8_mixup_imagenet.py delete mode 100644 configs/resnet/resnet50_b64x32_warmup_coslr_imagenet.py delete mode 100644 configs/resnet/resnet50_b64x32_warmup_imagenet.py delete mode 100644 configs/resnet/resnet50_b64x32_warmup_label_smooth_imagenet.py delete mode 100644 configs/resnet/resnetv1d101_b32x8_imagenet.py delete mode 100644 configs/resnet/resnetv1d152_b32x8_imagenet.py delete mode 100644 configs/resnet/resnetv1d50_b32x8_imagenet.py delete mode 100644 configs/resnext/resnext101_32x4d_b32x8_imagenet.py delete mode 100644 configs/resnext/resnext101_32x8d_b32x8_imagenet.py delete mode 100644 configs/resnext/resnext152_32x4d_b32x8_imagenet.py delete mode 100644 configs/resnext/resnext50_32x4d_b32x8_imagenet.py delete mode 100644 configs/seresnet/seresnet101_b32x8_imagenet.py delete mode 100644 configs/seresnet/seresnet50_b32x8_imagenet.py delete mode 100644 configs/seresnet/seresnext101_32x4d_b32x8_imagenet.py delete mode 100644 configs/seresnet/seresnext50_32x4d_b32x8_imagenet.py delete mode 100644 configs/shufflenet_v1/shufflenet_v1_1x_b64x16_linearlr_bn_nowd_imagenet.py delete mode 100644 configs/swin_transformer/swin_base_224_b16x64_300e_imagenet.py delete mode 100644 configs/swin_transformer/swin_base_384_evalonly_imagenet.py delete mode 100644 configs/swin_transformer/swin_large_224_evalonly_imagenet.py delete mode 100644 configs/swin_transformer/swin_large_384_evalonly_imagenet.py delete mode 100644 configs/swin_transformer/swin_small_224_b16x64_300e_imagenet.py delete mode 100644 configs/swin_transformer/swin_tiny_224_b16x64_300e_imagenet.py delete mode 100644 configs/tnt/tnt_s_patch16_224_evalonly_imagenet.py delete mode 100644 configs/vgg/vgg11_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg11bn_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg13_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg13bn_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg16_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg16bn_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg19_b32x8_imagenet.py delete mode 100644 configs/vgg/vgg19bn_b32x8_imagenet.py diff --git a/configs/_base_/default_runtime.py b/configs/_base_/default_runtime.py index ba965a45..f63f8797 100644 --- a/configs/_base_/default_runtime.py +++ b/configs/_base_/default_runtime.py @@ -1,16 +1,37 @@ -# checkpoint saving -checkpoint_config = dict(interval=1) -# yapf:disable -log_config = dict( - interval=100, - hooks=[ - dict(type='TextLoggerHook'), - # dict(type='TensorboardLoggerHook') - ]) -# yapf:enable +default_scope = 'mmcls' -dist_params = dict(backend='nccl') +default_hooks = dict( + # optimizer configure + optimizer=dict(type='OptimizerHook', grad_clip=None), + + # record the time to load data and the time it takes to iterate once + timer=dict(type='IterTimerHook'), + + # logger configure + logger=dict(type='LoggerHook', interval=50), + + # Parameter Scheduler + param_scheduler=dict(type='ParamSchedulerHook'), + + # checkpoint saving + checkpoint=dict(type='CheckpointHook', interval=1), + + # Sampler for distributed training + sampler_seed=dict(type='DistSamplerSeedHook'), +) + +# Environment configure +env_cfg = dict( + cudnn_benchmark=False, + mp_cfg=dict(mp_start_method='fork', opencv_num_threads=0), + dist_cfg=dict(backend='nccl'), +) + +# Log level configuration log_level = 'INFO' + +# Load from weight load_from = None -resume_from = None -workflow = [('train', 1)] + +# resume training +resume = False diff --git a/configs/_base_/schedules/cifar10_bs128.py b/configs/_base_/schedules/cifar10_bs128.py index f134dbce..67747612 100644 --- a/configs/_base_/schedules/cifar10_bs128.py +++ b/configs/_base_/schedules/cifar10_bs128.py @@ -1,6 +1,5 @@ # optimizer optimizer = dict(type='SGD', lr=0.1, momentum=0.9, weight_decay=0.0001) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='step', step=[100, 150]) runner = dict(type='EpochBasedRunner', max_epochs=200) diff --git a/configs/_base_/schedules/cub_bs64.py b/configs/_base_/schedules/cub_bs64.py index 93cce6a7..68e17cdf 100644 --- a/configs/_base_/schedules/cub_bs64.py +++ b/configs/_base_/schedules/cub_bs64.py @@ -1,7 +1,6 @@ # optimizer optimizer = dict( type='SGD', lr=0.01, momentum=0.9, weight_decay=0.0005, nesterov=True) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( policy='CosineAnnealing', @@ -10,4 +9,5 @@ lr_config = dict( warmup_iters=5, warmup_ratio=0.01, warmup_by_epoch=True) + runner = dict(type='EpochBasedRunner', max_epochs=100) diff --git a/configs/_base_/schedules/imagenet_bs1024_adamw_conformer.py b/configs/_base_/schedules/imagenet_bs1024_adamw_conformer.py index 92f18017..d2f8dbdd 100644 --- a/configs/_base_/schedules/imagenet_bs1024_adamw_conformer.py +++ b/configs/_base_/schedules/imagenet_bs1024_adamw_conformer.py @@ -14,7 +14,6 @@ optimizer = dict( eps=1e-8, betas=(0.9, 0.999), paramwise_cfg=paramwise_cfg) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( diff --git a/configs/_base_/schedules/imagenet_bs1024_adamw_swin.py b/configs/_base_/schedules/imagenet_bs1024_adamw_swin.py index 2ad035cb..3464f77f 100644 --- a/configs/_base_/schedules/imagenet_bs1024_adamw_swin.py +++ b/configs/_base_/schedules/imagenet_bs1024_adamw_swin.py @@ -15,7 +15,6 @@ optimizer = dict( eps=1e-8, betas=(0.9, 0.999), paramwise_cfg=paramwise_cfg) -optimizer_config = dict(grad_clip=dict(max_norm=5.0)) # learning policy lr_config = dict( diff --git a/configs/_base_/schedules/imagenet_bs1024_coslr.py b/configs/_base_/schedules/imagenet_bs1024_coslr.py index ee84e7a6..1a3ca6fe 100644 --- a/configs/_base_/schedules/imagenet_bs1024_coslr.py +++ b/configs/_base_/schedules/imagenet_bs1024_coslr.py @@ -1,6 +1,5 @@ # optimizer optimizer = dict(type='SGD', lr=0.8, momentum=0.9, weight_decay=5e-5) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( policy='CosineAnnealing', diff --git a/configs/_base_/schedules/imagenet_bs1024_linearlr_bn_nowd.py b/configs/_base_/schedules/imagenet_bs1024_linearlr_bn_nowd.py index 99fbdda9..7825c78a 100644 --- a/configs/_base_/schedules/imagenet_bs1024_linearlr_bn_nowd.py +++ b/configs/_base_/schedules/imagenet_bs1024_linearlr_bn_nowd.py @@ -5,7 +5,6 @@ optimizer = dict( momentum=0.9, weight_decay=0.00004, paramwise_cfg=dict(norm_decay_mult=0)) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( policy='poly', diff --git a/configs/_base_/schedules/imagenet_bs2048.py b/configs/_base_/schedules/imagenet_bs2048.py index 93fdebfd..43ed92f9 100644 --- a/configs/_base_/schedules/imagenet_bs2048.py +++ b/configs/_base_/schedules/imagenet_bs2048.py @@ -1,7 +1,7 @@ # optimizer optimizer = dict( type='SGD', lr=0.8, momentum=0.9, weight_decay=0.0001, nesterov=True) -optimizer_config = dict(grad_clip=None) + # learning policy lr_config = dict( policy='step', diff --git a/configs/_base_/schedules/imagenet_bs2048_AdamW.py b/configs/_base_/schedules/imagenet_bs2048_AdamW.py index 6d4f2081..5f09fc0a 100644 --- a/configs/_base_/schedules/imagenet_bs2048_AdamW.py +++ b/configs/_base_/schedules/imagenet_bs2048_AdamW.py @@ -2,7 +2,6 @@ # In ClassyVision, the lr is set to 0.003 for bs4096. # In this implementation(bs2048), lr = 0.003 / 4096 * (32bs * 64gpus) = 0.0015 optimizer = dict(type='AdamW', lr=0.0015, weight_decay=0.3) -optimizer_config = dict(grad_clip=dict(max_norm=1.0)) # specific to vit pretrain paramwise_cfg = dict( diff --git a/configs/_base_/schedules/imagenet_bs2048_coslr.py b/configs/_base_/schedules/imagenet_bs2048_coslr.py index b9e77f2c..2a4e5bd1 100644 --- a/configs/_base_/schedules/imagenet_bs2048_coslr.py +++ b/configs/_base_/schedules/imagenet_bs2048_coslr.py @@ -1,7 +1,6 @@ # optimizer optimizer = dict( type='SGD', lr=0.8, momentum=0.9, weight_decay=0.0001, nesterov=True) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( policy='CosineAnnealing', diff --git a/configs/_base_/schedules/imagenet_bs2048_rsb.py b/configs/_base_/schedules/imagenet_bs2048_rsb.py index e021cb0f..78a3e393 100644 --- a/configs/_base_/schedules/imagenet_bs2048_rsb.py +++ b/configs/_base_/schedules/imagenet_bs2048_rsb.py @@ -1,6 +1,6 @@ # optimizer optimizer = dict(type='Lamb', lr=0.005, weight_decay=0.02) -optimizer_config = dict(grad_clip=None) + # learning policy lr_config = dict( policy='CosineAnnealing', diff --git a/configs/_base_/schedules/imagenet_bs256.py b/configs/_base_/schedules/imagenet_bs256.py index 3b5d1984..3450e1a5 100644 --- a/configs/_base_/schedules/imagenet_bs256.py +++ b/configs/_base_/schedules/imagenet_bs256.py @@ -1,6 +1,5 @@ # optimizer optimizer = dict(type='SGD', lr=0.1, momentum=0.9, weight_decay=0.0001) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='step', step=[30, 60, 90]) runner = dict(type='EpochBasedRunner', max_epochs=100) diff --git a/configs/_base_/schedules/imagenet_bs256_140e.py b/configs/_base_/schedules/imagenet_bs256_140e.py index caba1577..bc541e6a 100644 --- a/configs/_base_/schedules/imagenet_bs256_140e.py +++ b/configs/_base_/schedules/imagenet_bs256_140e.py @@ -1,6 +1,6 @@ # optimizer optimizer = dict(type='SGD', lr=0.1, momentum=0.9, weight_decay=0.0001) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='step', step=[40, 80, 120]) + runner = dict(type='EpochBasedRunner', max_epochs=140) diff --git a/configs/_base_/schedules/imagenet_bs256_200e_coslr_warmup.py b/configs/_base_/schedules/imagenet_bs256_200e_coslr_warmup.py index 49456b2c..7710010b 100644 --- a/configs/_base_/schedules/imagenet_bs256_200e_coslr_warmup.py +++ b/configs/_base_/schedules/imagenet_bs256_200e_coslr_warmup.py @@ -1,6 +1,5 @@ # optimizer optimizer = dict(type='SGD', lr=0.1, momentum=0.9, weight_decay=0.0001) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict( policy='CosineAnnealing', diff --git a/configs/_base_/schedules/imagenet_bs256_coslr.py b/configs/_base_/schedules/imagenet_bs256_coslr.py index 779b4792..2b413120 100644 --- a/configs/_base_/schedules/imagenet_bs256_coslr.py +++ b/configs/_base_/schedules/imagenet_bs256_coslr.py @@ -1,6 +1,6 @@ # optimizer optimizer = dict(type='SGD', lr=0.1, momentum=0.9, weight_decay=0.0001) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='CosineAnnealing', min_lr=0) + runner = dict(type='EpochBasedRunner', max_epochs=100) diff --git a/configs/_base_/schedules/imagenet_bs256_epochstep.py b/configs/_base_/schedules/imagenet_bs256_epochstep.py index 2347a043..f312dc07 100644 --- a/configs/_base_/schedules/imagenet_bs256_epochstep.py +++ b/configs/_base_/schedules/imagenet_bs256_epochstep.py @@ -1,6 +1,5 @@ # optimizer optimizer = dict(type='SGD', lr=0.045, momentum=0.9, weight_decay=0.00004) -optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='step', gamma=0.98, step=1) runner = dict(type='EpochBasedRunner', max_epochs=300) diff --git a/configs/_base_/schedules/imagenet_bs4096_AdamW.py b/configs/_base_/schedules/imagenet_bs4096_AdamW.py index 75b00d80..8c3bb326 100644 --- a/configs/_base_/schedules/imagenet_bs4096_AdamW.py +++ b/configs/_base_/schedules/imagenet_bs4096_AdamW.py @@ -11,7 +11,6 @@ optimizer = dict( weight_decay=0.3, paramwise_cfg=paramwise_cfg, ) -optimizer_config = dict(grad_clip=dict(max_norm=1.0)) # learning policy lr_config = dict( diff --git a/configs/convmixer/convmixer-1024-20_10xb64_in1k.py b/configs/convmixer/convmixer-1024-20_10xb64_in1k.py index 58694d6e..115e209e 100644 --- a/configs/convmixer/convmixer-1024-20_10xb64_in1k.py +++ b/configs/convmixer/convmixer-1024-20_10xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=0.01) runner = dict(type='EpochBasedRunner', max_epochs=150) diff --git a/configs/convmixer/convmixer-1536-20_10xb64_in1k.py b/configs/convmixer/convmixer-1536-20_10xb64_in1k.py index 17a75595..d121ff13 100644 --- a/configs/convmixer/convmixer-1536-20_10xb64_in1k.py +++ b/configs/convmixer/convmixer-1536-20_10xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=0.01) runner = dict(type='EpochBasedRunner', max_epochs=150) diff --git a/configs/convmixer/convmixer-768-32_10xb64_in1k.py b/configs/convmixer/convmixer-768-32_10xb64_in1k.py index fa4c0602..164205f9 100644 --- a/configs/convmixer/convmixer-768-32_10xb64_in1k.py +++ b/configs/convmixer/convmixer-768-32_10xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=0.01) runner = dict(type='EpochBasedRunner', max_epochs=300) diff --git a/configs/convnext/convnext-base_32xb128_in1k.py b/configs/convnext/convnext-base_32xb128_in1k.py index 6c0450a4..d27871b9 100644 --- a/configs/convnext/convnext-base_32xb128_in1k.py +++ b/configs/convnext/convnext-base_32xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=128) optimizer = dict(lr=4e-3) diff --git a/configs/convnext/convnext-large_64xb64_in1k.py b/configs/convnext/convnext-large_64xb64_in1k.py index 1faae253..6919c65b 100644 --- a/configs/convnext/convnext-large_64xb64_in1k.py +++ b/configs/convnext/convnext-large_64xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=64) optimizer = dict(lr=4e-3) diff --git a/configs/convnext/convnext-small_32xb128_in1k.py b/configs/convnext/convnext-small_32xb128_in1k.py index d820fc6c..095b9c92 100644 --- a/configs/convnext/convnext-small_32xb128_in1k.py +++ b/configs/convnext/convnext-small_32xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=128) optimizer = dict(lr=4e-3) diff --git a/configs/convnext/convnext-tiny_32xb128_in1k.py b/configs/convnext/convnext-tiny_32xb128_in1k.py index 46d0185d..ef305b75 100644 --- a/configs/convnext/convnext-tiny_32xb128_in1k.py +++ b/configs/convnext/convnext-tiny_32xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=128) optimizer = dict(lr=4e-3) diff --git a/configs/convnext/convnext-xlarge_64xb64_in1k.py b/configs/convnext/convnext-xlarge_64xb64_in1k.py index 72849013..d4d7dd81 100644 --- a/configs/convnext/convnext-xlarge_64xb64_in1k.py +++ b/configs/convnext/convnext-xlarge_64xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=64) optimizer = dict(lr=4e-3) diff --git a/configs/deit/deit-base_ft-16xb32_in1k-384px.py b/configs/deit/deit-base_ft-16xb32_in1k-384px.py index db444168..4908ceec 100644 --- a/configs/deit/deit-base_ft-16xb32_in1k-384px.py +++ b/configs/deit/deit-base_ft-16xb32_in1k-384px.py @@ -4,6 +4,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + # model settings model = dict( type='ImageClassifier', diff --git a/configs/deit/deit-small_pt-4xb256_in1k.py b/configs/deit/deit-small_pt-4xb256_in1k.py index 550f0801..86a0a019 100644 --- a/configs/deit/deit-small_pt-4xb256_in1k.py +++ b/configs/deit/deit-small_pt-4xb256_in1k.py @@ -6,6 +6,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + # model settings model = dict( type='ImageClassifier', diff --git a/configs/fp16/resnet50_b32x8_fp16_dynamic_imagenet.py b/configs/fp16/resnet50_b32x8_fp16_dynamic_imagenet.py deleted file mode 100644 index 9075a894..00000000 --- a/configs/fp16/resnet50_b32x8_fp16_dynamic_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = '../resnet/resnet50_8xb32-fp16-dynamic_in1k.py' - -_deprecation_ = dict( - expected='../resnet/resnet50_8xb32-fp16-dynamic_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/mlp_mixer/mlp-mixer-base-p16_64xb64_in1k.py b/configs/mlp_mixer/mlp-mixer-base-p16_64xb64_in1k.py index e35dae55..aff28f71 100644 --- a/configs/mlp_mixer/mlp-mixer-base-p16_64xb64_in1k.py +++ b/configs/mlp_mixer/mlp-mixer-base-p16_64xb64_in1k.py @@ -4,3 +4,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs4096_AdamW.py', '../_base_/default_runtime.py', ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) diff --git a/configs/mlp_mixer/mlp-mixer-large-p16_64xb64_in1k.py b/configs/mlp_mixer/mlp-mixer-large-p16_64xb64_in1k.py index 459563c8..6d1b9b38 100644 --- a/configs/mlp_mixer/mlp-mixer-large-p16_64xb64_in1k.py +++ b/configs/mlp_mixer/mlp-mixer-large-p16_64xb64_in1k.py @@ -4,3 +4,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs4096_AdamW.py', '../_base_/default_runtime.py', ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) diff --git a/configs/mobilenet_v2/mobilenet_v2_b32x8_imagenet.py b/configs/mobilenet_v2/mobilenet_v2_b32x8_imagenet.py deleted file mode 100644 index 26c2b6de..00000000 --- a/configs/mobilenet_v2/mobilenet_v2_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'mobilenet-v2_8xb32_in1k.py' - -_deprecation_ = dict( - expected='mobilenet-v2_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/mobilenet_v3/mobilenet_v3_large_imagenet.py b/configs/mobilenet_v3/mobilenet_v3_large_imagenet.py deleted file mode 100644 index 93e89a49..00000000 --- a/configs/mobilenet_v3/mobilenet_v3_large_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'mobilenet-v3-large_8xb32_in1k.py' - -_deprecation_ = dict( - expected='mobilenet-v3-large_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/mobilenet_v3/mobilenet_v3_small_cifar.py b/configs/mobilenet_v3/mobilenet_v3_small_cifar.py deleted file mode 100644 index c09bd1cd..00000000 --- a/configs/mobilenet_v3/mobilenet_v3_small_cifar.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'mobilenet-v3-small_8xb16_cifar10.py' - -_deprecation_ = dict( - expected='mobilenet-v3-small_8xb16_cifar10.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/mobilenet_v3/mobilenet_v3_small_imagenet.py b/configs/mobilenet_v3/mobilenet_v3_small_imagenet.py deleted file mode 100644 index 15debd0f..00000000 --- a/configs/mobilenet_v3/mobilenet_v3_small_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'mobilenet-v3-small_8xb32_in1k.py' - -_deprecation_ = dict( - expected='mobilenet-v3-small_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/poolformer/poolformer-m36_32xb128_in1k.py b/configs/poolformer/poolformer-m36_32xb128_in1k.py index 1937a786..c20e6c16 100644 --- a/configs/poolformer/poolformer-m36_32xb128_in1k.py +++ b/configs/poolformer/poolformer-m36_32xb128_in1k.py @@ -5,4 +5,6 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=4e-3) diff --git a/configs/poolformer/poolformer-m48_32xb128_in1k.py b/configs/poolformer/poolformer-m48_32xb128_in1k.py index a65b76a6..dbc574ba 100644 --- a/configs/poolformer/poolformer-m48_32xb128_in1k.py +++ b/configs/poolformer/poolformer-m48_32xb128_in1k.py @@ -5,4 +5,6 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=4e-3) diff --git a/configs/poolformer/poolformer-s12_32xb128_in1k.py b/configs/poolformer/poolformer-s12_32xb128_in1k.py index 98027c07..918fa8a8 100644 --- a/configs/poolformer/poolformer-s12_32xb128_in1k.py +++ b/configs/poolformer/poolformer-s12_32xb128_in1k.py @@ -5,4 +5,6 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=4e-3) diff --git a/configs/poolformer/poolformer-s24_32xb128_in1k.py b/configs/poolformer/poolformer-s24_32xb128_in1k.py index 97742594..58405e69 100644 --- a/configs/poolformer/poolformer-s24_32xb128_in1k.py +++ b/configs/poolformer/poolformer-s24_32xb128_in1k.py @@ -5,4 +5,6 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=4e-3) diff --git a/configs/poolformer/poolformer-s36_32xb128_in1k.py b/configs/poolformer/poolformer-s36_32xb128_in1k.py index 4d742d37..e4f19d89 100644 --- a/configs/poolformer/poolformer-s36_32xb128_in1k.py +++ b/configs/poolformer/poolformer-s36_32xb128_in1k.py @@ -5,4 +5,6 @@ _base_ = [ '../_base_/default_runtime.py', ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + optimizer = dict(lr=4e-3) diff --git a/configs/repmlp/repmlp-base_8xb64_in1k-256px.py b/configs/repmlp/repmlp-base_8xb64_in1k-256px.py index 6bf61c8f..14e12638 100644 --- a/configs/repmlp/repmlp-base_8xb64_in1k-256px.py +++ b/configs/repmlp/repmlp-base_8xb64_in1k-256px.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict(backbone=dict(img_size=256)) img_norm_cfg = dict( diff --git a/configs/repmlp/repmlp-base_8xb64_in1k.py b/configs/repmlp/repmlp-base_8xb64_in1k.py index 2feecf48..11e938a7 100644 --- a/configs/repmlp/repmlp-base_8xb64_in1k.py +++ b/configs/repmlp/repmlp-base_8xb64_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + img_norm_cfg = dict( mean=[123.675, 116.28, 103.53], std=[58.395, 57.12, 57.375], to_rgb=True) test_pipeline = [ diff --git a/configs/resnest/resnest101_b64x32_imagenet.py b/configs/resnest/resnest101_b64x32_imagenet.py deleted file mode 100644 index 31c36477..00000000 --- a/configs/resnest/resnest101_b64x32_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnest101_32xb64_in1k.py' - -_deprecation_ = dict( - expected='resnest101_32xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnest/resnest200_b32x64_imagenet.py b/configs/resnest/resnest200_b32x64_imagenet.py deleted file mode 100644 index 8e62865f..00000000 --- a/configs/resnest/resnest200_b32x64_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnest200_64xb32_in1k.py' - -_deprecation_ = dict( - expected='resnest200_64xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnest/resnest269_b32x64_imagenet.py b/configs/resnest/resnest269_b32x64_imagenet.py deleted file mode 100644 index 0f8b76c5..00000000 --- a/configs/resnest/resnest269_b32x64_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnest269_64xb32_in1k.py' - -_deprecation_ = dict( - expected='resnest269_64xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnest/resnest50_b64x32_imagenet.py b/configs/resnest/resnest50_b64x32_imagenet.py deleted file mode 100644 index c0da422a..00000000 --- a/configs/resnest/resnest50_b64x32_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnest50_32xb64_in1k.py' - -_deprecation_ = dict( - expected='resnest50_32xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet101_b16x8_cifar10.py b/configs/resnet/resnet101_b16x8_cifar10.py deleted file mode 100644 index 57758f2d..00000000 --- a/configs/resnet/resnet101_b16x8_cifar10.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet101_8xb16_cifar10.py' - -_deprecation_ = dict( - expected='resnet101_8xb16_cifar10.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet101_b32x8_imagenet.py b/configs/resnet/resnet101_b32x8_imagenet.py deleted file mode 100644 index 8d45adc3..00000000 --- a/configs/resnet/resnet101_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet101_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnet101_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet152_b16x8_cifar10.py b/configs/resnet/resnet152_b16x8_cifar10.py deleted file mode 100644 index 5c76cac6..00000000 --- a/configs/resnet/resnet152_b16x8_cifar10.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet152_8xb16_cifar10.py' - -_deprecation_ = dict( - expected='resnet152_8xb16_cifar10.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet152_b32x8_imagenet.py b/configs/resnet/resnet152_b32x8_imagenet.py deleted file mode 100644 index 133638a4..00000000 --- a/configs/resnet/resnet152_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet152_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnet152_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet18_b16x8_cifar10.py b/configs/resnet/resnet18_b16x8_cifar10.py deleted file mode 100644 index 5a25a0e4..00000000 --- a/configs/resnet/resnet18_b16x8_cifar10.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet18_8xb16_cifar10.py' - -_deprecation_ = dict( - expected='resnet18_8xb16_cifar10.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet18_b32x8_imagenet.py b/configs/resnet/resnet18_b32x8_imagenet.py deleted file mode 100644 index e6d08f60..00000000 --- a/configs/resnet/resnet18_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet18_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnet18_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet34_b32x8_imagenet.py b/configs/resnet/resnet34_b32x8_imagenet.py deleted file mode 100644 index 144613a3..00000000 --- a/configs/resnet/resnet34_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet34_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnet34_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b16x8_cifar100.py b/configs/resnet/resnet50_b16x8_cifar100.py deleted file mode 100644 index b49b6f45..00000000 --- a/configs/resnet/resnet50_b16x8_cifar100.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb16_cifar100.py' - -_deprecation_ = dict( - expected='resnet50_8xb16_cifar100.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b16x8_cifar10_mixup.py b/configs/resnet/resnet50_b16x8_cifar10_mixup.py deleted file mode 100644 index 409a40e9..00000000 --- a/configs/resnet/resnet50_b16x8_cifar10_mixup.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb16-mixup_cifar10.py' - -_deprecation_ = dict( - expected='resnet50_8xb16-mixup_cifar10.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b32x8_coslr_imagenet.py b/configs/resnet/resnet50_b32x8_coslr_imagenet.py deleted file mode 100644 index 647153b4..00000000 --- a/configs/resnet/resnet50_b32x8_coslr_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb32-coslr_in1k.py' - -_deprecation_ = dict( - expected='resnet50_8xb32-coslr_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b32x8_cutmix_imagenet.py b/configs/resnet/resnet50_b32x8_cutmix_imagenet.py deleted file mode 100644 index 87b27d5a..00000000 --- a/configs/resnet/resnet50_b32x8_cutmix_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb32-cutmix_in1k.py' - -_deprecation_ = dict( - expected='resnet50_8xb32-cutmix_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b32x8_imagenet.py b/configs/resnet/resnet50_b32x8_imagenet.py deleted file mode 100644 index 7d7f69ec..00000000 --- a/configs/resnet/resnet50_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnet50_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b32x8_label_smooth_imagenet.py b/configs/resnet/resnet50_b32x8_label_smooth_imagenet.py deleted file mode 100644 index 6e874155..00000000 --- a/configs/resnet/resnet50_b32x8_label_smooth_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb32-lbs_in1k.py' - -_deprecation_ = dict( - expected='resnet50_8xb32-lbs_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b32x8_mixup_imagenet.py b/configs/resnet/resnet50_b32x8_mixup_imagenet.py deleted file mode 100644 index 3405319d..00000000 --- a/configs/resnet/resnet50_b32x8_mixup_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_8xb32-mixup_in1k.py' - -_deprecation_ = dict( - expected='resnet50_8xb32-mixup_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b64x32_warmup_coslr_imagenet.py b/configs/resnet/resnet50_b64x32_warmup_coslr_imagenet.py deleted file mode 100644 index 4724616c..00000000 --- a/configs/resnet/resnet50_b64x32_warmup_coslr_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_32xb64-warmup-coslr_in1k.py' - -_deprecation_ = dict( - expected='resnet50_32xb64-warmup-coslr_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b64x32_warmup_imagenet.py b/configs/resnet/resnet50_b64x32_warmup_imagenet.py deleted file mode 100644 index 3e350541..00000000 --- a/configs/resnet/resnet50_b64x32_warmup_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_32xb64-warmup_in1k.py' - -_deprecation_ = dict( - expected='resnet50_32xb64-warmup_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnet50_b64x32_warmup_label_smooth_imagenet.py b/configs/resnet/resnet50_b64x32_warmup_label_smooth_imagenet.py deleted file mode 100644 index 2544e33f..00000000 --- a/configs/resnet/resnet50_b64x32_warmup_label_smooth_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnet50_32xb64-warmup-lbs_in1k.py' - -_deprecation_ = dict( - expected='resnet50_32xb64-warmup-lbs_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnetv1d101_b32x8_imagenet.py b/configs/resnet/resnetv1d101_b32x8_imagenet.py deleted file mode 100644 index e736937e..00000000 --- a/configs/resnet/resnetv1d101_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnetv1d101_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnetv1d101_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnetv1d152_b32x8_imagenet.py b/configs/resnet/resnetv1d152_b32x8_imagenet.py deleted file mode 100644 index 88e5b9f0..00000000 --- a/configs/resnet/resnetv1d152_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnetv1d152_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnetv1d152_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnet/resnetv1d50_b32x8_imagenet.py b/configs/resnet/resnetv1d50_b32x8_imagenet.py deleted file mode 100644 index 5455e055..00000000 --- a/configs/resnet/resnetv1d50_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnetv1d50_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnetv1d50_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnext/resnext101_32x4d_b32x8_imagenet.py b/configs/resnext/resnext101_32x4d_b32x8_imagenet.py deleted file mode 100644 index 07d66c35..00000000 --- a/configs/resnext/resnext101_32x4d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnext101-32x4d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnext101-32x4d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnext/resnext101_32x8d_b32x8_imagenet.py b/configs/resnext/resnext101_32x8d_b32x8_imagenet.py deleted file mode 100644 index 071ca60f..00000000 --- a/configs/resnext/resnext101_32x8d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnext101-32x8d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnext101-32x8d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnext/resnext152_32x4d_b32x8_imagenet.py b/configs/resnext/resnext152_32x4d_b32x8_imagenet.py deleted file mode 100644 index 6d05c8b3..00000000 --- a/configs/resnext/resnext152_32x4d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnext152-32x4d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnext152-32x4d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/resnext/resnext50_32x4d_b32x8_imagenet.py b/configs/resnext/resnext50_32x4d_b32x8_imagenet.py deleted file mode 100644 index 92ae0639..00000000 --- a/configs/resnext/resnext50_32x4d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'resnext50-32x4d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='resnext50-32x4d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/seresnet/seresnet101_b32x8_imagenet.py b/configs/seresnet/seresnet101_b32x8_imagenet.py deleted file mode 100644 index 46daa09a..00000000 --- a/configs/seresnet/seresnet101_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'seresnet101_8xb32_in1k.py' - -_deprecation_ = dict( - expected='seresnet101_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/seresnet/seresnet50_b32x8_imagenet.py b/configs/seresnet/seresnet50_b32x8_imagenet.py deleted file mode 100644 index 0fb9df39..00000000 --- a/configs/seresnet/seresnet50_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'seresnet50_8xb32_in1k.py' - -_deprecation_ = dict( - expected='seresnet50_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/seresnet/seresnext101_32x4d_b32x8_imagenet.py b/configs/seresnet/seresnext101_32x4d_b32x8_imagenet.py deleted file mode 100644 index cb99ec66..00000000 --- a/configs/seresnet/seresnext101_32x4d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'seresnext101-32x4d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='seresnext101-32x4d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/seresnet/seresnext50_32x4d_b32x8_imagenet.py b/configs/seresnet/seresnext50_32x4d_b32x8_imagenet.py deleted file mode 100644 index 49229604..00000000 --- a/configs/seresnet/seresnext50_32x4d_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'seresnext50-32x4d_8xb32_in1k.py' - -_deprecation_ = dict( - expected='seresnext50-32x4d_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/shufflenet_v1/shufflenet_v1_1x_b64x16_linearlr_bn_nowd_imagenet.py b/configs/shufflenet_v1/shufflenet_v1_1x_b64x16_linearlr_bn_nowd_imagenet.py deleted file mode 100644 index 03121979..00000000 --- a/configs/shufflenet_v1/shufflenet_v1_1x_b64x16_linearlr_bn_nowd_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'shufflenet-v1-1x_16xb64_in1k.py' - -_deprecation_ = dict( - expected='shufflenet-v1-1x_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin-base_16xb64_in1k-384px.py b/configs/swin_transformer/swin-base_16xb64_in1k-384px.py index 711a0d6d..bce56957 100644 --- a/configs/swin_transformer/swin-base_16xb64_in1k-384px.py +++ b/configs/swin_transformer/swin-base_16xb64_in1k-384px.py @@ -5,3 +5,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin-base_16xb64_in1k.py b/configs/swin_transformer/swin-base_16xb64_in1k.py index 2a4548af..b6f5cc33 100644 --- a/configs/swin_transformer/swin-base_16xb64_in1k.py +++ b/configs/swin_transformer/swin-base_16xb64_in1k.py @@ -4,3 +4,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin-large_16xb64_in1k-384px.py b/configs/swin_transformer/swin-large_16xb64_in1k-384px.py index a7f0ad27..4e900947 100644 --- a/configs/swin_transformer/swin-large_16xb64_in1k-384px.py +++ b/configs/swin_transformer/swin-large_16xb64_in1k-384px.py @@ -5,3 +5,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin-large_16xb64_in1k.py b/configs/swin_transformer/swin-large_16xb64_in1k.py index 4e875c59..ed6ebd2b 100644 --- a/configs/swin_transformer/swin-large_16xb64_in1k.py +++ b/configs/swin_transformer/swin-large_16xb64_in1k.py @@ -5,3 +5,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin-small_16xb64_in1k.py b/configs/swin_transformer/swin-small_16xb64_in1k.py index aa1fa21b..fa1f6041 100644 --- a/configs/swin_transformer/swin-small_16xb64_in1k.py +++ b/configs/swin_transformer/swin-small_16xb64_in1k.py @@ -4,3 +4,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin-tiny_16xb64_in1k.py b/configs/swin_transformer/swin-tiny_16xb64_in1k.py index e1ed022a..343f4c64 100644 --- a/configs/swin_transformer/swin-tiny_16xb64_in1k.py +++ b/configs/swin_transformer/swin-tiny_16xb64_in1k.py @@ -4,3 +4,5 @@ _base_ = [ '../_base_/schedules/imagenet_bs1024_adamw_swin.py', '../_base_/default_runtime.py' ] + +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) diff --git a/configs/swin_transformer/swin_base_224_b16x64_300e_imagenet.py b/configs/swin_transformer/swin_base_224_b16x64_300e_imagenet.py deleted file mode 100644 index 912c379b..00000000 --- a/configs/swin_transformer/swin_base_224_b16x64_300e_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-base_16xb64_in1k.py' - -_deprecation_ = dict( - expected='swin-base_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin_base_384_evalonly_imagenet.py b/configs/swin_transformer/swin_base_384_evalonly_imagenet.py deleted file mode 100644 index 9ed58889..00000000 --- a/configs/swin_transformer/swin_base_384_evalonly_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-base_16xb64_in1k-384px.py' - -_deprecation_ = dict( - expected='swin-base_16xb64_in1k-384px.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin_large_224_evalonly_imagenet.py b/configs/swin_transformer/swin_large_224_evalonly_imagenet.py deleted file mode 100644 index 5ebb54a5..00000000 --- a/configs/swin_transformer/swin_large_224_evalonly_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-large_16xb64_in1k.py' - -_deprecation_ = dict( - expected='swin-large_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin_large_384_evalonly_imagenet.py b/configs/swin_transformer/swin_large_384_evalonly_imagenet.py deleted file mode 100644 index 9a59f5b6..00000000 --- a/configs/swin_transformer/swin_large_384_evalonly_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-large_16xb64_in1k-384px.py' - -_deprecation_ = dict( - expected='swin-large_16xb64_in1k-384px.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin_small_224_b16x64_300e_imagenet.py b/configs/swin_transformer/swin_small_224_b16x64_300e_imagenet.py deleted file mode 100644 index a747aa4d..00000000 --- a/configs/swin_transformer/swin_small_224_b16x64_300e_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-small_16xb64_in1k.py' - -_deprecation_ = dict( - expected='swin-small_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/swin_transformer/swin_tiny_224_b16x64_300e_imagenet.py b/configs/swin_transformer/swin_tiny_224_b16x64_300e_imagenet.py deleted file mode 100644 index 2160eb91..00000000 --- a/configs/swin_transformer/swin_tiny_224_b16x64_300e_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'swin-tiny_16xb64_in1k.py' - -_deprecation_ = dict( - expected='swin-tiny_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/tnt/tnt_s_patch16_224_evalonly_imagenet.py b/configs/tnt/tnt_s_patch16_224_evalonly_imagenet.py deleted file mode 100644 index 3c054d4a..00000000 --- a/configs/tnt/tnt_s_patch16_224_evalonly_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'tnt-s-p16_16xb64_in1k.py' - -_deprecation_ = dict( - expected='tnt-s-p16_16xb64_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/twins/twins-pcpvt-base_8xb128_in1k.py b/configs/twins/twins-pcpvt-base_8xb128_in1k.py index 8ea9adc3..3092bfa4 100644 --- a/configs/twins/twins-pcpvt-base_8xb128_in1k.py +++ b/configs/twins/twins-pcpvt-base_8xb128_in1k.py @@ -5,6 +5,9 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict( + optimizer=dict(_delete_=True, grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=128) paramwise_cfg = dict(_delete=True, norm_decay_mult=0.0, bias_decay_mult=0.0) @@ -18,7 +21,6 @@ optimizer = dict( eps=1e-8, betas=(0.9, 0.999), paramwise_cfg=paramwise_cfg) -optimizer_config = dict(_delete_=True, grad_clip=dict(max_norm=5.0)) # learning policy lr_config = dict( diff --git a/configs/twins/twins-svt-base_8xb128_in1k.py b/configs/twins/twins-svt-base_8xb128_in1k.py index e2db2301..3864bdea 100644 --- a/configs/twins/twins-svt-base_8xb128_in1k.py +++ b/configs/twins/twins-svt-base_8xb128_in1k.py @@ -5,6 +5,9 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict( + optimizer=dict(_delete_=True, grad_clip=dict(max_norm=5.0))) + data = dict(samples_per_gpu=128) paramwise_cfg = dict(_delete=True, norm_decay_mult=0.0, bias_decay_mult=0.0) @@ -18,9 +21,7 @@ optimizer = dict( eps=1e-8, betas=(0.9, 0.999), paramwise_cfg=paramwise_cfg) -optimizer_config = dict(_delete_=True, grad_clip=dict(max_norm=5.0)) -# learning policy lr_config = dict( policy='CosineAnnealing', by_epoch=True, diff --git a/configs/van/van-base_8xb128_in1k.py b/configs/van/van-base_8xb128_in1k.py index c98c8f3d..9a972b66 100644 --- a/configs/van/van-base_8xb128_in1k.py +++ b/configs/van/van-base_8xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + # Note that the mean and variance used here are different from other configs img_norm_cfg = dict( mean=[127.5, 127.5, 127.5], std=[127.5, 127.5, 127.5], to_rgb=True) diff --git a/configs/van/van-large_8xb128_in1k.py b/configs/van/van-large_8xb128_in1k.py index 4fbc7099..61d8fee1 100644 --- a/configs/van/van-large_8xb128_in1k.py +++ b/configs/van/van-large_8xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + # Note that the mean and variance used here are different from other configs img_norm_cfg = dict( mean=[127.5, 127.5, 127.5], std=[127.5, 127.5, 127.5], to_rgb=True) diff --git a/configs/van/van-small_8xb128_in1k.py b/configs/van/van-small_8xb128_in1k.py index 62dffcc2..9d823739 100644 --- a/configs/van/van-small_8xb128_in1k.py +++ b/configs/van/van-small_8xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + # Note that the mean and variance used here are different from other configs img_norm_cfg = dict( mean=[127.5, 127.5, 127.5], std=[127.5, 127.5, 127.5], to_rgb=True) diff --git a/configs/van/van-tiny_8xb128_in1k.py b/configs/van/van-tiny_8xb128_in1k.py index fa3fa685..7a7bf558 100644 --- a/configs/van/van-tiny_8xb128_in1k.py +++ b/configs/van/van-tiny_8xb128_in1k.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=5.0))) + # Note that the mean and variance used here are different from other configs img_norm_cfg = dict( mean=[127.5, 127.5, 127.5], std=[127.5, 127.5, 127.5], to_rgb=True) diff --git a/configs/vgg/vgg11_b32x8_imagenet.py b/configs/vgg/vgg11_b32x8_imagenet.py deleted file mode 100644 index b15396be..00000000 --- a/configs/vgg/vgg11_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg11_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg11_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg11bn_b32x8_imagenet.py b/configs/vgg/vgg11bn_b32x8_imagenet.py deleted file mode 100644 index 350c9bef..00000000 --- a/configs/vgg/vgg11bn_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg11bn_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg11bn_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg13_b32x8_imagenet.py b/configs/vgg/vgg13_b32x8_imagenet.py deleted file mode 100644 index 6198ca2c..00000000 --- a/configs/vgg/vgg13_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg13_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg13_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg13bn_b32x8_imagenet.py b/configs/vgg/vgg13bn_b32x8_imagenet.py deleted file mode 100644 index 0a715d7f..00000000 --- a/configs/vgg/vgg13bn_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg13bn_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg13bn_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg16_8xb16_voc.py b/configs/vgg/vgg16_8xb16_voc.py index d096959f..2aaaf99b 100644 --- a/configs/vgg/vgg16_8xb16_voc.py +++ b/configs/vgg/vgg16_8xb16_voc.py @@ -22,4 +22,5 @@ optimizer = dict( optimizer_config = dict(grad_clip=None) # learning policy lr_config = dict(policy='step', step=20, gamma=0.1) + runner = dict(type='EpochBasedRunner', max_epochs=40) diff --git a/configs/vgg/vgg16_b32x8_imagenet.py b/configs/vgg/vgg16_b32x8_imagenet.py deleted file mode 100644 index 2fefb949..00000000 --- a/configs/vgg/vgg16_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg16_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg16_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg16bn_b32x8_imagenet.py b/configs/vgg/vgg16bn_b32x8_imagenet.py deleted file mode 100644 index cb21917f..00000000 --- a/configs/vgg/vgg16bn_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg16bn_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg16bn_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg19_b32x8_imagenet.py b/configs/vgg/vgg19_b32x8_imagenet.py deleted file mode 100644 index e8b8b25a..00000000 --- a/configs/vgg/vgg19_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg19_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg19_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vgg/vgg19bn_b32x8_imagenet.py b/configs/vgg/vgg19bn_b32x8_imagenet.py deleted file mode 100644 index f615496c..00000000 --- a/configs/vgg/vgg19bn_b32x8_imagenet.py +++ /dev/null @@ -1,6 +0,0 @@ -_base_ = 'vgg19bn_8xb32_in1k.py' - -_deprecation_ = dict( - expected='vgg19bn_8xb32_in1k.py', - reference='https://github.com/open-mmlab/mmclassification/pull/508', -) diff --git a/configs/vision_transformer/vit-base-p16_ft-64xb64_in1k-384.py b/configs/vision_transformer/vit-base-p16_ft-64xb64_in1k-384.py index 259685e4..72c3d162 100644 --- a/configs/vision_transformer/vit-base-p16_ft-64xb64_in1k-384.py +++ b/configs/vision_transformer/vit-base-p16_ft-64xb64_in1k-384.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict(backbone=dict(img_size=384)) img_norm_cfg = dict( diff --git a/configs/vision_transformer/vit-base-p16_pt-64xb64_in1k-224.py b/configs/vision_transformer/vit-base-p16_pt-64xb64_in1k-224.py index 79c323b1..ae4a5f7e 100644 --- a/configs/vision_transformer/vit-base-p16_pt-64xb64_in1k-224.py +++ b/configs/vision_transformer/vit-base-p16_pt-64xb64_in1k-224.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict( head=dict(hidden_dim=3072), train_cfg=dict( diff --git a/configs/vision_transformer/vit-base-p32_ft-64xb64_in1k-384.py b/configs/vision_transformer/vit-base-p32_ft-64xb64_in1k-384.py index d83daa2a..be54eb6b 100644 --- a/configs/vision_transformer/vit-base-p32_ft-64xb64_in1k-384.py +++ b/configs/vision_transformer/vit-base-p32_ft-64xb64_in1k-384.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict(backbone=dict(img_size=384)) img_norm_cfg = dict( diff --git a/configs/vision_transformer/vit-base-p32_pt-64xb64_in1k-224.py b/configs/vision_transformer/vit-base-p32_pt-64xb64_in1k-224.py index a477e211..ebe18192 100644 --- a/configs/vision_transformer/vit-base-p32_pt-64xb64_in1k-224.py +++ b/configs/vision_transformer/vit-base-p32_pt-64xb64_in1k-224.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict( head=dict(hidden_dim=3072), train_cfg=dict( diff --git a/configs/vision_transformer/vit-large-p16_ft-64xb64_in1k-384.py b/configs/vision_transformer/vit-large-p16_ft-64xb64_in1k-384.py index 8032085b..0713532a 100644 --- a/configs/vision_transformer/vit-large-p16_ft-64xb64_in1k-384.py +++ b/configs/vision_transformer/vit-large-p16_ft-64xb64_in1k-384.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict(backbone=dict(img_size=384)) img_norm_cfg = dict( diff --git a/configs/vision_transformer/vit-large-p16_pt-64xb64_in1k-224.py b/configs/vision_transformer/vit-large-p16_pt-64xb64_in1k-224.py index 5cf7a7d3..8deeb2af 100644 --- a/configs/vision_transformer/vit-large-p16_pt-64xb64_in1k-224.py +++ b/configs/vision_transformer/vit-large-p16_pt-64xb64_in1k-224.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict( head=dict(hidden_dim=3072), train_cfg=dict( diff --git a/configs/vision_transformer/vit-large-p32_ft-64xb64_in1k-384.py b/configs/vision_transformer/vit-large-p32_ft-64xb64_in1k-384.py index c7889386..77d2b88d 100644 --- a/configs/vision_transformer/vit-large-p32_ft-64xb64_in1k-384.py +++ b/configs/vision_transformer/vit-large-p32_ft-64xb64_in1k-384.py @@ -6,6 +6,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict(backbone=dict(img_size=384)) img_norm_cfg = dict( diff --git a/configs/vision_transformer/vit-large-p32_pt-64xb64_in1k-224.py b/configs/vision_transformer/vit-large-p32_pt-64xb64_in1k-224.py index 773ade87..81821fd1 100644 --- a/configs/vision_transformer/vit-large-p32_pt-64xb64_in1k-224.py +++ b/configs/vision_transformer/vit-large-p32_pt-64xb64_in1k-224.py @@ -5,6 +5,8 @@ _base_ = [ '../_base_/default_runtime.py' ] +default_hooks = dict(optimizer=dict(grad_clip=dict(max_norm=1.0))) + model = dict( head=dict(hidden_dim=3072), train_cfg=dict(