From 5b41431511d3788a53e5e7fe7c31e794bb22f616 Mon Sep 17 00:00:00 2001 From: "xiexinchen.vendor" Date: Thu, 14 Jul 2022 01:49:52 +0000 Subject: [PATCH] [Fix] Fix optim wrapper configs --- .../deeplabv3_r50-d8_480x480_40k_pascal_context.py | 1 + .../deeplabv3_r50-d8_480x480_40k_pascal_context_59.py | 1 + .../deeplabv3_r50-d8_480x480_80k_pascal_context.py | 1 + .../deeplabv3_r50-d8_480x480_80k_pascal_context_59.py | 1 + .../deeplabv3plus_r50-d8_480x480_40k_pascal_context.py | 1 + .../deeplabv3plus_r50-d8_480x480_40k_pascal_context_59.py | 1 + .../deeplabv3plus_r50-d8_480x480_80k_pascal_context.py | 1 + .../deeplabv3plus_r50-d8_480x480_80k_pascal_context_59.py | 1 + configs/dnlnet/dnl_r50-d8_769x769_80k_cityscapes.py | 3 ++- configs/fastscnn/fast_scnn_lr0.12_8x4_160k_cityscapes.py | 1 + configs/fcn/fcn_r50-d8_480x480_40k_pascal_context.py | 1 + configs/fcn/fcn_r50-d8_480x480_40k_pascal_context_59.py | 1 + configs/fcn/fcn_r50-d8_480x480_80k_pascal_context.py | 1 + configs/fcn/fcn_r50-d8_480x480_80k_pascal_context_59.py | 1 + configs/hrnet/fcn_hr18_480x480_40k_pascal_context.py | 1 + configs/hrnet/fcn_hr18_480x480_40k_pascal_context_59.py | 1 + configs/hrnet/fcn_hr18_480x480_80k_pascal_context.py | 1 + configs/hrnet/fcn_hr18_480x480_80k_pascal_context_59.py | 1 + .../pspnet/pspnet_r50-d8_480x480_40k_pascal_context.py | 1 + .../pspnet/pspnet_r50-d8_480x480_40k_pascal_context_59.py | 1 + .../pspnet/pspnet_r50-d8_480x480_80k_pascal_context.py | 1 + .../pspnet/pspnet_r50-d8_480x480_80k_pascal_context_59.py | 1 + .../segmenter_vit-b_mask_8x1_512x512_160k_ade20k.py | 2 +- .../segmenter_vit-l_mask_8x1_512x512_160k_ade20k.py | 2 +- .../segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py | 2 +- .../segmenter_vit-t_mask_8x1_512x512_160k_ade20k.py | 2 +- configs/setr/setr_mla_512x512_160k_b8_ade20k.py | 8 ++++---- configs/setr/setr_naive_512x512_160k_b16_ade20k.py | 8 ++++---- configs/setr/setr_pup_512x512_160k_b16_ade20k.py | 8 ++++---- .../setr/setr_vit-large_mla_8x1_768x768_80k_cityscapes.py | 7 ++++--- .../setr_vit-large_naive_8x1_768x768_80k_cityscapes.py | 7 ++++--- .../setr/setr_vit-large_pup_8x1_768x768_80k_cityscapes.py | 6 ++++-- 32 files changed, 51 insertions(+), 25 deletions(-) diff --git a/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context.py b/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context.py index fb878a17b..3c4e753a2 100644 --- a/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context.py +++ b/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context_59.py b/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context_59.py index 844a6785b..e3b6c3690 100644 --- a/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context_59.py +++ b/configs/deeplabv3/deeplabv3_r50-d8_480x480_40k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context.py b/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context.py index 4bc3e157d..ba8c7ded9 100644 --- a/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context.py +++ b/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context_59.py b/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context_59.py index f97dd4ae6..d34bd8933 100644 --- a/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context_59.py +++ b/configs/deeplabv3/deeplabv3_r50-d8_480x480_80k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context.py b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context.py index 5e1d2fdcd..95b56d03e 100644 --- a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context.py +++ b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context_59.py b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context_59.py index 83ee53336..459c62dc5 100644 --- a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context_59.py +++ b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_40k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context.py b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context.py index 20fc61c22..5ff7fcb41 100644 --- a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context.py +++ b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context_59.py b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context_59.py index 4ed60a788..84aaf25b5 100644 --- a/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context_59.py +++ b/configs/deeplabv3plus/deeplabv3plus_r50-d8_480x480_80k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/dnlnet/dnl_r50-d8_769x769_80k_cityscapes.py b/configs/dnlnet/dnl_r50-d8_769x769_80k_cityscapes.py index f0a7ab814..cb379c1e0 100644 --- a/configs/dnlnet/dnl_r50-d8_769x769_80k_cityscapes.py +++ b/configs/dnlnet/dnl_r50-d8_769x769_80k_cityscapes.py @@ -10,6 +10,7 @@ model = dict( decode_head=dict(align_corners=True), auxiliary_head=dict(align_corners=True), test_cfg=dict(mode='slide', crop_size=(769, 769), stride=(513, 513))) -optimizer = dict( + +optim_wrapper = dict( paramwise_cfg=dict( custom_keys=dict(theta=dict(wd_mult=0.), phi=dict(wd_mult=0.)))) diff --git a/configs/fastscnn/fast_scnn_lr0.12_8x4_160k_cityscapes.py b/configs/fastscnn/fast_scnn_lr0.12_8x4_160k_cityscapes.py index 8eedbceb4..e7f68bfe7 100644 --- a/configs/fastscnn/fast_scnn_lr0.12_8x4_160k_cityscapes.py +++ b/configs/fastscnn/fast_scnn_lr0.12_8x4_160k_cityscapes.py @@ -12,3 +12,4 @@ test_dataloader = val_dataloader # Re-config the optimizer. optimizer = dict(type='SGD', lr=0.12, momentum=0.9, weight_decay=4e-5) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context.py b/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context.py index ee12a83ec..d99cb0dc3 100644 --- a/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context.py +++ b/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context.py @@ -10,3 +10,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context_59.py b/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context_59.py index cdcc3a2ce..64c941052 100644 --- a/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context_59.py +++ b/configs/fcn/fcn_r50-d8_480x480_40k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context.py b/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context.py index 38e57872a..1eeafb8a5 100644 --- a/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context.py +++ b/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context.py @@ -10,3 +10,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context_59.py b/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context_59.py index 2751974f2..c11a9bbb6 100644 --- a/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context_59.py +++ b/configs/fcn/fcn_r50-d8_480x480_80k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/hrnet/fcn_hr18_480x480_40k_pascal_context.py b/configs/hrnet/fcn_hr18_480x480_40k_pascal_context.py index 43f109ca5..f744baec7 100644 --- a/configs/hrnet/fcn_hr18_480x480_40k_pascal_context.py +++ b/configs/hrnet/fcn_hr18_480x480_40k_pascal_context.py @@ -9,3 +9,4 @@ model = dict( decode_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/hrnet/fcn_hr18_480x480_40k_pascal_context_59.py b/configs/hrnet/fcn_hr18_480x480_40k_pascal_context_59.py index 45a65c16a..0daaa35eb 100644 --- a/configs/hrnet/fcn_hr18_480x480_40k_pascal_context_59.py +++ b/configs/hrnet/fcn_hr18_480x480_40k_pascal_context_59.py @@ -9,3 +9,4 @@ model = dict( decode_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/hrnet/fcn_hr18_480x480_80k_pascal_context.py b/configs/hrnet/fcn_hr18_480x480_80k_pascal_context.py index 349c3f9a1..4f37e8ade 100644 --- a/configs/hrnet/fcn_hr18_480x480_80k_pascal_context.py +++ b/configs/hrnet/fcn_hr18_480x480_80k_pascal_context.py @@ -9,3 +9,4 @@ model = dict( decode_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/hrnet/fcn_hr18_480x480_80k_pascal_context_59.py b/configs/hrnet/fcn_hr18_480x480_80k_pascal_context_59.py index 283d71598..2c35cb9c3 100644 --- a/configs/hrnet/fcn_hr18_480x480_80k_pascal_context_59.py +++ b/configs/hrnet/fcn_hr18_480x480_80k_pascal_context_59.py @@ -9,3 +9,4 @@ model = dict( decode_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context.py b/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context.py index 8c92d85fe..08a214448 100644 --- a/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context.py +++ b/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context_59.py b/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context_59.py index a8270e9af..b65449573 100644 --- a/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context_59.py +++ b/configs/pspnet/pspnet_r50-d8_480x480_40k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context.py b/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context.py index 040784448..a7d82478c 100644 --- a/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context.py +++ b/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=60), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context_59.py b/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context_59.py index e596f8d4d..b7abc1bdd 100644 --- a/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context_59.py +++ b/configs/pspnet/pspnet_r50-d8_480x480_80k_pascal_context_59.py @@ -11,3 +11,4 @@ model = dict( auxiliary_head=dict(num_classes=59), test_cfg=dict(mode='slide', crop_size=(480, 480), stride=(320, 320))) optimizer = dict(type='SGD', lr=0.004, momentum=0.9, weight_decay=0.0001) +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) diff --git a/configs/segmenter/segmenter_vit-b_mask_8x1_512x512_160k_ade20k.py b/configs/segmenter/segmenter_vit-b_mask_8x1_512x512_160k_ade20k.py index 556b87a8a..a4bae5064 100644 --- a/configs/segmenter/segmenter_vit-b_mask_8x1_512x512_160k_ade20k.py +++ b/configs/segmenter/segmenter_vit-b_mask_8x1_512x512_160k_ade20k.py @@ -7,7 +7,7 @@ crop_size = (512, 512) data_preprocessor = dict(size=crop_size) model = dict(data_preprocessor=data_preprocessor) optimizer = dict(lr=0.001, weight_decay=0.0) - +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) train_dataloader = dict( # num_gpus: 8 -> batch_size: 8 batch_size=1) diff --git a/configs/segmenter/segmenter_vit-l_mask_8x1_512x512_160k_ade20k.py b/configs/segmenter/segmenter_vit-l_mask_8x1_512x512_160k_ade20k.py index 5fb0b417e..302acdecb 100644 --- a/configs/segmenter/segmenter_vit-l_mask_8x1_512x512_160k_ade20k.py +++ b/configs/segmenter/segmenter_vit-l_mask_8x1_512x512_160k_ade20k.py @@ -25,7 +25,7 @@ model = dict( test_cfg=dict(mode='slide', crop_size=(640, 640), stride=(608, 608))) optimizer = dict(lr=0.001, weight_decay=0.0) - +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) train_dataloader = dict( # num_gpus: 8 -> batch_size: 8 batch_size=1) diff --git a/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py b/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py index ac6e029a7..b19fd4140 100644 --- a/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py +++ b/configs/segmenter/segmenter_vit-s_mask_8x1_512x512_160k_ade20k.py @@ -29,7 +29,7 @@ model = dict( type='CrossEntropyLoss', use_sigmoid=False, loss_weight=1.0))) optimizer = dict(lr=0.001, weight_decay=0.0) - +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) train_dataloader = dict( # num_gpus: 8 -> batch_size: 8 batch_size=1) diff --git a/configs/segmenter/segmenter_vit-t_mask_8x1_512x512_160k_ade20k.py b/configs/segmenter/segmenter_vit-t_mask_8x1_512x512_160k_ade20k.py index 1ca387ae3..221a9f9a6 100644 --- a/configs/segmenter/segmenter_vit-t_mask_8x1_512x512_160k_ade20k.py +++ b/configs/segmenter/segmenter_vit-t_mask_8x1_512x512_160k_ade20k.py @@ -19,7 +19,7 @@ model = dict( embed_dims=192)) optimizer = dict(lr=0.001, weight_decay=0.0) - +optim_wrapper = dict(type='OptimWrapper', optimizer=optimizer) train_dataloader = dict( # num_gpus: 8 -> batch_size: 8 batch_size=1) diff --git a/configs/setr/setr_mla_512x512_160k_b8_ade20k.py b/configs/setr/setr_mla_512x512_160k_b8_ade20k.py index a6feaa95c..1c6e2845f 100644 --- a/configs/setr/setr_mla_512x512_160k_b8_ade20k.py +++ b/configs/setr/setr_mla_512x512_160k_b8_ade20k.py @@ -79,11 +79,11 @@ model = dict( test_cfg=dict(mode='slide', crop_size=(512, 512), stride=(341, 341)), ) -optimizer = dict( - lr=0.001, - weight_decay=0.0, +optimizer = dict(lr=0.001, weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) - # num_gpus: 8 -> batch_size: 8 train_dataloader = dict(batch_size=1) val_dataloader = dict(batch_size=1) diff --git a/configs/setr/setr_naive_512x512_160k_b16_ade20k.py b/configs/setr/setr_naive_512x512_160k_b16_ade20k.py index 46cb463e7..109996c1b 100644 --- a/configs/setr/setr_naive_512x512_160k_b16_ade20k.py +++ b/configs/setr/setr_naive_512x512_160k_b16_ade20k.py @@ -61,11 +61,11 @@ model = dict( test_cfg=dict(mode='slide', crop_size=(512, 512), stride=(341, 341)), ) -optimizer = dict( - lr=0.01, - weight_decay=0.0, +optimizer = dict(lr=0.01, weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) - # num_gpus: 8 -> batch_size: 16 train_dataloader = dict(batch_size=2) val_dataloader = dict(batch_size=1) diff --git a/configs/setr/setr_pup_512x512_160k_b16_ade20k.py b/configs/setr/setr_pup_512x512_160k_b16_ade20k.py index 0bc301408..e9bfb2201 100644 --- a/configs/setr/setr_pup_512x512_160k_b16_ade20k.py +++ b/configs/setr/setr_pup_512x512_160k_b16_ade20k.py @@ -61,11 +61,11 @@ model = dict( test_cfg=dict(mode='slide', crop_size=(512, 512), stride=(341, 341)), ) -optimizer = dict( - lr=0.001, - weight_decay=0.0, +optimizer = dict(lr=0.001, weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) - # num_gpus: 8 -> batch_size: 16 train_dataloader = dict(batch_size=2) val_dataloader = dict(batch_size=1) diff --git a/configs/setr/setr_vit-large_mla_8x1_768x768_80k_cityscapes.py b/configs/setr/setr_vit-large_mla_8x1_768x768_80k_cityscapes.py index b8b933afb..026557f50 100644 --- a/configs/setr/setr_vit-large_mla_8x1_768x768_80k_cityscapes.py +++ b/configs/setr/setr_vit-large_mla_8x1_768x768_80k_cityscapes.py @@ -13,9 +13,10 @@ model = dict( type='Pretrained', checkpoint='pretrain/vit_large_p16.pth')), test_cfg=dict(mode='slide', crop_size=(768, 768), stride=(512, 512))) -optimizer = dict( - lr=0.002, - weight_decay=0.0, +optimizer = dict(lr=0.002, weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) train_dataloader = dict(batch_size=1) val_dataloader = dict(batch_size=1) diff --git a/configs/setr/setr_vit-large_naive_8x1_768x768_80k_cityscapes.py b/configs/setr/setr_vit-large_naive_8x1_768x768_80k_cityscapes.py index 040fe24fc..db4931730 100644 --- a/configs/setr/setr_vit-large_naive_8x1_768x768_80k_cityscapes.py +++ b/configs/setr/setr_vit-large_naive_8x1_768x768_80k_cityscapes.py @@ -14,10 +14,11 @@ model = dict( type='Pretrained', checkpoint='pretrain/vit_large_p16.pth')), test_cfg=dict(mode='slide', crop_size=(768, 768), stride=(512, 512))) -optimizer = dict( - weight_decay=0.0, +optimizer = dict(weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) - train_dataloader = dict(batch_size=1) val_dataloader = dict(batch_size=1) test_dataloader = val_dataloader diff --git a/configs/setr/setr_vit-large_pup_8x1_768x768_80k_cityscapes.py b/configs/setr/setr_vit-large_pup_8x1_768x768_80k_cityscapes.py index 1cfe0b39c..999ab1803 100644 --- a/configs/setr/setr_vit-large_pup_8x1_768x768_80k_cityscapes.py +++ b/configs/setr/setr_vit-large_pup_8x1_768x768_80k_cityscapes.py @@ -59,8 +59,10 @@ model = dict( ], test_cfg=dict(mode='slide', crop_size=crop_size, stride=(512, 512))) -optimizer = dict( - weight_decay=0.0, +optimizer = dict(weight_decay=0.0) +optim_wrapper = dict( + type='OptimWrapper', + optimizer=optimizer, paramwise_cfg=dict(custom_keys={'head': dict(lr_mult=10.)})) train_dataloader = dict(batch_size=1)