mmselfsup/configs/selfsup/byol/byol_resnet50_8xb256-fp16-accum2-coslr-200e_in1k.py
2022-07-18 11:06:44 +08:00

29 lines
816 B
Python

_base_ = [
'../_base_/models/byol.py',
'../_base_/datasets/imagenet_byol.py',
'../_base_/schedules/lars_coslr-200e_in1k.py',
'../_base_/default_runtime.py',
]
# dataset summary
train_dataloader = dict(batch_size=256)
# optimizer
optimizer = dict(type='LARS', lr=4.8, momentum=0.9, weight_decay=1e-6)
optim_wrapper = dict(
type='AmpOptimWrapper',
loss_scale=512.,
optimizer=optimizer,
accumulative_iters=2,
paramwise_cfg=dict(
custom_keys={
'bn': dict(decay_mult=0, lars_exclude=True),
'bias': dict(decay_mult=0, lars_exclude=True),
# bn layer in ResNet block downsample module
'downsample.1': dict(decay_mult=0, lars_exclude=True),
}),
)
# runtime settings
default_hooks = dict(checkpoint=dict(max_keep_ckpts=3))