# Model settings model = dict( type='ImageClassifier', backbone=dict( type='TinyViT', arch='5m', img_size=(224, 224), window_size=[7, 7, 14, 7], out_indices=(3, ), drop_path_rate=0.0, gap_before_final_norm=True, init_cfg=[ dict( type='TruncNormal', layer=['Conv2d', 'Linear'], std=.02, bias=0.), dict(type='Constant', layer=['LayerNorm'], val=1., bias=0.), ]), head=dict( type='LinearClsHead', num_classes=1000, in_channels=320, loss=dict(type='CrossEntropyLoss', loss_weight=1.0), ))