From 7f96538052eb411003c2c38a7013353aa31ffc62 Mon Sep 17 00:00:00 2001 From: Ross Wightman Date: Fri, 31 May 2024 11:59:51 -0700 Subject: [PATCH] Add missing lkc act for mobileclip fastvits --- timm/models/fastvit.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/timm/models/fastvit.py b/timm/models/fastvit.py index 7c918887..66142105 100644 --- a/timm/models/fastvit.py +++ b/timm/models/fastvit.py @@ -1420,7 +1420,7 @@ def _checkpoint_filter_fn(state_dict, model): return state_dict # non-original checkpoint, no remapping needed state_dict = state_dict.get('state_dict', state_dict) - if 'image_encoder.model.head.proj' in state_dict: + if 'image_encoder.model.patch_embed.0.rbr_conv.0.conv.weight' in state_dict: # remap MobileCLIP checkpoints prefix = 'image_encoder.model.' else: @@ -1598,6 +1598,7 @@ def fastvit_mci0(pretrained=False, **kwargs): se_downsamples=(False, False, True, True), pos_embs=(None, None, None, partial(RepConditionalPosEnc, spatial_shape=(7, 7))), token_mixers=("repmixer", "repmixer", "repmixer", "attention"), + lkc_use_act=True, ) return _create_fastvit('fastvit_mci0', pretrained=pretrained, **dict(model_args, **kwargs)) @@ -1612,6 +1613,7 @@ def fastvit_mci1(pretrained=False, **kwargs): se_downsamples=(False, False, True, True), pos_embs=(None, None, None, partial(RepConditionalPosEnc, spatial_shape=(7, 7))), token_mixers=("repmixer", "repmixer", "repmixer", "attention"), + lkc_use_act=True, ) return _create_fastvit('fastvit_mci1', pretrained=pretrained, **dict(model_args, **kwargs)) @@ -1626,5 +1628,6 @@ def fastvit_mci2(pretrained=False, **kwargs): se_downsamples=(False, False, True, True), pos_embs=(None, None, None, partial(RepConditionalPosEnc, spatial_shape=(7, 7))), token_mixers=("repmixer", "repmixer", "repmixer", "attention"), + lkc_use_act=True, ) - return _create_fastvit('fastvit_mci2', pretrained=pretrained, **dict(model_args, **kwargs)) \ No newline at end of file + return _create_fastvit('fastvit_mci2', pretrained=pretrained, **dict(model_args, **kwargs))