Fix bottleneck attn transpose typo, hopefully these train better now..

2025-06-03 15:01:08 +08:00 · 2021-09-28 16:38:41 -07:00 · 2021-09-28 16:38:41 -07:00 · b81e79aae9
commit b81e79aae9
parent 80075b0b8a
1 changed files with 1 additions and 1 deletions
--- a/timm/models/layers/bottleneck_attn.py
+++ b/timm/models/layers/bottleneck_attn.py
@ -122,7 +122,7 @@ class BottleneckAttn(nn.Module):
        attn_logits = attn_logits + self.pos_embed(q)  # B, num_heads, H * W, H * W

        attn_out = attn_logits.softmax(dim=-1)
-        attn_out = (attn_out @ v).transpose(1, 2).reshape(B, self.dim_out, H, W)  # B, dim_out, H, W
+        attn_out = (attn_out @ v).transpose(-1, -2).reshape(B, self.dim_out, H, W)  # B, dim_out, H, W
        attn_out = self.pool(attn_out)
        return attn_out