Update implementation of scaled_index_add and index_select_cat with fallback

Add a check for the proper size and type for the optimized scaled_index_add and index_select_cat, and fallback on pytorch implementation otherwise
2023-09-01 15:07:26 +02:00 · 2023-09-01 15:07:26 +02:00 · 942cc2dee4
parent 6a6261546c
commit 942cc2dee4
1 changed files with 19 additions and 1 deletions
--- a/dinov2/layers/block.py
+++ b/dinov2/layers/block.py
@ -27,8 +27,26 @@ logger = logging.getLogger("dinov2")
 XFORMERS_ENABLED = os.environ.get("XFORMERS_DISABLED") is None
 try:
    if XFORMERS_ENABLED:
-        from xformers.ops import fmha, scaled_index_add, index_select_cat
+        from xformers.ops import scaled_index_add as _scaled_index_add, index_select_cat as _index_select_cat

+        def scaled_index_add(input, index, source, scaling, alpha):
+            is_proper_embed_dim = input.shape[-1] % 256 == 0
+            is_float16 = input.dtype == torch.half
+            if is_proper_embed_dim and is_float16:
+                return _scaled_index_add(input, index, source, scaling, alpha)
+            else:
+                return torch.index_add(input, dim=0, source=scaling * source, index=index, alpha=alpha)
+        
+        
+        def index_select_cat(sources, indices):
+            is_proper_embed_dim = all(s.shape[-1] % 256 == 0 for s in sources)
+            is_float16 = all(s.dtype == torch.half for s in sources)
+            if is_proper_embed_dim and is_float16:
+                return _index_select_cat(sources, indices)
+            else:
+                return torch.cat([s[i.long()].flatten() for s, i in zip(sources, indices)], dim=0)
+
+        
        XFORMERS_AVAILABLE = True
        warnings.warn("xFormers is available (Block)")
    else: