fix no selected kv during inference

lucidrains · lucidrains · commit a834a5a2ba9f · 2025-03-06T07:53:19.000-08:00
diff --git a/native_sparse_attention_pytorch/native_sparse_attention.py b/native_sparse_attention_pytorch/native_sparse_attention.py
@@ -454,6 +454,8 @@ def forward_inference(
 
         # select out the sparse kv segments as defined by compressed attention map as importance score
 
+        fmask = None
+
         if has_selected_kv_for_fine_attn:
             if self.query_heads_share_selected_kv:
                 importance_scores = reduce(importance_scores, 'b (h grouped_queries) ... -> b h ...', 'mean', grouped_queries = self.num_grouped_queries)
@@ -493,7 +495,8 @@ def forward_inference(
 
         fsim = einsum(fq, fk, 'b h gh i d, b h j d -> b h gh i j') * scale
 
-        fsim = einx.where('b h i j, b h gh i j, -> b h gh i j', fmask, fsim, max_neg_value(fsim))
+        if exists(fmask):
+            fsim = einx.where('b h i j, b h gh i j, -> b h gh i j', fmask, fsim, max_neg_value(fsim))
 
         fattn = fsim.softmax(dim = -1)
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "native-sparse-attention-pytorch"
-version = "0.1.1"
+version = "0.1.2"
 description = "Native Sparse Attention"
 authors = [
     { name = "Phil Wang", email = "lucidrains@gmail.com" }