[fix] fix sparse attention (#397)

Lijiachen1018 · lijiachen19 · web-flow · commit 5779ce9122c2 · 2025-11-22T17:57:55.000+08:00
fix ascend attention

Co-authored-by: lijiachen19 &lt;lijiachen19@huawei.com&gt;
diff --git a/ucm/integration/vllm/patch/patch_funcs/v092/vllm_ascend_adapt.py b/ucm/integration/vllm/patch/patch_funcs/v092/vllm_ascend_adapt.py
@@ -112,6 +112,13 @@ def maybe_execute_sparse_attention_finished(
         ):
             if not has_ucm_sparse():
                 return
+            ucm_sparse = get_ucm_sparse()
+            attn_metadata = forward_context.attn_metadata
+            if attn_metadata is None:
+                return
+            ucm_sparse.attention_finished(
+                query, key, value, attn_output, layer_name, forward_context
+            )
 
         attention_v1.maybe_execute_sparse_attention_finished = (
             maybe_execute_sparse_attention_finished