mirror of
https://github.com/wassname/vllm.git
synced 2026-06-27 18:27:02 +08:00
[ROCM] fix native attention function call (#13650)
This commit is contained in:
@@ -717,7 +717,6 @@ class ROCmFlashAttentionImpl(AttentionImpl):
|
||||
self.num_heads,
|
||||
self.head_size,
|
||||
self.scale,
|
||||
causal_mask,
|
||||
attn_masks,
|
||||
)
|
||||
else:
|
||||
|
||||
Reference in New Issue
Block a user