Skip to content

Commit a3f6647

Browse files
fix
Signed-off-by: Lucas Wilkinson <[email protected]>
1 parent 9839db5 commit a3f6647

File tree

1 file changed

+4
-2
lines changed

1 file changed

+4
-2
lines changed

vllm/v1/attention/backends/mla/flashmla_sparse.py

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -636,8 +636,10 @@ def __init__(
636636
vllm_config.model_config.max_model_len
637637
)
638638
self.prefill_workspace_shape = (prefill_workspace_size, head_size)
639-
self.prefill_bf16_workspace = current_workspace_manager().get_simultaneous(
640-
(self.prefill_workspace_shape, torch.bfloat16)
639+
(self.prefill_bf16_workspace,) = (
640+
current_workspace_manager().get_simultaneous(
641+
(self.prefill_workspace_shape, torch.bfloat16)
642+
)
641643
)
642644

643645
def _forward_bf16_kv(

0 commit comments

Comments
 (0)