diff --git a/vllm/v1/attention/backends/mla/common.py b/vllm/v1/attention/backends/mla/common.py index b920fd929e85..3efd25c03497 100755 --- a/vllm/v1/attention/backends/mla/common.py +++ b/vllm/v1/attention/backends/mla/common.py @@ -799,7 +799,7 @@ def build( dcp_local_seq_lens[:num_decodes] = seq_lens[ :num_decodes ] // self.dcp_world_size + ( - self.dcp_rank <= (seq_lens[:num_decodes] - 1) % self.dcp_world_size + self.dcp_rank < seq_lens[:num_decodes] % self.dcp_world_size ) assert num_decodes + num_prefills == num_reqs