@@ -176,16 +176,30 @@ def test_ascend_mla_metadata_default(self):
176176
177177class TestAscendMLAMetadataBuilder (TestBase ):
178178
179- def test_ascend_mla_metadata_builder_default (self ):
179+ @patch ('vllm.distributed.parallel_state.get_dcp_group' )
180+ @patch ('vllm.distributed.parallel_state._DCP' ,
181+ new_callable = lambda : MagicMock (spec = GroupCoordinator ))
182+ @patch ("vllm.distributed.get_decode_context_model_parallel_world_size" ,
183+ return_value = 1 )
184+ def test_ascend_mla_metadata_builder_default (self , mock_get_dcp_size ,
185+ mock_dcp , mock_get_dcp_group ):
180186 mock_vllm_config = MagicMock ()
181187 mock_vllm_config .model_config .max_model_len = 1024
182188 mock_vllm_config .model_config .get_head_size .return_value = 64
183189 mock_vllm_config .model_config .dtype = torch .float16
184190 mock_vllm_config .cache_config .block_size = 16
185191 mock_vllm_config .scheduler_config .max_num_seqs = 4
192+ mock_vllm_config .scheduler_config .decode_max_num_seqs = 4
186193 mock_vllm_config .scheduler_config .chunked_prefill_enabled = False
187194 mock_device = 'cpu'
188195
196+ mock_dcp .world_size = 1
197+ dcp_group = MagicMock (spec = GroupCoordinator )
198+ dcp_group .rank_in_group = 0
199+ dcp_group .world_size = 1
200+ dcp_group .device_group = MagicMock ()
201+ mock_get_dcp_group .return_value = dcp_group
202+
189203 mock_vllm_config .speculative_config = None
190204
191205 ascend_config = MagicMock ()
@@ -200,16 +214,31 @@ def test_ascend_mla_metadata_builder_default(self):
200214 builder .chunked_prefill_enabled ,
201215 mock_vllm_config .scheduler_config .chunked_prefill_enabled )
202216
203- def test_ascend_mla_metadata_builder_spec_decode (self ):
217+ @patch ('vllm.distributed.parallel_state.get_dcp_group' )
218+ @patch ('vllm.distributed.parallel_state._DCP' ,
219+ new_callable = lambda : MagicMock (spec = GroupCoordinator ))
220+ @patch ("vllm.distributed.get_decode_context_model_parallel_world_size" ,
221+ return_value = 1 )
222+ def test_ascend_mla_metadata_builder_spec_decode (self , mock_get_dcp_size ,
223+ mock_dcp ,
224+ mock_get_dcp_group ):
204225 mock_vllm_config = MagicMock ()
205226 mock_vllm_config .model_config .max_model_len = 1024
206227 mock_vllm_config .model_config .get_head_size .return_value = 64
207228 mock_vllm_config .model_config .dtype = torch .float16
208229 mock_vllm_config .cache_config .block_size = 16
209230 mock_vllm_config .scheduler_config .max_num_seqs = 4
231+ mock_vllm_config .scheduler_config .decode_max_num_seqs = 4
210232 mock_vllm_config .scheduler_config .chunked_prefill_enabled = False
211233 mock_device = 'cpu'
212234
235+ mock_dcp .world_size = 1
236+ dcp_group = MagicMock (spec = GroupCoordinator )
237+ dcp_group .rank_in_group = 0
238+ dcp_group .world_size = 1
239+ dcp_group .device_group = MagicMock ()
240+ mock_get_dcp_group .return_value = dcp_group
241+
213242 mock_spec_config = MagicMock ()
214243 mock_spec_config .num_speculative_tokens = 3
215244 mock_vllm_config .speculative_config = mock_spec_config
@@ -226,16 +255,30 @@ def test_ascend_mla_metadata_builder_spec_decode(self):
226255 builder .chunked_prefill_enabled ,
227256 mock_vllm_config .scheduler_config .chunked_prefill_enabled )
228257
229- def test_reorder_batch (self ):
258+ @patch ('vllm.distributed.parallel_state.get_dcp_group' )
259+ @patch ('vllm.distributed.parallel_state._DCP' ,
260+ new_callable = lambda : MagicMock (spec = GroupCoordinator ))
261+ @patch ("vllm.distributed.get_decode_context_model_parallel_world_size" ,
262+ return_value = 1 )
263+ def test_reorder_batch (self , mock_get_dcp_size , mock_dcp ,
264+ mock_get_dcp_group ):
230265 ascend_config = MagicMock ()
231266
232267 mock_vllm_config = MagicMock ()
233268 mock_vllm_config .model_config .max_model_len = 1024
234269 mock_vllm_config .cache_config .block_size = 16
235270 mock_vllm_config .scheduler_config .max_num_seqs = 4
271+ mock_vllm_config .scheduler_config .decode_max_num_seqs = 4
236272 mock_vllm_config .scheduler_config .chunked_prefill_enabled = False
237273 mock_device = 'cpu'
238274
275+ mock_dcp .world_size = 1
276+ dcp_group = MagicMock (spec = GroupCoordinator )
277+ dcp_group .rank_in_group = 0
278+ dcp_group .world_size = 1
279+ dcp_group .device_group = MagicMock ()
280+ mock_get_dcp_group .return_value = dcp_group
281+
239282 mock_vllm_config .speculative_config = None
240283
241284 with patch ("vllm_ascend.attention.mla_v1.get_ascend_config" ,
0 commit comments