|
1 | 1 | from unittest.mock import MagicMock, patch |
2 | 2 |
|
3 | 3 | import torch |
4 | | -from vllm.config import CacheConfig, ModelConfig, SchedulerConfig, VllmConfig |
| 4 | +from vllm.config import VllmConfig |
5 | 5 | from vllm.distributed.parallel_state import GroupCoordinator |
6 | 6 | from vllm.model_executor.layers.linear import LinearBase |
7 | 7 |
|
@@ -215,7 +215,7 @@ def test_ascend_mla_metadata_builder_default(self, mock_get_dcp_size, |
215 | 215 | mock_vllm_config.cache_config.block_size) |
216 | 216 | self.assertEqual( |
217 | 217 | builder.chunked_prefill_enabled, |
218 | | - mock_vllm_config.scheduler_config.chunked_prefill_enabled) |
| 218 | + mock_vllm_config.scheduler_config.enable_chunked_prefill) |
219 | 219 |
|
220 | 220 | @patch('vllm.distributed.parallel_state.get_dcp_group') |
221 | 221 | @patch('vllm.distributed.parallel_state._DCP', |
@@ -447,15 +447,20 @@ class TestAscendMLAMetadataBuilderBuild(TestBase): |
447 | 447 |
|
448 | 448 | def setUp(self): |
449 | 449 | self.mock_vllm_config = MagicMock(spec=VllmConfig) |
450 | | - self.mock_vllm_config.model_config = ModelConfig(max_model_len=2048) |
451 | | - self.mock_vllm_config.model_config.hf_text_config.qk_rope_head_dim = 32 |
452 | | - self.mock_vllm_config.cache_config = CacheConfig(block_size=32) |
453 | | - mock_scheduler_config = MagicMock(spec=SchedulerConfig) |
454 | | - mock_scheduler_config.max_num_seqs = 8 # 设置为整数,不是 MagicMock |
455 | | - mock_scheduler_config.chunked_prefill_enabled = True |
456 | | - self.mock_vllm_config.scheduler_config = mock_scheduler_config |
| 450 | + # NOTE: Do not init the ModelConfig from constructor |
| 451 | + # Which will try to download a model |
| 452 | + mock_model_config = MagicMock() |
| 453 | + mock_model_config.max_model_len = 1024 |
| 454 | + mock_model_config.get_head_size.return_value = 64 |
| 455 | + mock_model_config.dtype = torch.float16 |
| 456 | + |
| 457 | + self.mock_vllm_config.model_config = mock_model_config |
| 458 | + self.mock_vllm_config.cache_config = MagicMock(block_size=16) |
| 459 | + self.mock_vllm_config.scheduler_config = MagicMock( |
| 460 | + max_num_seqs=4, enable_chunked_prefill=False) |
457 | 461 | self.mock_vllm_config.speculative_config = None |
458 | | - self.mock_device = torch.device("cpu") |
| 462 | + |
| 463 | + self.mock_device = torch.device('cpu') |
459 | 464 |
|
460 | 465 | self.kv_cache_spec = MagicMock() |
461 | 466 | self.kv_cache_spec.num_layers = 32 |
|
0 commit comments