Skip to content

Commit 0bb70dc

Browse files
committed
fix
Signed-off-by: Shanshan Shen <87969357+shen-shanshan@users.noreply.github.com>
1 parent e7dba89 commit 0bb70dc

File tree

2 files changed

+4
-5
lines changed

2 files changed

+4
-5
lines changed

vllm_ascend/__init__.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,8 +23,8 @@ def register():
2323

2424

2525
def register_model():
26-
from .models import register_model
27-
register_model()
26+
from vllm_ascend.torchair.utils import register_torchair_model
27+
register_torchair_model()
2828

2929

3030
def register_connector():

vllm_ascend/torchair/torchair_model_runner.py

Lines changed: 2 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -39,8 +39,8 @@
3939
from vllm_ascend.torchair.utils import (
4040
TORCHAIR_CACHE_DIR, TorchairCommonAttentionMetadata,
4141
check_torchair_cache_exist, converting_weight_acl_format,
42-
register_torchair_model, torchair_ops_patch,
43-
torchair_quant_method_register, write_kv_cache_bytes_to_file)
42+
torchair_ops_patch, torchair_quant_method_register,
43+
write_kv_cache_bytes_to_file)
4444
from vllm_ascend.utils import (ACL_FORMAT_FRACTAL_ND, ACL_FORMAT_FRACTAL_NZ,
4545
AscendDeviceType, get_ascend_device_type)
4646
from vllm_ascend.worker.model_runner_v1 import NPUModelRunner
@@ -60,7 +60,6 @@ def __init__(self, vllm_config: VllmConfig, device: torch.device):
6060
None, None, vllm_config, device)
6161
self.use_sparse = hasattr(self.model_config.hf_config, "index_topk")
6262

63-
register_torchair_model()
6463
torchair_ops_patch()
6564
torchair_quant_method_register()
6665
if self.enable_shared_expert_dp:

0 commit comments

Comments
 (0)