Skip to content

Commit ab37a7d

Browse files
authored
[main]Upgrade cann to 8.3rc2 (#4350)
### What this PR does / why we need it? Upgrade cann to 8.3rc2 ### Does this PR introduce _any_ user-facing change? Yes, docker image will use 8.3.RC2 - vLLM version: v0.11.2 - vLLM main: https://github.com/vllm-project/vllm/commit/v0.11.2 --------- Signed-off-by: MrZ20 <2609716663@qq.com>
1 parent 755b635 commit ab37a7d

23 files changed

+40
-49
lines changed

.github/Dockerfile.buildwheel

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@
1515
# This file is a part of the vllm-ascend project.
1616
#
1717
ARG PY_VERSION=3.11
18-
FROM quay.io/ascend/manylinux:8.3.rc1-910b-manylinux_2_28-py${PY_VERSION}
18+
FROM quay.io/ascend/manylinux:8.3.rc2-910b-manylinux_2_28-py${PY_VERSION}
1919

2020
ARG COMPILE_CUSTOM_KERNELS=1
2121
ARG SOC_VERSION

.github/workflows/_e2e_nightly_multi_node.yaml

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -15,7 +15,7 @@ on:
1515
required: false
1616
type: string
1717
description: base image for pods
18-
default: "swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11"
18+
default: "swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11"
1919
config_file_path:
2020
required: true
2121
type: string
@@ -69,7 +69,7 @@ jobs:
6969
# This is the runner with no NPU for k8s controller
7070
runs-on: ${{ inputs.runner }}
7171
container:
72-
image: m.daocloud.io/quay.io/ascend/cann:8.3.rc1-a3-ubuntu22.04-py3.11
72+
image: m.daocloud.io/quay.io/ascend/cann:8.3.rc2-a3-ubuntu22.04-py3.11
7373
env:
7474
KUBECONFIG: /tmp/kubeconfig
7575
KUBECTL: /root/.cache/.kube/kubectl

.github/workflows/_e2e_nightly_single_node.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -29,7 +29,7 @@ on:
2929
image:
3030
required: false
3131
type: string
32-
default: "swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11"
32+
default: "swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11"
3333
tests:
3434
required: true
3535
type: string

.github/workflows/_e2e_nightly_single_node_models.yaml

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,7 @@ jobs:
5959
name: ${{inputs.model_list}} accuracy test
6060
runs-on: ${{ inputs.runner }}
6161
container:
62-
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11
62+
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11
6363
env:
6464
VLLM_USE_MODELSCOPE: True
6565
GHA_VLLM_ASCEND_VERSION: ${{ inputs.vllm-ascend }}
@@ -108,10 +108,7 @@ jobs:
108108
if: ${{ inputs.runner == 'linux-aarch64-a2-4' && contains(inputs.model_list, 'Qwen3-Next-80B-A3B-Instruct') }}
109109
shell: bash -l {0}
110110
run: |
111-
wget -q https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/Ascend-BiSheng-toolkit_aarch64.run -O /tmp/Ascend-BiSheng-toolkit_aarch64.run
112-
chmod a+x /tmp/Ascend-BiSheng-toolkit_aarch64.run
113-
/tmp/Ascend-BiSheng-toolkit_aarch64.run --install
114-
. /usr/local/Ascend/8.3.RC1/bisheng_toolkit/set_env.sh
111+
. /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh
115112
python3 -m pip install "https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/triton_ascend-3.2.0.dev20250914-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl"
116113
117114
- name: Resolve vllm-ascend version
@@ -225,4 +222,4 @@ jobs:
225222
path: ./benchmarks/accuracy/
226223
if-no-files-found: warn
227224
retention-days: 90
228-
overwrite: true
225+
overwrite: true

.github/workflows/_e2e_test.yaml

Lines changed: 3 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -211,7 +211,7 @@ jobs:
211211
if: ${{ needs.e2e.result == 'success' && needs.e2e-2-cards.result == 'success' && inputs.type == 'full' }}
212212
runs-on: linux-aarch64-a3-4
213213
container:
214-
image: m.daocloud.io/quay.io/ascend/cann:8.3.rc1-a3-ubuntu22.04-py3.11
214+
image: m.daocloud.io/quay.io/ascend/cann:8.3.rc2-a3-ubuntu22.04-py3.11
215215
env:
216216
VLLM_LOGGING_LEVEL: ERROR
217217
VLLM_USE_MODELSCOPE: True
@@ -274,10 +274,7 @@ jobs:
274274
- name: Install Ascend toolkit & triton_ascend (for Qwen3-Next-80B-A3B-Instruct)
275275
shell: bash -l {0}
276276
run: |
277-
wget -q https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/Ascend-BiSheng-toolkit_aarch64.run -O /tmp/Ascend-BiSheng-toolkit_aarch64.run
278-
chmod a+x /tmp/Ascend-BiSheng-toolkit_aarch64.run
279-
/tmp/Ascend-BiSheng-toolkit_aarch64.run --install
280-
. /usr/local/Ascend/8.3.RC1/bisheng_toolkit/set_env.sh
277+
. /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh
281278
python3 -m pip install "https://vllm-ascend.obs.cn-north-4.myhuaweicloud.com/vllm-ascend/triton_ascend-3.2.0.dev20250914-cp311-cp311-manylinux_2_27_aarch64.manylinux_2_28_aarch64.whl"
282279
283280
- name: Run vllm-project/vllm-ascend Qwen3 Next test
@@ -287,5 +284,5 @@ jobs:
287284
VLLM_WORKER_MULTIPROC_METHOD: spawn
288285
VLLM_USE_MODELSCOPE: True
289286
run: |
290-
. /usr/local/Ascend/8.3.RC1/bisheng_toolkit/set_env.sh
287+
. /usr/local/Ascend/ascend-toolkit/8.3.RC2/bisheng_toolkit/set_env.sh
291288
pytest -sv tests/e2e/multicard/test_qwen3_next.py

.github/workflows/_nightly_image_build.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -45,7 +45,7 @@ jobs:
4545
--network host \
4646
--platform linux/arm64 \
4747
-f .github/Dockerfile.nightly.${TARGET} \
48-
--build-arg CANN_VERSION="8.3.rc1" \
48+
--build-arg CANN_VERSION="8.3.rc2" \
4949
--build-arg UBUNTU_VERSION="22.04" \
5050
--build-arg PYTHON_VERSION="3.11" \
5151
-t "$IMAGE_TAG" .

.github/workflows/nightly_benchmarks.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -55,7 +55,7 @@ jobs:
5555
vllm_ascend_branch: main
5656
max-parallel: 1
5757
container:
58-
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11
58+
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11
5959
volumes:
6060
- /usr/local/dcmi:/usr/local/dcmi
6161
- /usr/local/bin/npu-smi:/usr/local/bin/npu-smi

.github/workflows/vllm_ascend_test_310p.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -58,7 +58,7 @@ jobs:
5858
runs-on: ${{ matrix.os }}
5959
container:
6060
# TODO(yikun): Remove m.daocloud.io prefix when infra proxy ready
61-
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-310p-ubuntu22.04-py3.11
61+
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-310p-ubuntu22.04-py3.11
6262
env:
6363
VLLM_LOGGING_LEVEL: ERROR
6464
VLLM_USE_MODELSCOPE: True

.github/workflows/vllm_ascend_test_full_vllm_main.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -41,5 +41,5 @@ jobs:
4141
with:
4242
vllm: main
4343
runner: linux-aarch64-a2
44-
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11
44+
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11
4545
type: full

.github/workflows/vllm_ascend_test_pr_full.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -76,5 +76,5 @@ jobs:
7676
with:
7777
vllm: ${{ matrix.vllm_version }}
7878
runner: linux-aarch64-a2
79-
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11
79+
image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc2-910b-ubuntu22.04-py3.11
8080
type: full

0 commit comments

Comments
 (0)