vllm-project
diff --git a/‎.github/workflows/_e2e_nightly_multi_node.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/_e2e_nightly_multi_node.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/format_pr_body.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/format_pr_body.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/nightly_benchmarks.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/nightly_benchmarks.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/vllm_ascend_test.yaml‎
Lines changed: 7 additions & 4 deletions b/‎.github/workflows/vllm_ascend_test.yaml‎
Lines changed: 7 additions & 4 deletions
diff --git a/‎.github/workflows/vllm_ascend_test_full.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/vllm_ascend_test_full.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/vllm_ascend_test_nightly_a2.yaml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/vllm_ascend_test_nightly_a2.yaml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.github/workflows/vllm_ascend_test_nightly_a3.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/vllm_ascend_test_nightly_a3.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/vllm_ascend_test_report.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/vllm_ascend_test_report.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎Dockerfile‎
Lines changed: 2 additions & 4 deletions b/‎Dockerfile‎
Lines changed: 2 additions & 4 deletions
diff --git a/‎Dockerfile.310p‎
Lines changed: 2 additions & 4 deletions b/‎Dockerfile.310p‎
Lines changed: 2 additions & 4 deletions
@@ -32,7 +32,7 @@ on:
         description: how many pods will be pulled up via lws.yaml, indicates number of nodes we need
       vllm_version:
         required: false
-        default: "2918c1b49c88c29783c86f78d2c4221cb9622379"
+        default: "v0.11.2"
         type: string
         description: vllm version to use
       vllm_ascend_remote_url:
 
@@ -36,7 +36,7 @@ jobs:
 
       - name: Get vLLM version
         run: |
-          VLLM_COMMIT=2918c1b49c88c29783c86f78d2c4221cb9622379
+          VLLM_COMMIT=v0.11.2
           echo "VLLM_COMMIT=https://github.com/vllm-project/vllm/commit/$VLLM_COMMIT" >> $GITHUB_ENV
 
       - name: Checkout repository
 
@@ -51,7 +51,7 @@ jobs:
     strategy:
       matrix:
         include:
-          - vllm_branch: 2918c1b49c88c29783c86f78d2c4221cb9622379
+          - vllm_branch: v0.11.2
             vllm_ascend_branch: main
       max-parallel: 1
     container:
 
@@ -42,7 +42,7 @@ jobs:
   lint:
     uses: ./.github/workflows/pre-commit.yml
     with:
-      vllm: 2918c1b49c88c29783c86f78d2c4221cb9622379
+      vllm: v0.11.2
   changes:
     runs-on: ubuntu-latest
     outputs:
@@ -83,7 +83,7 @@ jobs:
         VLLM_USE_MODELSCOPE: True
     strategy:
       matrix:
-        vllm_version: [2918c1b49c88c29783c86f78d2c4221cb9622379]
+        vllm_version: [v0.11.2]
     steps:
       - name: Install packages
         run: |
@@ -121,7 +121,10 @@ jobs:
           export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/x86_64-linux/devlib
           pytest -sv --cov --cov-report=xml:unittests-coverage.xml tests/ut \
             --ignore tests/ut/torchair/models/test_torchair_deepseek_mtp.py \
-            --ignore tests/ut/torchair/models/test_torchair_deepseek_v2.py
+            --ignore tests/ut/torchair/models/test_torchair_deepseek_v2.py \
+            --ignore tests/ut/models/test_qwen2_vl.py \
+            --ignore tests/ut/models/test_qwen2_5_vl.py \
+            --ignore tests/ut/models/test_qwen2_5_vl_without_padding.py
 
       - name: Upload coverage to Codecov
         # only upload coverage when commits merged
@@ -138,7 +141,7 @@ jobs:
     name: e2e-light
     strategy:
       matrix:
-        vllm_version: [2918c1b49c88c29783c86f78d2c4221cb9622379]
+        vllm_version: [v0.11.2]
     # Note (yikun): If CI resource are limited we can split job into two chain jobs
     needs: [lint, changes]
     # only trigger e2e test after lint passed and the change is e2e related with pull request.
 
@@ -69,7 +69,7 @@ jobs:
     name: e2e-full
     strategy:
       matrix:
-        vllm_version: [2918c1b49c88c29783c86f78d2c4221cb9622379]
+        vllm_version: [v0.11.2]
     needs: [changes]
     if: ${{ needs.changes.outputs.e2e_tracker == 'true' }}
     uses: ./.github/workflows/_e2e_test.yaml
 
@@ -86,7 +86,7 @@ jobs:
             tests: tests/e2e/nightly/ops
     uses: ./.github/workflows/_e2e_nightly_single_node.yaml
     with:
-      vllm: 2918c1b49c88c29783c86f78d2c4221cb9622379
+      vllm: v0.11.2
       runner: ${{ matrix.test_config.os }}
       tests: ${{ matrix.test_config.tests }}
       image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-a2'
@@ -125,7 +125,7 @@ jobs:
               - Qwen3-Next-80B-A3B-Instruct
     uses: ./.github/workflows/_e2e_nightly_single_node_models.yaml
     with:
-      vllm: 2918c1b49c88c29783c86f78d2c4221cb9622379
+      vllm: v0.11.2
       runner: ${{ matrix.test_config.os }}
       model_list: ${{ toJson(matrix.test_config.model_list) }}
       image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
 
@@ -136,7 +136,7 @@ jobs:
             tests: tests/e2e/nightly/models/test_deepseek_v3_2_exp_w8a8.py
     uses: ./.github/workflows/_e2e_nightly_single_node.yaml
     with:
-      vllm: 2918c1b49c88c29783c86f78d2c4221cb9622379
+      vllm: v0.11.2
       runner: ${{ matrix.test_config.os }}
       image: 'swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/vllm-ascend:nightly-a3'
       tests: ${{ matrix.test_config.tests }}
 
@@ -72,7 +72,7 @@ jobs:
               - DeepSeek-V2-Lite
     uses: ./.github/workflows/_e2e_nightly_single_node_models.yaml
     with:
-      vllm: 2918c1b49c88c29783c86f78d2c4221cb9622379
+      vllm: v0.11.2
       runner: ${{ matrix.runner }}
       image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.3.rc1-910b-ubuntu22.04-py3.11
       model_list: ${{ toJson(matrix.model_list) }}
 
@@ -46,10 +46,8 @@ RUN pip config set global.index-url ${PIP_INDEX_URL}
 
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=2918c1b49c88c29783c86f78d2c4221cb9622379
-# Revert this change once VLLM_TAG is specified to branch or tag
-# RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
-RUN git clone $VLLM_REPO /vllm-workspace/vllm && (cd /vllm-workspace/vllm && git checkout $VLLM_TAG)
+ARG VLLM_TAG=v0.11.2
+RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
 RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm/[audio] --extra-index https://download.pytorch.org/whl/cpu/ && \
     python3 -m pip uninstall -y triton && \
 
@@ -37,10 +37,8 @@ RUN pip config set global.index-url ${PIP_INDEX_URL}
 
 # Install vLLM
 ARG VLLM_REPO=https://github.com/vllm-project/vllm.git
-ARG VLLM_TAG=2918c1b49c88c29783c86f78d2c4221cb9622379
-# Revert this change once VLLM_TAG is specified to branch or tag
-# RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
-RUN git clone $VLLM_REPO /vllm-workspace/vllm && (cd /vllm-workspace/vllm && git checkout $VLLM_TAG)
+ARG VLLM_TAG=v0.11.2
+RUN git clone --depth 1 $VLLM_REPO --branch $VLLM_TAG /vllm-workspace/vllm
 # In x86, triton will be installed by vllm. But in Ascend, triton doesn't work correctly. we need to uninstall it.
 RUN VLLM_TARGET_DEVICE="empty" python3 -m pip install -v -e /vllm-workspace/vllm/[audio] --extra-index https://download.pytorch.org/whl/cpu/ && \
     python3 -m pip uninstall -y triton && \