PyPI - vllm-ascend - Versions diffs - 0.10.2rc1__tar.gz → 0.11.0rc0__tar.gz - Mend

vllm-ascend 0.10.2rc1tar.gz → 0.11.0rc0tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (578) hide show

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/ISSUE_TEMPLATE/900-release-checklist.yml RENAMED Viewed

@@ -24,6 +24,8 @@ body:
     value: >
       - [ ] Create a new issue for release feedback
+      - [ ] Upgrade vllm version to the new version for CI and Dockerfile
       - [ ] Write the release note PR.
         - [ ] Update the feedback issue link in docs/source/faqs.md

vllm_ascend-0.10.2rc1/.github/workflows/vllm_ascend_test_full.yaml → vllm_ascend-0.11.0rc0/.github/workflows/_e2e_test.yaml RENAMED Viewed

@@ -1,82 +1,27 @@
-#
-# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# This file is a part of the vllm-ascend project.
-#
-name: 'test-full'
+name: 'e2e test'
 on:
-  pull_request:
-    branches:
-      - 'main'
-      - '*-dev'
-    types: [ labeled, synchronize ]
-# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
-# declared as "shell: bash -el {0}" on steps that need to be properly activated.
-# It's used to activate ascend-toolkit environment variables.
-defaults:
-  run:
-    shell: bash -el {0}
-# only cancel in-progress runs of the same workflow
-# and ignore the lint / 1 card / 4 cards test type
-concurrency:
-  group: ${{ github.workflow }}-${{ github.ref }}
-  cancel-in-progress: true
+  workflow_call:
+    inputs:
+      vllm:
+        required: true
+        type: string
+      runner:
+        required: true
+        type: string
+      image:
+        required: true
+        type: string
+      type:
+        required: true
+        type: string
 jobs:
-  changes:
-    runs-on: ubuntu-latest
-    if: ${{ contains(github.event.pull_request.labels.*.name, 'ready') && contains(github.event.pull_request.labels.*.name, 'ready-for-test') }}
-    outputs:
-      e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
-      ut_tracker: ${{ steps.filter.outputs.ut_tracker }}
-    steps:
-      - uses: actions/checkout@v4
-      - uses: dorny/paths-filter@v3
-        id: filter
-        with:
-          filters: |
-            e2e_tracker:
-              - '.github/workflows/vllm_ascend_test.yaml'
-              - 'vllm_ascend/**'
-              - 'csrc/**'
-              - 'cmake/**'
-              - 'tests/e2e/**'
-              - 'CMakeLists.txt'
-              - 'setup.py'
-              - 'requirements.txt'
-              - 'requirements-dev.txt'
-              - 'requirements-lint.txt'
-              - 'packages.txt'
-            ut_tracker:
-              - 'tests/ut/**'
-  e2e-full:
-    # only trigger full test when pull request is approved
-    needs: [changes]
-    if: ${{ needs.changes.outputs.e2e_tracker == 'true' }}
-    strategy:
-      max-parallel: 2
-      matrix:
-        os: [linux-aarch64-a2-1]
-        vllm_version: [v0.10.2]
-    name: singlecard e2e test - full
-    runs-on: ${{ matrix.os }}
+  e2e:
+    name: singlecard
+    runs-on: ${{ inputs.runner }}-1
     container:
-      image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
+      image: ${{ inputs.image }}
       env:
         VLLM_LOGGING_LEVEL: ERROR
         VLLM_USE_MODELSCOPE: True
@@ -106,8 +51,9 @@ jobs:
         uses: actions/checkout@v4
         with:
           repository: vllm-project/vllm
-          ref: ${{ matrix.vllm_version }}
+          ref: ${{ inputs.vllm }}
           path: ./vllm-empty
+          fetch-depth: 1
       - name: Install vllm-project/vllm from source
         working-directory: ./vllm-empty
@@ -121,10 +67,23 @@ jobs:
           pip install -r requirements-dev.txt
           pip install -v -e .
+      - name: Run vllm-project/vllm-ascend test
+        env:
+          VLLM_WORKER_MULTIPROC_METHOD: spawn
+          VLLM_USE_MODELSCOPE: True
+          PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
+        if: ${{ inputs.type == 'light' }}
+        run: |
+          pytest -sv tests/e2e/singlecard/test_aclgraph.py
+          pytest -sv tests/e2e/singlecard/test_quantization.py
+          pytest -sv tests/e2e/singlecard/test_vlm.py::test_multimodal_vl
       - name: Run e2e test
         env:
           VLLM_WORKER_MULTIPROC_METHOD: spawn
           VLLM_USE_MODELSCOPE: True
+          PYTORCH_NPU_ALLOC_CONF: max_split_size_mb:256
+        if: ${{ inputs.type == 'full' }}
         run: |
           # We found that if running aclgraph tests in batch, it will cause AclmdlRICaptureBegin error. So we run
           # the test separately.
@@ -135,7 +94,7 @@ jobs:
           pytest -sv tests/e2e/singlecard/test_chunked.py
           pytest -sv tests/e2e/singlecard/test_embedding.py
           pytest -sv tests/e2e/singlecard/test_guided_decoding.py
-          #pytest -sv tests/e2e/singlecard/test_ilama_lora.py
+          pytest -sv tests/e2e/singlecard/test_ilama_lora.py
           pytest -sv tests/e2e/singlecard/test_profile_execute_duration.py
           pytest -sv tests/e2e/singlecard/test_quantization.py
           pytest -sv tests/e2e/singlecard/test_sampler.py
@@ -144,23 +103,16 @@ jobs:
           # ------------------------------------ v1 spec decode test ------------------------------------ #
           pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_correctness.py
           pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_mtp_torchair_correctness.py
-          pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py
+          # Fix me: OOM error
+          #pytest -sv tests/e2e/singlecard/spec_decode_v1/test_v1_spec_decode.py
           pytest -sv tests/e2e/singlecard/ops/
-  e2e-2-cards-full:
-    # only trigger full test when pull request is approved
-    needs: [changes]
-    if: ${{ needs.changes.outputs.e2e_tracker == 'true' }}
-    strategy:
-      max-parallel: 2
-      matrix:
-        os: [linux-aarch64-a2-2]
-        vllm_version: [v0.10.2]
-    name: multicard e2e test - full
-    runs-on: ${{ matrix.os }}
+  e2e-2-cards:
+    name: multicard
+    runs-on: ${{ inputs.runner }}-2
     container:
-      image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
+      image: ${{ inputs.image }}
       env:
         VLLM_LOGGING_LEVEL: ERROR
         VLLM_USE_MODELSCOPE: True
@@ -190,8 +142,9 @@ jobs:
         uses: actions/checkout@v4
         with:
           repository: vllm-project/vllm
-          ref: ${{ matrix.vllm_version }}
+          ref: ${{ inputs.vllm }}
           path: ./vllm-empty
+          fetch-depth: 1
       - name: Install vllm-project/vllm from source
         working-directory: ./vllm-empty
@@ -205,17 +158,26 @@ jobs:
           pip install -r requirements-dev.txt
           pip install -v -e .
-      - name: Run vllm-project/vllm-ascend test
+      - name: Run vllm-project/vllm-ascend test (light)
+        env:
+          VLLM_WORKER_MULTIPROC_METHOD: spawn
+          VLLM_USE_MODELSCOPE: True
+        if: ${{ inputs.type == 'light' }}
+        run: |
+          pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP
+      - name: Run vllm-project/vllm-ascend test (full)
         env:
           VLLM_WORKER_MULTIPROC_METHOD: spawn
           VLLM_USE_MODELSCOPE: True
+        if: ${{ inputs.type == 'full' }}
         run: |
           pytest -sv tests/e2e/multicard/test_data_parallel.py
           pytest -sv tests/e2e/multicard/test_expert_parallel.py
           # external_launcher test is not stable enough. Fix it later
           # pytest -sv tests/e2e/multicard/test_external_launcher.py
           pytest -sv tests/e2e/multicard/test_fused_moe_allgather_ep.py
-          #pytest -sv tests/e2e/multicard/test_ilama_lora_tp2.py
+          pytest -sv tests/e2e/multicard/test_ilama_lora_tp2.py
           # To avoid oom, we need to run the test in a single process.
           pytest -sv tests/e2e/multicard/test_offline_inference_distributed.py::test_models_distributed_QwQ

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/accuracy_test.yaml RENAMED Viewed

@@ -19,7 +19,7 @@
 # 1. PR labeled with: '*accuracy-test' (ONLY 1 label valid) & 'ready-for-test'
 # 2. workflow_dispatch with models input
 # See detail rule in strategy.matrix note
-name: Benchmarks / accuracy
+name: ascend test / accuracy
 on:
   schedule:
@@ -112,7 +112,7 @@ jobs:
         uses: actions/checkout@v4
         with:
           repository: vllm-project/vllm
-          ref: v0.10.2
+          ref: v0.11.0rc3
           path: ./vllm-empty
       - name: Install vllm-project/vllm from source

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/format_pr_body.yaml RENAMED Viewed

@@ -33,23 +33,17 @@ jobs:
     runs-on: ubuntu-latest
     steps:
-      - name: Checkout vllm-project/vllm repo
-        uses: actions/checkout@v4
-        with:
-          repository: vllm-project/vllm
-          path: ./vllm-empty
       - name: Get vLLM version
-        working-directory: ./vllm-empty
         run: |
-          VLLM_COMMIT=$(git rev-parse HEAD)
+          VLLM_COMMIT=releases/v0.11.0
           echo "VLLM_COMMIT=https://github.com/vllm-project/vllm/commit/$VLLM_COMMIT" >> $GITHUB_ENV
       - name: Checkout repository
         uses: actions/checkout@ff7abcd0c3c05ccf6adc123a8cd1fd4fb30fb493 # v4.2.2
       - name: Set up Python
-        uses: actions/setup-python@42375524e23c412d93fb67b49958b491fce71c38 # v5.4.0
+        uses: actions/setup-python@e797f83bcb11b83ae66e0230d6156d7c80228e7c # v6.0.0
       - name: Get vLLM release version
         run: |

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/label_merge_conflict.yml RENAMED Viewed

@@ -16,6 +16,5 @@ jobs:
         uses: eps1lon/actions-label-merge-conflict@v3
         with:
           dirtyLabel: "merge-conflicts"
-          removeOnDirtyLabel: "ready"
           repoToken: "${{ secrets.GITHUB_TOKEN }}"
           commentOnDirty: "This pull request has conflicts, please resolve those before we can evaluate the pull request."

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/labeler.yml RENAMED Viewed

@@ -11,7 +11,7 @@ jobs:
       pull-requests: write
     steps:
       - name: Label the PR
-        uses: actions/labeler@v5
+        uses: actions/labeler@v6
         with:
           repo-token: ${{ secrets.GITHUB_TOKEN }}
           configuration-path: .github/labeler.yml

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/nightly_benchmarks.yaml RENAMED Viewed

@@ -15,7 +15,7 @@
 # limitations under the License.
 #
-name: 'Benchmarks / Performance'
+name: 'ascend test / performance'
 # This workflow runs nightly benchmarks for vllm-ascend.
 on:
@@ -51,7 +51,7 @@ jobs:
     strategy:
       matrix:
         include:
-          - vllm_branch: v0.10.2
+          - vllm_branch: v0.11.0rc3
             vllm_ascend_branch: main
             vllm_use_v1: 1
       max-parallel: 1

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/pre-commit.yml RENAMED Viewed

@@ -2,6 +2,10 @@ name: pre-commit
 on:
     workflow_call:
+      inputs:
+        vllm:
+          required: true
+          type: string
 permissions:
   contents: read
@@ -12,7 +16,7 @@ jobs:
     steps:
     - name: Checkout vllm-project/vllm-ascend repo
       uses: actions/checkout@v4
-    - uses: actions/setup-python@42375524e23c412d93fb67b49958b491fce71c38 # v5.4.0
+    - uses: actions/setup-python@e797f83bcb11b83ae66e0230d6156d7c80228e7c # v6.0.0
       with:
         python-version: "3.11"
     - run: echo "::add-matcher::.github/workflows/matchers/actionlint.json"
@@ -22,6 +26,7 @@ jobs:
       with:
         repository: vllm-project/vllm
         path: ./vllm-empty
+        ref: ${{ inputs.vllm }}
     - name: Install vllm
       working-directory: vllm-empty
       run: |

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/release_code.yml RENAMED Viewed

@@ -50,7 +50,7 @@ jobs:
           lscpu
       - name: Set up Python ${{ matrix.python-version }}
-        uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
+        uses: actions/setup-python@e797f83bcb11b83ae66e0230d6156d7c80228e7c # v6.0.0
         with:
           python-version: ${{ matrix.python-version }}

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/release_whl.yml RENAMED Viewed

@@ -73,7 +73,7 @@ jobs:
     - name: Set up Python ${{ matrix.python-version }}
       if: startsWith(github.ref, 'refs/tags/')
-      uses: actions/setup-python@a26af69be951a213d495a4c3e4e4022e16d87065 # v5.6.0
+      uses: actions/setup-python@e797f83bcb11b83ae66e0230d6156d7c80228e7c # v6.0.0
       with:
         python-version: ${{ matrix.python-version }}

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/vllm_ascend_dist.yaml RENAMED Viewed

@@ -43,7 +43,7 @@ jobs:
     strategy:
       matrix:
         os: [linux-aarch64-a3-8]
-        vllm_version: [v0.10.2]
+        vllm_version: [v0.11.0rc3]
     name: vLLM Ascend test
     runs-on: ${{ matrix.os }}
     container:

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/vllm_ascend_doctest.yaml RENAMED Viewed

@@ -15,7 +15,7 @@
 # This file is a part of the vllm-ascend project.
 #
-name: 'e2e test / doctest'
+name: 'ascend test / doctest'
 on:
   workflow_dispatch:

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/vllm_ascend_test.yaml RENAMED Viewed

@@ -15,7 +15,7 @@
 # This file is a part of the vllm-ascend project.
 #
-name: 'test'
+name: 'ascend test'
 on:
   push:
@@ -41,9 +41,10 @@ concurrency:
 jobs:
   lint:
     uses: ./.github/workflows/pre-commit.yml
+    with:
+      vllm: releases/v0.11.0
   changes:
-    if: github.event_name == 'pull_request'
     runs-on: ubuntu-latest
     outputs:
       e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
@@ -82,7 +83,7 @@ jobs:
         VLLM_USE_MODELSCOPE: True
     strategy:
       matrix:
-        vllm_version: [v0.10.2]
+        vllm_version: [releases/v0.11.0, v0.11.0rc3]
     steps:
       - name: Install packages
         run: |
@@ -118,10 +119,20 @@ jobs:
           TORCH_DEVICE_BACKEND_AUTOLOAD: 0
         run: |
           export LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/Ascend/ascend-toolkit/latest/x86_64-linux/devlib
-          pytest -sv --cov --cov-report=xml:unittests-coverage.xml tests/ut --ignore=tests/ut/test_platform.py --ignore=tests/ut/ops/test_vocab_parallel_embedding.py
+          pytest -sv --cov --cov-report=xml:unittests-coverage.xml tests/ut \
+          --ignore=tests/ut/test_platform.py \
+          --ignore=tests/ut/patch/worker/patch_common/test_patch_minicpm.py \
+          --ignore=tests/ut/core/test_scheduler.py \
+          --ignore=tests/ut/kv_connector/test_llmdatadist_connector.py \
+          --ignore=tests/ut/kv_connector/test_mooncake_connector.py \
+          --ignore=tests/ut/kv_connector/test_remote_decode_lifecycle.py \
+          --ignore=tests/ut/kv_connector/test_remote_prefill_lifecycle.py \
+          --ignore=tests/ut/torchair/models/test_torchair_deepseek_v2.py \
+          --ignore=tests/ut/torchair/test_utils.py
       - name: Upload coverage to Codecov
-        if: ${{ matrix.vllm_version == 'main' }}
+        # only upload coverage when commits merged
+        if: github.event_name == 'push' && github.ref == 'refs/heads/main'
         uses: codecov/codecov-action@v5
         env:
           CODECOV_TOKEN: ${{ secrets.CODECOV_TOKEN }}
@@ -131,130 +142,17 @@ jobs:
           verbose: true
   e2e-light:
+    name: e2e-light
+    strategy:
+      matrix:
+        vllm_version: [releases/v0.11.0, v0.11.0rc3]
+    # Note (yikun): If CI resource are limited we can split job into two chain jobs
     needs: [lint, changes]
     # only trigger e2e test after lint passed and the change is e2e related with pull request.
     if: ${{ github.event_name == 'pull_request' && needs.lint.result == 'success' && needs.changes.outputs.e2e_tracker == 'true' && !contains(github.event.pull_request.labels.*.name, 'ready') }}
-    strategy:
-      max-parallel: 2
-      matrix:
-        os: [linux-aarch64-a2-1]
-        vllm_version: [v0.10.2]
-    name: singlecard e2e test - light
-    runs-on: ${{ matrix.os }}
-    container:
-      image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
-      env:
-        VLLM_LOGGING_LEVEL: ERROR
-        VLLM_USE_MODELSCOPE: True
-    steps:
-      - name: Check npu and CANN info
-        run: |
-          npu-smi info
-          cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info
-      - name: Config mirrors
-        run: |
-          sed -Ei 's@(ports|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
-          pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
-          pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
-          apt-get update -y
-          apt install git -y
-      - name: Checkout vllm-project/vllm-ascend repo
-        uses: actions/checkout@v4
-      - name: Install system dependencies
-        run: |
-          apt-get -y install `cat packages.txt`
-          apt-get -y install gcc g++ cmake libnuma-dev
-      - name: Checkout vllm-project/vllm repo
-        uses: actions/checkout@v4
-        with:
-          repository: vllm-project/vllm
-          ref: ${{ matrix.vllm_version }}
-          path: ./vllm-empty
-      - name: Install vllm-project/vllm from source
-        working-directory: ./vllm-empty
-        run: |
-          VLLM_TARGET_DEVICE=empty pip install -e .
-      - name: Install vllm-project/vllm-ascend
-        env:
-          PIP_EXTRA_INDEX_URL: https://mirrors.huaweicloud.com/ascend/repos/pypi
-        run: |
-          pip install -r requirements-dev.txt
-          pip install -v -e .
-      - name: Run e2e test
-        env:
-          VLLM_WORKER_MULTIPROC_METHOD: spawn
-          VLLM_USE_MODELSCOPE: True
-        run: |
-          pytest -sv tests/e2e/singlecard/test_aclgraph.py
-          pytest -sv tests/e2e/singlecard/test_quantization.py
-          pytest -sv tests/e2e/singlecard/test_vlm.py::test_multimodal_vl
-  e2e-2-cards-light:
-    needs: [e2e-light]
-    if: ${{ needs.e2e-light.result == 'success' }}
-    strategy:
-      max-parallel: 2
-      matrix:
-        os: [linux-aarch64-a2-2]
-        vllm_version: [v0.10.2]
-    name: multicard e2e test - light
-    runs-on: ${{ matrix.os }}
-    container:
+    uses: ./.github/workflows/_e2e_test.yaml
+    with:
+      vllm: ${{ matrix.vllm_version }}
+      runner: linux-aarch64-a2
       image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
-      env:
-        VLLM_LOGGING_LEVEL: ERROR
-        VLLM_USE_MODELSCOPE: True
-    steps:
-      - name: Check npu and CANN info
-        run: |
-          npu-smi info
-          cat /usr/local/Ascend/ascend-toolkit/latest/"$(uname -i)"-linux/ascend_toolkit_install.info
-      - name: Config mirrors
-        run: |
-          sed -Ei 's@(ports|archive).ubuntu.com@cache-service.nginx-pypi-cache.svc.cluster.local:8081@g' /etc/apt/sources.list
-          pip config set global.index-url http://cache-service.nginx-pypi-cache.svc.cluster.local/pypi/simple
-          pip config set global.trusted-host cache-service.nginx-pypi-cache.svc.cluster.local
-          apt-get update -y
-          apt install git -y
-      - name: Checkout vllm-project/vllm-ascend repo
-        uses: actions/checkout@v4
-      - name: Install system dependencies
-        run: |
-          apt-get -y install `cat packages.txt`
-          apt-get -y install gcc g++ cmake libnuma-dev
-      - name: Checkout vllm-project/vllm repo
-        uses: actions/checkout@v4
-        with:
-          repository: vllm-project/vllm
-          ref: ${{ matrix.vllm_version }}
-          path: ./vllm-empty
-      - name: Install vllm-project/vllm from source
-        working-directory: ./vllm-empty
-        run: |
-          VLLM_TARGET_DEVICE=empty pip install -e .
-      - name: Install vllm-project/vllm-ascend
-        env:
-          PIP_EXTRA_INDEX_URL: https://mirrors.huaweicloud.com/ascend/repos/pypi
-        run: |
-          pip install -r requirements-dev.txt
-          pip install -v -e .
-      - name: Run vllm-project/vllm-ascend test
-        env:
-          VLLM_WORKER_MULTIPROC_METHOD: spawn
-          VLLM_USE_MODELSCOPE: True
-        run: |
-          pytest -sv tests/e2e/multicard/test_qwen3_moe.py::test_models_distributed_Qwen3_MOE_TP2_WITH_EP
+      type: light

{vllm_ascend-0.10.2rc1 → vllm_ascend-0.11.0rc0}/.github/workflows/vllm_ascend_test_310p.yaml RENAMED Viewed

@@ -53,7 +53,7 @@ jobs:
       max-parallel: 2
       matrix:
         os: [linux-aarch64-310p-1, linux-aarch64-310p-4]
-        vllm_version: [v0.10.2]
+        vllm_version: [v0.11.0rc3]
     name: 310p e2e test
     runs-on: ${{ matrix.os }}
     container:

vllm_ascend-0.11.0rc0/.github/workflows/vllm_ascend_test_full.yaml ADDED Viewed

@@ -0,0 +1,79 @@
+#
+# Copyright (c) 2025 Huawei Technologies Co., Ltd. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# This file is a part of the vllm-ascend project.
+#
+name: 'ascend test / full'
+on:
+  pull_request:
+    branches:
+      - 'main'
+      - '*-dev'
+    types: [ labeled, synchronize ]
+# Bash shells do not use ~/.profile or ~/.bashrc so these shells need to be explicitly
+# declared as "shell: bash -el {0}" on steps that need to be properly activated.
+# It's used to activate ascend-toolkit environment variables.
+defaults:
+  run:
+    shell: bash -el {0}
+# only cancel in-progress runs of the same workflow
+# and ignore the lint / 1 card / 4 cards test type
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}
+  cancel-in-progress: true
+jobs:
+  changes:
+    runs-on: ubuntu-latest
+    if: ${{ contains(github.event.pull_request.labels.*.name, 'ready') && contains(github.event.pull_request.labels.*.name, 'ready-for-test') }}
+    outputs:
+      e2e_tracker: ${{ steps.filter.outputs.e2e_tracker }}
+      ut_tracker: ${{ steps.filter.outputs.ut_tracker }}
+    steps:
+      - uses: actions/checkout@v4
+      - uses: dorny/paths-filter@v3
+        id: filter
+        with:
+          filters: |
+            e2e_tracker:
+              - '.github/workflows/vllm_ascend_test.yaml'
+              - 'vllm_ascend/**'
+              - 'csrc/**'
+              - 'cmake/**'
+              - 'tests/e2e/**'
+              - 'CMakeLists.txt'
+              - 'setup.py'
+              - 'requirements.txt'
+              - 'requirements-dev.txt'
+              - 'requirements-lint.txt'
+              - 'packages.txt'
+            ut_tracker:
+              - 'tests/ut/**'
+  e2e-test:
+    name: e2e-full
+    strategy:
+      matrix:
+        vllm_version: [releases/v0.11.0, v0.11.0rc3]
+    needs: [changes]
+    if: ${{ needs.changes.outputs.e2e_tracker == 'true' }}
+    uses: ./.github/workflows/_e2e_test.yaml
+    with:
+      vllm: ${{ matrix.vllm_version }}
+      runner: linux-aarch64-a2
+      image: swr.cn-southwest-2.myhuaweicloud.com/base_image/ascend-ci/cann:8.2.rc1-910b-ubuntu22.04-py3.11
+      type: full

vllm-ascend 0.10.2rc1__tar.gz → 0.11.0rc0__tar.gz

vllm-ascend 0.10.2rc1tar.gz → 0.11.0rc0tar.gz