diff --git a/.github/workflows/accuracy_test.yaml b/.github/workflows/accuracy_test.yaml index 4acb9f670b..b6d978e310 100644 --- a/.github/workflows/accuracy_test.yaml +++ b/.github/workflows/accuracy_test.yaml @@ -123,7 +123,7 @@ jobs: fail-fast: false name: ${{ matrix.model_name }} accuracy V${{ matrix.vllm_use_version }} container: - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 env: DATASET_SOURCE: ModelScope VLLM_USE_MODELSCOPE: True diff --git a/.github/workflows/nightly_benchmarks.yaml b/.github/workflows/nightly_benchmarks.yaml index c23cc724ef..0232972a1d 100644 --- a/.github/workflows/nightly_benchmarks.yaml +++ b/.github/workflows/nightly_benchmarks.yaml @@ -55,7 +55,7 @@ jobs: vllm_use_v1: 1 max-parallel: 1 container: - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 volumes: - /usr/local/dcmi:/usr/local/dcmi - /usr/local/bin/npu-smi:/usr/local/bin/npu-smi diff --git a/.github/workflows/vllm_ascend_test.yaml b/.github/workflows/vllm_ascend_test.yaml index b82659be21..235c705980 100644 --- a/.github/workflows/vllm_ascend_test.yaml +++ b/.github/workflows/vllm_ascend_test.yaml @@ -138,7 +138,7 @@ jobs: if: ${{ needs.lint.result == 'success' || github.event_name == 'push' }} runs-on: ubuntu-latest container: - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 env: VLLM_LOGGING_LEVEL: ERROR VLLM_USE_MODELSCOPE: True @@ -206,7 +206,7 @@ jobs: runs-on: ${{ matrix.os }} container: # TODO(yikun): Remove m.daocloud.io prefix when infra proxy ready - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 env: VLLM_LOGGING_LEVEL: ERROR VLLM_USE_MODELSCOPE: True @@ -307,7 +307,7 @@ jobs: runs-on: ${{ matrix.os }} container: # TODO(yikun): Remove m.daocloud.io prefix when infra proxy ready - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 env: VLLM_LOGGING_LEVEL: ERROR VLLM_USE_MODELSCOPE: True diff --git a/.github/workflows/vllm_ascend_test_long_term.yaml b/.github/workflows/vllm_ascend_test_long_term.yaml index bcf166941d..59866ce640 100644 --- a/.github/workflows/vllm_ascend_test_long_term.yaml +++ b/.github/workflows/vllm_ascend_test_long_term.yaml @@ -48,7 +48,7 @@ jobs: runs-on: ${{ matrix.os }} container: # TODO(yikun): Remove m.daocloud.io prefix when infra proxy ready - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 env: VLLM_LOGGING_LEVEL: ERROR VLLM_USE_MODELSCOPE: True diff --git a/.github/workflows/vllm_ascend_test_pd.yaml b/.github/workflows/vllm_ascend_test_pd.yaml index e6bb6a6988..fcb9fe1f0a 100644 --- a/.github/workflows/vllm_ascend_test_pd.yaml +++ b/.github/workflows/vllm_ascend_test_pd.yaml @@ -50,7 +50,7 @@ jobs: runs-on: linux-arm64-npu-static-8 container: - image: m.daocloud.io/quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 + image: m.daocloud.io/quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 volumes: - /usr/local/dcmi:/usr/local/dcmi - /usr/local/bin/npu-smi:/usr/local/bin/npu-smi diff --git a/Dockerfile b/Dockerfile index e6ec009d28..44e889d456 100644 --- a/Dockerfile +++ b/Dockerfile @@ -15,7 +15,7 @@ # This file is a part of the vllm-ascend project. # -FROM quay.io/ascend/cann:8.1.rc1-910b-ubuntu22.04-py3.10 +FROM quay.io/ascend/cann:8.2.rc1.alpha003-910b-ubuntu22.04-py3.11 ARG PIP_INDEX_URL="https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple" ARG COMPILE_CUSTOM_KERNELS=1 diff --git a/Dockerfile.310p b/Dockerfile.310p index fffe73eeeb..d531c8413c 100644 --- a/Dockerfile.310p +++ b/Dockerfile.310p @@ -15,7 +15,7 @@ # This file is a part of the vllm-ascend project. # -FROM quay.io/ascend/cann:8.1.rc1-310p-ubuntu22.04-py3.10 +FROM quay.io/ascend/cann:8.2.rc1.alpha003-310p-ubuntu22.04-py3.11 ARG PIP_INDEX_URL="https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple" ARG COMPILE_CUSTOM_KERNELS=1 diff --git a/Dockerfile.310p.openEuler b/Dockerfile.310p.openEuler index da4718cb29..0e3e55bded 100644 --- a/Dockerfile.310p.openEuler +++ b/Dockerfile.310p.openEuler @@ -15,7 +15,7 @@ # This file is a part of the vllm-ascend project. # -FROM quay.io/ascend/cann:8.1.rc1-310p-openeuler22.03-py3.10 +FROM quay.io/ascend/cann:8.2.rc1.alpha003-310p-openeuler22.03-py3.11 ARG PIP_INDEX_URL="https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple" ARG COMPILE_CUSTOM_KERNELS=1 diff --git a/Dockerfile.openEuler b/Dockerfile.openEuler index 4e414e04b7..62aa44d08f 100644 --- a/Dockerfile.openEuler +++ b/Dockerfile.openEuler @@ -15,7 +15,7 @@ # This file is a part of the vllm-ascend project. # -FROM quay.io/ascend/cann:8.1.rc1-910b-openeuler22.03-py3.10 +FROM quay.io/ascend/cann:8.2.rc1.alpha003-910b-openeuler22.03-py3.11 ARG PIP_INDEX_URL="https://mirrors.tuna.tsinghua.edu.cn/pypi/web/simple" ARG COMPILE_CUSTOM_KERNELS=1 diff --git a/README.md b/README.md index 7e5918c763..6afbf08a1c 100644 --- a/README.md +++ b/README.md @@ -37,7 +37,7 @@ By using vLLM Ascend plugin, popular open-source models, including Transformer-l - OS: Linux - Software: * Python >= 3.9, < 3.12 - * CANN >= 8.1.RC1 + * CANN >= 8.2.RC1.alpha003 * PyTorch >= 2.5.1, torch-npu >= 2.5.1.post1.dev20250619 * vLLM (the same version as vllm-ascend) diff --git a/README.zh.md b/README.zh.md index 55a40f5380..81763efe2a 100644 --- a/README.zh.md +++ b/README.zh.md @@ -38,7 +38,7 @@ vLLM 昇腾插件 (`vllm-ascend`) 是一个由社区维护的让vLLM在Ascend NP - 操作系统:Linux - 软件: * Python >= 3.9, < 3.12 - * CANN >= 8.1.RC1 + * CANN >= 8.2.RC1.alpha003 * PyTorch >= 2.5.1, torch-npu >= 2.5.1.post1.dev20250619 * vLLM (与vllm-ascend版本一致) diff --git a/docs/source/conf.py b/docs/source/conf.py index 9bb8a0cc8f..1689957280 100644 --- a/docs/source/conf.py +++ b/docs/source/conf.py @@ -75,7 +75,7 @@ 'pip_vllm_ascend_version': "0.9.1rc1", 'pip_vllm_version': "0.9.1", # CANN image tag - 'cann_image_tag': "8.1.rc1-910b-ubuntu22.04-py3.10", + 'cann_image_tag': "8.2.rc1.alpha003-910b-ubuntu22.04-py3.11", } # Add any paths that contain templates here, relative to this directory. diff --git a/docs/source/installation.md b/docs/source/installation.md index 8f21aa8111..3704b409d1 100644 --- a/docs/source/installation.md +++ b/docs/source/installation.md @@ -11,7 +11,7 @@ This document describes how to install vllm-ascend manually. | Software | Supported version | Note | |---------------|----------------------------------|-------------------------------------------| - | CANN | >= 8.1.RC1 | Required for vllm-ascend and torch-npu | + | CANN | >= 8.2.RC1.alpha003 | Required for vllm-ascend and torch-npu | | torch-npu | >= 2.5.1.post1.dev20250619 | Required for vllm-ascend | | torch | >= 2.5.1 | Required for torch-npu and vllm | @@ -78,19 +78,20 @@ source vllm-ascend-env/bin/activate pip3 install -i https://pypi.tuna.tsinghua.edu.cn/simple attrs 'numpy<2.0.0' decorator sympy cffi pyyaml pathlib2 psutil protobuf scipy requests absl-py wheel typing_extensions # Download and install the CANN package. -wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/CANN/CANN%208.1.RC1/Ascend-cann-toolkit_8.1.RC1_linux-"$(uname -i)".run -chmod +x ./Ascend-cann-toolkit_8.1.RC1_linux-"$(uname -i)".run -./Ascend-cann-toolkit_8.1.RC1_linux-"$(uname -i)".run --full +wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/Milan-ASL/Milan-ASL%20V100R001C22B800TP052/Ascend-cann-toolkit_8.2.RC1.alpha003_linux-"$(uname -i)".run +chmod +x ./Ascend-cann-toolkit_8.2.RC1.alpha003_linux-"$(uname -i)".run +./Ascend-cann-toolkit_8.2.RC1.alpha003_linux-"$(uname -i)".run --full +# https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/Milan-ASL/Milan-ASL%20V100R001C22B800TP052/Ascend-cann-kernels-910b_8.2.RC1.alpha003_linux-aarch64.run source /usr/local/Ascend/ascend-toolkit/set_env.sh -wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/CANN/CANN%208.1.RC1/Ascend-cann-kernels-910b_8.1.RC1_linux-"$(uname -i)".run -chmod +x ./Ascend-cann-kernels-910b_8.1.RC1_linux-"$(uname -i)".run -./Ascend-cann-kernels-910b_8.1.RC1_linux-"$(uname -i)".run --install +wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/Milan-ASL/Milan-ASL%20V100R001C22B800TP052/Ascend-cann-kernels-910b_8.2.RC1.alpha003_linux-"$(uname -i)".run +chmod +x ./Ascend-cann-kernels-910b_8.2.RC1.alpha003_linux-"$(uname -i)".run +./Ascend-cann-kernels-910b_8.2.RC1.alpha003_linux-"$(uname -i)".run --install -wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/CANN/CANN%208.1.RC1/Ascend-cann-nnal_8.1.RC1_linux-"$(uname -i)".run -chmod +x ./Ascend-cann-nnal_8.1.RC1_linux-"$(uname -i)".run -./Ascend-cann-nnal_8.1.RC1_linux-"$(uname -i)".run --install +wget --header="Referer: https://www.hiascend.com/" https://ascend-repo.obs.cn-east-2.myhuaweicloud.com/Milan-ASL/Milan-ASL%20V100R001C22B800TP052/Ascend-cann-nnal_8.2.RC1.alpha003_linux-"$(uname -i)".run +chmod +x ./Ascend-cann-nnal_8.2.RC1.alpha003_linux-"$(uname -i)".run +./Ascend-cann-nnal_8.2.RC1.alpha003_linux-"$(uname -i)".run --install source /usr/local/Ascend/nnal/atb/set_env.sh ```