| 内容 | 版本 |
|---|---|
| 固件与驱动 | 25.0.rc1 |
| CANN | 8.3.rc1 |
| Pytorch | 2.7.1 |
| torch_npu | 2.7.1 |
| transformers | 4.57.1 |
| 镜像 | vllm-ascandv0.11rc2 |
git clone https://www.modelscope.cn/BAAI/BGE-VL-large.git镜像下载地址
docker pull quay.io/ascend/vllm-ascend:v0.11.0rc2vim docker_start.sh
#脚本内容如下
############################################################################
docker run -itd --privileged --name=容器名称 --net=host --shm-size=500g \
--device=/dev/davinci0 \
--device=/dev/davinci1 \
--device=/dev/davinci2 \
--device=/dev/davinci3 \
--device=/dev/davinci4 \
--device=/dev/davinci5 \
--device=/dev/davinci6 \
--device=/dev/davinci7 \
--device=/dev/davinci_manager \
--device=/dev/devmm_svm \
--device=/dev/hisi_hdc \
-v /usr/local/Ascend/driver:/usr/local/Ascend/driver \
-v /usr/local/Ascend/add-ons/:/usr/local/Ascend/add-ons/ \
-v /usr/local/sbin/:/usr/local/sbin/ \
-v /var/log/npu/slog/:/var/log/npu/slog \
-v /var/log/npu/profiling/:/var/log/npu/profiling \
-v /var/log/npu/dump/:/var/log/npu/dump \
-v /var/log/npu/:/usr/slog \
-v /etc/hccn.conf:/etc/hccn.conf \
-v /data:/data \ #权重和推理脚本位置,可选不同路径
镜像ID \
bash
#########################################################
#进入容器
bash docker_start.sh
docker exec -it <容器名称> bashgit clone https://gitcode.com/Ascend-SACT/BGE-VL-large-infer.git
cd BGE-VL-large-infer项目目录
├── infer_bge_vl.py
├── BGE-VL-large
│ ├── config.json
│ ├── pytorch_model.bin
│ └── ...
└── images
├── cir_query.png
├── cir_candi_1.png
└── cir_candi_2.pngpython3 infer_bge_vl.py --model_path ./BGE-VL-large --image_path ./images