@@ -20,13 +20,12 @@ echo "uninstall org"
2020python -m pip uninstall paddlepaddle-xpu -y
2121python -m pip uninstall fastdeploy-xpu -y
2222
23- python -m pip install paddlepaddle-xpu -i https://www.paddlepaddle.org.cn/packages/nightly/xpu-p800/
23+ python -m pip install https://paddle-qa.bj.bcebos.com/paddle-pipeline/Release-TagBuild-Training-Linux-Xpu-P800-SelfBuiltPypiUse/latest/paddlepaddle_xpu-0.0.0-cp310-cp310-linux_x86_64.whl
2424
2525echo " build whl"
26- bash custom_ops/xpu_ops/download_dependencies.sh develop
26+ bash custom_ops/xpu_ops/download_dependencies.sh stable
2727export CLANG_PATH=$( pwd) /custom_ops/xpu_ops/third_party/xtdk
2828export XVLLM_PATH=$( pwd) /custom_ops/xpu_ops/third_party/xvllm
29-
3029bash build.sh || exit 1
3130
3231echo " pip others"
@@ -54,7 +53,8 @@ python -m fastdeploy.entrypoints.openai.api_server \
5453 --num-gpu-blocks-override 16384 \
5554 --max-model-len 32768 \
5655 --max-num-seqs 128 \
57- --quantization wint4 > server.log 2>&1 &
56+ --quantization wint4 \
57+ --load-choices default > server.log 2>&1 &
5858
5959sleep 60
6060# 探活
@@ -121,7 +121,8 @@ python -m fastdeploy.entrypoints.openai.api_server \
121121 --num-gpu-blocks-override 16384 \
122122 --max-model-len 32768 \
123123 --max-num-seqs 64 \
124- --quantization " W4A8" > server.log 2>&1 &
124+ --quantization " W4A8" \
125+ --load-choices default > server.log 2>&1 &
125126
126127sleep 60
127128# 探活
@@ -191,7 +192,8 @@ python -m fastdeploy.entrypoints.openai.api_server \
191192 --enable-mm \
192193 --mm-processor-kwargs ' {"video_max_frames": 30}' \
193194 --limit-mm-per-prompt ' {"image": 10, "video": 3}' \
194- --reasoning-parser ernie-45-vl > server.log 2>&1 &
195+ --reasoning-parser ernie-45-vl \
196+ --load-choices default > server.log 2>&1 &
195197
196198sleep 60
197199# 探活
@@ -283,4 +285,4 @@ if [ ${ep_exit_code} -ne 0 ]; then
283285 cat log/workerlog.0
284286 echo " EP并行 相关测试失败,请检查pr代码"
285287 exit 1
286- fi
288+ fi
0 commit comments