File tree Expand file tree Collapse file tree 5 files changed +9
-2
lines changed
docker_compose/intel/gpu/arc Expand file tree Collapse file tree 5 files changed +9
-2
lines changed Original file line number Diff line number Diff line change @@ -34,3 +34,4 @@ export MAX_NUM_BATCHED_TOKENS=${MAX_NUM_BATCHED_TOKENS}
3434export MAX_MODEL_LEN=${MAX_MODEL_LEN}
3535export LOAD_IN_LOW_BIT=${LOAD_IN_LOW_BIT}
3636export CCL_DG2_USM=${CCL_DG2_USM}
37+ export ZE_AFFINITY_MASK=${ZE_AFFINITY_MASK}
Original file line number Diff line number Diff line change @@ -22,6 +22,9 @@ pillow>=10.4.0
2222py-cpuinfo >= 9.0.0
2323pymilvus == 2.5.10
2424python-docx == 1.1.2
25+ torch == 2.8.0+cpu
26+ torchvision == 0.23.0+cpu
2527unstructured
2628unstructured [pdf ]
2729werkzeug == 3.1.3
30+
Original file line number Diff line number Diff line change @@ -28,7 +28,6 @@ UI_UPLOAD_PATH="$WORKPATH/tests"
2828
2929HF_ENDPOINT=https://hf-mirror.com
3030
31-
3231function build_docker_images() {
3332 opea_branch=${opea_branch:- " main" }
3433 cd $WORKPATH /docker_image_build
Original file line number Diff line number Diff line change @@ -38,6 +38,7 @@ LLM_MODEL="Qwen/Qwen3-8B"
3838LLM_MODEL_PATH=" ${MODEL_PATH} /${LLM_MODEL} "
3939NGINX_CONFIG_PATH=" $WORKPATH /nginx/nginx.conf"
4040VLLM_IMAGE_TAG=" 0.8.3-b20"
41+ MAX_MODEL_LEN=8192
4142DP_NUM=1
4243
4344function build_docker_images() {
@@ -179,4 +180,5 @@ function main() {
179180
180181}
181182
183+
182184main
Original file line number Diff line number Diff line change @@ -25,14 +25,15 @@ MODEL_PATH="${HOME}/models"
2525# MODEL_PATH="$WORKPATH/models"
2626DOC_PATH=" $WORKPATH /tests"
2727UI_UPLOAD_PATH=" $WORKPATH /tests"
28-
28+ MAX_MODEL_LEN=8192
2929HF_ENDPOINT=https://hf-mirror.com
3030VLLM_SERVICE_PORT_B60=8086
3131TP=1
3232vLLM_ENDPOINT=" http://${HOST_IP} :${VLLM_SERVICE_PORT_B60} "
3333LLM_MODEL=" Qwen/Qwen3-8B"
3434VLLM_IMAGE_TAG=" 1.0"
3535DP=1
36+ ZE_AFFINITY_MASK=1
3637
3738function build_docker_images() {
3839 opea_branch=${opea_branch:- " main" }
@@ -170,4 +171,5 @@ function main() {
170171
171172}
172173
174+
173175main
You can’t perform that action at this time.
0 commit comments