File tree Expand file tree Collapse file tree 3 files changed +2
-3
lines changed
docker_compose/intel/hpu/gaudi
kubernetes/intel/hpu/gaudi/manifest Expand file tree Collapse file tree 3 files changed +2
-3
lines changed Original file line number Diff line number Diff line change @@ -97,7 +97,7 @@ services:
9797 cap_add :
9898 - SYS_NICE
9999 ipc : host
100- command : --enforce-eager -- model $LLM_MODEL_ID --tensor-parallel-size 1 --host 0.0.0.0 --port 80 --block-size 128 --max-num-seqs 256 --max-seq_len-to-capture 2048
100+ command : --model $LLM_MODEL_ID --tensor-parallel-size 1 --host 0.0.0.0 --port 80 --block-size 128 --max-num-seqs 256 --max-seq_len-to-capture 2048
101101 chatqna-gaudi-backend-server :
102102 image : ${REGISTRY:-opea}/chatqna:${TAG:-latest}
103103 container_name : chatqna-gaudi-backend-server
Original file line number Diff line number Diff line change @@ -1286,7 +1286,6 @@ spec:
12861286 type : RuntimeDefault
12871287 image : " opea/vllm-gaudi:latest"
12881288 args :
1289- - " --enforce-eager"
12901289 - " --model"
12911290 - " $(MODEL_ID)"
12921291 - " --tensor-parallel-size"
Original file line number Diff line number Diff line change @@ -39,7 +39,7 @@ function start_services() {
3939 # Start Docker Containers
4040 docker compose -f compose_vllm.yaml up -d > ${LOG_PATH} /start_services_with_compose.log
4141 n=0
42- until [[ " $n " -ge 100 ]]; do
42+ until [[ " $n " -ge 160 ]]; do
4343 echo " n=$n "
4444 docker logs vllm-gaudi-server > vllm_service_start.log
4545 if grep -q " Warmup finished" vllm_service_start.log; then
You can’t perform that action at this time.
0 commit comments