File tree Expand file tree Collapse file tree 3 files changed +2
-3
lines changed
docker_compose/intel/hpu/gaudi
kubernetes/intel/hpu/gaudi/manifest Expand file tree Collapse file tree 3 files changed +2
-3
lines changed Original file line number Diff line number Diff line change @@ -97,7 +97,7 @@ services:
97
97
cap_add :
98
98
- SYS_NICE
99
99
ipc : host
100
- command : --enforce-eager -- model $LLM_MODEL_ID --tensor-parallel-size 1 --host 0.0.0.0 --port 80 --block-size 128 --max-num-seqs 256 --max-seq_len-to-capture 2048
100
+ command : --model $LLM_MODEL_ID --tensor-parallel-size 1 --host 0.0.0.0 --port 80 --block-size 128 --max-num-seqs 256 --max-seq_len-to-capture 2048
101
101
chatqna-gaudi-backend-server :
102
102
image : ${REGISTRY:-opea}/chatqna:${TAG:-latest}
103
103
container_name : chatqna-gaudi-backend-server
Original file line number Diff line number Diff line change @@ -1286,7 +1286,6 @@ spec:
1286
1286
type : RuntimeDefault
1287
1287
image : " opea/vllm-gaudi:latest"
1288
1288
args :
1289
- - " --enforce-eager"
1290
1289
- " --model"
1291
1290
- " $(MODEL_ID)"
1292
1291
- " --tensor-parallel-size"
Original file line number Diff line number Diff line change @@ -39,7 +39,7 @@ function start_services() {
39
39
# Start Docker Containers
40
40
docker compose -f compose_vllm.yaml up -d > ${LOG_PATH} /start_services_with_compose.log
41
41
n=0
42
- until [[ " $n " -ge 100 ]]; do
42
+ until [[ " $n " -ge 160 ]]; do
43
43
echo " n=$n "
44
44
docker logs vllm-gaudi-server > vllm_service_start.log
45
45
if grep -q " Warmup finished" vllm_service_start.log; then
You can’t perform that action at this time.
0 commit comments