From a89d9b72beabf705082fe8bfe7a16d86a8e9aff8 Mon Sep 17 00:00:00 2001 From: Yannic Kilcher Date: Sun, 19 Feb 2023 23:02:23 +0100 Subject: [PATCH] updated dockerfile for worker-full --- docker/inference/Dockerfile.worker-full | 1 - inference/worker/worker_full_main.sh | 2 ++ 2 files changed, 2 insertions(+), 1 deletion(-) diff --git a/docker/inference/Dockerfile.worker-full b/docker/inference/Dockerfile.worker-full index 66ccd17a8b..948ab0fa6b 100644 --- a/docker/inference/Dockerfile.worker-full +++ b/docker/inference/Dockerfile.worker-full @@ -19,7 +19,6 @@ COPY ./${APP_RELATIVE_PATH}/worker_full_main.sh /entrypoint.sh ENV MODEL_ID="distilgpt2" ENV MAX_INPUT_LENGTH="850" ENV MAX_TOTAL_TOKENS="1024" -ENV INFERENCE_SERVER_URL="http://localhost:80" ENV BACKEND_URL="ws://localhost:8000" ENV PARALLELISM="4" diff --git a/inference/worker/worker_full_main.sh b/inference/worker/worker_full_main.sh index bb8ed33c79..e81a22ddaf 100755 --- a/inference/worker/worker_full_main.sh +++ b/inference/worker/worker_full_main.sh @@ -5,6 +5,8 @@ PARALLELISM=${PARALLELISM:-1} text-generation-launcher & +export INFERENCE_SERVER_URL="http://localhost:80" + # launch PARALLELISM workers for i in $(seq 1 $PARALLELISM); do /opt/miniconda/envs/worker/bin/python /worker &