Skip to content

Commit

Permalink
updated dockerfile for worker-full
Browse files Browse the repository at this point in the history
  • Loading branch information
yk committed Feb 19, 2023
1 parent cdea29e commit a89d9b7
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 1 deletion.
1 change: 0 additions & 1 deletion docker/inference/Dockerfile.worker-full
Expand Up @@ -19,7 +19,6 @@ COPY ./${APP_RELATIVE_PATH}/worker_full_main.sh /entrypoint.sh
ENV MODEL_ID="distilgpt2"
ENV MAX_INPUT_LENGTH="850"
ENV MAX_TOTAL_TOKENS="1024"
ENV INFERENCE_SERVER_URL="http://localhost:80"
ENV BACKEND_URL="ws://localhost:8000"
ENV PARALLELISM="4"

Expand Down
2 changes: 2 additions & 0 deletions inference/worker/worker_full_main.sh
Expand Up @@ -5,6 +5,8 @@ PARALLELISM=${PARALLELISM:-1}

text-generation-launcher &

export INFERENCE_SERVER_URL="http://localhost:80"

# launch PARALLELISM workers
for i in $(seq 1 $PARALLELISM); do
/opt/miniconda/envs/worker/bin/python /worker &
Expand Down

0 comments on commit a89d9b7

Please sign in to comment.