diff --git a/serving/docker/Dockerfile b/serving/docker/Dockerfile index f4b36320a..f0f6980d6 100644 --- a/serving/docker/Dockerfile +++ b/serving/docker/Dockerfile @@ -31,7 +31,6 @@ EXPOSE 8080 WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 -ENV OMP_NUM_THREADS=1 ENV TF_NUM_INTEROP_THREADS=1 ENV TF_NUM_INTRAOP_THREADS=1 ENV TF_CPP_MIN_LOG_LEVEL=1 diff --git a/serving/docker/aarch64.Dockerfile b/serving/docker/aarch64.Dockerfile index 4b45bbbb7..130150a74 100644 --- a/serving/docker/aarch64.Dockerfile +++ b/serving/docker/aarch64.Dockerfile @@ -19,7 +19,6 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh RUN chmod +x /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-arm64 -ENV OMP_NUM_THREADS=1 ENV JAVA_OPTS="-Xmx1g -Xms1g -XX:-UseContainerSupport -XX:+ExitOnOutOfMemoryError -Dai.djl.default_engine=PyTorch" ENV MODEL_SERVER_HOME=/opt/djl ENV HUGGINGFACE_HUB_CACHE=/tmp diff --git a/serving/docker/deepspeed.Dockerfile b/serving/docker/deepspeed.Dockerfile index f4af82929..684fd2bd9 100644 --- a/serving/docker/deepspeed.Dockerfile +++ b/serving/docker/deepspeed.Dockerfile @@ -27,6 +27,7 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh RUN chmod +x /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 +ENV NO_OMP_NUM_THREADS=true ENV JAVA_OPTS="-Xmx1g -Xms1g -XX:-UseContainerSupport -XX:+ExitOnOutOfMemoryError" ENV MODEL_SERVER_HOME=/opt/djl ENV MODEL_LOADING_TIMEOUT=1200 diff --git a/serving/docker/fastertransformer.Dockerfile b/serving/docker/fastertransformer.Dockerfile index b5a9d66d6..992f225bc 100644 --- a/serving/docker/fastertransformer.Dockerfile +++ b/serving/docker/fastertransformer.Dockerfile @@ -29,6 +29,7 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh RUN chmod +x /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 +ENV NO_OMP_NUM_THREADS=true ENV JAVA_OPTS="-Xmx1g -Xms1g -XX:-UseContainerSupport -XX:+ExitOnOutOfMemoryError" ENV MODEL_SERVER_HOME=/opt/djl ENV MODEL_LOADING_TIMEOUT=1200 diff --git a/serving/docker/pytorch-cu118.Dockerfile b/serving/docker/pytorch-cu118.Dockerfile index a7fc6f8ac..629e9c6ca 100644 --- a/serving/docker/pytorch-cu118.Dockerfile +++ b/serving/docker/pytorch-cu118.Dockerfile @@ -25,7 +25,7 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 -ENV OMP_NUM_THREADS=1 +ENV NO_OMP_NUM_THREADS=true ENV MODEL_SERVER_HOME=/opt/djl ENV DJL_CACHE_DIR=/tmp/.djl.ai ENV HUGGINGFACE_HUB_CACHE=/tmp diff --git a/serving/docker/pytorch-inf1.Dockerfile b/serving/docker/pytorch-inf1.Dockerfile index a0a515e99..9bec140bb 100644 --- a/serving/docker/pytorch-inf1.Dockerfile +++ b/serving/docker/pytorch-inf1.Dockerfile @@ -21,7 +21,6 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh RUN chmod +x /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 -ENV OMP_NUM_THREADS=1 ENV MODEL_SERVER_HOME=/opt/djl ENV DJL_CACHE_DIR=/tmp/.djl.ai ENV HUGGINGFACE_HUB_CACHE=/tmp @@ -40,7 +39,7 @@ CMD ["serve"] COPY scripts scripts/ RUN mkdir -p /opt/djl/conf && \ mkdir -p /opt/djl/deps && \ - mkdir -p /opt/ml/model + mkdir -p /opt/ml/model COPY config.properties /opt/djl/conf/ RUN scripts/install_djl_serving.sh $djl_version && \ mkdir -p /opt/djl/bin && cp scripts/telemetry.sh /opt/djl/bin && \ diff --git a/serving/docker/pytorch-inf2.Dockerfile b/serving/docker/pytorch-inf2.Dockerfile index 0f6d9468d..178a31dc8 100644 --- a/serving/docker/pytorch-inf2.Dockerfile +++ b/serving/docker/pytorch-inf2.Dockerfile @@ -27,6 +27,7 @@ COPY dockerd-entrypoint.sh /usr/local/bin/dockerd-entrypoint.sh RUN chmod +x /usr/local/bin/dockerd-entrypoint.sh WORKDIR /opt/djl ENV JAVA_HOME=/usr/lib/jvm/java-11-openjdk-amd64 +ENV NO_OMP_NUM_THREADS=true ENV MODEL_SERVER_HOME=/opt/djl ENV DJL_CACHE_DIR=/tmp/.djl.ai ENV HUGGINGFACE_HUB_CACHE=/tmp