From 770f0794eb000216f9e34987ed0946dda6b09078 Mon Sep 17 00:00:00 2001 From: ZheyuYe Date: Thu, 20 Aug 2020 15:10:57 +0800 Subject: [PATCH] Revert "merge xingjian's" This reverts commit ea1f1aae9f7e05463900875e12ea98aae2a81827. --- LICENSE | 201 ------------------ README.md | 11 - src/gluonnlp/__init__.py | 2 +- tools/batch/README.md | 26 ++- tools/batch/docker/Dockerfile | 48 ++--- tools/batch/hello_world.py | 10 - tools/batch/submit-job.py | 24 ++- tools/docker/README.md | 21 -- tools/docker/devel_entrypoint.sh | 5 - tools/docker/start_jupyter.sh | 15 -- tools/docker/ubuntu18.04-devel-gpu.Dockerfile | 186 ---------------- 11 files changed, 53 insertions(+), 496 deletions(-) delete mode 100644 LICENSE delete mode 100644 tools/batch/hello_world.py delete mode 100644 tools/docker/README.md delete mode 100644 tools/docker/devel_entrypoint.sh delete mode 100644 tools/docker/start_jupyter.sh delete mode 100644 tools/docker/ubuntu18.04-devel-gpu.Dockerfile diff --git a/LICENSE b/LICENSE deleted file mode 100644 index 261eeb9e9f..0000000000 --- a/LICENSE +++ /dev/null @@ -1,201 +0,0 @@ - Apache License - Version 2.0, January 2004 - http://www.apache.org/licenses/ - - TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION - - 1. Definitions. - - "License" shall mean the terms and conditions for use, reproduction, - and distribution as defined by Sections 1 through 9 of this document. - - "Licensor" shall mean the copyright owner or entity authorized by - the copyright owner that is granting the License. - - "Legal Entity" shall mean the union of the acting entity and all - other entities that control, are controlled by, or are under common - control with that entity. For the purposes of this definition, - "control" means (i) the power, direct or indirect, to cause the - direction or management of such entity, whether by contract or - otherwise, or (ii) ownership of fifty percent (50%) or more of the - outstanding shares, or (iii) beneficial ownership of such entity. - - "You" (or "Your") shall mean an individual or Legal Entity - exercising permissions granted by this License. - - "Source" form shall mean the preferred form for making modifications, - including but not limited to software source code, documentation - source, and configuration files. - - "Object" form shall mean any form resulting from mechanical - transformation or translation of a Source form, including but - not limited to compiled object code, generated documentation, - and conversions to other media types. - - "Work" shall mean the work of authorship, whether in Source or - Object form, made available under the License, as indicated by a - copyright notice that is included in or attached to the work - (an example is provided in the Appendix below). - - "Derivative Works" shall mean any work, whether in Source or Object - form, that is based on (or derived from) the Work and for which the - editorial revisions, annotations, elaborations, or other modifications - represent, as a whole, an original work of authorship. For the purposes - of this License, Derivative Works shall not include works that remain - separable from, or merely link (or bind by name) to the interfaces of, - the Work and Derivative Works thereof. - - "Contribution" shall mean any work of authorship, including - the original version of the Work and any modifications or additions - to that Work or Derivative Works thereof, that is intentionally - submitted to Licensor for inclusion in the Work by the copyright owner - or by an individual or Legal Entity authorized to submit on behalf of - the copyright owner. For the purposes of this definition, "submitted" - means any form of electronic, verbal, or written communication sent - to the Licensor or its representatives, including but not limited to - communication on electronic mailing lists, source code control systems, - and issue tracking systems that are managed by, or on behalf of, the - Licensor for the purpose of discussing and improving the Work, but - excluding communication that is conspicuously marked or otherwise - designated in writing by the copyright owner as "Not a Contribution." - - "Contributor" shall mean Licensor and any individual or Legal Entity - on behalf of whom a Contribution has been received by Licensor and - subsequently incorporated within the Work. - - 2. Grant of Copyright License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - copyright license to reproduce, prepare Derivative Works of, - publicly display, publicly perform, sublicense, and distribute the - Work and such Derivative Works in Source or Object form. - - 3. Grant of Patent License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - (except as stated in this section) patent license to make, have made, - use, offer to sell, sell, import, and otherwise transfer the Work, - where such license applies only to those patent claims licensable - by such Contributor that are necessarily infringed by their - Contribution(s) alone or by combination of their Contribution(s) - with the Work to which such Contribution(s) was submitted. If You - institute patent litigation against any entity (including a - cross-claim or counterclaim in a lawsuit) alleging that the Work - or a Contribution incorporated within the Work constitutes direct - or contributory patent infringement, then any patent licenses - granted to You under this License for that Work shall terminate - as of the date such litigation is filed. - - 4. Redistribution. You may reproduce and distribute copies of the - Work or Derivative Works thereof in any medium, with or without - modifications, and in Source or Object form, provided that You - meet the following conditions: - - (a) You must give any other recipients of the Work or - Derivative Works a copy of this License; and - - (b) You must cause any modified files to carry prominent notices - stating that You changed the files; and - - (c) You must retain, in the Source form of any Derivative Works - that You distribute, all copyright, patent, trademark, and - attribution notices from the Source form of the Work, - excluding those notices that do not pertain to any part of - the Derivative Works; and - - (d) If the Work includes a "NOTICE" text file as part of its - distribution, then any Derivative Works that You distribute must - include a readable copy of the attribution notices contained - within such NOTICE file, excluding those notices that do not - pertain to any part of the Derivative Works, in at least one - of the following places: within a NOTICE text file distributed - as part of the Derivative Works; within the Source form or - documentation, if provided along with the Derivative Works; or, - within a display generated by the Derivative Works, if and - wherever such third-party notices normally appear. The contents - of the NOTICE file are for informational purposes only and - do not modify the License. You may add Your own attribution - notices within Derivative Works that You distribute, alongside - or as an addendum to the NOTICE text from the Work, provided - that such additional attribution notices cannot be construed - as modifying the License. - - You may add Your own copyright statement to Your modifications and - may provide additional or different license terms and conditions - for use, reproduction, or distribution of Your modifications, or - for any such Derivative Works as a whole, provided Your use, - reproduction, and distribution of the Work otherwise complies with - the conditions stated in this License. - - 5. Submission of Contributions. Unless You explicitly state otherwise, - any Contribution intentionally submitted for inclusion in the Work - by You to the Licensor shall be under the terms and conditions of - this License, without any additional terms or conditions. - Notwithstanding the above, nothing herein shall supersede or modify - the terms of any separate license agreement you may have executed - with Licensor regarding such Contributions. - - 6. Trademarks. This License does not grant permission to use the trade - names, trademarks, service marks, or product names of the Licensor, - except as required for reasonable and customary use in describing the - origin of the Work and reproducing the content of the NOTICE file. - - 7. Disclaimer of Warranty. Unless required by applicable law or - agreed to in writing, Licensor provides the Work (and each - Contributor provides its Contributions) on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or - implied, including, without limitation, any warranties or conditions - of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A - PARTICULAR PURPOSE. You are solely responsible for determining the - appropriateness of using or redistributing the Work and assume any - risks associated with Your exercise of permissions under this License. - - 8. Limitation of Liability. In no event and under no legal theory, - whether in tort (including negligence), contract, or otherwise, - unless required by applicable law (such as deliberate and grossly - negligent acts) or agreed to in writing, shall any Contributor be - liable to You for damages, including any direct, indirect, special, - incidental, or consequential damages of any character arising as a - result of this License or out of the use or inability to use the - Work (including but not limited to damages for loss of goodwill, - work stoppage, computer failure or malfunction, or any and all - other commercial damages or losses), even if such Contributor - has been advised of the possibility of such damages. - - 9. Accepting Warranty or Additional Liability. While redistributing - the Work or Derivative Works thereof, You may choose to offer, - and charge a fee for, acceptance of support, warranty, indemnity, - or other liability obligations and/or rights consistent with this - License. However, in accepting such obligations, You may act only - on Your own behalf and on Your sole responsibility, not on behalf - of any other Contributor, and only if You agree to indemnify, - defend, and hold each Contributor harmless for any liability - incurred by, or claims asserted against, such Contributor by reason - of your accepting any such warranty or additional liability. - - END OF TERMS AND CONDITIONS - - APPENDIX: How to apply the Apache License to your work. - - To apply the Apache License to your work, attach the following - boilerplate notice, with the fields enclosed by brackets "[]" - replaced with your own identifying information. (Don't include - the brackets!) The text should be enclosed in the appropriate - comment syntax for the file format. We also recommend that a - file or class name and description of purpose be included on the - same "printed page" as the copyright notice for easier - identification within third-party archives. - - Copyright [yyyy] [name of copyright owner] - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. diff --git a/README.md b/README.md index 768495f9f6..2b1aae9fc8 100644 --- a/README.md +++ b/README.md @@ -72,14 +72,3 @@ python3 -m gluonnlp.cli.preprocess help # Run Unittests You may go to [tests](tests) to see all how to run the unittests. - - -# Use Docker -You can use Docker to launch a JupyterLab development environment with GluonNLP installed. - -``` -docker pull gluonai/gluon-nlp:v1.0.0 -docker run --gpus all --rm -it -p 8888:8888 -p 8787:8787 -p 8786:8786 gluonai/gluon-nlp:v1.0.0 -``` - -For more details, you can refer to the guidance in [tools/docker]. diff --git a/src/gluonnlp/__init__.py b/src/gluonnlp/__init__.py index a11355a405..31e7e08557 100644 --- a/src/gluonnlp/__init__.py +++ b/src/gluonnlp/__init__.py @@ -1,4 +1,4 @@ -__version__ = '1.0.0' +__version__ = '1.0.0.dev0' from . import base from . import data from . import models diff --git a/tools/batch/README.md b/tools/batch/README.md index ad47df8de0..955d4da53d 100644 --- a/tools/batch/README.md +++ b/tools/batch/README.md @@ -1,20 +1,18 @@ -# Launch AWS Jobs -For contributors of GluonNLP, you can try to launch jobs via AWS Batch. -Once you've correctly configured the AWS CLI, you may use the following command -to submit a dummy example in which `remote` and `source-ref` denote the repository - url and branch name respectively. +# Batch Job Examples +Based on AWS Batch, we provide a quick way to submit a job, including Conversion, Question Answering, Machine Translation, Text Translation and Pre-trained Model Training, which can be used for regular inspections or for rapid deployment of experiments. -``` +See a dummy submission for example in which `remote` and `source-ref` denote the repository url and branch name respectively. + +```bash python3 submit-job.py \ ---region us-east-1 \ ---source-ref master \ ---job-type p3.2x \ ---work-dir tools/batch \ ---remote https://github.com/dmlc/gluon-nlp \ ---command "python3 hello_world.py" \ ---wait + --region us-east-1 \ + --source-ref master \ + --job-type g4dn.12x \ + --name dummy_example \ + --work-dir scripts/preprocess \ + --remote https://github.com/dmlc/gluon-nlp/ \ + --command 'git rev-parse HEAD | tee stdout.log' ``` - ## Conversion Toolkits Following the instruction of [converting scripts](../../scripts/conversion_toolkits), several pre-trained models could be converted through the corresponding conversion tool as below command where `${MODEL_TYPE}` could be selected from `[albert, bert, electra, mobilebert, bart, robert, xmlr]`. ```bash diff --git a/tools/batch/docker/Dockerfile b/tools/batch/docker/Dockerfile index c0b8592ca7..a9ef4aaad4 100644 --- a/tools/batch/docker/Dockerfile +++ b/tools/batch/docker/Dockerfile @@ -1,27 +1,27 @@ FROM nvidia/cuda:10.2-cudnn7-devel-ubuntu18.04 -RUN apt-get update && apt-get install -y --no-install-recommends \ - build-essential \ - locales \ - cmake \ - wget \ - subversion \ - git \ - curl \ - vim \ - unzip \ - sudo \ - ca-certificates \ - libjpeg-dev \ - libpng-dev \ - libfreetype6-dev \ - python3-dev \ - python3-pip \ - python3-setuptools \ - libxft-dev &&\ - rm -rf /var/lib/apt/lists/* + RUN apt-get update && apt-get install -y --no-install-recommends \ + build-essential \ + locales \ + cmake \ + wget \ + subversion \ + git \ + curl \ + vim \ + unzip \ + sudo \ + ca-certificates \ + libjpeg-dev \ + libpng-dev \ + libfreetype6-dev \ + python3-dev \ + python3-pip \ + python3-setuptools \ + libxft-dev &&\ + rm -rf /var/lib/apt/lists/* -RUN pip3 install --upgrade pip && pip3 install awscli && pip3 install --pre 'mxnet-cu102' -f https://dist.mxnet.io/python -RUN git clone https://github.com/dmlc/gluon-nlp -WORKDIR gluon-nlp -ADD gluon_nlp_job.sh . + RUN pip3 install --upgrade pip && pip3 install awscli && pip3 install --pre 'mxnet-cu102' -f https://dist.mxnet.io/python + RUN git clone https://github.com/dmlc/gluon-nlp + WORKDIR gluon-nlp + ADD gluon_nlp_job.sh . diff --git a/tools/batch/hello_world.py b/tools/batch/hello_world.py deleted file mode 100644 index f84e06d6b9..0000000000 --- a/tools/batch/hello_world.py +++ /dev/null @@ -1,10 +0,0 @@ -from gluonnlp.data.vocab import Vocab -import mxnet as mx - - -if __name__ == '__main__': - vocab = Vocab(['Hello', 'World!'], unk_token=None) - print(vocab) - num_gpus = mx.context.num_gpus() - print('Number of GPUS:', num_gpus) - diff --git a/tools/batch/submit-job.py b/tools/batch/submit-job.py index f11fd50b64..451bd0fb3b 100644 --- a/tools/batch/submit-job.py +++ b/tools/batch/submit-job.py @@ -47,7 +47,6 @@ session = boto3.Session(profile_name=args.profile, region_name=args.region) batch, cloudwatch = [session.client(service_name=sn) for sn in ['batch', 'logs']] - def printLogs(logGroupName, logStreamName, startTime): kwargs = {'logGroupName': logGroupName, 'logStreamName': logStreamName, @@ -71,17 +70,27 @@ def printLogs(logGroupName, logStreamName, startTime): return lastTimestamp +def getLogStream(logGroupName, jobName, jobId): + response = cloudwatch.describe_log_streams( + logGroupName=logGroupName, + logStreamNamePrefix=jobName + '/' + jobId + ) + logStreams = response['logStreams'] + if not logStreams: + return '' + else: + return logStreams[0]['logStreamName'] + def nowInMillis(): endTime = long(total_seconds(datetime.utcnow() - datetime(1970, 1, 1))) * 1000 return endTime - job_definitions = { 'g4dn.4x': 'gluon-nlp-1-jobs:5', 'g4dn.8x': 'gluon-nlp-1-jobs:4', 'g4dn.12x': 'gluon-nlp-1-4gpu-jobs:1', 'g4dn.16x': 'gluon-nlp-1-jobs:3', - 'p3.2x': 'gluon-nlp-1-jobs:11', + 'p3.2x': 'gluon-nlp-1-jobs:5', 'p3.8x': 'gluon-nlp-1-4gpu-jobs:2', 'p3.16x': 'gluon-nlp-1-8gpu-jobs:1', 'p3dn.24x': 'gluon-nlp-1-8gpu-jobs:2', @@ -100,7 +109,6 @@ def nowInMillis(): 'c5n.18x': 'c5n', } - def main(): spin = ['-', '/', '|', '\\', '-', '/', '|', '\\'] logGroupName = '/aws/batch/job' @@ -112,7 +120,7 @@ def main(): command = args.command.split() wait = args.wait - parameters = { + parameters={ 'SOURCE_REF': args.source_ref, 'WORK_DIR': args.work_dir, 'SAVED_OUTPUT': args.saved_output, @@ -137,6 +145,7 @@ def main(): running = False status_set = set() startTime = 0 + while wait: time.sleep(random.randint(5, 10)) describeJobsResponse = batch.describe_jobs(jobs=[jobId]) @@ -148,10 +157,10 @@ def main(): sys.exit(status == 'FAILED') elif status == 'RUNNING': - logStreamName = describeJobsResponse['jobs'][0]['container']['logStreamName'] + logStreamName = getLogStream(logGroupName, jobName, jobId) if not running: running = True - print('\rJob [{}, {}] is RUNNING.'.format(jobName, jobId)) + print('\rJob [{} - {}] is RUNNING.'.format(jobName, jobId)) if logStreamName: print('Output [{}]:\n {}'.format(logStreamName, '=' * 80)) if logStreamName: @@ -162,6 +171,5 @@ def main(): sys.stdout.flush() spinner += 1 - if __name__ == '__main__': main() diff --git a/tools/docker/README.md b/tools/docker/README.md deleted file mode 100644 index 2b38c9730c..0000000000 --- a/tools/docker/README.md +++ /dev/null @@ -1,21 +0,0 @@ -# Docker Support in GluonNLP -We provide the [Docker](https://www.docker.com/) container with everything set up to run GluonNLP. -With the prebuilt docker image, there is no need to worry about the operating systems or system dependencies. -You can launch a [JupyterLab](https://jupyterlab.readthedocs.io/en/stable/) development environment -and try out to use GluonNLP to solve your problem. - -## Run Docker -You can run the docker with the following command: - -``` -docker pull gluonai/gluon-nlp:v1.0.0 -docker run --gpus all --rm -it -p 8888:8888 -p 8787:8787 -p 8786:8786 gluonai/gluon-nlp:v1.0.0 -``` - - -## Build your own Docker Image -To build a docker image fom the dockerfile, you may use the following command: - -``` -docker build -f ubuntu18.04-devel-gpu.Dockerfile -t gluonai/gluon-nlp . -``` diff --git a/tools/docker/devel_entrypoint.sh b/tools/docker/devel_entrypoint.sh deleted file mode 100644 index 6a91eb26a3..0000000000 --- a/tools/docker/devel_entrypoint.sh +++ /dev/null @@ -1,5 +0,0 @@ -#!/bin/bash - -source /start_jupyter.sh - -exec "$@" diff --git a/tools/docker/start_jupyter.sh b/tools/docker/start_jupyter.sh deleted file mode 100644 index 695ad45d88..0000000000 --- a/tools/docker/start_jupyter.sh +++ /dev/null @@ -1,15 +0,0 @@ -#!/bin/bash - -# Run Jupyter in foreground if $JUPYTER_FG is set -if [[ "${JUPYTER_FG}" == "true" ]]; then - jupyter-lab --allow-root --ip=0.0.0.0 --no-browser --NotebookApp.token='' - exit 0 -else - nohup jupyter-lab --allow-root --ip=0.0.0.0 --no-browser --NotebookApp.token='' > /dev/null 2>&1 & - - echo "Notebook server successfully started, a JupyterLab instance has been executed!" - echo "Make local folders visible by volume mounting to /workspace/notebook" - echo "To access visit http://localhost:8888 on your host machine." - echo 'Ensure the following arguments to "docker run" are added to expose the server ports to your host machine: - -p 8888:8888 -p 8787:8787 -p 8786:8786' -fi diff --git a/tools/docker/ubuntu18.04-devel-gpu.Dockerfile b/tools/docker/ubuntu18.04-devel-gpu.Dockerfile deleted file mode 100644 index 644b54cbae..0000000000 --- a/tools/docker/ubuntu18.04-devel-gpu.Dockerfile +++ /dev/null @@ -1,186 +0,0 @@ -FROM nvidia/cuda:10.2-cudnn7-devel-ubuntu18.04 - -LABEL maintainer="GluonNLP Team" - -ARG PYTHON=python3 -ARG PIP=pip3 -ARG PYTHON_VERSION=3.7.8 -ARG MX_URL=https://repo.mxnet.io/dist/python/cu102/mxnet_cu102-2.0.0b20200816-py2.py3-none-manylinux2014_x86_64.whl - -ARG OPENSSL_VERSION=1.1.1g -ARG TINI_VERSION=v0.19.0 - -# Update for tzdata -ARG DEBIAN_FRONTEND=noninteractive -ENV TZ=US -RUN ln -fs /usr/share/zoneinfo/America/New_York /etc/localtime - -ENV PYTHONDONTWRITEBYTECODE=1 \ - PYTHONUNBUFFERED=1 \ - LD_LIBRARY_PATH="${LD_LIBRARY_PATH}:/usr/local/lib" \ - PYTHONIOENCODING=UTF-8 \ - LANG=C.UTF-8 \ - LC_ALL=C.UTF-8 - -ENV WORKDIR=/workspace - -RUN apt-get update \ - && apt-get install -y --no-install-recommends \ - software-properties-common \ - build-essential \ - ca-certificates \ - tzdata \ - curl \ - emacs \ - subversion \ - locales \ - cmake \ - git \ - libopencv-dev \ - openssh-client \ - openssh-server \ - htop \ - vim \ - wget \ - unzip \ - sudo \ - python3-dev \ - python3-pip \ - python3-setuptools \ - libxft-dev \ - zlib1g-dev \ - && apt-get clean \ - && rm -rf /var/lib/apt/lists/* - -########################################################################### -# Horovod dependencies -########################################################################### - -# Install Open MPI -RUN mkdir /tmp/openmpi \ - && cd /tmp/openmpi \ - && curl -fSsL -O https://download.open-mpi.org/release/open-mpi/v4.0/openmpi-4.0.1.tar.gz \ - && tar zxf openmpi-4.0.1.tar.gz \ - && cd openmpi-4.0.1 \ - && ./configure --enable-orterun-prefix-by-default \ - && make -j $(nproc) all \ - && make install \ - && ldconfig \ - && rm -rf /tmp/openmpi - -# Create a wrapper for OpenMPI to allow running as root by default -RUN mv /usr/local/bin/mpirun /usr/local/bin/mpirun.real \ - && echo '#!/bin/bash' > /usr/local/bin/mpirun \ - && echo 'mpirun.real --allow-run-as-root "$@"' >> /usr/local/bin/mpirun \ - && chmod a+x /usr/local/bin/mpirun - -RUN echo "hwloc_base_binding_policy = none" >> /usr/local/etc/openmpi-mca-params.conf \ - && echo "rmaps_base_mapping_policy = slot" >> /usr/local/etc/openmpi-mca-params.conf - -ENV LD_LIBRARY_PATH=/usr/local/openmpi/lib:$LD_LIBRARY_PATH -ENV PATH=/usr/local/openmpi/bin/:/root/.local/bin:$PATH - -RUN wget -c https://www.openssl.org/source/openssl-${OPENSSL_VERSION}.tar.gz \ - && apt-get update \ - && apt remove -y --purge openssl \ - && rm -rf /usr/include/openssl \ - && apt-get install -y \ - ca-certificates \ - && tar -xzvf openssl-${OPENSSL_VERSION}.tar.gz \ - && cd openssl-${OPENSSL_VERSION} \ - && ./config && make -j $(nproc) && make test \ - && make install \ - && ldconfig \ - && cd .. && rm -rf openssl-* - -# when we remove previous openssl, the ca-certificates pkgs and its symlinks gets deleted -# causing sslcertverificationerror the below steps are to fix that -RUN ln -s /etc/ssl/certs/*.* /usr/local/ssl/certs/ - -RUN wget https://www.python.org/ftp/python/$PYTHON_VERSION/Python-$PYTHON_VERSION.tgz \ - && tar -xvf Python-$PYTHON_VERSION.tgz \ - && cd Python-$PYTHON_VERSION \ - && apt-get update \ - && apt-get install -y --no-install-recommends \ - libreadline-gplv2-dev \ - libncursesw5-dev \ - libssl-dev \ - libsqlite3-dev \ - libgdbm-dev \ - libc6-dev \ - libffi-dev \ - libbz2-dev \ - tk-dev \ - && apt-get clean \ - && ./configure \ - && make -j $(nproc) \ - && make install \ - && rm -rf /var/lib/apt/lists/* \ - && cd .. \ - && rm -rf Python-$PYTHON_VERSION* \ - && ln -s /usr/local/bin/pip3 /usr/bin/pip \ - && ln -s $(which ${PYTHON}) /usr/local/bin/python - -RUN mkdir -p ${WORKDIR}/notebook - -# install PyYAML==5.1.2 to avoid conflict with latest awscli -# python-dateutil==2.8.0 to satisfy botocore associated with latest awscli -RUN ${PIP} install --no-cache --upgrade \ - wheel \ - numpy==1.19.1 \ - pandas==0.25.1 \ - Pillow \ - requests==2.22.0 \ - scikit-learn==0.20.4 \ - scipy==1.2.2 \ - urllib3==1.25.8 \ - python-dateutil==2.8.0 \ - sagemaker-experiments==0.* \ - PyYAML==5.3.1 \ - mpi4py==3.0.2 \ - jupyterlab==2.2.4 \ - ${MX_URL} \ - awscli - -# Allow OpenSSH to talk to containers without asking for confirmation -RUN cat /etc/ssh/ssh_config | grep -v StrictHostKeyChecking > /etc/ssh/ssh_config.new \ - && echo " StrictHostKeyChecking no" >> /etc/ssh/ssh_config.new \ - && mv /etc/ssh/ssh_config.new /etc/ssh/ssh_config - -# OpenSSH config for MPI communication -RUN mkdir -p /var/run/sshd && \ - sed 's@session\s*required\s*pam_loginuid.so@session optional pam_loginuid.so@g' -i /etc/pam.d/sshd - -RUN rm -rf /root/.ssh/ && \ - mkdir -p /root/.ssh/ && \ - ssh-keygen -q -t rsa -N '' -f /root/.ssh/id_rsa && \ - cp /root/.ssh/id_rsa.pub /root/.ssh/authorized_keys \ - && printf "Host *\n StrictHostKeyChecking no\n" >> /root/.ssh/config - - -RUN mkdir -p /.init -RUN cd ${WORKDIR} \ - && git clone https://github.com/dmlc/gluon-nlp \ - && cd gluon-nlp \ - && git checkout master \ - && python3 -m pip install -U -e ."[extras]" --user - -COPY start_jupyter.sh /start_jupyter.sh -COPY devel_entrypoint.sh /devel_entrypoint.sh -RUN chmod +x /devel_entrypoint.sh - -EXPOSE 8888 -EXPOSE 8787 -EXPOSE 8786 - -WORKDIR ${WORKDIR} - -# Revise default shell to /bin/bash -RUN jupyter notebook --generate-config \ - && echo "c.NotebookApp.terminado_settings = { 'shell_command': ['/bin/bash'] }" >> /root/.jupyter/jupyter_notebook_config.py - -# Add Tini -ADD https://github.com/krallin/tini/releases/download/${TINI_VERSION}/tini /tini -RUN chmod +x /tini -ENTRYPOINT [ "/tini", "--", "/devel_entrypoint.sh" ] -CMD ["/bin/bash"]