|
| 1 | +# Copyright (c) 2020 NVIDIA CORPORATION. All rights reserved. |
| 2 | +# Licensed under the Apache License, Version 2.0 (the "License"); |
| 3 | +# you may not use this file except in compliance with the License. |
| 4 | +# You may obtain a copy of the License at |
| 5 | +# |
| 6 | +# http://www.apache.org/licenses/LICENSE-2.0 |
| 7 | +# |
| 8 | +# Unless required by applicable law or agreed to in writing, software |
| 9 | +# distributed under the License is distributed on an "AS IS" BASIS, |
| 10 | +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 11 | +# See the License for the specific language governing permissions and |
| 12 | +# limitations under the License. |
| 13 | + |
| 14 | +ARG FROM_IMAGE_NAME=nvcr.io/nvidian/tensorflow:20.06-tf2-py3 |
| 15 | +#FROM gitlab-master.nvidia.com:5005/dl/dgx/tensorrtserver:master-py3.1164446-client as trt |
| 16 | +#FROM nvcr.io/nvidia/tensorrtserver:20.03-py3-clientsdk as trt |
| 17 | +FROM ${FROM_IMAGE_NAME} |
| 18 | +RUN apt-get update && apt-get install -y pbzip2 pv bzip2 cabextract |
| 19 | + |
| 20 | +ENV DATA_PREP_WORKING_DIR /workspace/electra/data |
| 21 | + |
| 22 | +WORKDIR /workspace |
| 23 | +RUN git clone https://github.com/attardi/wikiextractor.git |
| 24 | +RUN git clone https://github.com/soskek/bookcorpus.git |
| 25 | + |
| 26 | +# Copy the perf_client over |
| 27 | +#COPY --from=trt /workspace/install/ /workspace/install/ |
| 28 | +#ENV LD_LIBRARY_PATH /workspace/install/lib:${LD_LIBRARY_PATH} |
| 29 | + |
| 30 | +# Install trt python api |
| 31 | +#RUN pip install /workspace/install/python/tensorrtserver-1.*-py3-none-linux_x86_64.whl |
| 32 | + |
| 33 | +WORKDIR /workspace/electra |
| 34 | +RUN pip install --upgrade --no-cache-dir pip \ |
| 35 | + && pip install --no-cache-dir \ |
| 36 | + tqdm boto3 requests six ipdb h5py html2text nltk progressbar filelock tokenizers==0.7.0 \ |
| 37 | + git+https://github.com/NVIDIA/dllogger |
| 38 | + |
| 39 | +RUN apt-get install -y iputils-ping |
| 40 | +COPY . . |
0 commit comments