34 lines
1.3 KiB
Docker
34 lines
1.3 KiB
Docker
ARG FROM_IMAGE_NAME=nvcr.io/nvidia/tensorflow:20.06-tf1-py3
|
|
|
|
FROM ${FROM_IMAGE_NAME}
|
|
|
|
RUN apt-get update && apt-get install -y pbzip2 pv bzip2 libcurl4 curl libb64-dev
|
|
RUN pip install --upgrade pip
|
|
RUN pip install toposort networkx pytest nltk tqdm html2text progressbar
|
|
RUN pip --no-cache-dir --no-cache install git+https://github.com/NVIDIA/dllogger wget
|
|
|
|
WORKDIR /workspace
|
|
RUN git clone https://github.com/openai/gradient-checkpointing.git
|
|
RUN git clone https://github.com/attardi/wikiextractor.git && cd wikiextractor && git checkout 6408a430fc504a38b04d37ce5e7fc740191dee16 && cd ..
|
|
RUN git clone https://github.com/soskek/bookcorpus.git
|
|
RUN git clone https://github.com/titipata/pubmed_parser
|
|
|
|
|
|
RUN pip3 install /workspace/pubmed_parser
|
|
|
|
#Copy the perf_client over
|
|
ARG TRTIS_CLIENTS_URL=https://github.com/NVIDIA/triton-inference-server/releases/download/v2.0.0/v2.0.0_ubuntu1804.clients.tar.gz
|
|
RUN mkdir -p /workspace/install \
|
|
&& curl -L ${TRTIS_CLIENTS_URL} | tar xvz -C /workspace/install
|
|
|
|
#Install the python wheel with pip
|
|
RUN pip install /workspace/install/python/triton*.whl
|
|
|
|
WORKDIR /workspace/bert
|
|
COPY . .
|
|
|
|
ENV PYTHONPATH /workspace/bert
|
|
ENV BERT_PREP_WORKING_DIR /workspace/bert/data
|
|
ENV PATH //workspace/install/bin:${PATH}
|
|
ENV LD_LIBRARY_PATH /workspace/install/lib:${LD_LIBRARY_PATH}
|