2020-07-27 22:02:39 +02:00
|
|
|
# syntax=docker/dockerfile:experimental
|
|
|
|
|
|
|
|
# Copyright (c) 2019, NVIDIA CORPORATION. All rights reserved.
|
|
|
|
#
|
|
|
|
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
# you may not use this file except in compliance with the License.
|
|
|
|
# You may obtain a copy of the License at
|
|
|
|
#
|
|
|
|
# http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
#
|
|
|
|
# Unless required by applicable law or agreed to in writing, software
|
|
|
|
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
# See the License for the specific language governing permissions and
|
|
|
|
# limitations under the License.
|
|
|
|
|
2021-10-21 05:06:37 +02:00
|
|
|
ARG BASE_IMAGE=nvcr.io/nvidia/pytorch:21.10-py3
|
2020-09-04 07:12:03 +02:00
|
|
|
|
2020-07-27 22:02:39 +02:00
|
|
|
|
|
|
|
# build an image that includes only the nemo dependencies, ensures that dependencies
|
|
|
|
# are included first for optimal caching, and useful for building a development
|
|
|
|
# image (by specifying build target as `nemo-deps`)
|
|
|
|
FROM ${BASE_IMAGE} as nemo-deps
|
|
|
|
|
|
|
|
# Ensure apt-get won't prompt for selecting options
|
|
|
|
ENV DEBIAN_FRONTEND=noninteractive
|
|
|
|
RUN apt-get update && \
|
|
|
|
apt-get install -y \
|
|
|
|
libsndfile1 sox \
|
2020-11-17 01:00:50 +01:00
|
|
|
libfreetype6 \
|
2020-10-23 00:54:20 +02:00
|
|
|
python-setuptools swig \
|
2020-07-27 22:02:39 +02:00
|
|
|
python-dev ffmpeg && \
|
|
|
|
rm -rf /var/lib/apt/lists/*
|
|
|
|
|
2021-04-02 03:14:53 +02:00
|
|
|
# uninstall stuff from base container
|
|
|
|
RUN pip uninstall -y sacrebleu torchtext
|
|
|
|
|
2020-09-25 08:47:06 +02:00
|
|
|
# build torchaudio (change latest release version to match pytorch)
|
|
|
|
WORKDIR /tmp/torchaudio_build
|
2021-09-11 21:18:06 +02:00
|
|
|
RUN git clone --depth 1 --branch release/0.9 https://github.com/pytorch/audio.git && \
|
2020-09-25 08:47:06 +02:00
|
|
|
cd audio && \
|
2021-09-11 21:18:06 +02:00
|
|
|
git submodule update --init --recursive && \
|
2020-09-25 08:47:06 +02:00
|
|
|
BUILD_SOX=1 python setup.py install && \
|
|
|
|
cd .. && rm -r audio
|
|
|
|
|
2021-04-02 03:14:53 +02:00
|
|
|
# TODO: remove when 21.04 container is released
|
|
|
|
# build torchtext
|
|
|
|
WORKDIR /tmp/torchtext_build
|
|
|
|
RUN git clone --branch v0.8.1 https://github.com/pytorch/text.git && \
|
|
|
|
cd text && \
|
|
|
|
git submodule update --init --recursive && \
|
|
|
|
python setup.py clean install && \
|
2021-04-02 03:43:16 +02:00
|
|
|
cd .. && rm -r text
|
2021-04-02 03:14:53 +02:00
|
|
|
|
2021-01-18 09:50:41 +01:00
|
|
|
#install TRT tools: PT quantization support and ONNX graph optimizer
|
|
|
|
WORKDIR /tmp/trt_build
|
2020-12-04 02:21:07 +01:00
|
|
|
RUN git clone https://github.com/NVIDIA/TensorRT.git && \
|
2021-01-26 09:00:44 +01:00
|
|
|
cd TensorRT/tools/onnx-graphsurgeon && python setup.py install && \
|
2021-01-18 09:50:41 +01:00
|
|
|
cd ../pytorch-quantization && \
|
2020-12-04 02:21:07 +01:00
|
|
|
python setup.py install && \
|
2021-01-18 09:50:41 +01:00
|
|
|
rm -fr /tmp/trt_build
|
2020-12-04 02:21:07 +01:00
|
|
|
|
2021-04-13 06:31:28 +02:00
|
|
|
# install nemo dependencies
|
|
|
|
WORKDIR /tmp/nemo
|
|
|
|
COPY requirements .
|
|
|
|
RUN for f in $(ls requirements*.txt); do pip install --disable-pip-version-check --no-cache-dir -r $f; done
|
|
|
|
|
|
|
|
# install nemo_text_processing dependencies
|
|
|
|
COPY nemo_text_processing /tmp/nemo/nemo_text_processing/
|
|
|
|
RUN /bin/bash /tmp/nemo/nemo_text_processing/setup.sh
|
|
|
|
|
2020-07-27 22:02:39 +02:00
|
|
|
# copy nemo source into a scratch image
|
|
|
|
FROM scratch as nemo-src
|
|
|
|
COPY . .
|
|
|
|
|
|
|
|
# start building the final container
|
|
|
|
FROM nemo-deps as nemo
|
2021-09-11 21:18:06 +02:00
|
|
|
ARG NEMO_VERSION=1.4.0
|
2020-07-27 22:02:39 +02:00
|
|
|
|
|
|
|
# Check that NEMO_VERSION is set. Build will fail without this. Expose NEMO and base container
|
|
|
|
# version information as runtime environment variable for introspection purposes
|
|
|
|
RUN /usr/bin/test -n "$NEMO_VERSION" && \
|
|
|
|
/bin/echo "export NEMO_VERSION=${NEMO_VERSION}" >> /root/.bashrc && \
|
|
|
|
/bin/echo "export BASE_IMAGE=${BASE_IMAGE}" >> /root/.bashrc
|
2021-03-31 19:20:26 +02:00
|
|
|
RUN --mount=from=nemo-src,target=/tmp/nemo cd /tmp/nemo && pip install ".[all]" && \
|
|
|
|
python -c "import nemo.collections.asr as nemo_asr" && \
|
|
|
|
python -c "import nemo.collections.nlp as nemo_nlp" && \
|
2021-04-10 00:19:16 +02:00
|
|
|
python -c "import nemo.collections.tts as nemo_tts" && \
|
2021-04-10 03:11:40 +02:00
|
|
|
python -c "import nemo_text_processing.text_normalization as text_normalization"
|
|
|
|
|
2021-07-22 17:31:38 +02:00
|
|
|
# TODO: Try to remove once 21.07 container is the base container
|
|
|
|
# install pinned numba version
|
|
|
|
RUN conda install -c numba numba=0.53.1
|
2020-07-27 22:02:39 +02:00
|
|
|
|
|
|
|
# copy scripts/examples/tests into container for end user
|
|
|
|
WORKDIR /workspace/nemo
|
|
|
|
COPY scripts /workspace/nemo/scripts
|
|
|
|
COPY examples /workspace/nemo/examples
|
|
|
|
COPY tests /workspace/nemo/tests
|
2020-10-07 00:34:14 +02:00
|
|
|
COPY tutorials /workspace/nemo/tutorials
|
2020-07-27 22:02:39 +02:00
|
|
|
# COPY README.rst LICENSE /workspace/nemo/
|
|
|
|
|
|
|
|
RUN printf "#!/bin/bash\njupyter lab --no-browser --allow-root --ip=0.0.0.0" >> start-jupyter.sh && \
|
|
|
|
chmod +x start-jupyter.sh
|
|
|
|
|