| ARG RELEASE |
| ARG LAUNCHPAD_BUILD_ARCH |
| LABEL org.opencontainers.image.ref.name=ubuntu |
| LABEL org.opencontainers.image.version=24.04 |
| ADD file:6df775300d76441aa33f31b22c1afce8dfe35c8ffbc14ef27c27009235b12a95 in / |
| CMD ["/bin/bash"] |
| ARG JETPACK_HOST_MOUNTS= |
| ENV NVIDIA_REQUIRE_JETPACK_HOST_MOUNTS= |
| RUN |1 JETPACK_HOST_MOUNTS= /bin/sh -c if [ -n "${JETPACK_HOST_MOUNTS}" ]; then echo "/usr/lib/aarch64-linux-gnu/tegra" > /etc/ld.so.conf.d/nvidia-tegra.conf && echo "/usr/lib/aarch64-linux-gnu/tegra-egl" >> /etc/ld.so.conf.d/nvidia-tegra.conf; fi # buildkit |
| RUN |1 JETPACK_HOST_MOUNTS= /bin/sh -c export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends apt-utils build-essential ca-certificates curl libncurses6 libncursesw6 patch wget unzip jq gnupg libtcmalloc-minimal4 && rm -rf /var/lib/apt/lists/* && echo "hsts=0" > /root/.wgetrc # buildkit |
| ARG GDRCOPY_VERSION=2.4.1 |
| ARG HPCX_VERSION=2.22.1 |
| ARG RDMACORE_VERSION=50.0 |
| ARG MOFED_VERSION=5.4-rdmacore50.0 |
| ARG OPENUCX_VERSION=1.18.0 |
| ARG OPENMPI_VERSION=4.1.7 |
| ARG EFA_VERSION=1.34.0 |
| ARG AWS_OFI_NCCL_VERSION=1.12.1 |
| ENV GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 RDMACORE_VERSION=50.0 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 |
| ARG TARGETARCH=amd64 |
| RUN |10 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 /bin/sh -c cd /nvidia && ( export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends libibverbs1 libibverbs-dev librdmacm1 librdmacm-dev libibumad3 libibumad-dev ibverbs-utils ibverbs-providers && rm -rf /var/lib/apt/lists/* && rm $(dpkg-query -L libibverbs-dev librdmacm-dev libibumad-dev | grep "\(\.so\|\.a\)$") ) && ( cd opt/gdrcopy/ && dpkg -i libgdrapi_*.deb ) && ( cp -r opt/hpcx /opt/ && cp etc/ld.so.conf.d/hpcx.conf /etc/ld.so.conf.d/ && ln -sf /opt/hpcx/ompi /usr/local/mpi && ln -sf /opt/hpcx/ucx /usr/local/ucx && sed -i 's/^\(hwloc_base_binding_policy\) = core$/\1 = none/' /opt/hpcx/ompi/etc/openmpi-mca-params.conf && sed -i 's/^\(btl = self\)$/#\1/' /opt/hpcx/ompi/etc/openmpi-mca-params.conf ) && ( if [ ! -f /etc/ld.so.conf.d/nvidia-tegra.conf ]; then cd opt/amazon/efa/ && dpkg -i libfabric*.deb && rm /opt/amazon/efa/lib/libfabric.a && echo "/opt/amazon/efa/lib" > /etc/ld.so.conf.d/efa.conf; fi ) && ldconfig # buildkit |
| ENV OPAL_PREFIX=/opt/hpcx/ompi PATH=/usr/local/mpi/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/amazon/efa/bin |
| ENV OMPI_MCA_coll_hcoll_enable=0 |
| ARG CUDA_VERSION=12.8.1.012 |
| ARG CUDA_DRIVER_VERSION=570.124.06 |
| ENV CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 CUDA_CACHE_DISABLE=1 |
| RUN |12 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 /bin/sh -c /nvidia/build-scripts/installCUDA.sh # buildkit |
| RUN |12 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 /bin/sh -c cp -vprd /nvidia/. / && patch -p0 < /etc/startup_scripts.patch && rm -f /etc/startup_scripts.patch # buildkit |
| ENV _CUDA_COMPAT_PATH=/usr/local/cuda/compat ENV=/etc/shinit_v2 BASH_ENV=/etc/bash.bashrc SHELL=/bin/bash NVIDIA_REQUIRE_CUDA=cuda>=9.0 |
| LABEL com.nvidia.volumes.needed=nvidia_driver com.nvidia.cuda.version=9.0 |
| ARG NCCL_VERSION=2.25.1 |
| ARG CUBLAS_VERSION=12.8.4.1 |
| ARG CUFFT_VERSION=11.3.3.83 |
| ARG CURAND_VERSION=10.3.9.90 |
| ARG CUSPARSE_VERSION=12.5.8.93 |
| ARG CUSOLVER_VERSION=11.7.3.90 |
| ARG NPP_VERSION=12.3.3.100 |
| ARG NVJPEG_VERSION=12.3.5.92 |
| ARG CUFILE_VERSION=1.13.1.3 |
| ARG NVJITLINK_VERSION=12.8.93 |
| ARG CUBLASMP_VERSION=0.4.0.789 |
| ARG CAL_VERSION=0.4.4.50 |
| ARG NVSHMEM_VERSION=3.2.5 |
| ARG CUDNN_VERSION=9.8.0.87 |
| ARG CUDNN_FRONTEND_VERSION=1.10.0 |
| ARG TRT_VERSION=10.9.0.34 |
| ARG TRTOSS_VERSION= |
| ARG NSIGHT_SYSTEMS_VERSION=2025.1.1.110 |
| ARG NSIGHT_COMPUTE_VERSION=2025.1.1.2 |
| ARG CUSPARSELT_VERSION=0.7.1.0 |
| ENV NCCL_VERSION=2.25.1 CUBLAS_VERSION=12.8.4.1 CUFFT_VERSION=11.3.3.83 CURAND_VERSION=10.3.9.90 CUSPARSE_VERSION=12.5.8.93 CUSPARSELT_VERSION=0.7.1.0 CUSOLVER_VERSION=11.7.3.90 NPP_VERSION=12.3.3.100 NVJPEG_VERSION=12.3.5.92 CUFILE_VERSION=1.13.1.3 NVJITLINK_VERSION=12.8.93 CUBLASMP_VERSION=0.4.0.789 CAL_VERSION=0.4.4.50 NVSHMEM_VERSION=3.2.5 CUDNN_VERSION=9.8.0.87 CUDNN_FRONTEND_VERSION=1.10.0 TRT_VERSION=10.9.0.34 TRTOSS_VERSION= NSIGHT_SYSTEMS_VERSION=2025.1.1.110 NSIGHT_COMPUTE_VERSION=2025.1.1.2 |
| RUN |32 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 NCCL_VERSION=2.25.1 CUBLAS_VERSION=12.8.4.1 CUFFT_VERSION=11.3.3.83 CURAND_VERSION=10.3.9.90 CUSPARSE_VERSION=12.5.8.93 CUSOLVER_VERSION=11.7.3.90 NPP_VERSION=12.3.3.100 NVJPEG_VERSION=12.3.5.92 CUFILE_VERSION=1.13.1.3 NVJITLINK_VERSION=12.8.93 CUBLASMP_VERSION=0.4.0.789 CAL_VERSION=0.4.4.50 NVSHMEM_VERSION=3.2.5 CUDNN_VERSION=9.8.0.87 CUDNN_FRONTEND_VERSION=1.10.0 TRT_VERSION=10.9.0.34 TRTOSS_VERSION= NSIGHT_SYSTEMS_VERSION=2025.1.1.110 NSIGHT_COMPUTE_VERSION=2025.1.1.2 CUSPARSELT_VERSION=0.7.1.0 /bin/sh -c /nvidia/build-scripts/installLIBS.sh && /nvidia/build-scripts/installCUDNN.sh && /nvidia/build-scripts/installTRT.sh && /nvidia/build-scripts/installNSYS.sh && /nvidia/build-scripts/installNCU.sh && /nvidia/build-scripts/installCUSPARSELT.sh && if [ -z "${JETPACK_HOST_MOUNTS}" ]; then /nvidia/build-scripts/installNCCL.sh; fi; # buildkit |
| LABEL com.nvidia.nccl.version=2.25.1 com.nvidia.cublas.version=12.8.4.1 com.nvidia.cufft.version=11.3.3.83 com.nvidia.curand.version=10.3.9.90 com.nvidia.cusparse.version=12.5.8.93 com.nvidia.cusparselt.version=0.7.1.0 com.nvidia.cusolver.version=11.7.3.90 com.nvidia.npp.version=12.3.3.100 com.nvidia.nvjpeg.version=12.3.5.92 com.nvidia.cublasmp.version=0.4.0.789 com.nvidia.cal.version=0.4.4.50 com.nvidia.cudnn.version=9.8.0.87 com.nvidia.tensorrt.version=10.9.0.34 com.nvidia.tensorrtoss.version= com.nvidia.nsightsystems.version=2025.1.1.110 com.nvidia.nsightcompute.version=2025.1.1.2 |
| ARG DALI_VERSION=1.47.0 |
| ARG DALI_BUILD= |
| ARG DALI_URL_SUFFIX=120 |
| ARG POLYGRAPHY_VERSION=0.49.18 |
| ARG TRANSFORMER_ENGINE_VERSION=2.1 |
| ARG MODEL_OPT_VERSION=0.25.0 |
| ENV DALI_VERSION=1.47.0 DALI_BUILD= DALI_URL_SUFFIX=120 POLYGRAPHY_VERSION=0.49.18 TRANSFORMER_ENGINE_VERSION=2.1 MODEL_OPT_VERSION=0.25.0 |
| ADD docs.tgz / # buildkit |
| RUN |38 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 NCCL_VERSION=2.25.1 CUBLAS_VERSION=12.8.4.1 CUFFT_VERSION=11.3.3.83 CURAND_VERSION=10.3.9.90 CUSPARSE_VERSION=12.5.8.93 CUSOLVER_VERSION=11.7.3.90 NPP_VERSION=12.3.3.100 NVJPEG_VERSION=12.3.5.92 CUFILE_VERSION=1.13.1.3 NVJITLINK_VERSION=12.8.93 CUBLASMP_VERSION=0.4.0.789 CAL_VERSION=0.4.4.50 NVSHMEM_VERSION=3.2.5 CUDNN_VERSION=9.8.0.87 CUDNN_FRONTEND_VERSION=1.10.0 TRT_VERSION=10.9.0.34 TRTOSS_VERSION= NSIGHT_SYSTEMS_VERSION=2025.1.1.110 NSIGHT_COMPUTE_VERSION=2025.1.1.2 CUSPARSELT_VERSION=0.7.1.0 DALI_VERSION=1.47.0 DALI_BUILD= DALI_URL_SUFFIX=120 POLYGRAPHY_VERSION=0.49.18 TRANSFORMER_ENGINE_VERSION=2.1 MODEL_OPT_VERSION=0.25.0 /bin/sh -c echo "/usr/local/nvidia/lib" >> /etc/ld.so.conf.d/nvidia.conf && echo "/usr/local/nvidia/lib64" >> /etc/ld.so.conf.d/nvidia.conf # buildkit |
| ARG _LIBPATH_SUFFIX= |
| ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/mpi/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/amazon/efa/bin LD_LIBRARY_PATH=/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64 NVIDIA_VISIBLE_DEVICES=all NVIDIA_DRIVER_CAPABILITIES=compute,utility,video |
| COPY entrypoint/ /opt/nvidia/ # buildkit |
| ENV NVIDIA_PRODUCT_NAME=CUDA |
| ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"] |
| RUN |39 JETPACK_HOST_MOUNTS= GDRCOPY_VERSION=2.4.1 HPCX_VERSION=2.22.1 RDMACORE_VERSION=50.0 MOFED_VERSION=5.4-rdmacore50.0 OPENUCX_VERSION=1.18.0 OPENMPI_VERSION=4.1.7 EFA_VERSION=1.34.0 AWS_OFI_NCCL_VERSION=1.12.1 TARGETARCH=amd64 CUDA_VERSION=12.8.1.012 CUDA_DRIVER_VERSION=570.124.06 NCCL_VERSION=2.25.1 CUBLAS_VERSION=12.8.4.1 CUFFT_VERSION=11.3.3.83 CURAND_VERSION=10.3.9.90 CUSPARSE_VERSION=12.5.8.93 CUSOLVER_VERSION=11.7.3.90 NPP_VERSION=12.3.3.100 NVJPEG_VERSION=12.3.5.92 CUFILE_VERSION=1.13.1.3 NVJITLINK_VERSION=12.8.93 CUBLASMP_VERSION=0.4.0.789 CAL_VERSION=0.4.4.50 NVSHMEM_VERSION=3.2.5 CUDNN_VERSION=9.8.0.87 CUDNN_FRONTEND_VERSION=1.10.0 TRT_VERSION=10.9.0.34 TRTOSS_VERSION= NSIGHT_SYSTEMS_VERSION=2025.1.1.110 NSIGHT_COMPUTE_VERSION=2025.1.1.2 CUSPARSELT_VERSION=0.7.1.0 DALI_VERSION=1.47.0 DALI_BUILD= DALI_URL_SUFFIX=120 POLYGRAPHY_VERSION=0.49.18 TRANSFORMER_ENGINE_VERSION=2.1 MODEL_OPT_VERSION=0.25.0 _LIBPATH_SUFFIX= /bin/sh -c mkdir -p /workspace && cp -f -p /opt/nvidia/entrypoint.d/30-container-license.txt /workspace/license.txt # buildkit |
| RUN /bin/sh -c export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends build-essential git libglib2.0-0 less libhwloc15 libnl-route-3-200 libnl-3-dev libnl-route-3-dev libnuma-dev libnuma1 libpmi2-0-dev nano numactl openssh-client vim wget && rm -rf /var/lib/apt/lists/* # buildkit |
| COPY cuda-*.patch /tmp # buildkit |
| RUN /bin/sh -c export DEVEL=1 BASE=0 && /nvidia/build-scripts/installNCU.sh && /nvidia/build-scripts/installCUDA.sh && /nvidia/build-scripts/installLIBS.sh && if [ ! -f /etc/ld.so.conf.d/nvidia-tegra.conf ]; then /nvidia/build-scripts/installNCCL.sh; fi && /nvidia/build-scripts/installCUDNN.sh && /nvidia/build-scripts/installTRT.sh && /nvidia/build-scripts/installNSYS.sh && /nvidia/build-scripts/installCUSPARSELT.sh && if [ -f "/tmp/cuda-${_CUDA_VERSION_MAJMIN}.patch" ]; then patch -p0 < /tmp/cuda-${_CUDA_VERSION_MAJMIN}.patch; fi && rm -f /tmp/cuda-*.patch # buildkit |
| ENV LIBRARY_PATH=/usr/local/cuda/lib64/stubs: |
| COPY /opt/amazon/aws-ofi-nccl /opt/amazon/aws-ofi-nccl # buildkit |
| RUN /bin/sh -c if [ ! -f /etc/ld.so.conf.d/nvidia-tegra.conf ]; then echo "/opt/amazon/aws-ofi-nccl/lib" > /etc/ld.so.conf.d/aws-ofi-nccl.conf && ldconfig; fi # buildkit |
| ENV NVIDIA_PRODUCT_NAME=PyTorch |
| ARG NVIDIA_PYTORCH_VERSION=25.03 |
| ARG PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 |
| ARG NVFUSER_BUILD_VERSION=c5e1555 |
| ENV PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 PYTORCH_VERSION=2.7.0a0+7c8ec84 PYTORCH_BUILD_NUMBER=0 NVIDIA_PYTORCH_VERSION=25.03 |
| ENV NVFUSER_BUILD_VERSION=c5e1555 NVFUSER_VERSION=c5e1555 |
| LABEL com.nvidia.pytorch.version=2.7.0a0+7c8ec84 |
| ARG TARGETARCH=amd64 |
| ARG PYVER=3.12 |
| ARG PYVER_MAJMIN=312 |
| ENV PIP_BREAK_SYSTEM_PACKAGES=1 |
| ARG L4T=0 |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c export PYSFX=`echo "${PYVER}" | cut -c1-1` && export DEBIAN_FRONTEND=noninteractive && apt-get update && apt-get install -y --no-install-recommends python$PYVER-dev python$PYSFX python$PYSFX-dev python$PYSFX-venv python-is-python$PYSFX autoconf automake libatlas-base-dev libgoogle-glog-dev libbz2-dev libc-ares2 libre2-dev libleveldb-dev liblmdb-dev libprotobuf-dev libsnappy-dev libtool nasm protobuf-compiler pkg-config unzip sox libsndfile1 libpng-dev libhdf5-dev gfortran rapidjson-dev ninja-build libedit-dev build-essential patchelf && rm -rf /var/lib/apt/lists/* # buildkit |
| ENV PROTOCOL_BUFFERS_PYTHON_IMPLEMENTATION=python |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c DEBIAN_FRONTEND=noninteractive apt remove -y --force-yes python3-pip && curl -O https://bootstrap.pypa.io/get-pip.py && python get-pip.py && rm get-pip.py # buildkit |
| ENV PIP_CONSTRAINT=/etc/pip/constraint.txt |
| COPY constraint.txt /etc/pip/constraint.txt # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c pip install pip setuptools && pip install cmake # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c curl "https://gitlab-master.nvidia.com/api/v4/projects/105799/packages/generic/OpenBLAS/0.3.24-$(uname -m)/OpenBLAS-0.3.24-$(uname -m).tar.gz" --output OpenBLAS.tar.gz && tar -xf OpenBLAS.tar.gz -C /usr/local/ && rm OpenBLAS.tar.gz # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c if [ $TARGETARCH = "arm64" ]; then cd /opt && curl "https://gitlab-master.nvidia.com/api/v4/projects/105799/packages/generic/nvpl_slim_24.04/sbsa/nvpl_slim_24.04.tar" --output nvpl_slim_24.04.tar && tar -xf nvpl_slim_24.04.tar && cp -r nvpl_slim_24.04/lib/* /usr/local/lib && cp -r nvpl_slim_24.04/include/* /usr/local/include && rm -rf nvpl_slim_24.04.tar nvpl_slim_24.04 ; fi # buildkit |
| ENV NVPL_LAPACK_MATH_MODE=PEDANTIC |
| WORKDIR /opt/pytorch |
| COPY . . # buildkit |
| ENV PYTHONIOENCODING=utf-8 |
| ENV LC_ALL=C.UTF-8 |
| ENV PIP_DEFAULT_TIMEOUT=100 |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c pip install numpy scipy PyYAML astunparse typing_extensions cffi spacy mock tqdm librosa expecttest hypothesis xdoctest pytest pytest-xdist pytest-rerunfailures pytest-shard pytest-flakefinder pybind11 Cython regex protobuf six && if [[ $TARGETARCH = "amd64" ]] ; then pip install --no-cache-dir mkl mkl-include mkl-devel ; find /usr/local/lib -maxdepth 1 -type f -regex '.*\/lib\(tbb\|mkl\).*\.so\($\|\.[0-9]*\.[0-9]*\)' -exec rm -v {} + ; fi # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c git config --global url."https://github".insteadOf git://github && pip install jupyterlab notebook tensorboard jupyterlab_code_formatter python-hostlist # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c PATCHED_FILE=$(python -c "from tensorboard.plugins.core import core_plugin as _; print(_.__file__)") && sed -i 's/^\( *"--bind_all",\)$/\1 default=True,/' "$PATCHED_FILE" && test $(grep '^ *"--bind_all", default=True,$' "$PATCHED_FILE" | wc -l) -eq 1 # buildkit |
| WORKDIR /opt/pytorch |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c pip install --no-cache-dir /builder/*.whl jupytext black isort && mkdir -p /root/.jupyter/lab/user-settings/@jupyterlab/completer-extension/ && jupyter lab clean # buildkit |
| COPY jupyter_config/jupyter_notebook_config.py /usr/local/etc/jupyter/ # buildkit |
| COPY jupyter_config/manager.jupyterlab-settings /root/.jupyter/lab/user-settings/@jupyterlab/completer-extension/ # buildkit |
| COPY jupyter_config/settings.jupyterlab-settings /root/.jupyter/lab/user-settings/@jupyterlab/completer-extension/ # buildkit |
| ENV JUPYTER_PORT=8888 |
| ENV TENSORBOARD_PORT=6006 |
| EXPOSE map[8888/tcp:{}] |
| EXPOSE map[6006/tcp:{}] |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c OPENCV_VERSION=4.10.0 && cd / && wget -q -O - https://github.com/opencv/opencv/archive/${OPENCV_VERSION}.tar.gz | tar -xzf - && cd /opencv-${OPENCV_VERSION} && cmake -GNinja -Bbuild -H. -DWITH_CUDA=OFF -DWITH_1394=OFF -DPYTHON3_PACKAGES_PATH="/usr/local/lib/python${PYVER}/dist-packages" -DBUILD_opencv_cudalegacy=OFF -DBUILD_opencv_stitching=OFF -DWITH_IPP=OFF -DWITH_PROTOBUF=OFF && cmake --build build --target install && cd modules/python/package && pip install -v . && rm -rf /opencv-${OPENCV_VERSION} # buildkit |
| ENV UCC_CL_BASIC_TLS=^sharp |
| ENV TORCH_CUDA_ARCH_LIST=7.5 8.0 8.6 9.0 10.0 12.0+PTX |
| ENV PYTORCH_HOME=/opt/pytorch/pytorch |
| ENV CUDA_HOME=/usr/local/cuda |
| ENV TORCH_ALLOW_TF32_CUBLAS_OVERRIDE=1 |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c pip install /opt/transfer/torch*.whl && patchelf --set-rpath '/usr/local/lib' /usr/local/lib/python${PYVER}/dist-packages/torch/lib/libtorch_global_deps.so # buildkit |
| COPY /usr/local/share/cmake/TorchVision/ /usr/local/share/cmake/TorchVision/ # buildkit |
| COPY /usr/local/include/torchvision/ /usr/local/include/torchvision/ # buildkit |
| COPY /usr/local/lib64/libtorchvision.so /usr/local/lib/libtorchvision.so.1.0 # buildkit |
| COPY /usr/local/lib64/libjpeg* /usr/local/lib/ # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c patchelf --set-rpath '$ORIGIN:/usr/local/lib/python3.12/dist-packages/torch/lib:/usr/local/lib/python3.12/dist-packages/torchvision/' /usr/local/lib/libtorchvision.so.1.0 && patchelf --set-soname libtorchvision.so.1 --output /usr/local/lib/libtorchvision.so.1.0 /usr/local/lib/libtorchvision.so.1.0 && ldconfig && pushd /usr/local/lib && ln -s libtorchvision.so.1 /usr/local/lib/libtorchvision.so && popd && patchelf --set-soname libjpeg.so.62 --output /usr/local/lib/libjpeg.so.62 $(readlink -f $(ldd /usr/local/lib/python3.12/dist-packages/torchvision/image.so | grep libjpeg | awk '{print $3}')) # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c cd pytorch && pip install -v -r /opt/pytorch/pytorch/requirements.txt # buildkit |
| RUN |7 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 /bin/sh -c pip install --no-cache-dir /tmp/dist/*.whl # buildkit |
| ARG DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c if [ -z "${DALI_VERSION}" ] ; then echo "Not Installing DALI for L4T Build." ; exit 0; fi && export CUDA_VERSION_MAJOR=$(ls /usr/local/cuda/lib64/libcudart.so.*.*.* | cut -d . -f 3) && export DALI_PKG_SUFFIX="cuda${CUDA_VERSION_MAJOR}0" && if [ -z "${DALI_URL_SUFFIX}" ] ; then export DALI_EXTRA_INDEX_URL="${DALI_EXTRA_INDEX_URL}-qa"; fi && pip install --extra-index-url https://developer.download.nvidia.com/compute/redist --extra-index-url "${DALI_EXTRA_INDEX_URL}" --trusted-host sqrl nvidia-dali-${DALI_PKG_SUFFIX}==${DALI_VERSION} # buildkit |
| ENV COCOAPI_VERSION=2.0+nv0.8.1 |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c export COCOAPI_TAG=$(echo ${COCOAPI_VERSION} | sed 's/^.*+n//') && pip install git+https://github.com/nvidia/cocoapi.git@${COCOAPI_TAG}#subdirectory=PythonAPI # buildkit |
| COPY singularity/ /.singularity.d/ # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c ( cd fuser && pip install -r requirements.txt && python setup.py -version-tag=a0+${NVFUSER_VERSION} install && python setup.py clean && cp $(find /usr/local/lib/python${PYVER}/dist-packages/ -name libnvfuser_codegen.so) /usr/local/lib/python${PYVER}/dist-packages/torch/lib/ ) && ( cd lightning-thunder && python setup.py install && rm -rf build *.egg-info) && ( cd lightning-thunder && mkdir tmp && cd tmp && git clone -b v${CUDNN_FRONTEND_VERSION} --recursive --single-branch https://github.com/NVIDIA/cudnn-frontend.git cudnn_frontend && cd cudnn_frontend && pip install --no-build-isolation . && cd ../../ && rm -rf tmp ) && ( cd pytorch/third_party/onnx && pip uninstall typing -y && CMAKE_ARGS="-DONNX_USE_PROTOBUF_SHARED_LIBS=ON" pip install --no-build-isolation . ) # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c pip install tabulate # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c if [ "${L4T}" = "1" ]; then echo "Not installing rapids for L4T build."; exit 0; fi && find /rapids -name "*-Linux.tar.gz" -exec tar -C /usr --exclude="*.a" --exclude="bin/xgboost" --strip-components=1 -xvf {} \; && find /rapids -name "*.whl" ! -name "tornado-*" ! -name "Pillow-*" ! -name "certifi-*" ! -name "protobuf-*" ! -name "six-*" -exec pip install --no-cache-dir {} + # buildkit |
| WORKDIR /workspace |
| COPY NVREADME.md README.md # buildkit |
| COPY docker-examples docker-examples # buildkit |
| COPY tutorials tutorials # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c chmod -R a+w . # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c set -x && WHEELS=1 /nvidia/build-scripts/installTRT.sh # buildkit |
| ENV PATH=/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/mpi/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/amazon/efa/bin:/opt/tensorrt/bin |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c pip --version && python -c 'import sys; print(sys.platform)' && pip install --extra-index-url https://urm.nvidia.com/artifactory/api/pypi/sw-tensorrt-pypi/simple --no-cache-dir "polygraphy==${POLYGRAPHY_VERSION}" && pip install --index-url https://gitlab-master.nvidia.com/api/v4/projects/95421/packages/pypi/simple --extra-index-url https://pypi.nvidia.com "nvidia-modelopt[torch]==${MODEL_OPT_VERSION}" # buildkit |
| COPY torch_tensorrt/ /opt/pytorch/torch_tensorrt/ # buildkit |
| ARG PYVER=3.12 |
| ENV LD_LIBRARY_PATH=/usr/local/lib/python3.12/dist-packages/torch/lib:/usr/local/lib/python3.12/dist-packages/torch_tensorrt/lib:/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64 |
| ENV PATH=/usr/local/lib/python3.12/dist-packages/torch_tensorrt/bin:/usr/local/nvidia/bin:/usr/local/cuda/bin:/usr/local/mpi/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/sbin:/bin:/usr/local/ucx/bin:/opt/amazon/efa/bin:/opt/tensorrt/bin |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c pip install --no-cache-dir /opt/pytorch/apex/dist/*.whl # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c pip install --no-cache-dir /opt/pytorch/torch_tensorrt/dist/*.whl # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c if [ "${L4T}" = "1" ]; then echo "Not installing Flash Attention wheel in iGPU as it is a requirement for Transformer Engine"; else pip install --no-cache-dir /opt/pytorch/flash_attn*.whl; fi # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c if [ "${L4T}" = "1" ]; then echo "Not installing Transformer Engine in iGPU container until Version variable is set"; else /nvidia/build-scripts/installCAL.sh && /nvidia/build-scripts/installCUBLASMP.sh && /nvidia/build-scripts/installNVSHMEM.sh && CI_JOB_TOKEN=$(cat /run/secrets/CI_JOB_TOKEN) && echo $CI_JOB_TOKEN && git clone -b release_v${TRANSFORMER_ENGINE_VERSION} --single-branch --recursive https://gitlab-ci-token:${CI_JOB_TOKEN}@gitlab-master.nvidia.com/dl/transformerengine/transformerengine.git && env NVTE_CUDA_ARCHS="70;80;89;90;100;120" NVTE_BUILD_THREADS_PER_JOB=8 pip install --no-cache-dir --no-build-isolation ./transformerengine && rm -rf transformerengine; fi # buildkit |
| ENV CUDA_MODULE_LOADING=LAZY |
| ENV TORCH_NCCL_USE_COMM_NONBLOCKING=0 |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c ln -sf ${_CUDA_COMPAT_PATH}/lib.real ${_CUDA_COMPAT_PATH}/lib && echo ${_CUDA_COMPAT_PATH}/lib > /etc/ld.so.conf.d/00-cuda-compat.conf && ldconfig && rm -f ${_CUDA_COMPAT_PATH}/lib # buildkit |
| COPY entrypoint.d/ /opt/nvidia/entrypoint.d/ # buildkit |
| COPY gloo.patch /gloo.patch # buildkit |
| RUN |8 NVIDIA_PYTORCH_VERSION=25.03 PYTORCH_BUILD_VERSION=2.7.0a0+7c8ec84 NVFUSER_BUILD_VERSION=c5e1555 TARGETARCH=amd64 PYVER=3.12 PYVER_MAJMIN=312 L4T=0 DALI_EXTRA_INDEX_URL=http://sqrl/nvdl/datasets/dali/pip-dali /bin/sh -c cd /opt/pytorch/pytorch/third_party/gloo && patch -p1 < /gloo.patch && cd - && rm /gloo.patch # buildkit |
| ARG NVIDIA_BUILD_ID=148941828 |
| ENV NVIDIA_BUILD_ID=148941828 |
| LABEL com.nvidia.build.id=148941828 |
| ARG NVIDIA_BUILD_REF=84f446f5c7204f47f7769a5a5f759c7622b828eb |
| LABEL com.nvidia.build.ref=84f446f5c7204f47f7769a5a5f759c7622b828eb |
| ENV NVIDIA_PRODUCT_NAME=NeMo Framework |
| ENV PIP_NO_CACHE_DIR=1 |
| ARG NVIDIA_BIGNLP_VERSION |
| ENV NVIDIA_BIGNLP_VERSION= |
| LABEL com.nvidia.bignlp.version= |
| ENV DEBIAN_FRONTEND=noninteractive |
| RUN |1 NVIDIA_BIGNLP_VERSION= /bin/sh -c apt-get update && apt-get install -y --no-install-recommends libsndfile1 sox swig libb64-dev openssh-server && rm -rf /var/lib/apt/lists/* && apt-get clean && pip install virtualenv && virtualenv /opt/venv # buildkit |
| RUN |1 NVIDIA_BIGNLP_VERSION= /bin/sh -c apt-get remove --purge -y libslurm* && apt-get -y autoremove && pip uninstall -y onnx && rm -rf /opt/pytorch/pytorch/third_party/onnx # buildkit |
| RUN |1 NVIDIA_BIGNLP_VERSION= /bin/sh -c cp /dev/null /etc/pip/constraint.txt # buildkit |
| WORKDIR /opt |
| RUN |1 NVIDIA_BIGNLP_VERSION= /bin/sh -c bash tensorrt_llm/docker/common/install_base.sh && bash tensorrt_llm/docker/common/install_cmake.sh && bash tensorrt_llm/docker/common/install_ccache.sh # buildkit |
| ARG TRT_VER=10.9.0.34 |
| ARG CUDA_VER=12.8 |
| ARG CUDNN_VER=9.8.0.87-1 |
| ARG NCCL_VER=2.25.1-1+cuda12.8 |
| ARG CUBLAS_VER=12.8.4.1-1 |
| ARG NVRTC_VER=12.8.93-1 |
| ARG TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 |
| ARG TRT_LLM_VERSION=0.18.0 |
| ENV TRT_VER=10.9.0.34 |
| ENV NEMO_FW_TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 |
| ENV NEMO_FW_TRT_LLM_VERSION=0.18.0 |
| RUN |9 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 /bin/sh -c bash tensorrt_llm/docker/common/install_tensorrt.sh --TRT_VER=${TRT_VER} --CUDA_VER=${CUDA_VER} --CUDNN_VER=${CUDNN_VER} --NCCL_VER=${NCCL_VER} --CUBLAS_VER=${CUBLAS_VER} --NVRTC_VER=${NVRTC_VER} bash tensorrt_llm/docker/common/install_polygraphy.sh && bash tensorrt_llm/docker/common/install_mpi4py.sh # buildkit |
| ARG REINSTALL_NSYS=False |
| ARG NSYS_VERSION=2025.1.1.65 |
| ENV NSIGHT_SYSTEMS_VERSION=2025.1.1.65 |
| RUN |11 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 /bin/sh -c if [ $REINSTALL_NSYS = "True" ]; then /nvidia/build-scripts/installNSYS.sh; fi # buildkit |
| ARG TARGET_ARCH=x86 |
| ARG DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 |
| ARG GDR_COPY_VERSION=v2.4.1 |
| ENV CPATH=/usr/local/mpi/include: |
| ENV LD_LIBRARY_PATH=/usr/local/mpi/lib:/usr/local/lib/python3.12/dist-packages/torch/lib:/usr/local/lib/python3.12/dist-packages/torch_tensorrt/lib:/usr/local/cuda/compat/lib:/usr/local/nvidia/lib:/usr/local/nvidia/lib64 |
| ENV GDRCOPY_HOME=/usr/src/gdrdrv-2.4.1/ |
| RUN |14 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 /bin/sh -c apt-get update && apt-get install -y --no-install-recommends nvidia-dkms-535 devscripts debhelper fakeroot dkms check libsubunit0 libsubunit-dev libfabric-dev && if [ $TARGET_ARCH = "x86" ]; then ln -s /usr/lib/x86_64-linux-gnu/libmlx5.so.1 /usr/lib/x86_64-linux-gnu/libmlx5.so; else ln -s /usr/lib/aarch64-linux-gnu/libmlx5.so.1 /usr/lib/aarch64-linux-gnu/libmlx5.so; fi && rm -rf /var/lib/apt/lists/* && apt-get clean && git clone https://github.com/NVIDIA/gdrcopy.git && cd /opt/gdrcopy && git checkout $GDR_COPY_VERSION && CUDA=/usr/local/cuda packages/build-deb-packages.sh && dpkg -i gdrdrv-dkms_*.deb && dpkg -i libgdrapi_*.deb && dpkg -i gdrcopy-tests_*.deb && dpkg -i gdrcopy_*.deb && cd /opt && git clone https://github.com/deepseek-ai/DeepEP.git && cd DeepEP && git fetch origin $DEEPEP_COMMIT && git checkout FETCH_HEAD && cd /opt && wget https://developer.nvidia.com/downloads/assets/secure/nvshmem/nvshmem_src_3.2.5-1.txz && mkdir -p /opt/nvshmem_src && tar xf nvshmem_src_3.2.5-1.txz -C /opt && rm nvshmem_src_3.2.5-1.txz && cd /opt/nvshmem_src && git apply /opt/DeepEP/third-party/nvshmem.patch && CUDA_HOME=/usr/local/cuda NVSHMEM_SHMEM_SUPPORT=0 NVSHMEM_UCX_SUPPORT=0 NVSHMEM_USE_NCCL=0 NVSHMEM_IBGDA_SUPPORT=1 NVSHMEM_PMIX_SUPPORT=0 NVSHMEM_TIMEOUT_DEVICE_POLLING=0 NVSHMEM_USE_GDRCOPY=1 cmake -S . -B build/ -DCMAKE_INSTALL_PREFIX=/opt/nvshmem_src/install -DCMAKE_CUDA_ARCHITECTURES=90 && cd build && make install -j && rm -rf /opt/nvshmem_src/build && cd /opt/DeepEP && NVSHMEM_DIR=/opt/nvshmem_src/install python setup.py develop && NVSHMEM_DIR=/opt/nvshmem_src/install python setup.py install && apt-get remove --purge -y devscripts debhelper man-db && apt-get -y autoremove && apt-get clean # buildkit |
| ARG REINSTALL_APEX=False |
| ARG APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a |
| RUN |16 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a /bin/sh -c pip install packaging # buildkit |
| RUN |16 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a /bin/sh -c if [ $REINSTALL_APEX = "True" ]; then pip uninstall -y apex && git clone https://github.com/NVIDIA/apex && cd apex && if [ ! -z $APEX_COMMIT ]; then git fetch origin $APEX_COMMIT && git checkout FETCH_HEAD; fi && HEAD_APEX_COMMIT=$(git rev-parse HEAD) && echo "Container built with Apex commit hash: $HEAD_APEX_COMMIT" && pip install -e . -v --no-build-isolation --disable-pip-version-check --no-cache-dir --config-settings "--build-option=--cpp_ext --cuda_ext --fast_layer_norm --distributed_adam --deprecated_fused_adam --group_norm --nccl_allocator"; fi # buildkit |
| RUN |16 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a /bin/sh -c if [ -d /tmp/TransformerEngine ]; then pip install --no-cache-dir --no-build-isolation /tmp/TransformerEngine/dist/transformer_engine*; fi # buildkit |
| ARG MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 |
| ARG MCORE_VERSION=0.12.1 |
| ENV NEMO_FW_MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 |
| ENV NEMO_FW_MCORE_VERSION=0.12.1 |
| RUN |18 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 /bin/sh -c CI_JOB_TOKEN=$(cat /run/secrets/CI_JOB_TOKEN) && git clone https://gitlab-ci-token:${CI_JOB_TOKEN}@gitlab-master.nvidia.com/ADLR/megatron-lm.git && cd megatron-lm && git pull && if [ ! -z $MCORE_COMMIT ]; then git fetch origin $MCORE_COMMIT && git checkout FETCH_HEAD; fi && HEAD_MCORE_COMMIT=$(git rev-parse HEAD) && echo "Container built with megatron-lm commit hash: $HEAD_MCORE_COMMIT" && sed -i "/triton/d" requirements/pytorch_24.10/requirements.txt && sed -i "/nvidia-resiliency-ext/d" requirements/pytorch_24.10/requirements.txt && pip install -e . && rm -rf .git && cd megatron/core/datasets && make && rm -rf /root/.cache/bazel # buildkit |
| ENV PYTHONPATH=:/opt/megatron-lm |
| WORKDIR /opt/tensorrt_llm |
| RUN |18 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 /bin/sh -c pip install /src/tensorrt_llm/build/tensorrt_llm*.whl --extra-index-url https://pypi.nvidia.com --extra-index-url https://gitlab-master.nvidia.com/api/v4/projects/95421/packages/pypi/simple # buildkit |
| RUN |18 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 /bin/sh -c ln -sv $(python3 -c 'import site; print(f"{site.getsitepackages()[0]}/tensorrt_llm/libs")') lib && test -f lib/libnvinfer_plugin_tensorrt_llm.so && ln -sv lib/libnvinfer_plugin_tensorrt_llm.so lib/libnvinfer_plugin_tensorrt_llm.so.9 && echo "/opt/tensorrt_llm/lib" > /etc/ld.so.conf.d/tensorrt_llm.conf && ldconfig # buildkit |
| ARG SRC_DIR=/src/tensorrt_llm |
| COPY /src/tensorrt_llm/benchmarks benchmarks # buildkit |
| ARG CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build |
| COPY /src/tensorrt_llm/cpp/build/benchmarks/bertBenchmark /src/tensorrt_llm/cpp/build/benchmarks/gptManagerBenchmark /src/tensorrt_llm/cpp/build/benchmarks/gptSessionBenchmark benchmarks/cpp/ # buildkit |
| RUN |20 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build /bin/sh -c rm -v benchmarks/cpp/bertBenchmark.cpp benchmarks/cpp/gptManagerBenchmark.cpp benchmarks/cpp/gptSessionBenchmark.cpp benchmarks/cpp/CMakeLists.txt && apt-get remove --purge -y gdb && apt-get -y autoremove && apt-get clean # buildkit |
| ARG TARGET_ARCH=x86 |
| ARG INSTALL_VLLM=True |
| WORKDIR /opt |
| COPY /opt/tinycudann*.whl ./ # buildkit |
| RUN |21 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True /bin/sh -c pip install --no-cache-dir /tmp/build_mamba_dep/causal-conv1d/causal_conv1d*.whl /tmp/build_grouped_gemm/grouped_gemm*.whl /tmp/build_nvdiffrast/nvdiffrast*.whl /tmp/build_stable_dreamfusion/raymarching*.whl /tmp/build_stable_dreamfusion/shencoder*.whl /tmp/build_stable_dreamfusion/freqencoder*.whl /tmp/build_stable_dreamfusion/gridencoder*.whl && if [ -f /tmp/build_mamba_dep/mamba/mamba*.whl ]; then pip install --no-cache-dir /tmp/build_mamba_dep/mamba/mamba*.whl; fi && if [ -f /tmp/build_bitsandbytes/bitsandbytes/dist/bitsandbytes*.whl ]; then pip install --no-cache-dir /tmp/build_bitsandbytes/bitsandbytes/dist/bitsandbytes*.whl; fi # buildkit |
| ARG ALIGNER_COMMIT=dev |
| ARG ALIGNER_VERSION=0.6.0rc0.dev0 |
| ARG LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 |
| ENV NEMO_FW_LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 |
| RUN |24 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 /bin/sh -c git clone https://github.com/NVIDIA/NeMo-Framework-Launcher.git && cd NeMo-Framework-Launcher && git pull && if [ ! -z $LAUNCHER_COMMIT ]; then git fetch origin $LAUNCHER_COMMIT && git checkout FETCH_HEAD; fi && HEAD_LAUNCHER_COMMIT=$(git rev-parse HEAD) && echo "Container built with NeMo-Framework-Launcher commit hash: $HEAD_LAUNCHER_COMMIT" && pip install --no-cache-dir -r requirements.txt # buildkit |
| ENV LAUNCHER_SCRIPTS_PATH=/opt/NeMo-Framework-Launcher/launcher_scripts |
| ENV PYTHONPATH=/opt/NeMo-Framework-Launcher/launcher_scripts::/opt/megatron-lm |
| ARG CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 |
| ARG INSTALL_CURATOR=True |
| ARG CURATOR_VERSION=0.8.0rc4.dev0 |
| ENV NEMO_FW_CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 |
| ENV NEMO_FW_CURATOR_VERSION=0.8.0rc4.dev0 |
| RUN |27 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 /bin/sh -c if [ $INSTALL_CURATOR = "True" ]; then pip install mpi4py --no-build-isolation && if [ $TARGET_ARCH = "arm" ]; then pip install git+https://github.com/aboSamoor/pycld2.git; fi && git clone https://github.com/NVIDIA/NeMo-Curator.git && cd NeMo-Curator && git pull && if [ ! -z $CURATOR_COMMIT ]; then git fetch origin $CURATOR_COMMIT && git checkout FETCH_HEAD; fi && HEAD_CURATOR_COMMIT=$(git rev-parse HEAD) && echo "Container built with Curator commit hash: $HEAD_CURATOR_COMMIT" && sed -i "/nemo_toolkit/d" pyproject.toml && sed -i "/cudf-cu12/d" pyproject.toml && sed -i "/cugraph-cu12/d" pyproject.toml && sed -i "/cuml-cu12/d" pyproject.toml && sed -i "/dask-cuda/d" pyproject.toml && sed -i "/dask-cudf-cu12/d" pyproject.toml && cd ../ && pip install --extra-index-url=https://pypi.nvidia.com -e "./NeMo-Curator[all]" && pip install protobuf==4.24.4; fi # extra-index-url pypi could cause dependencies conflicts (later on) # buildkit |
| ARG TARGET_ARCH=x86 |
| ARG INSTALL_VLLM=True |
| RUN |27 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 /bin/sh -c echo " UserKnownHostsFile /dev/null" >> /etc/ssh/ssh_config && sed -i 's/#\(StrictModes \).*/\1no/g' /etc/ssh/sshd_config && sed -i 's/# StrictHostKeyChecking ask/ StrictHostKeyChecking no/' /etc/ssh/ssh_config && mkdir -p /var/run/sshd # buildkit |
| ARG NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 |
| ARG NEMO_VERSION=2.3.1 |
| ENV NEMO_FW_NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 |
| ENV NEMO_FW_NEMO_VERSION=2.3.1 |
| RUN |29 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 /bin/sh -c git clone https://github.com/NVIDIA/NeMo.git && cd NeMo && git pull && if [ ! -z $NEMO_COMMIT ]; then git fetch origin $NEMO_COMMIT && git checkout FETCH_HEAD; fi && HEAD_NEMO_COMMIT=$(git rev-parse HEAD) && echo "Container built with NeMo commit hash: $HEAD_NEMO_COMMIT" && pip uninstall -y nemo_toolkit sacrebleu && sed -i "/mamba-ssm/d" requirements/requirements_nlp.txt && if [ $TARGET_ARCH = "arm" ]; then sed -i "/torch/d" requirements/requirements.txt && sed -i "/decord/d" requirements/requirements_multimodal.txt && sed -i "/megatron_core/d" requirements/requirements_nlp.txt; fi && pip install -e ".[all]" && cd nemo/collections/nlp/data/language_modeling/megatron && make # buildkit |
| ARG INSTALL_RESIL=False |
| ARG RESIL_COMMIT=not_installed |
| ARG RESIL_VERSION=not_installed |
| ENV NEMO_FW_RESIL_COMMIT=not_installed |
| ENV NEMO_FW_RESIL_VERSION=not_installed |
| RUN |32 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed /bin/sh -c if [ $INSTALL_RESIL = "True" ] && [ $TARGET_ARCH = "x86" ]; then pip install --no-cache-dir "git+https://github.com/NVIDIA/nvidia-resiliency-ext.git@${RESIL_COMMIT}"; fi # buildkit |
| ARG INSTALL_MODELOPT=True |
| ARG MODELOPT_VERSION=0.27.1 |
| RUN |34 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 /bin/sh -c if [ $INSTALL_MODELOPT = "True" ]; then pip install --no-cache-dir nvidia-modelopt[torch]==$MODELOPT_VERSION; fi # buildkit |
| RUN |34 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 /bin/sh -c if [ $INSTALL_VLLM = "True" ]; then /opt/venv/bin/pip install -r /opt/NeMo/requirements/requirements_vllm.txt -r /opt/NeMo/requirements/requirements_deploy.txt; fi # buildkit |
| ARG NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f |
| ENV NEMO_FW_NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c git clone https://github.com/NVIDIA/NeMo-Run && cd NeMo-Run && git pull && if [ ! -z $NEMO_RUN_COMMIT ]; then git fetch origin $NEMO_RUN_COMMIT && git checkout FETCH_HEAD; fi && pip install -e . # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c pip install --no-deps --no-cache-dir "liger-kernel==0.5.8; (platform_machine == 'x86_64' and platform_system != 'Darwin')" && pip install --no-deps "cut-cross-entropy @ git+https://github.com/apple/ml-cross-entropy.git@87a86aba72cfd2f0d8abecaf81c13c4528ea07d8; (platform_machine == 'x86_64' and platform_system != 'Darwin')" # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c pip uninstall -y webdataset && pip install --no-cache-dir "webdataset==0.2.86" "pandas==2.2.3" "ctc_segmentation==1.7.1" "transformers==4.51.3" # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c if [ $INSTALL_VLLM = "True" ]; then /opt/venv/bin/pip install "transformers==4.51.3"; fi # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c pip uninstall -y tornado onnx h11 pytest-coverage levenshtein && pip install --no-cache-dir "tornado==6.5.0" "onnx==1.17.0" "h11==0.16.0" "setuptools==78.1.1" && sed -i '57d' /usr/local/lib/python3.12/dist-packages/torch_tensorrt/dynamo/conversion/custom_ops_converters.py # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c apt-get remove --purge -y gdb libffi-dev ccache fakeroot libfakeroot libdebuginfod-common && apt-get -y autoremove && apt-get clean # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c <<"EOF" python
from transformers import AutoTokenizer, Qwen2Tokenizer, CLIPImageProcessor
_=AutoTokenizer.from_pretrained('gpt2')
_=AutoTokenizer.from_pretrained('bert-base-cased')
_=AutoTokenizer.from_pretrained('bert-large-cased')
_=AutoTokenizer.from_pretrained('bert-large-uncased')
_=AutoTokenizer.from_pretrained('bigcode/starcoder2-tokenizer')
_=AutoTokenizer.from_pretrained("EleutherAI/gpt-neox-20b")
_=AutoTokenizer.from_pretrained("nvidia/Nemotron-H-8B-Base-8K")
_=AutoTokenizer.from_pretrained("nvidia/Nemotron-H-47B-Base-8K")
_=AutoTokenizer.from_pretrained("nvidia/Nemotron-H-56B-Base-8K")
_=AutoTokenizer.from_pretrained('THUDM/chatglm2-6b',trust_remote_code=True)
_=AutoTokenizer.from_pretrained('THUDM/chatglm3-6b',trust_remote_code=True)
_=Qwen2Tokenizer.from_pretrained('qwen/Qwen1.5-7B',trust_remote_code=True)
_=Qwen2Tokenizer.from_pretrained('qwen/Qwen1.5-14B',trust_remote_code=True)
_=AutoTokenizer.from_pretrained('openai/clip-vit-large-patch14')
_=CLIPImageProcessor.from_pretrained('openai/clip-vit-large-patch14')
_=CLIPImageProcessor.from_pretrained('openai/clip-vit-large-patch14-336')
EOF # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c URM_API_TOKEN=$(cat /run/secrets/URM_API_TOKEN) && wget --http-user donghyukc --http-password ${URM_API_TOKEN} "https://urm.nvidia.com/artifactory/nemo-fw-generic-local/llama3_70b_tokenizer.tar.gz" && wget --http-user donghyukc --http-password ${URM_API_TOKEN} "https://urm.nvidia.com/artifactory/nemo-fw-generic-local/llama3_8b_tokenizer.tar.gz" && mkdir -p /tmp_assets && tar -xzvf llama3_8b_tokenizer.tar.gz -C /tmp_assets && tar -xzvf llama3_70b_tokenizer.tar.gz -C /tmp_assets && cp -rf /tmp_assets/hub ~/.cache/huggingface && rm -rf /tmp_assets && rm llama3_8b_tokenizer.tar.gz llama3_70b_tokenizer.tar.gz # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c <<"EOF" python
from transformers import AutoTokenizer
_=AutoTokenizer.from_pretrained('meta-llama/Meta-Llama-3-8B')
_=AutoTokenizer.from_pretrained('meta-llama/Meta-Llama-3-70B')
_=AutoTokenizer.from_pretrained('meta-llama/Meta-Llama-3-8B-instruct')
_=AutoTokenizer.from_pretrained('meta-llama/Meta-Llama-3-70B-instruct')
EOF # buildkit |
| RUN |35 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f /bin/sh -c sed -i '/^LayerId/s/^/#/' /usr/local/lib/python3.12/dist-packages/cv2/typing/__init__.py # buildkit |
| ARG PRE_COMPILE_QUANT_KERNELS=True |
| RUN |36 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f PRE_COMPILE_QUANT_KERNELS=True /bin/sh -c if [ $PRE_COMPILE_QUANT_KERNELS = "True" ]; then python -c "import modelopt.torch.quantization.extensions as ext; ext.precompile()"; fi # buildkit |
| COPY nemo2/patches/triton-lang_triton_6570_lazy_init.patch /opt/ # buildkit |
| RUN |36 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f PRE_COMPILE_QUANT_KERNELS=True /bin/sh -c cd /usr/local/lib/python3.12/dist-packages && patch -p1 < /opt/triton-lang_triton_6570_lazy_init.patch && rm /opt/triton-lang_triton_6570_lazy_init.patch # buildkit |
| WORKDIR /workspace |
| RUN |36 NVIDIA_BIGNLP_VERSION= TRT_VER=10.9.0.34 CUDA_VER=12.8 CUDNN_VER=9.8.0.87-1 NCCL_VER=2.25.1-1+cuda12.8 CUBLAS_VER=12.8.4.1-1 NVRTC_VER=12.8.93-1 TRT_LLM_COMMIT=3c5fe5eb86077f67febc42070be11f11de17c1e2 TRT_LLM_VERSION=0.18.0 REINSTALL_NSYS=False NSYS_VERSION=2025.1.1.65 TARGET_ARCH=x86 DEEPEP_COMMIT=a84a24808fb0ea732f49b874cc456a69dde69076 GDR_COPY_VERSION=v2.4.1 REINSTALL_APEX=False APEX_COMMIT=e74a67bba3ee679f778670e17edc21639008ae0a MCORE_COMMIT=a845aa7e12b3a117e24c2352b9e3e60bad2e3a17 MCORE_VERSION=0.12.1 SRC_DIR=/src/tensorrt_llm CPP_BUILD_DIR=/src/tensorrt_llm/cpp/build INSTALL_VLLM=True ALIGNER_COMMIT=dev ALIGNER_VERSION=0.6.0rc0.dev0 LAUNCHER_COMMIT=26e42fa91d9e608897ce485b4911c263a4b57008 CURATOR_COMMIT=33db56e304a3cb2d72d2038d393474905737a3e1 INSTALL_CURATOR=True CURATOR_VERSION=0.8.0rc4.dev0 NEMO_COMMIT=5ac3335a3dc2a76eb96889312f79904ba2cdcf70 NEMO_VERSION=2.3.1 INSTALL_RESIL=False RESIL_COMMIT=not_installed RESIL_VERSION=not_installed INSTALL_MODELOPT=True MODELOPT_VERSION=0.27.1 NEMO_RUN_COMMIT=bc412ee5584ed3072717af59f54565ec0d265a6f PRE_COMPILE_QUANT_KERNELS=True /bin/sh -c chmod -R a+w /workspace # buildkit |
| ARG NEMO_FW_PIPELINE_ID=28827164 |
| ENV NEMO_FW_PIPELINE_ID=28827164 |
| ARG NVIDIA_BUILD_ID |
| ENV NVIDIA_BUILD_ID=148941828 |
| LABEL com.nvidia.build.id=148941828 |
| ARG NVIDIA_BUILD_REF |
| LABEL com.nvidia.build.ref= |