diff --git a/dockerfile/cuda11.1.1.dockerfile b/dockerfile/cuda11.1.1.dockerfile index 54577fdad..69044c440 100644 --- a/dockerfile/cuda11.1.1.dockerfile +++ b/dockerfile/cuda11.1.1.dockerfile @@ -149,7 +149,7 @@ ADD dockerfile/etc /opt/microsoft/ WORKDIR ${SB_HOME} ADD third_party third_party -RUN make -C third_party cuda +RUN make -C third_party cuda -o nvbandwidth ADD . . RUN python3 -m pip install --upgrade setuptools==65.7 && \ diff --git a/dockerfile/cuda12.4.dockerfile b/dockerfile/cuda12.4.dockerfile index 3cd70da13..560f0908a 100644 --- a/dockerfile/cuda12.4.dockerfile +++ b/dockerfile/cuda12.4.dockerfile @@ -156,7 +156,7 @@ ADD dockerfile/etc /opt/microsoft/ WORKDIR ${SB_HOME} ADD third_party third_party -RUN make -C third_party cuda_with_msccl_and_nvbandwidth +RUN make -C third_party cuda_with_msccl ADD . . RUN python3 -m pip install --upgrade setuptools==65.7 && \ diff --git a/third_party/Makefile b/third_party/Makefile index 7f76b293c..8117fc10b 100755 --- a/third_party/Makefile +++ b/third_party/Makefile @@ -20,9 +20,8 @@ NUM_MAKE_JOBS ?= $(shell nproc --ignore=2) # Build targets. all: cuda rocm -cuda_with_msccl_and_nvbandwidth: cuda cuda_msccl nvbandwidth cuda_with_msccl: cuda cuda_msccl -cuda: common cuda_cutlass cuda_bandwidthTest cuda_nccl_tests cuda_perftest gpcnet cuda_gpuburn megatron_lm megatron_deepspeed +cuda: common cuda_cutlass cuda_bandwidthTest cuda_nccl_tests cuda_perftest gpcnet cuda_gpuburn megatron_lm megatron_deepspeed nvbandwidth rocm: common rocm_perftest rocm_rccl_tests rocm_rocblas rocm_bandwidthTest rocm_hipblaslt megatron_deepspeed apex_rocm cpu: common cpu_perftest cpu_stream common: fio