triton-inference-server · Sunidhi-Gaonkar1 · Nov 20, 2025 · mc-nv · Dec 2, 2025 · alhad-deshpande
diff --git a/build.py b/build.py
@@ -1509,8 +1509,9 @@ def dockerfile_prepare_container_linux(argmap, backends, enable_gpu, target_mach
 """
 
     if target_platform() not in ["igpu", "windows", "rhel"]:
-        repo_arch = "sbsa" if target_machine == "aarch64" else "x86_64"
-        df += f"""
+        if FLAGS.triton_wheels_dependencies_group != "cpu" :
+           repo_arch = "sbsa" if target_machine == "aarch64" else "x86_64"
+           df += f"""
 RUN curl -o /tmp/cuda-keyring.deb \\
         https://developer.download.nvidia.com/compute/cuda/repos/ubuntu2404/{repo_arch}/cuda-keyring_1.1-1_all.deb \\
       && apt install /tmp/cuda-keyring.deb \\