Skip to content

Commit

Permalink
Merge pull request #217619 from ConnorBaker/feat/nccl-use-cudaPackages
Browse files Browse the repository at this point in the history
cudaPackages.nccl: refactor to fix #220340 and #221895
  • Loading branch information
ConnorBaker committed Aug 22, 2023
2 parents a2eca34 + 8208602 commit eeefcf7
Showing 1 changed file with 19 additions and 21 deletions.
40 changes: 19 additions & 21 deletions pkgs/development/libraries/science/math/nccl/default.nix
Original file line number Diff line number Diff line change
Expand Up @@ -2,38 +2,44 @@
, backendStdenv
, fetchFromGitHub
, which
, cudaPackages ? { }
, addOpenGLRunpath
, autoAddOpenGLRunpathHook
, cuda_cccl
, cuda_cudart
, cuda_nvcc
, cudaFlags
, cudaVersion
}:

with cudaPackages;

let
# Output looks like "-gencode=arch=compute_86,code=sm_86 -gencode=arch=compute_86,code=compute_86"
gencode = lib.concatStringsSep " " cudaFlags.gencode;
in
backendStdenv.mkDerivation rec {
name = "nccl-${version}-cuda-${cudaPackages.cudaMajorVersion}";
backendStdenv.mkDerivation (finalAttrs: {
name = "nccl-${finalAttrs.version}-cuda-${cudaVersion}";
version = "2.16.5-1";

src = fetchFromGitHub {
owner = "NVIDIA";
repo = "nccl";
rev = "v${version}";
rev = "v${finalAttrs.version}";
hash = "sha256-JyhhYKSVIqUKIbC1rCJozPT1IrIyRLGrTjdPjJqsYaU=";
};

outputs = [ "out" "dev" ];

nativeBuildInputs = [
which
addOpenGLRunpath
autoAddOpenGLRunpathHook
cuda_nvcc
];

buildInputs = [
cuda_cudart
] ++ lib.optionals (lib.versionAtLeast cudaVersion "12.0.0") [
]
# NOTE: CUDA versions in Nixpkgs only use a major and minor version. When we do comparisons
# against other version, like below, it's important that we use the same format. Otherwise,
# we'll get incorrect results.
# For example, lib.versionAtLeast "12.0" "12.0.0" == false.
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [
cuda_cccl
];

Expand All @@ -46,32 +52,24 @@ backendStdenv.mkDerivation rec {

makeFlags = [
"CUDA_HOME=${cuda_nvcc}"
"CUDA_LIB=${cuda_cudart}/lib64"
"CUDA_INC=${cuda_cudart}/include"
"CUDA_LIB=${lib.getLib cuda_cudart}/lib"
"CUDA_INC=${lib.getDev cuda_cudart}/include"
"PREFIX=$(out)"
];

postFixup = ''
moveToOutput lib/libnccl_static.a $dev
# Set RUNPATH so that libnvidia-ml in /run/opengl-driver(-32)/lib can be found.
# See the explanation in addOpenGLRunpath.
addOpenGLRunpath $out/lib/lib*.so
'';

env.NIX_CFLAGS_COMPILE = toString [ "-Wno-unused-function" ];

enableParallelBuilding = true;

passthru = {
inherit cudaPackages;
};

meta = with lib; {
description = "Multi-GPU and multi-node collective communication primitives for NVIDIA GPUs";
homepage = "https://developer.nvidia.com/nccl";
license = licenses.bsd3;
platforms = [ "x86_64-linux" ];
maintainers = with maintainers; [ mdaiter orivej ];
};
}
})

0 comments on commit eeefcf7

Please sign in to comment.