210 lines
6.7 KiB
Nix
210 lines
6.7 KiB
Nix
|
{cudaVersion, lib, addDriverRunpath}:
|
||
|
let
|
||
|
inherit (lib) attrsets lists strings;
|
||
|
# cudaVersionOlder : Version -> Boolean
|
||
|
cudaVersionOlder = strings.versionOlder cudaVersion;
|
||
|
# cudaVersionAtLeast : Version -> Boolean
|
||
|
cudaVersionAtLeast = strings.versionAtLeast cudaVersion;
|
||
|
|
||
|
addBuildInputs =
|
||
|
drv: buildInputs:
|
||
|
drv.overrideAttrs (prevAttrs: {buildInputs = prevAttrs.buildInputs ++ buildInputs;});
|
||
|
in
|
||
|
# NOTE: Filter out attributes that are not present in the previous version of
|
||
|
# the package set. This is necessary to prevent the appearance of attributes
|
||
|
# like `cuda_nvcc` in `cudaPackages_10_0, which predates redistributables.
|
||
|
final: prev:
|
||
|
attrsets.filterAttrs (attr: _: (builtins.hasAttr attr prev)) {
|
||
|
libcufile = prev.libcufile.overrideAttrs (
|
||
|
prevAttrs: {
|
||
|
buildInputs = prevAttrs.buildInputs ++ [
|
||
|
final.libcublas.lib
|
||
|
final.pkgs.numactl
|
||
|
final.pkgs.rdma-core
|
||
|
];
|
||
|
# Before 11.7 libcufile depends on itself for some reason.
|
||
|
env.autoPatchelfIgnoreMissingDeps =
|
||
|
prevAttrs.env.autoPatchelfIgnoreMissingDeps
|
||
|
+ strings.optionalString (cudaVersionOlder "11.7") " libcufile.so.0";
|
||
|
}
|
||
|
);
|
||
|
|
||
|
libcusolver = addBuildInputs prev.libcusolver (
|
||
|
# Always depends on this
|
||
|
[final.libcublas.lib]
|
||
|
# Dependency from 12.0 and on
|
||
|
++ lists.optionals (cudaVersionAtLeast "12.0") [final.libnvjitlink.lib]
|
||
|
# Dependency from 12.1 and on
|
||
|
++ lists.optionals (cudaVersionAtLeast "12.1") [final.libcusparse.lib]
|
||
|
);
|
||
|
|
||
|
libcusparse = addBuildInputs prev.libcusparse (
|
||
|
lists.optionals (cudaVersionAtLeast "12.0") [final.libnvjitlink.lib]
|
||
|
);
|
||
|
|
||
|
cuda_cudart = prev.cuda_cudart.overrideAttrs (
|
||
|
prevAttrs: {
|
||
|
allowFHSReferences = false;
|
||
|
|
||
|
# The libcuda stub's pkg-config doesn't follow the general pattern:
|
||
|
postPatch =
|
||
|
prevAttrs.postPatch or ""
|
||
|
+ ''
|
||
|
while IFS= read -r -d $'\0' path ; do
|
||
|
sed -i \
|
||
|
-e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib/stubs|" \
|
||
|
-e "s|^Libs\s*:\(.*\)\$|Libs: \1 -Wl,-rpath,${addDriverRunpath.driverLink}/lib|" \
|
||
|
"$path"
|
||
|
done < <(find -iname 'cuda-*.pc' -print0)
|
||
|
''
|
||
|
+ ''
|
||
|
# Namelink may not be enough, add a soname.
|
||
|
# Cf. https://gitlab.kitware.com/cmake/cmake/-/issues/25536
|
||
|
if [[ -f lib/stubs/libcuda.so && ! -f lib/stubs/libcuda.so.1 ]] ; then
|
||
|
ln -s libcuda.so lib/stubs/libcuda.so.1
|
||
|
fi
|
||
|
'';
|
||
|
}
|
||
|
);
|
||
|
|
||
|
cuda_compat = prev.cuda_compat.overrideAttrs (
|
||
|
prevAttrs: {
|
||
|
env.autoPatchelfIgnoreMissingDeps =
|
||
|
prevAttrs.env.autoPatchelfIgnoreMissingDeps + " libnvrm_gpu.so libnvrm_mem.so libnvdla_runtime.so";
|
||
|
# `cuda_compat` only works on aarch64-linux, and only when building for Jetson devices.
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
"Trying to use cuda_compat on aarch64-linux targeting non-Jetson devices" =
|
||
|
!final.flags.isJetsonBuild;
|
||
|
};
|
||
|
}
|
||
|
);
|
||
|
|
||
|
cuda_gdb = addBuildInputs prev.cuda_gdb (
|
||
|
# x86_64 only needs gmp from 12.0 and on
|
||
|
lists.optionals (cudaVersionAtLeast "12.0") [final.pkgs.gmp]
|
||
|
);
|
||
|
|
||
|
cuda_nvcc = prev.cuda_nvcc.overrideAttrs (
|
||
|
oldAttrs: {
|
||
|
|
||
|
outputs = oldAttrs.outputs ++ lists.optionals (!(builtins.elem "lib" oldAttrs.outputs)) [ "lib" ];
|
||
|
|
||
|
# Patch the nvcc.profile.
|
||
|
# Syntax:
|
||
|
# - `=` for assignment,
|
||
|
# - `?=` for conditional assignment,
|
||
|
# - `+=` to "prepend",
|
||
|
# - `=+` to "append".
|
||
|
|
||
|
# Cf. https://web.archive.org/web/20230308044351/https://arcb.csc.ncsu.edu/~mueller/cluster/nvidia/2.0/nvcc_2.0.pdf
|
||
|
|
||
|
# We set all variables with the lowest priority (=+), but we do force
|
||
|
# nvcc to use the fixed backend toolchain. Cf. comments in
|
||
|
# backend-stdenv.nix
|
||
|
|
||
|
postPatch =
|
||
|
(oldAttrs.postPatch or "")
|
||
|
+ ''
|
||
|
substituteInPlace bin/nvcc.profile \
|
||
|
--replace \
|
||
|
'$(TOP)/lib' \
|
||
|
"''${!outputLib}/lib" \
|
||
|
--replace \
|
||
|
'$(TOP)/$(_NVVM_BRANCH_)' \
|
||
|
"''${!outputBin}/nvvm" \
|
||
|
--replace \
|
||
|
'$(TOP)/$(_TARGET_DIR_)/include' \
|
||
|
"''${!outputDev}/include"
|
||
|
|
||
|
cat << EOF >> bin/nvcc.profile
|
||
|
|
||
|
# Fix a compatible backend compiler
|
||
|
PATH += ${lib.getBin final.backendStdenv.cc}/bin:
|
||
|
LIBRARIES += "-L${lib.getLib final.backendStdenv.nixpkgsCompatibleLibstdcxx}/lib"
|
||
|
|
||
|
# Expose the split-out nvvm
|
||
|
LIBRARIES =+ -L''${!outputBin}/nvvm/lib
|
||
|
INCLUDES =+ -I''${!outputBin}/nvvm/include
|
||
|
|
||
|
# Expose cudart and the libcuda stubs
|
||
|
LIBRARIES =+ -L$static/lib" "-L${final.cuda_cudart.lib}/lib -L${final.cuda_cudart.lib}/lib/stubs
|
||
|
INCLUDES =+ -I${final.cuda_cudart.dev}/include
|
||
|
EOF
|
||
|
'';
|
||
|
|
||
|
propagatedBuildInputs = [ final.setupCudaHook ];
|
||
|
|
||
|
postInstall =
|
||
|
(oldAttrs.postInstall or "")
|
||
|
+ ''
|
||
|
moveToOutput "nvvm" "''${!outputBin}"
|
||
|
'';
|
||
|
|
||
|
# The nvcc and cicc binaries contain hard-coded references to /usr
|
||
|
allowFHSReferences = true;
|
||
|
|
||
|
meta = (oldAttrs.meta or { }) // {
|
||
|
mainProgram = "nvcc";
|
||
|
};
|
||
|
}
|
||
|
);
|
||
|
|
||
|
cuda_nvprof = prev.cuda_nvprof.overrideAttrs (
|
||
|
prevAttrs: {buildInputs = prevAttrs.buildInputs ++ [final.cuda_cupti.lib];}
|
||
|
);
|
||
|
|
||
|
cuda_demo_suite = addBuildInputs prev.cuda_demo_suite [
|
||
|
final.pkgs.freeglut
|
||
|
final.pkgs.libGLU
|
||
|
final.pkgs.libglvnd
|
||
|
final.pkgs.mesa
|
||
|
final.libcufft.lib
|
||
|
final.libcurand.lib
|
||
|
];
|
||
|
|
||
|
nsight_compute = prev.nsight_compute.overrideAttrs (
|
||
|
prevAttrs: {
|
||
|
nativeBuildInputs =
|
||
|
prevAttrs.nativeBuildInputs
|
||
|
++ (
|
||
|
if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then
|
||
|
[final.pkgs.qt5.wrapQtAppsHook]
|
||
|
else
|
||
|
[final.pkgs.qt6.wrapQtAppsHook]
|
||
|
);
|
||
|
buildInputs =
|
||
|
prevAttrs.buildInputs
|
||
|
++ (
|
||
|
if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then
|
||
|
[final.pkgs.qt5.qtwebview]
|
||
|
else
|
||
|
[final.pkgs.qt6.qtwebview]
|
||
|
);
|
||
|
}
|
||
|
);
|
||
|
|
||
|
nsight_systems = prev.nsight_systems.overrideAttrs (
|
||
|
prevAttrs: {
|
||
|
nativeBuildInputs = prevAttrs.nativeBuildInputs ++ [final.pkgs.qt5.wrapQtAppsHook];
|
||
|
buildInputs = prevAttrs.buildInputs ++ [
|
||
|
final.pkgs.alsa-lib
|
||
|
final.pkgs.e2fsprogs
|
||
|
final.pkgs.nss
|
||
|
final.pkgs.numactl
|
||
|
final.pkgs.pulseaudio
|
||
|
final.pkgs.wayland
|
||
|
final.pkgs.xorg.libXcursor
|
||
|
final.pkgs.xorg.libXdamage
|
||
|
final.pkgs.xorg.libXrandr
|
||
|
final.pkgs.xorg.libXtst
|
||
|
];
|
||
|
}
|
||
|
);
|
||
|
|
||
|
nvidia_driver = prev.nvidia_driver.overrideAttrs {
|
||
|
# No need to support this package as we have drivers already
|
||
|
# in linuxPackages.
|
||
|
meta.broken = true;
|
||
|
};
|
||
|
}
|