371 lines
11 KiB
Nix
371 lines
11 KiB
Nix
|
let
|
||
|
filterAndCreateOverrides =
|
||
|
createOverrideAttrs: final: prev:
|
||
|
let
|
||
|
# It is imperative that we use `final.callPackage` to perform overrides,
|
||
|
# so the final package set is available to the override functions.
|
||
|
inherit (final) callPackage;
|
||
|
|
||
|
# NOTE(@connorbaker): We MUST use `lib` from `prev` because the attribute
|
||
|
# names CAN NOT depend on `final`.
|
||
|
inherit (prev.lib.attrsets) filterAttrs mapAttrs;
|
||
|
inherit (prev.lib.trivial) pipe;
|
||
|
|
||
|
# NOTE: Filter out attributes that are not present in the previous version of
|
||
|
# the package set. This is necessary to prevent the appearance of attributes
|
||
|
# like `cuda_nvcc` in `cudaPackages_10_0, which predates redistributables.
|
||
|
filterOutNewAttrs = filterAttrs (name: _: prev ? ${name});
|
||
|
|
||
|
# Apply callPackage to each attribute value, yielding a value to be passed
|
||
|
# to overrideAttrs.
|
||
|
callPackageThenOverrideAttrs = mapAttrs (
|
||
|
name: value: prev.${name}.overrideAttrs (callPackage value { })
|
||
|
);
|
||
|
in
|
||
|
pipe createOverrideAttrs [
|
||
|
filterOutNewAttrs
|
||
|
callPackageThenOverrideAttrs
|
||
|
];
|
||
|
in
|
||
|
# Each attribute name is the name of an existing package in the previous version
|
||
|
# of the package set.
|
||
|
# The value is a function (to be provided to callPackage), which yields a value
|
||
|
# to be provided to overrideAttrs. This allows us to override the attributes of
|
||
|
# a package without losing access to the fixed point of the package set --
|
||
|
# especially useful given that some packages may depend on each other!
|
||
|
filterAndCreateOverrides {
|
||
|
libcufile =
|
||
|
{
|
||
|
cudaOlder,
|
||
|
lib,
|
||
|
libcublas,
|
||
|
numactl,
|
||
|
rdma-core,
|
||
|
}:
|
||
|
prevAttrs: {
|
||
|
buildInputs = prevAttrs.buildInputs ++ [
|
||
|
libcublas
|
||
|
numactl
|
||
|
rdma-core
|
||
|
];
|
||
|
# Before 11.7 libcufile depends on itself for some reason.
|
||
|
autoPatchelfIgnoreMissingDeps =
|
||
|
prevAttrs.autoPatchelfIgnoreMissingDeps
|
||
|
++ lib.lists.optionals (cudaOlder "11.7") [ "libcufile.so.0" ];
|
||
|
};
|
||
|
|
||
|
libcusolver =
|
||
|
{
|
||
|
cudaAtLeast,
|
||
|
lib,
|
||
|
libcublas,
|
||
|
libcusparse ? null,
|
||
|
libnvjitlink ? null,
|
||
|
}:
|
||
|
prevAttrs: {
|
||
|
buildInputs =
|
||
|
prevAttrs.buildInputs
|
||
|
# Always depends on this
|
||
|
++ [ libcublas ]
|
||
|
# Dependency from 12.0 and on
|
||
|
++ lib.lists.optionals (cudaAtLeast "12.0") [ libnvjitlink ]
|
||
|
# Dependency from 12.1 and on
|
||
|
++ lib.lists.optionals (cudaAtLeast "12.1") [ libcusparse ];
|
||
|
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
"libnvjitlink missing (CUDA >= 12.0)" =
|
||
|
!(cudaAtLeast "12.0" -> (libnvjitlink != null && libnvjitlink != null));
|
||
|
"libcusparse missing (CUDA >= 12.1)" =
|
||
|
!(cudaAtLeast "12.1" -> (libcusparse != null && libcusparse != null));
|
||
|
};
|
||
|
};
|
||
|
|
||
|
libcusparse =
|
||
|
{
|
||
|
cudaAtLeast,
|
||
|
lib,
|
||
|
libnvjitlink ? null,
|
||
|
}:
|
||
|
prevAttrs: {
|
||
|
buildInputs =
|
||
|
prevAttrs.buildInputs
|
||
|
# Dependency from 12.0 and on
|
||
|
++ lib.lists.optionals (cudaAtLeast "12.0") [ libnvjitlink ];
|
||
|
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
"libnvjitlink missing (CUDA >= 12.0)" =
|
||
|
!(cudaAtLeast "12.0" -> (libnvjitlink != null && libnvjitlink != null));
|
||
|
};
|
||
|
};
|
||
|
|
||
|
# TODO(@connorbaker): cuda_cudart.dev depends on crt/host_config.h, which is from
|
||
|
# (getDev cuda_nvcc). It would be nice to be able to encode that.
|
||
|
cuda_cudart =
|
||
|
{ addDriverRunpath, lib }:
|
||
|
prevAttrs: {
|
||
|
# Remove once cuda-find-redist-features has a special case for libcuda
|
||
|
outputs =
|
||
|
prevAttrs.outputs
|
||
|
++ lib.lists.optionals (!(builtins.elem "stubs" prevAttrs.outputs)) [ "stubs" ];
|
||
|
|
||
|
allowFHSReferences = false;
|
||
|
|
||
|
# The libcuda stub's pkg-config doesn't follow the general pattern:
|
||
|
postPatch =
|
||
|
prevAttrs.postPatch or ""
|
||
|
+ ''
|
||
|
while IFS= read -r -d $'\0' path; do
|
||
|
sed -i \
|
||
|
-e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib/stubs|" \
|
||
|
-e "s|^Libs\s*:\(.*\)\$|Libs: \1 -Wl,-rpath,${addDriverRunpath.driverLink}/lib|" \
|
||
|
"$path"
|
||
|
done < <(find -iname 'cuda-*.pc' -print0)
|
||
|
''
|
||
|
# Namelink may not be enough, add a soname.
|
||
|
# Cf. https://gitlab.kitware.com/cmake/cmake/-/issues/25536
|
||
|
+ ''
|
||
|
if [[ -f lib/stubs/libcuda.so && ! -f lib/stubs/libcuda.so.1 ]]; then
|
||
|
ln -s libcuda.so lib/stubs/libcuda.so.1
|
||
|
fi
|
||
|
'';
|
||
|
|
||
|
postFixup =
|
||
|
prevAttrs.postFixup or ""
|
||
|
+ ''
|
||
|
moveToOutput lib/stubs "$stubs"
|
||
|
ln -s "$stubs"/lib/stubs/* "$stubs"/lib/
|
||
|
ln -s "$stubs"/lib/stubs "''${!outputLib}/lib/stubs"
|
||
|
'';
|
||
|
};
|
||
|
|
||
|
cuda_compat =
|
||
|
{ flags, lib }:
|
||
|
prevAttrs: {
|
||
|
autoPatchelfIgnoreMissingDeps = prevAttrs.autoPatchelfIgnoreMissingDeps ++ [
|
||
|
"libnvrm_gpu.so"
|
||
|
"libnvrm_mem.so"
|
||
|
"libnvdla_runtime.so"
|
||
|
];
|
||
|
# `cuda_compat` only works on aarch64-linux, and only when building for Jetson devices.
|
||
|
badPlatformsConditions = prevAttrs.badPlatformsConditions // {
|
||
|
"Trying to use cuda_compat on aarch64-linux targeting non-Jetson devices" = !flags.isJetsonBuild;
|
||
|
};
|
||
|
};
|
||
|
|
||
|
cuda_gdb =
|
||
|
{
|
||
|
cudaAtLeast,
|
||
|
gmp,
|
||
|
expat,
|
||
|
stdenv,
|
||
|
lib,
|
||
|
}:
|
||
|
prevAttrs: {
|
||
|
buildInputs =
|
||
|
prevAttrs.buildInputs
|
||
|
# x86_64 only needs gmp from 12.0 and on
|
||
|
++ lib.lists.optionals (cudaAtLeast "12.0") [ gmp ]
|
||
|
# aarch64,sbsa needs expat
|
||
|
++ lib.lists.optionals (stdenv.hostPlatform.isAarch64) [ expat ];
|
||
|
};
|
||
|
|
||
|
cuda_nvcc =
|
||
|
{ backendStdenv, setupCudaHook }:
|
||
|
prevAttrs: {
|
||
|
# Merge "bin" and "dev" into "out" to avoid circular references
|
||
|
outputs = builtins.filter (
|
||
|
x:
|
||
|
!(builtins.elem x [
|
||
|
"dev"
|
||
|
"bin"
|
||
|
])
|
||
|
) prevAttrs.outputs;
|
||
|
|
||
|
# Patch the nvcc.profile.
|
||
|
# Syntax:
|
||
|
# - `=` for assignment,
|
||
|
# - `?=` for conditional assignment,
|
||
|
# - `+=` to "prepend",
|
||
|
# - `=+` to "append".
|
||
|
|
||
|
# Cf. https://web.archive.org/web/20230308044351/https://arcb.csc.ncsu.edu/~mueller/cluster/nvidia/2.0/nvcc_2.0.pdf
|
||
|
|
||
|
# We set all variables with the lowest priority (=+), but we do force
|
||
|
# nvcc to use the fixed backend toolchain. Cf. comments in
|
||
|
# backend-stdenv.nix
|
||
|
|
||
|
postPatch =
|
||
|
(prevAttrs.postPatch or "")
|
||
|
+ ''
|
||
|
substituteInPlace bin/nvcc.profile \
|
||
|
--replace-fail \
|
||
|
'$(TOP)/$(_NVVM_BRANCH_)' \
|
||
|
"''${!outputBin}/nvvm" \
|
||
|
--replace-fail \
|
||
|
'$(TOP)/$(_TARGET_DIR_)/include' \
|
||
|
"''${!outputDev}/include"
|
||
|
|
||
|
cat << EOF >> bin/nvcc.profile
|
||
|
|
||
|
# Fix a compatible backend compiler
|
||
|
PATH += "${backendStdenv.cc}/bin":
|
||
|
|
||
|
# Expose the split-out nvvm
|
||
|
LIBRARIES =+ "-L''${!outputBin}/nvvm/lib"
|
||
|
INCLUDES =+ "-I''${!outputBin}/nvvm/include"
|
||
|
EOF
|
||
|
'';
|
||
|
|
||
|
# NOTE(@connorbaker):
|
||
|
# Though it might seem odd or counter-intuitive to add the setup hook to `propagatedBuildInputs` instead of
|
||
|
# `propagatedNativeBuildInputs`, it is necessary! If you move the setup hook from `propagatedBuildInputs` to
|
||
|
# `propagatedNativeBuildInputs`, it stops being propagated to downstream packages during their build because
|
||
|
# setup hooks in `propagatedNativeBuildInputs` are not designed to affect the runtime or build environment of
|
||
|
# dependencies; they are only meant to affect the build environment of the package that directly includes them.
|
||
|
propagatedBuildInputs = (prevAttrs.propagatedBuildInputs or [ ]) ++ [ setupCudaHook ];
|
||
|
|
||
|
postInstall =
|
||
|
(prevAttrs.postInstall or "")
|
||
|
+ ''
|
||
|
moveToOutput "nvvm" "''${!outputBin}"
|
||
|
'';
|
||
|
|
||
|
# The nvcc and cicc binaries contain hard-coded references to /usr
|
||
|
allowFHSReferences = true;
|
||
|
|
||
|
meta = (prevAttrs.meta or { }) // {
|
||
|
mainProgram = "nvcc";
|
||
|
};
|
||
|
};
|
||
|
|
||
|
cuda_nvprof = { cuda_cupti }: prevAttrs: { buildInputs = prevAttrs.buildInputs ++ [ cuda_cupti ]; };
|
||
|
|
||
|
cuda_demo_suite =
|
||
|
{
|
||
|
libglut,
|
||
|
libcufft,
|
||
|
libcurand,
|
||
|
libGLU,
|
||
|
libglvnd,
|
||
|
mesa,
|
||
|
}:
|
||
|
prevAttrs: {
|
||
|
buildInputs = prevAttrs.buildInputs ++ [
|
||
|
libglut
|
||
|
libcufft
|
||
|
libcurand
|
||
|
libGLU
|
||
|
libglvnd
|
||
|
mesa
|
||
|
];
|
||
|
};
|
||
|
|
||
|
nsight_compute =
|
||
|
{
|
||
|
lib,
|
||
|
qt5 ? null,
|
||
|
qt6 ? null,
|
||
|
}:
|
||
|
prevAttrs:
|
||
|
let
|
||
|
inherit (lib.strings) versionOlder versionAtLeast;
|
||
|
inherit (prevAttrs) version;
|
||
|
qt = if versionOlder version "2022.2.0" then qt5 else qt6;
|
||
|
inherit (qt) wrapQtAppsHook qtwebview;
|
||
|
in
|
||
|
{
|
||
|
nativeBuildInputs = prevAttrs.nativeBuildInputs ++ [ wrapQtAppsHook ];
|
||
|
buildInputs = prevAttrs.buildInputs ++ [ qtwebview ];
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
"Qt 5 missing (<2022.2.0)" = !(versionOlder version "2022.2.0" -> qt5 != null);
|
||
|
"Qt 6 missing (>=2022.2.0)" = !(versionAtLeast version "2022.2.0" -> qt6 != null);
|
||
|
};
|
||
|
};
|
||
|
|
||
|
nsight_systems =
|
||
|
{
|
||
|
cuda_cudart,
|
||
|
cudaOlder,
|
||
|
gst_all_1,
|
||
|
lib,
|
||
|
nss,
|
||
|
numactl,
|
||
|
pulseaudio,
|
||
|
qt5 ? null,
|
||
|
qt6 ? null,
|
||
|
rdma-core,
|
||
|
ucx,
|
||
|
wayland,
|
||
|
xorg,
|
||
|
}:
|
||
|
prevAttrs:
|
||
|
let
|
||
|
inherit (lib.strings) versionOlder versionAtLeast;
|
||
|
inherit (prevAttrs) version;
|
||
|
qt = if lib.strings.versionOlder prevAttrs.version "2022.4.2.1" then qt5 else qt6;
|
||
|
qtwayland =
|
||
|
if lib.versions.major qt.qtbase.version == "5" then
|
||
|
lib.getBin qt.qtwayland
|
||
|
else
|
||
|
lib.getLib qt.qtwayland;
|
||
|
qtWaylandPlugins = "${qtwayland}/${qt.qtbase.qtPluginPrefix}";
|
||
|
in
|
||
|
{
|
||
|
# An ad hoc replacement for
|
||
|
# https://github.com/ConnorBaker/cuda-redist-find-features/issues/11
|
||
|
env.rmPatterns = toString [
|
||
|
"nsight-systems/*/*/lib{arrow,jpeg}*"
|
||
|
"nsight-systems/*/*/lib{ssl,ssh,crypto}*"
|
||
|
"nsight-systems/*/*/libboost*"
|
||
|
"nsight-systems/*/*/libexec"
|
||
|
"nsight-systems/*/*/libQt*"
|
||
|
"nsight-systems/*/*/libstdc*"
|
||
|
"nsight-systems/*/*/Mesa"
|
||
|
"nsight-systems/*/*/Plugins"
|
||
|
"nsight-systems/*/*/python/bin/python"
|
||
|
];
|
||
|
postPatch =
|
||
|
prevAttrs.postPatch or ""
|
||
|
+ ''
|
||
|
for path in $rmPatterns; do
|
||
|
rm -r "$path"
|
||
|
done
|
||
|
'';
|
||
|
nativeBuildInputs = prevAttrs.nativeBuildInputs ++ [ qt.wrapQtAppsHook ];
|
||
|
buildInputs = prevAttrs.buildInputs ++ [
|
||
|
(qt.qtdeclarative or qt.full)
|
||
|
(qt.qtsvg or qt.full)
|
||
|
cuda_cudart.stubs
|
||
|
gst_all_1.gst-plugins-base
|
||
|
gst_all_1.gstreamer
|
||
|
nss
|
||
|
numactl
|
||
|
pulseaudio
|
||
|
qt.qtbase
|
||
|
qtWaylandPlugins
|
||
|
rdma-core
|
||
|
ucx
|
||
|
wayland
|
||
|
xorg.libXcursor
|
||
|
xorg.libXdamage
|
||
|
xorg.libXrandr
|
||
|
xorg.libXtst
|
||
|
];
|
||
|
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
# Older releases require boost 1.70, which is deprecated in Nixpkgs
|
||
|
"CUDA too old (<11.8)" = cudaOlder "11.8";
|
||
|
"Qt 5 missing (<2022.4.2.1)" = !(versionOlder version "2022.4.2.1" -> qt5 != null);
|
||
|
"Qt 6 missing (>=2022.4.2.1)" = !(versionAtLeast version "2022.4.2.1" -> qt6 != null);
|
||
|
};
|
||
|
};
|
||
|
|
||
|
nvidia_driver =
|
||
|
{ }:
|
||
|
prevAttrs: {
|
||
|
brokenConditions = prevAttrs.brokenConditions // {
|
||
|
"Package is not supported; use drivers from linuxPackages" = true;
|
||
|
};
|
||
|
};
|
||
|
}
|