f34ce41345
GitOrigin-RevId: b73c2221a46c13557b1b3be9c2070cc42cf01eb3
124 lines
2.8 KiB
Nix
124 lines
2.8 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchFromGitHub,
|
|
cython_0,
|
|
fastrlock,
|
|
numpy,
|
|
wheel,
|
|
pytestCheckHook,
|
|
mock,
|
|
setuptools,
|
|
cudaPackages,
|
|
addOpenGLRunpath,
|
|
pythonOlder,
|
|
symlinkJoin,
|
|
fetchpatch
|
|
}:
|
|
|
|
let
|
|
inherit (cudaPackages) cudnn cutensor nccl;
|
|
outpaths = with cudaPackages; [
|
|
cuda_cccl # <nv/target>
|
|
cuda_cudart
|
|
cuda_nvcc # <crt/host_defines.h>
|
|
cuda_nvprof
|
|
cuda_nvrtc
|
|
cuda_nvtx
|
|
cuda_profiler_api
|
|
libcublas
|
|
libcufft
|
|
libcurand
|
|
libcusolver
|
|
libcusparse
|
|
|
|
# Missing:
|
|
# cusparselt
|
|
];
|
|
cudatoolkit-joined = symlinkJoin {
|
|
name = "cudatoolkit-joined-${cudaPackages.cudaVersion}";
|
|
paths = outpaths ++ lib.concatMap (f: lib.map f outpaths) [lib.getLib lib.getDev (lib.getOutput "static") (lib.getOutput "stubs")];
|
|
};
|
|
in
|
|
buildPythonPackage rec {
|
|
pname = "cupy";
|
|
version = "13.2.0";
|
|
format = "setuptools";
|
|
|
|
disabled = pythonOlder "3.7";
|
|
|
|
src = fetchFromGitHub {
|
|
owner = "cupy";
|
|
repo = "cupy";
|
|
rev = "v13.2.0";
|
|
hash = "sha256-vZAtpIZztmsYeJeuq7yl7kgZse2azrIM3efHDmUswJI=";
|
|
fetchSubmodules = true;
|
|
};
|
|
|
|
patches = [
|
|
(fetchpatch {
|
|
url =
|
|
"https://github.com/cfhammill/cupy/commit/67526c756e4a0a70f0420bf0e7f081b8a35a8ee5.patch";
|
|
hash = "sha256-WZgexBdM9J0ep5s+9CGZriVq0ZidCRccox+g0iDDywQ=";
|
|
})
|
|
];
|
|
|
|
# See https://docs.cupy.dev/en/v10.2.0/reference/environment.html. Seting both
|
|
# CUPY_NUM_BUILD_JOBS and CUPY_NUM_NVCC_THREADS to NIX_BUILD_CORES results in
|
|
# a small amount of thrashing but it turns out there are a large number of
|
|
# very short builds and a few extremely long ones, so setting both ends up
|
|
# working nicely in practice.
|
|
preConfigure = ''
|
|
export CUPY_NUM_BUILD_JOBS="$NIX_BUILD_CORES"
|
|
export CUPY_NUM_NVCC_THREADS="$NIX_BUILD_CORES"
|
|
'';
|
|
|
|
nativeBuildInputs = [
|
|
setuptools
|
|
wheel
|
|
addOpenGLRunpath
|
|
cython_0
|
|
cudaPackages.cuda_nvcc
|
|
];
|
|
|
|
buildInputs = [
|
|
cudatoolkit-joined
|
|
cudnn
|
|
cutensor
|
|
nccl
|
|
];
|
|
|
|
NVCC = "${lib.getExe cudaPackages.cuda_nvcc}"; # FIXME: splicing/buildPackages
|
|
CUDA_PATH = "${cudatoolkit-joined}";
|
|
|
|
propagatedBuildInputs = [
|
|
fastrlock
|
|
numpy
|
|
];
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
mock
|
|
];
|
|
|
|
# Won't work with the GPU, whose drivers won't be accessible from the build
|
|
# sandbox
|
|
doCheck = false;
|
|
|
|
postFixup = ''
|
|
find $out -type f \( -name '*.so' -or -name '*.so.*' \) | while read lib; do
|
|
addOpenGLRunpath "$lib"
|
|
done
|
|
'';
|
|
|
|
enableParallelBuilding = true;
|
|
|
|
meta = with lib; {
|
|
description = "NumPy-compatible matrix library accelerated by CUDA";
|
|
homepage = "https://cupy.chainer.org/";
|
|
changelog = "https://github.com/cupy/cupy/releases/tag/v${version}";
|
|
license = licenses.mit;
|
|
platforms = [ "x86_64-linux" ];
|
|
maintainers = with maintainers; [ hyphon81 ];
|
|
};
|
|
}
|