bcb2f287e1
GitOrigin-RevId: d603719ec6e294f034936c0d0dc06f689d91b6c3
113 lines
2.5 KiB
Nix
113 lines
2.5 KiB
Nix
{
|
|
lib,
|
|
buildPythonPackage,
|
|
fetchPypi,
|
|
cython,
|
|
fastrlock,
|
|
numpy,
|
|
wheel,
|
|
pytestCheckHook,
|
|
mock,
|
|
setuptools,
|
|
cudaPackages,
|
|
addOpenGLRunpath,
|
|
pythonOlder,
|
|
symlinkJoin,
|
|
}:
|
|
|
|
let
|
|
inherit (cudaPackages) cudnn cutensor nccl;
|
|
cudatoolkit-joined = symlinkJoin {
|
|
name = "cudatoolkit-joined-${cudaPackages.cudaVersion}";
|
|
paths = with cudaPackages; [
|
|
cuda_cccl # <nv/target>
|
|
cuda_cccl.dev
|
|
cuda_cudart
|
|
cuda_nvcc.dev # <crt/host_defines.h>
|
|
cuda_nvprof
|
|
cuda_nvrtc
|
|
cuda_nvtx
|
|
cuda_profiler_api
|
|
libcublas
|
|
libcufft
|
|
libcurand
|
|
libcusolver
|
|
libcusparse
|
|
|
|
# Missing:
|
|
# cusparselt
|
|
];
|
|
};
|
|
in
|
|
buildPythonPackage rec {
|
|
pname = "cupy";
|
|
version = "13.0.0";
|
|
format = "setuptools";
|
|
|
|
disabled = pythonOlder "3.7";
|
|
|
|
src = fetchPypi {
|
|
inherit pname version;
|
|
hash = "sha256-LwTnhX9pKnEzYNycOwZwmAarhAT8o5ta+XIcBKKXmq4=";
|
|
};
|
|
|
|
# See https://docs.cupy.dev/en/v10.2.0/reference/environment.html. Seting both
|
|
# CUPY_NUM_BUILD_JOBS and CUPY_NUM_NVCC_THREADS to NIX_BUILD_CORES results in
|
|
# a small amount of thrashing but it turns out there are a large number of
|
|
# very short builds and a few extremely long ones, so setting both ends up
|
|
# working nicely in practice.
|
|
preConfigure = ''
|
|
export CUPY_NUM_BUILD_JOBS="$NIX_BUILD_CORES"
|
|
export CUPY_NUM_NVCC_THREADS="$NIX_BUILD_CORES"
|
|
'';
|
|
|
|
nativeBuildInputs = [
|
|
setuptools
|
|
wheel
|
|
addOpenGLRunpath
|
|
cython
|
|
cudaPackages.cuda_nvcc
|
|
];
|
|
|
|
buildInputs = [
|
|
cudatoolkit-joined
|
|
cudnn
|
|
cutensor
|
|
nccl
|
|
];
|
|
|
|
NVCC = "${lib.getExe cudaPackages.cuda_nvcc}"; # FIXME: splicing/buildPackages
|
|
CUDA_PATH = "${cudatoolkit-joined}";
|
|
LDFLAGS = "-L${cudaPackages.cuda_cudart}/lib/stubs";
|
|
|
|
propagatedBuildInputs = [
|
|
fastrlock
|
|
numpy
|
|
];
|
|
|
|
nativeCheckInputs = [
|
|
pytestCheckHook
|
|
mock
|
|
];
|
|
|
|
# Won't work with the GPU, whose drivers won't be accessible from the build
|
|
# sandbox
|
|
doCheck = false;
|
|
|
|
postFixup = ''
|
|
find $out -type f \( -name '*.so' -or -name '*.so.*' \) | while read lib; do
|
|
addOpenGLRunpath "$lib"
|
|
done
|
|
'';
|
|
|
|
enableParallelBuilding = true;
|
|
|
|
meta = with lib; {
|
|
description = "NumPy-compatible matrix library accelerated by CUDA";
|
|
homepage = "https://cupy.chainer.org/";
|
|
changelog = "https://github.com/cupy/cupy/releases/tag/v${version}";
|
|
license = licenses.mit;
|
|
platforms = [ "x86_64-linux" ];
|
|
maintainers = with maintainers; [ hyphon81 ];
|
|
};
|
|
}
|