2022-04-15 01:41:22 +00:00
|
|
|
|
{ stdenv, lib, fetchFromGitHub, fetchpatch, buildPythonPackage, python,
|
|
|
|
|
cudaSupport ? false, cudaPackages, magma,
|
2020-05-15 21:57:56 +00:00
|
|
|
|
mklDnnSupport ? true, useSystemNccl ? true,
|
2021-02-05 17:12:51 +00:00
|
|
|
|
MPISupport ? false, mpi,
|
2020-05-15 21:57:56 +00:00
|
|
|
|
buildDocs ? false,
|
2020-11-12 09:05:59 +00:00
|
|
|
|
|
|
|
|
|
# Native build inputs
|
2022-04-27 09:35:20 +00:00
|
|
|
|
cmake, util-linux, linkFarm, symlinkJoin, which, pybind11, removeReferencesTo,
|
2020-11-12 09:05:59 +00:00
|
|
|
|
|
|
|
|
|
# Build inputs
|
|
|
|
|
numactl,
|
2022-06-26 10:26:21 +00:00
|
|
|
|
CoreServices, libobjc,
|
2020-11-12 09:05:59 +00:00
|
|
|
|
|
|
|
|
|
# Propagated build inputs
|
2022-04-15 01:41:22 +00:00
|
|
|
|
numpy, pyyaml, cffi, click, typing-extensions,
|
2020-11-12 09:05:59 +00:00
|
|
|
|
|
|
|
|
|
# Unit tests
|
|
|
|
|
hypothesis, psutil,
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
# virtual pkg that consistently instantiates blas across nixpkgs
|
|
|
|
|
# See https://github.com/NixOS/nixpkgs/pull/83888
|
|
|
|
|
blas,
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
# ninja (https://ninja-build.org) must be available to run C++ extensions tests,
|
|
|
|
|
ninja,
|
|
|
|
|
|
2022-10-30 15:09:59 +00:00
|
|
|
|
linuxHeaders_5_19,
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
# dependencies for torch.utils.tensorboard
|
2022-04-15 01:41:22 +00:00
|
|
|
|
pillow, six, future, tensorboard, protobuf,
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-11-12 09:05:59 +00:00
|
|
|
|
isPy3k, pythonOlder }:
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2022-04-15 01:41:22 +00:00
|
|
|
|
let
|
2022-12-17 10:02:37 +00:00
|
|
|
|
inherit (cudaPackages) cudatoolkit cudaFlags cudnn nccl;
|
2022-04-15 01:41:22 +00:00
|
|
|
|
in
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
# assert that everything needed for cuda is present and that the correct cuda versions are used
|
|
|
|
|
assert !cudaSupport || (let majorIs = lib.versions.major cudatoolkit.version;
|
2020-09-25 04:45:31 +00:00
|
|
|
|
in majorIs == "9" || majorIs == "10" || majorIs == "11");
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
# confirm that cudatoolkits are sync'd across dependencies
|
2021-02-05 17:12:51 +00:00
|
|
|
|
assert !(MPISupport && cudaSupport) || mpi.cudatoolkit == cudatoolkit;
|
2020-09-25 04:45:31 +00:00
|
|
|
|
assert !cudaSupport || magma.cudatoolkit == cudatoolkit;
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
let
|
2021-04-12 18:23:04 +00:00
|
|
|
|
setBool = v: if v then "1" else "0";
|
2020-04-24 23:36:52 +00:00
|
|
|
|
cudatoolkit_joined = symlinkJoin {
|
|
|
|
|
name = "${cudatoolkit.name}-unsplit";
|
|
|
|
|
# nccl is here purely for semantic grouping it could be moved to nativeBuildInputs
|
|
|
|
|
paths = [ cudatoolkit.out cudatoolkit.lib nccl.dev nccl.out ];
|
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
# Normally libcuda.so.1 is provided at runtime by nvidia-x11 via
|
|
|
|
|
# LD_LIBRARY_PATH=/run/opengl-driver/lib. We only use the stub
|
|
|
|
|
# libcuda.so from cudatoolkit for running tests, so that we don’t have
|
|
|
|
|
# to recompile pytorch on every update to nvidia-x11 or the kernel.
|
|
|
|
|
cudaStub = linkFarm "cuda-stub" [{
|
|
|
|
|
name = "libcuda.so.1";
|
|
|
|
|
path = "${cudatoolkit}/lib/stubs/libcuda.so";
|
|
|
|
|
}];
|
|
|
|
|
cudaStubEnv = lib.optionalString cudaSupport
|
|
|
|
|
"LD_LIBRARY_PATH=${cudaStub}\${LD_LIBRARY_PATH:+:}$LD_LIBRARY_PATH ";
|
|
|
|
|
|
|
|
|
|
in buildPythonPackage rec {
|
2022-09-09 14:08:57 +00:00
|
|
|
|
pname = "torch";
|
|
|
|
|
# Don't forget to update torch-bin to the same version.
|
2022-12-17 10:02:37 +00:00
|
|
|
|
version = "1.13.0";
|
2022-04-15 01:41:22 +00:00
|
|
|
|
format = "setuptools";
|
2020-09-25 04:45:31 +00:00
|
|
|
|
|
2022-04-15 01:41:22 +00:00
|
|
|
|
disabled = pythonOlder "3.7.0";
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
outputs = [
|
2022-09-09 14:08:57 +00:00
|
|
|
|
"out" # output standard python package
|
|
|
|
|
"dev" # output libtorch headers
|
|
|
|
|
"lib" # output libtorch libraries
|
2020-04-24 23:36:52 +00:00
|
|
|
|
];
|
|
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
2022-09-09 14:08:57 +00:00
|
|
|
|
owner = "pytorch";
|
|
|
|
|
repo = "pytorch";
|
|
|
|
|
rev = "refs/tags/v${version}";
|
2020-04-24 23:36:52 +00:00
|
|
|
|
fetchSubmodules = true;
|
2022-12-17 10:02:37 +00:00
|
|
|
|
hash = "sha256-jlXd+9fYWePDevXRxsjtL4oEdTWirv1ObH0B4A6o6Q4=";
|
2020-04-24 23:36:52 +00:00
|
|
|
|
};
|
|
|
|
|
|
2022-09-09 14:08:57 +00:00
|
|
|
|
patches = lib.optionals (stdenv.isDarwin && stdenv.isx86_64) [
|
2020-08-20 17:08:02 +00:00
|
|
|
|
# pthreadpool added support for Grand Central Dispatch in April
|
|
|
|
|
# 2020. However, this relies on functionality (DISPATCH_APPLY_AUTO)
|
|
|
|
|
# that is available starting with macOS 10.13. However, our current
|
|
|
|
|
# base is 10.12. Until we upgrade, we can fall back on the older
|
|
|
|
|
# pthread support.
|
|
|
|
|
./pthreadpool-disable-gcd.diff
|
2020-07-18 16:06:22 +00:00
|
|
|
|
];
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
preConfigure = lib.optionalString cudaSupport ''
|
2022-12-17 10:02:37 +00:00
|
|
|
|
export TORCH_CUDA_ARCH_LIST="${cudaFlags.cudaCapabilitiesSemiColonString}"
|
2020-04-24 23:36:52 +00:00
|
|
|
|
export CC=${cudatoolkit.cc}/bin/gcc CXX=${cudatoolkit.cc}/bin/g++
|
|
|
|
|
'' + lib.optionalString (cudaSupport && cudnn != null) ''
|
|
|
|
|
export CUDNN_INCLUDE_DIR=${cudnn}/include
|
|
|
|
|
'';
|
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
# Use pytorch's custom configurations
|
|
|
|
|
dontUseCmakeConfigure = true;
|
|
|
|
|
|
2021-04-12 18:23:04 +00:00
|
|
|
|
BUILD_NAMEDTENSOR = setBool true;
|
|
|
|
|
BUILD_DOCS = setBool buildDocs;
|
2020-05-15 21:57:56 +00:00
|
|
|
|
|
2021-04-12 18:23:04 +00:00
|
|
|
|
# We only do an imports check, so do not build tests either.
|
|
|
|
|
BUILD_TEST = setBool false;
|
2020-05-15 21:57:56 +00:00
|
|
|
|
|
2020-09-25 04:45:31 +00:00
|
|
|
|
# Unlike MKL, oneDNN (née MKLDNN) is FOSS, so we enable support for
|
|
|
|
|
# it by default. PyTorch currently uses its own vendored version
|
|
|
|
|
# of oneDNN through Intel iDeep.
|
2021-04-12 18:23:04 +00:00
|
|
|
|
USE_MKLDNN = setBool mklDnnSupport;
|
|
|
|
|
USE_MKLDNN_CBLAS = setBool mklDnnSupport;
|
2020-05-15 21:57:56 +00:00
|
|
|
|
|
2022-06-26 10:26:21 +00:00
|
|
|
|
# Avoid using pybind11 from git submodule
|
|
|
|
|
# Also avoids pytorch exporting the headers of pybind11
|
|
|
|
|
USE_SYSTEM_BIND11 = true;
|
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
preBuild = ''
|
|
|
|
|
export MAX_JOBS=$NIX_BUILD_CORES
|
|
|
|
|
${python.interpreter} setup.py build --cmake-only
|
|
|
|
|
${cmake}/bin/cmake build
|
|
|
|
|
'';
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
preFixup = ''
|
|
|
|
|
function join_by { local IFS="$1"; shift; echo "$*"; }
|
|
|
|
|
function strip2 {
|
|
|
|
|
IFS=':'
|
|
|
|
|
read -ra RP <<< $(patchelf --print-rpath $1)
|
|
|
|
|
IFS=' '
|
|
|
|
|
RP_NEW=$(join_by : ''${RP[@]:2})
|
|
|
|
|
patchelf --set-rpath \$ORIGIN:''${RP_NEW} "$1"
|
|
|
|
|
}
|
|
|
|
|
for f in $(find ''${out} -name 'libcaffe2*.so')
|
|
|
|
|
do
|
|
|
|
|
strip2 $f
|
|
|
|
|
done
|
|
|
|
|
'';
|
|
|
|
|
|
|
|
|
|
# Override the (weirdly) wrong version set by default. See
|
|
|
|
|
# https://github.com/NixOS/nixpkgs/pull/52437#issuecomment-449718038
|
|
|
|
|
# https://github.com/pytorch/pytorch/blob/v1.0.0/setup.py#L267
|
|
|
|
|
PYTORCH_BUILD_VERSION = version;
|
|
|
|
|
PYTORCH_BUILD_NUMBER = 0;
|
|
|
|
|
|
2022-09-09 14:08:57 +00:00
|
|
|
|
USE_SYSTEM_NCCL = setBool useSystemNccl; # don't build pytorch's third_party NCCL
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
# Suppress a weird warning in mkl-dnn, part of ideep in pytorch
|
|
|
|
|
# (upstream seems to have fixed this in the wrong place?)
|
|
|
|
|
# https://github.com/intel/mkl-dnn/commit/8134d346cdb7fe1695a2aa55771071d455fae0bc
|
|
|
|
|
# https://github.com/pytorch/pytorch/issues/22346
|
|
|
|
|
#
|
|
|
|
|
# Also of interest: pytorch ignores CXXFLAGS uses CFLAGS for both C and C++:
|
2022-04-15 01:41:22 +00:00
|
|
|
|
# https://github.com/pytorch/pytorch/blob/v1.11.0/setup.py#L17
|
2020-05-15 21:57:56 +00:00
|
|
|
|
NIX_CFLAGS_COMPILE = lib.optionals (blas.implementation == "mkl") [ "-Wno-error=array-bounds" ];
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
nativeBuildInputs = [
|
|
|
|
|
cmake
|
2020-11-24 20:58:05 +00:00
|
|
|
|
util-linux
|
2020-04-24 23:36:52 +00:00
|
|
|
|
which
|
|
|
|
|
ninja
|
2021-05-28 09:39:13 +00:00
|
|
|
|
pybind11
|
2022-04-27 09:35:20 +00:00
|
|
|
|
removeReferencesTo
|
2020-04-24 23:36:52 +00:00
|
|
|
|
] ++ lib.optionals cudaSupport [ cudatoolkit_joined ];
|
|
|
|
|
|
2022-06-26 10:26:21 +00:00
|
|
|
|
buildInputs = [ blas blas.provider pybind11 ]
|
2022-10-30 15:09:59 +00:00
|
|
|
|
++ [ linuxHeaders_5_19 ] # TMP: avoid "flexible array member" errors for now
|
2020-05-15 21:57:56 +00:00
|
|
|
|
++ lib.optionals cudaSupport [ cudnn magma nccl ]
|
2022-06-26 10:26:21 +00:00
|
|
|
|
++ lib.optionals stdenv.isLinux [ numactl ]
|
|
|
|
|
++ lib.optionals stdenv.isDarwin [ CoreServices libobjc ];
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
|
|
|
|
propagatedBuildInputs = [
|
|
|
|
|
cffi
|
|
|
|
|
click
|
|
|
|
|
numpy
|
|
|
|
|
pyyaml
|
2020-11-12 09:05:59 +00:00
|
|
|
|
typing-extensions
|
2020-05-15 21:57:56 +00:00
|
|
|
|
# the following are required for tensorboard support
|
2022-04-15 01:41:22 +00:00
|
|
|
|
pillow six future tensorboard protobuf
|
|
|
|
|
] ++ lib.optionals MPISupport [ mpi ];
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
# Tests take a long time and may be flaky, so just sanity-check imports
|
|
|
|
|
doCheck = false;
|
2022-09-09 14:08:57 +00:00
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
pythonImportsCheck = [
|
|
|
|
|
"torch"
|
|
|
|
|
];
|
|
|
|
|
|
2022-09-09 14:08:57 +00:00
|
|
|
|
checkInputs = [ hypothesis ninja psutil ];
|
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
checkPhase = with lib.versions; with lib.strings; concatStringsSep " " [
|
2022-09-09 14:08:57 +00:00
|
|
|
|
"runHook preCheck"
|
2020-05-15 21:57:56 +00:00
|
|
|
|
cudaStubEnv
|
|
|
|
|
"${python.interpreter} test/run_test.py"
|
|
|
|
|
"--exclude"
|
|
|
|
|
(concatStringsSep " " [
|
|
|
|
|
"utils" # utils requires git, which is not allowed in the check phase
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-05-15 21:57:56 +00:00
|
|
|
|
# "dataloader" # psutils correctly finds and triggers multiprocessing, but is too sandboxed to run -- resulting in numerous errors
|
|
|
|
|
# ^^^^^^^^^^^^ NOTE: while test_dataloader does return errors, these are acceptable errors and do not interfere with the build
|
|
|
|
|
|
|
|
|
|
# tensorboard has acceptable failures for pytorch 1.3.x due to dependencies on tensorboard-plugins
|
|
|
|
|
(optionalString (majorMinor version == "1.3" ) "tensorboard")
|
|
|
|
|
])
|
2022-09-09 14:08:57 +00:00
|
|
|
|
"runHook postCheck"
|
2020-05-15 21:57:56 +00:00
|
|
|
|
];
|
2022-09-09 14:08:57 +00:00
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
postInstall = ''
|
2022-04-27 09:35:20 +00:00
|
|
|
|
find "$out/${python.sitePackages}/torch/include" "$out/${python.sitePackages}/torch/lib" -type f -exec remove-references-to -t ${stdenv.cc} '{}' +
|
|
|
|
|
|
2020-04-24 23:36:52 +00:00
|
|
|
|
mkdir $dev
|
|
|
|
|
cp -r $out/${python.sitePackages}/torch/include $dev/include
|
2022-09-09 14:08:57 +00:00
|
|
|
|
cp -r $out/${python.sitePackages}/torch/share $dev/share
|
2020-07-18 16:06:22 +00:00
|
|
|
|
|
2020-12-07 07:45:13 +00:00
|
|
|
|
# Fix up library paths for split outputs
|
|
|
|
|
substituteInPlace \
|
|
|
|
|
$dev/share/cmake/Torch/TorchConfig.cmake \
|
|
|
|
|
--replace \''${TORCH_INSTALL_PREFIX}/lib "$lib/lib"
|
|
|
|
|
|
|
|
|
|
substituteInPlace \
|
|
|
|
|
$dev/share/cmake/Caffe2/Caffe2Targets-release.cmake \
|
|
|
|
|
--replace \''${_IMPORT_PREFIX}/lib "$lib/lib"
|
|
|
|
|
|
2020-07-18 16:06:22 +00:00
|
|
|
|
mkdir $lib
|
2022-09-09 14:08:57 +00:00
|
|
|
|
mv $out/${python.sitePackages}/torch/lib $lib/lib
|
2022-04-27 09:35:20 +00:00
|
|
|
|
ln -s $lib/lib $out/${python.sitePackages}/torch/lib
|
2020-04-24 23:36:52 +00:00
|
|
|
|
'';
|
|
|
|
|
|
2021-02-05 17:12:51 +00:00
|
|
|
|
postFixup = lib.optionalString stdenv.isDarwin ''
|
2020-08-20 17:08:02 +00:00
|
|
|
|
for f in $(ls $lib/lib/*.dylib); do
|
|
|
|
|
install_name_tool -id $lib/lib/$(basename $f) $f || true
|
2020-04-24 23:36:52 +00:00
|
|
|
|
done
|
|
|
|
|
|
2020-08-20 17:08:02 +00:00
|
|
|
|
install_name_tool -change @rpath/libshm.dylib $lib/lib/libshm.dylib $lib/lib/libtorch_python.dylib
|
|
|
|
|
install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libtorch_python.dylib
|
|
|
|
|
install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch_python.dylib
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-08-20 17:08:02 +00:00
|
|
|
|
install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libtorch.dylib
|
2020-04-24 23:36:52 +00:00
|
|
|
|
|
2020-08-20 17:08:02 +00:00
|
|
|
|
install_name_tool -change @rpath/libtorch.dylib $lib/lib/libtorch.dylib $lib/lib/libshm.dylib
|
|
|
|
|
install_name_tool -change @rpath/libc10.dylib $lib/lib/libc10.dylib $lib/lib/libshm.dylib
|
2020-04-24 23:36:52 +00:00
|
|
|
|
'';
|
|
|
|
|
|
2021-04-26 19:14:03 +00:00
|
|
|
|
# Builds in 2+h with 2 cores, and ~15m with a big-parallel builder.
|
|
|
|
|
requiredSystemFeatures = [ "big-parallel" ];
|
|
|
|
|
|
2021-08-08 23:34:03 +00:00
|
|
|
|
passthru = {
|
2022-04-15 01:41:22 +00:00
|
|
|
|
inherit cudaSupport cudaPackages;
|
2022-02-10 20:34:41 +00:00
|
|
|
|
# At least for 1.10.2 `torch.fft` is unavailable unless BLAS provider is MKL. This attribute allows for easy detection of its availability.
|
2021-09-18 10:52:07 +00:00
|
|
|
|
blasProvider = blas.provider;
|
2021-08-08 23:34:03 +00:00
|
|
|
|
};
|
|
|
|
|
|
2021-03-12 07:09:13 +00:00
|
|
|
|
meta = with lib; {
|
2022-09-09 14:08:57 +00:00
|
|
|
|
changelog = "https://github.com/pytorch/pytorch/releases/tag/v${version}";
|
|
|
|
|
# keep PyTorch in the description so the package can be found under that name on search.nixos.org
|
|
|
|
|
description = "PyTorch: Tensors and Dynamic neural networks in Python with strong GPU acceleration";
|
|
|
|
|
homepage = "https://pytorch.org/";
|
|
|
|
|
license = licenses.bsd3;
|
2021-09-18 10:52:07 +00:00
|
|
|
|
maintainers = with maintainers; [ teh thoughtpolice tscholak ]; # tscholak esp. for darwin-related builds
|
2022-09-09 14:08:57 +00:00
|
|
|
|
platforms = with platforms; linux ++ lib.optionals (!cudaSupport) darwin;
|
2020-04-24 23:36:52 +00:00
|
|
|
|
};
|
|
|
|
|
}
|