2023-04-29 16:46:19 +00:00
|
|
|
{ config, stdenv, lib, fetchFromGitHub, cmake, gtest, doCheck ? true
|
2023-10-19 13:55:26 +00:00
|
|
|
, cudaSupport ? config.cudaSupport or false, openclSupport ? false
|
|
|
|
, mpiSupport ? false, javaWrapper ? false, hdfsSupport ? false, pythonLibrary ? false
|
|
|
|
, rLibrary ? false, cudaPackages, opencl-headers, ocl-icd, boost
|
|
|
|
, llvmPackages, openmpi, openjdk, swig, hadoop, R, rPackages, pandoc }:
|
2023-04-29 16:46:19 +00:00
|
|
|
|
2024-09-19 14:19:46 +00:00
|
|
|
assert doCheck -> !mpiSupport;
|
|
|
|
assert openclSupport -> !cudaSupport;
|
|
|
|
assert cudaSupport -> !openclSupport;
|
2023-04-29 16:46:19 +00:00
|
|
|
|
|
|
|
stdenv.mkDerivation rec {
|
|
|
|
pnameBase = "lightgbm";
|
|
|
|
# prefix with r when building the R library
|
|
|
|
# The R package build results in a special binary file
|
|
|
|
# that contains a subset of the .so file use for the CLI
|
|
|
|
# and python version. In general, the CRAN version from
|
|
|
|
# nixpkgs's r-modules should be used, but this non-standard
|
|
|
|
# build allows for enabling CUDA support and other features
|
|
|
|
# which aren't included in the CRAN release. Build with:
|
|
|
|
# nix-build -E "with (import $NIXPKGS{}); \
|
|
|
|
# let \
|
|
|
|
# lgbm = lightgbm.override{rLibrary = true; doCheck = false;}; \
|
|
|
|
# in \
|
|
|
|
# rWrapper.override{ packages = [ lgbm ]; }"
|
|
|
|
pname = lib.optionalString rLibrary "r-" + pnameBase;
|
2024-09-19 14:19:46 +00:00
|
|
|
version = "4.5.0";
|
2023-04-29 16:46:19 +00:00
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "microsoft";
|
|
|
|
repo = pnameBase;
|
|
|
|
rev = "v${version}";
|
|
|
|
fetchSubmodules = true;
|
2024-09-19 14:19:46 +00:00
|
|
|
hash = "sha256-nST6+/c3Y4/hqwgEUhx03gWtjxhlmUu1XKDCy2pSsvU=";
|
2023-04-29 16:46:19 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
nativeBuildInputs = [ cmake ]
|
2024-09-26 11:04:55 +00:00
|
|
|
++ lib.optionals stdenv.hostPlatform.isDarwin [ llvmPackages.openmp ]
|
2023-04-29 16:46:19 +00:00
|
|
|
++ lib.optionals openclSupport [ opencl-headers ocl-icd boost ]
|
|
|
|
++ lib.optionals mpiSupport [ openmpi ]
|
|
|
|
++ lib.optionals hdfsSupport [ hadoop ]
|
|
|
|
++ lib.optionals (hdfsSupport || javaWrapper) [ openjdk ]
|
|
|
|
++ lib.optionals javaWrapper [ swig ]
|
2023-10-19 13:55:26 +00:00
|
|
|
++ lib.optionals rLibrary [ R pandoc ];
|
2023-04-29 16:46:19 +00:00
|
|
|
|
|
|
|
buildInputs = [ gtest ]
|
|
|
|
++ lib.optional cudaSupport cudaPackages.cudatoolkit;
|
|
|
|
|
|
|
|
propagatedBuildInputs = lib.optionals rLibrary [
|
|
|
|
rPackages.data_table
|
2024-02-29 20:09:43 +00:00
|
|
|
rPackages.markdown
|
2023-10-19 13:55:26 +00:00
|
|
|
rPackages.rmarkdown
|
2023-04-29 16:46:19 +00:00
|
|
|
rPackages.jsonlite
|
|
|
|
rPackages.Matrix
|
|
|
|
rPackages.R6
|
|
|
|
];
|
|
|
|
|
|
|
|
# Skip APPLE in favor of linux build for .so files
|
|
|
|
postPatch = ''
|
|
|
|
export PROJECT_SOURCE_DIR=./
|
|
|
|
substituteInPlace CMakeLists.txt \
|
|
|
|
--replace "find_package(GTest CONFIG)" "find_package(GTest REQUIRED)" \
|
|
|
|
--replace "OpenCL_INCLUDE_DIRS}" "OpenCL_INCLUDE_DIRS}" \
|
|
|
|
--replace "elseif(APPLE)" "elseif(APPLESKIP)"
|
|
|
|
substituteInPlace \
|
|
|
|
external_libs/compute/include/boost/compute/cl.hpp \
|
|
|
|
external_libs/compute/include/boost/compute/cl_ext.hpp \
|
|
|
|
--replace "include <OpenCL/" "include <CL/"
|
|
|
|
substituteInPlace build_r.R \
|
2023-10-19 13:55:26 +00:00
|
|
|
--replace "shQuote(normalizePath" "shQuote(type = 'cmd', string = normalizePath" \
|
2023-04-29 16:46:19 +00:00
|
|
|
--replace "file.path(getwd(), \"lightgbm_r\")" "'$out/tmp'" \
|
|
|
|
--replace \
|
|
|
|
"install_args <- c(\"CMD\", \"INSTALL\", \"--no-multiarch\", \"--with-keep.source\", tarball)" \
|
|
|
|
"install_args <- c(\"CMD\", \"INSTALL\", \"--no-multiarch\", \"--with-keep.source\", \"-l $out/library\", tarball)"
|
2024-02-29 20:09:43 +00:00
|
|
|
|
|
|
|
# Retry this test in next release. Something fails in the setup, so GTEST_FILTER is not enough
|
|
|
|
rm tests/cpp_tests/test_arrow.cpp
|
2023-04-29 16:46:19 +00:00
|
|
|
'';
|
|
|
|
|
|
|
|
cmakeFlags = lib.optionals doCheck [ "-DBUILD_CPP_TEST=ON" ]
|
2024-04-21 15:54:59 +00:00
|
|
|
++ lib.optionals cudaSupport [ "-DUSE_CUDA=1" "-DCMAKE_CXX_COMPILER=${cudaPackages.backendStdenv.cc}/bin/cc" ]
|
2023-04-29 16:46:19 +00:00
|
|
|
++ lib.optionals openclSupport [ "-DUSE_GPU=ON" ]
|
|
|
|
++ lib.optionals mpiSupport [ "-DUSE_MPI=ON" ]
|
|
|
|
++ lib.optionals hdfsSupport [
|
|
|
|
"-DUSE_HDFS=ON"
|
2023-10-19 13:55:26 +00:00
|
|
|
"-DHDFS_LIB=${hadoop}/lib/hadoop-${hadoop.version}/lib/native/libhdfs.so"
|
|
|
|
"-DHDFS_INCLUDE_DIR=${hadoop}/lib/hadoop-${hadoop.version}/include" ]
|
|
|
|
++ lib.optionals javaWrapper [
|
|
|
|
"-DUSE_SWIG=ON"
|
|
|
|
# RPATH of binary /nix/store/.../bin/... contains a forbidden reference to /build/
|
|
|
|
"-DCMAKE_SKIP_BUILD_RPATH=ON" ]
|
|
|
|
++ lib.optionals rLibrary [ "-D__BUILD_FOR_R=ON" ]
|
|
|
|
++ lib.optionals pythonLibrary [ "-D__BUILD_FOR_PYTHON=ON" ];
|
2023-04-29 16:46:19 +00:00
|
|
|
|
|
|
|
configurePhase = lib.optionals rLibrary ''
|
|
|
|
export R_LIBS_SITE="$out/library:$R_LIBS_SITE''${R_LIBS_SITE:+:}"
|
|
|
|
'';
|
|
|
|
|
|
|
|
# set the R package buildPhase to null because lightgbm has a
|
|
|
|
# custom builder script that builds and installs in one step
|
|
|
|
buildPhase = lib.optionals rLibrary ''
|
|
|
|
'';
|
|
|
|
|
|
|
|
inherit doCheck;
|
|
|
|
|
|
|
|
installPhase = ''
|
|
|
|
runHook preInstall
|
|
|
|
'' + lib.optionalString (!rLibrary) ''
|
|
|
|
mkdir -p $out
|
|
|
|
mkdir -p $out/lib
|
|
|
|
mkdir -p $out/bin
|
|
|
|
cp -r ../include $out
|
2024-09-19 14:19:46 +00:00
|
|
|
install -Dm755 ../lib_lightgbm${stdenv.hostPlatform.extensions.sharedLibrary} $out/lib/lib_lightgbm${stdenv.hostPlatform.extensions.sharedLibrary}
|
2023-10-19 13:55:26 +00:00
|
|
|
'' + lib.optionalString (!rLibrary && !pythonLibrary) ''
|
2023-04-29 16:46:19 +00:00
|
|
|
install -Dm755 ../lightgbm $out/bin/lightgbm
|
|
|
|
'' + lib.optionalString javaWrapper ''
|
|
|
|
cp -r java $out
|
|
|
|
cp -r com $out
|
|
|
|
cp -r lightgbmlib.jar $out
|
|
|
|
'' + ''
|
|
|
|
'' + lib.optionalString rLibrary ''
|
|
|
|
mkdir $out
|
|
|
|
mkdir $out/tmp
|
|
|
|
mkdir $out/library
|
|
|
|
mkdir $out/library/lightgbm
|
|
|
|
'' + lib.optionalString (rLibrary && (!openclSupport)) ''
|
2023-10-19 13:55:26 +00:00
|
|
|
Rscript build_r.R \
|
|
|
|
-j$NIX_BUILD_CORES
|
2023-04-29 16:46:19 +00:00
|
|
|
rm -rf $out/tmp
|
|
|
|
'' + lib.optionalString (rLibrary && openclSupport) ''
|
|
|
|
Rscript build_r.R --use-gpu \
|
|
|
|
--opencl-library=${ocl-icd}/lib/libOpenCL.so \
|
2023-10-19 13:55:26 +00:00
|
|
|
--opencl-include-dir=${opencl-headers}/include \
|
|
|
|
--boost-librarydir=${boost} \
|
|
|
|
-j$NIX_BUILD_CORES
|
2023-04-29 16:46:19 +00:00
|
|
|
rm -rf $out/tmp
|
|
|
|
'' + ''
|
|
|
|
runHook postInstall
|
|
|
|
'';
|
|
|
|
|
|
|
|
postFixup = lib.optionalString rLibrary ''
|
|
|
|
if test -e $out/nix-support/propagated-build-inputs; then
|
|
|
|
ln -s $out/nix-support/propagated-build-inputs $out/nix-support/propagated-user-env-packages
|
|
|
|
fi
|
|
|
|
'';
|
|
|
|
|
|
|
|
meta = with lib; {
|
|
|
|
description =
|
|
|
|
"LightGBM is a gradient boosting framework that uses tree based learning algorithms.";
|
2024-04-21 15:54:59 +00:00
|
|
|
mainProgram = "lightgbm";
|
2023-04-29 16:46:19 +00:00
|
|
|
homepage = "https://github.com/microsoft/LightGBM";
|
|
|
|
license = licenses.mit;
|
|
|
|
platforms = platforms.unix;
|
|
|
|
maintainers = with maintainers; [ nviets ];
|
|
|
|
};
|
|
|
|
}
|