2022-12-02 08:20:57 +00:00
|
|
|
{ lib
|
|
|
|
, stdenv
|
|
|
|
, fetchFromGitHub
|
2022-12-17 10:02:37 +00:00
|
|
|
, rocmUpdateScript
|
2022-12-02 08:20:57 +00:00
|
|
|
, cmake
|
|
|
|
, rocm-cmake
|
|
|
|
, hip
|
|
|
|
, openmp
|
|
|
|
, gtest
|
|
|
|
, rocblas
|
|
|
|
, texlive
|
|
|
|
, doxygen
|
|
|
|
, sphinx
|
|
|
|
, python3Packages
|
|
|
|
, buildDocs ? true
|
|
|
|
, buildTests ? false
|
2023-01-20 10:41:00 +00:00
|
|
|
, buildExtendedTests ? false
|
|
|
|
, buildBenchmarks ? false
|
2022-12-02 08:20:57 +00:00
|
|
|
, buildSamples ? false
|
|
|
|
, gpuTargets ? [ ] # gpuTargets = [ "gfx908:xnack-" "gfx90a:xnack-" "gfx90a:xnack+" ... ]
|
|
|
|
}:
|
|
|
|
|
|
|
|
let
|
|
|
|
latex = lib.optionalAttrs buildDocs texlive.combine {
|
|
|
|
inherit (texlive) scheme-small
|
|
|
|
latexmk
|
|
|
|
tex-gyre
|
|
|
|
fncychap
|
|
|
|
wrapfig
|
|
|
|
capt-of
|
|
|
|
framed
|
|
|
|
needspace
|
|
|
|
tabulary
|
|
|
|
varwidth
|
|
|
|
titlesec;
|
|
|
|
};
|
|
|
|
in stdenv.mkDerivation (finalAttrs: {
|
|
|
|
pname = "rocwmma";
|
2023-03-04 12:14:45 +00:00
|
|
|
version = "5.4.3";
|
2022-12-02 08:20:57 +00:00
|
|
|
|
|
|
|
outputs = [
|
|
|
|
"out"
|
|
|
|
] ++ lib.optionals buildDocs [
|
|
|
|
"doc"
|
2023-01-20 10:41:00 +00:00
|
|
|
] ++ lib.optionals (buildTests || buildBenchmarks) [
|
2022-12-02 08:20:57 +00:00
|
|
|
"test"
|
2023-01-20 10:41:00 +00:00
|
|
|
] ++ lib.optionals buildBenchmarks [
|
|
|
|
"benchmark"
|
2022-12-02 08:20:57 +00:00
|
|
|
] ++ lib.optionals buildSamples [
|
|
|
|
"sample"
|
|
|
|
];
|
|
|
|
|
|
|
|
src = fetchFromGitHub {
|
|
|
|
owner = "ROCmSoftwarePlatform";
|
|
|
|
repo = "rocWMMA";
|
|
|
|
rev = "rocm-${finalAttrs.version}";
|
2022-12-17 10:02:37 +00:00
|
|
|
hash = "sha256-HUJPb6IahBgl/v+W4kXludBTNAjRm8k6v0jxKAX+qZM=";
|
2022-12-02 08:20:57 +00:00
|
|
|
};
|
|
|
|
|
2023-01-20 10:41:00 +00:00
|
|
|
patches = lib.optionals (buildTests || buildBenchmarks) [
|
2022-12-02 08:20:57 +00:00
|
|
|
./0000-dont-fetch-googletest.patch
|
|
|
|
];
|
|
|
|
|
|
|
|
nativeBuildInputs = [
|
|
|
|
cmake
|
|
|
|
rocm-cmake
|
|
|
|
hip
|
|
|
|
];
|
|
|
|
|
|
|
|
buildInputs = [
|
|
|
|
openmp
|
2023-01-20 10:41:00 +00:00
|
|
|
] ++ lib.optionals (buildTests || buildBenchmarks) [
|
2022-12-02 08:20:57 +00:00
|
|
|
gtest
|
|
|
|
rocblas
|
|
|
|
] ++ lib.optionals buildDocs [
|
|
|
|
latex
|
|
|
|
doxygen
|
|
|
|
sphinx
|
|
|
|
python3Packages.sphinx-rtd-theme
|
|
|
|
python3Packages.breathe
|
|
|
|
];
|
|
|
|
|
|
|
|
cmakeFlags = [
|
|
|
|
"-DCMAKE_CXX_COMPILER=hipcc"
|
2023-01-20 10:41:00 +00:00
|
|
|
"-DROCWMMA_BUILD_TESTS=${if buildTests || buildBenchmarks then "ON" else "OFF"}"
|
|
|
|
"-DROCWMMA_BUILD_VALIDATION_TESTS=ON"
|
2022-12-02 08:20:57 +00:00
|
|
|
"-DROCWMMA_BUILD_SAMPLES=${if buildSamples then "ON" else "OFF"}"
|
2023-01-20 10:41:00 +00:00
|
|
|
"-DROCWMMA_VALIDATE_WITH_ROCBLAS=ON"
|
2022-12-02 08:20:57 +00:00
|
|
|
# Manually define CMAKE_INSTALL_<DIR>
|
|
|
|
# See: https://github.com/NixOS/nixpkgs/pull/197838
|
|
|
|
"-DCMAKE_INSTALL_BINDIR=bin"
|
|
|
|
"-DCMAKE_INSTALL_LIBDIR=lib"
|
|
|
|
"-DCMAKE_INSTALL_INCLUDEDIR=include"
|
|
|
|
] ++ lib.optionals (gpuTargets != [ ]) [
|
|
|
|
"-DGPU_TARGETS=${lib.concatStringsSep ";" gpuTargets}"
|
2023-01-20 10:41:00 +00:00
|
|
|
] ++ lib.optionals buildExtendedTests [
|
2022-12-02 08:20:57 +00:00
|
|
|
"-DROCWMMA_BUILD_EXTENDED_TESTS=ON"
|
2023-01-20 10:41:00 +00:00
|
|
|
] ++ lib.optionals buildBenchmarks [
|
|
|
|
"-DROCWMMA_BUILD_BENCHMARK_TESTS=ON"
|
2022-12-02 08:20:57 +00:00
|
|
|
"-DROCWMMA_BENCHMARK_WITH_ROCBLAS=ON"
|
|
|
|
];
|
|
|
|
|
|
|
|
postPatch = lib.optionalString buildDocs ''
|
|
|
|
patchShebangs docs/*.sh
|
|
|
|
'';
|
|
|
|
|
|
|
|
# Unfortunately, it seems like we have to call make on this manually
|
|
|
|
# -DROCWMMA_BUILD_DOCS=ON is invalid, despite being on the README
|
|
|
|
postBuild = lib.optionalString buildDocs ''
|
|
|
|
export HOME=$(mktemp -d)
|
|
|
|
../docs/run_doc.sh
|
|
|
|
'';
|
|
|
|
|
|
|
|
postInstall = lib.optionalString buildDocs ''
|
|
|
|
mv ../docs/source/_build/html $out/share/doc/rocwmma
|
|
|
|
mv ../docs/source/_build/latex/rocWMMA.pdf $out/share/doc/rocwmma
|
2023-01-20 10:41:00 +00:00
|
|
|
'' + lib.optionalString (buildTests || buildBenchmarks) ''
|
2022-12-02 08:20:57 +00:00
|
|
|
mkdir -p $test/bin
|
2023-01-20 10:41:00 +00:00
|
|
|
mv $out/bin/{*_test,*-validate} $test/bin
|
|
|
|
'' + lib.optionalString buildBenchmarks ''
|
|
|
|
mkdir -p $benchmark/bin
|
|
|
|
mv $out/bin/*-bench $benchmark/bin
|
2022-12-02 08:20:57 +00:00
|
|
|
'' + lib.optionalString buildSamples ''
|
|
|
|
mkdir -p $sample/bin
|
|
|
|
mv $out/bin/sgemmv $sample/bin
|
|
|
|
mv $out/bin/simple_gemm $sample/bin
|
|
|
|
mv $out/bin/simple_dlrm $sample/bin
|
2023-01-20 10:41:00 +00:00
|
|
|
'' + lib.optionalString (buildTests || buildBenchmarks || buildSamples) ''
|
|
|
|
rm -rf $out/bin
|
2022-12-02 08:20:57 +00:00
|
|
|
'';
|
|
|
|
|
2022-12-17 10:02:37 +00:00
|
|
|
passthru.updateScript = rocmUpdateScript {
|
|
|
|
name = finalAttrs.pname;
|
|
|
|
owner = finalAttrs.src.owner;
|
|
|
|
repo = finalAttrs.src.repo;
|
|
|
|
};
|
2022-12-02 08:20:57 +00:00
|
|
|
|
|
|
|
meta = with lib; {
|
|
|
|
description = "Mixed precision matrix multiplication and accumulation";
|
|
|
|
homepage = "https://github.com/ROCmSoftwarePlatform/rocWMMA";
|
|
|
|
license = with licenses; [ mit ];
|
|
|
|
maintainers = teams.rocm.members;
|
2023-01-20 10:41:00 +00:00
|
|
|
platforms = platforms.linux;
|
|
|
|
broken = versions.minor finalAttrs.version != versions.minor hip.version;
|
2022-12-02 08:20:57 +00:00
|
|
|
};
|
|
|
|
})
|