{ lib , stdenv , fetchFromGitHub , fetchpatch , cmake , rocm-cmake , rocm-runtime , rocm-device-libs , rocm-comgr , hip , python3 , tensile ? null , msgpack ? null , libxml2 ? null , llvm ? null , python3Packages ? null , gtest ? null , gfortran ? null , buildTensile ? true , buildTests ? false , buildBenchmarks ? false , tensileLogic ? "asm_full" , tensileCOVersion ? "V3" , tensileSepArch ? true , tensileLazyLib ? true , tensileLibFormat ? "msgpack" , gpuTargets ? [ "all" ] }: assert buildTensile -> tensile != null; assert buildTensile -> msgpack != null; assert buildTensile -> libxml2 != null; assert buildTensile -> llvm != null; assert buildTensile -> python3Packages != null; assert buildTests -> gtest != null; assert buildTests -> gfortran != null; # Tests and benchmarks are a can of worms that I will tackle in a different PR # It involves completely rewriting the amd-blis derivation assert buildTests == false; assert buildBenchmarks == false; stdenv.mkDerivation rec { pname = "rocblas"; rocmVersion = "5.3.1"; version = "2.45.0-${rocmVersion}"; src = fetchFromGitHub { owner = "ROCmSoftwarePlatform"; repo = "rocBLAS"; rev = "rocm-${rocmVersion}"; hash = "sha256-GeeICEI1dNE6D+nUUlBtUncLkPowAa5n+bsy160EtaU="; }; # We currently need this patch due to faulty toolchain includes # See: https://github.com/ROCmSoftwarePlatform/rocBLAS/issues/1277 patches = [ (fetchpatch { name = "only-std_norm-from-rocblas_complex.patch"; url = "https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/44b99c6df26002139ca9ec68ee1fc8899c7b001f.patch"; hash = "sha256-vSZkVYY951fqfOThKFqnYBasWMblS6peEJZ6sFMCk9k="; }) ]; nativeBuildInputs = [ cmake rocm-cmake hip ]; buildInputs = [ rocm-runtime rocm-device-libs rocm-comgr python3 ] ++ lib.optionals buildTensile [ msgpack libxml2 llvm python3Packages.pyyaml python3Packages.msgpack ] ++ lib.optionals buildTests [ gtest gfortran ]; cmakeFlags = [ "-DCMAKE_C_COMPILER=hipcc" "-DCMAKE_CXX_COMPILER=hipcc" "-Dpython=python3" "-DAMDGPU_TARGETS=${lib.strings.concatStringsSep ";" gpuTargets}" "-DBUILD_WITH_TENSILE=${if buildTensile then "ON" else "OFF"}" # Manually define CMAKE_INSTALL_ # See: https://github.com/NixOS/nixpkgs/pull/197838 "-DCMAKE_INSTALL_BINDIR=bin" "-DCMAKE_INSTALL_LIBDIR=lib" "-DCMAKE_INSTALL_INCLUDEDIR=include" ] ++ lib.optionals buildTensile [ "-DVIRTUALENV_HOME_DIR=/build/source/tensile" "-DTensile_TEST_LOCAL_PATH=/build/source/tensile" "-DTensile_ROOT=/build/source/tensile/lib/python${python3.pythonVersion}/site-packages/Tensile" "-DTensile_LOGIC=${tensileLogic}" "-DTensile_CODE_OBJECT_VERSION=${tensileCOVersion}" "-DTensile_SEPARATE_ARCHITECTURES=${if tensileSepArch then "ON" else "OFF"}" "-DTensile_LAZY_LIBRARY_LOADING=${if tensileLazyLib then "ON" else "OFF"}" "-DTensile_LIBRARY_FORMAT=${tensileLibFormat}" ] ++ lib.optionals buildTests [ "-DBUILD_CLIENTS_TESTS=ON" ] ++ lib.optionals buildBenchmarks [ "-DBUILD_CLIENTS_BENCHMARKS=ON" ]; # Tensile REALLY wants to write to the nix directory if we include it normally # We need to manually fixup the path so tensile will generate .co and .dat files postPatch = lib.optionalString buildTensile '' export PATH=${llvm}/bin:$PATH cp -a ${tensile} tensile chmod +w -R tensile # Rewrap Tensile substituteInPlace tensile/bin/{.t*,.T*,*} \ --replace "${tensile}" "/build/source/tensile" substituteInPlace CMakeLists.txt \ --replace "include(virtualenv)" "" \ --replace "virtualenv_install(\''${Tensile_TEST_LOCAL_PATH})" "" ''; meta = with lib; { description = "BLAS implementation for ROCm platform"; homepage = "https://github.com/ROCmSoftwarePlatform/rocBLAS"; license = with licenses; [ mit ]; maintainers = with maintainers; [ Madouura ]; broken = rocmVersion != hip.version; }; }