{ lib , stdenv , fetchFromGitHub , fetchpatch , cmake , rocm-cmake , rocm-runtime , rocm-device-libs , rocm-comgr , hip , python3 , tensile ? null , msgpack ? null , libxml2 ? null , llvm ? null , python3Packages ? null , gtest ? null , gfortran ? null , buildTensile ? true , buildTests ? false , buildBenchmarks ? false , tensileLogic ? "asm_full" , tensileCOVersion ? "V3" , tensileSepArch ? true , tensileLazyLib ? true , tensileLibFormat ? "msgpack" , gpuTargets ? [ "all" ] }: assert buildTensile -> tensile != null; assert buildTensile -> msgpack != null; assert buildTensile -> libxml2 != null; assert buildTensile -> llvm != null; assert buildTensile -> python3Packages != null; assert buildTests -> gtest != null; assert buildTests -> gfortran != null; # Tests and benchmarks are a can of worms that I will tackle in a different PR # It involves completely rewriting the amd-blis derivation assert buildTests == false; assert buildBenchmarks == false; stdenv.mkDerivation rec { pname = "rocblas"; rocmVersion = "5.3.1"; version = "2.45.0-${rocmVersion}"; src = fetchFromGitHub { owner = "ROCmSoftwarePlatform"; repo = "rocBLAS"; rev = "rocm-${rocmVersion}"; hash = "sha256-GeeICEI1dNE6D+nUUlBtUncLkPowAa5n+bsy160EtaU="; }; # We currently need this patch due to faulty toolchain includes # See: https://github.com/ROCmSoftwarePlatform/rocBLAS/issues/1277 patches = [ (fetchpatch { name = "only-std_norm-from-rocblas_complex.patch"; url = "https://github.com/ROCmSoftwarePlatform/rocBLAS/commit/44b99c6df26002139ca9ec68ee1fc8899c7b001f.patch"; hash = "sha256-vSZkVYY951fqfOThKFqnYBasWMblS6peEJZ6sFMCk9k="; }) ]; nativeBuildInputs = [ cmake rocm-cmake hip ]; buildInputs = [ rocm-runtime rocm-device-libs rocm-comgr python3 ] ++ lib.optionals buildTensile [ msgpack libxml2 llvm python3Packages.pyyaml python3Packages.msgpack ] ++ lib.optionals buildTests [ gtest gfortran ]; cmakeFlags = [ "-DCMAKE_C_COMPILER=hipcc" "-DCMAKE_CXX_COMPILER=hipcc" "-Dpython=python3" "-DAMDGPU_TARGETS=${lib.strings.concatStringsSep ";" gpuTargets}" "-DBUILD_WITH_TENSILE=${if buildTensile then "ON" else "OFF"}" # Manually define CMAKE_INSTALL_