{ lib, stdenv, fetchFromGitHub, fetchpatch, rocmUpdateScript, cmake, rocm-cmake, clr, gfortran, hipblas-common, rocblas, rocsolver, rocsparse, rocprim, gtest, lapack-reference, buildTests ? false, buildBenchmarks ? false, buildSamples ? false, # for passthru.tests hipblas, }: # Can also use cuBLAS stdenv.mkDerivation (finalAttrs: { pname = "hipblas"; version = "6.4.3"; outputs = [ "out" ] ++ lib.optionals buildTests [ "test" ] ++ lib.optionals buildBenchmarks [ "benchmark" ] ++ lib.optionals buildSamples [ "sample" ]; src = fetchFromGitHub { owner = "ROCm"; repo = "hipBLAS"; rev = "rocm-${finalAttrs.version}"; hash = "sha256-lQv8Ik6+0ldqyeJ05CSGB0309nIpzlRL3CRYeQxVfd0="; }; patches = [ (fetchpatch { # Subject: [PATCH] Add gfx1150, gfx1150, gfx1200, gfx1201 support (#1055) # This was merged to release/rocm-rel-6.4 but AMD forgot to tag it for 6.4.3 name = "release-6.4-arch-extra.patch"; url = "https://github.com/ROCm/hipBLAS/commit/0100b32ccff9a0f12134694315b4e44884e25a8e.patch"; hash = "sha256-BmktlLJpYaTcogHzEKpZdCnksIIysEO47WMezXoxvCs="; }) ]; postPatch = '' substituteInPlace library/CMakeLists.txt \ --replace-fail "find_package(Git REQUIRED)" "" ''; nativeBuildInputs = [ cmake rocm-cmake clr gfortran ]; propagatedBuildInputs = [ hipblas-common ]; buildInputs = [ rocblas rocprim rocsparse rocsolver ] ++ lib.optionals buildTests [ gtest ] ++ lib.optionals (buildTests || buildBenchmarks) [ lapack-reference ]; cmakeFlags = [ "-DCMAKE_CXX_COMPILER=${lib.getExe' clr "amdclang++"}" # Manually define CMAKE_INSTALL_