summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPatrick Lauer <patrick@gentoo.org>2025-02-07 19:46:17 +0000
committerPatrick Lauer <patrick@gentoo.org>2025-02-08 10:07:08 +0000
commitf940816e90c7662103a3c2d8e39b4eb18fc919ad (patch)
treee7b16775a4cd3e09de367070c14eaa2a3ef48498 /sci-libs/rocBLAS
parentdev-util/Tensile: add 6.3.2 (diff)
downloadgentoo-f940816e90c7662103a3c2d8e39b4eb18fc919ad.tar.gz
gentoo-f940816e90c7662103a3c2d8e39b4eb18fc919ad.tar.bz2
gentoo-f940816e90c7662103a3c2d8e39b4eb18fc919ad.zip
sci-libs/rocBLAS: add 6.3.2
Signed-off-by: Patrick Lauer <patrick@gentoo.org>
Diffstat (limited to 'sci-libs/rocBLAS')
-rw-r--r--sci-libs/rocBLAS/Manifest1
-rw-r--r--sci-libs/rocBLAS/rocBLAS-6.3.2.ebuild127
2 files changed, 128 insertions, 0 deletions
diff --git a/sci-libs/rocBLAS/Manifest b/sci-libs/rocBLAS/Manifest
index 466aa900e4c0..0dd6206be001 100644
--- a/sci-libs/rocBLAS/Manifest
+++ b/sci-libs/rocBLAS/Manifest
@@ -5,3 +5,4 @@ DIST rocm-rocBLAS-5.4.2.tar.gz 15938434 BLAKE2B 14ebafa944fdac443800bb7f9b16f8ec
DIST rocm-rocBLAS-5.7.1.tar.gz 55389700 BLAKE2B 9e58b1d29c8a04aa58ce17fdd9b0c2504934261851619dc5b696a04e8c6a79e7c44d86a6db7a9c76a434d76593de8c191cba6f163cf398d01cfc001e5fa32b5a SHA512 cfc73f6c490595a3c153c2ac2a3cb5926c48c2c19baa07ff3dcdf3a7ccaed82cfdff64ed5a3be64c349cb43d654d4b104d9090e2ec9f2061049d6a4921c07722
DIST rocm-rocBLAS-6.1.1.tar.gz 100103895 BLAKE2B df89a21e47730714b80c62717a86d65ac0d819c2d33b2a3c6252b60b8d7cc9eb5f8f1db27159b0a8dfc87aba7ccad97e2f832bc0044e92d0b69c526d382c745a SHA512 74e847c4ddee16cae7f41e268a815ea03875519c365abe7dfce313a9545df245baa73301b432f64a36cc988281fec7530629a0d72583e9ea287c98ec8a0b3907
DIST rocm-rocBLAS-6.3.0.tar.gz 57907324 BLAKE2B a3cce68e0cc06e8df56e1622889254c75744b0f85c9fe66cb94bbc158f7ce45e40a5798d30e6a10430092490c1e347f19f38b36db767ccb784c5757581b0bccb SHA512 45a524d680f1f0760fd37d49b9bd7c6257731ad5d840d832a8e40c121f7f1045a8d5b57ca8ef0943fdf333c55bccb341b529d2ca24664694203b906e510ecab5
+DIST rocm-rocBLAS-6.3.2.tar.gz 57909504 BLAKE2B 0ed000a10c9e71465f83fb9abdb9a745c82bf32552e3d86c61bf0c802f3728f7fd4c47fbf677d01aa35c457dc5281c916ca80fdc033b2752afd6733aefa4653f SHA512 ecfb6c68b0a44ddae0e4e6cf5c41c0c33a9685c590004ffe48fdb163bd059d534181d3faed2a23142078c5f621b1955c91725357c3e8e0f9307b139b19af46fd
diff --git a/sci-libs/rocBLAS/rocBLAS-6.3.2.ebuild b/sci-libs/rocBLAS/rocBLAS-6.3.2.ebuild
new file mode 100644
index 000000000000..f35ee735d2fb
--- /dev/null
+++ b/sci-libs/rocBLAS/rocBLAS-6.3.2.ebuild
@@ -0,0 +1,127 @@
+# Copyright 1999-2025 Gentoo Authors
+# Distributed under the terms of the GNU General Public License v2
+
+EAPI=8
+
+DOCS_BUILDER="doxygen"
+DOCS_DIR="docs/.doxygen"
+DOCS_DEPEND="media-gfx/graphviz"
+LLVM_COMPAT=( 19 )
+ROCM_VERSION=${PV}
+
+inherit cmake docs edo flag-o-matic multiprocessing rocm llvm-r1
+
+DESCRIPTION="AMD's library for BLAS on ROCm"
+HOMEPAGE="https://github.com/ROCm/rocBLAS"
+SRC_URI="https://github.com/ROCm/rocBLAS/archive/rocm-${PV}.tar.gz -> rocm-${P}.tar.gz"
+S="${WORKDIR}/${PN}-rocm-${PV}"
+
+LICENSE="BSD"
+SLOT="0/$(ver_cut 1-2)"
+KEYWORDS="~amd64"
+IUSE="benchmark hipblaslt test video_cards_amdgpu"
+RESTRICT="!test? ( test )"
+REQUIRED_USE="${ROCM_REQUIRED_USE}"
+
+BDEPEND="
+ >=dev-build/rocm-cmake-5.3
+ video_cards_amdgpu? (
+ dev-util/Tensile:${SLOT}
+ )
+ hipblaslt? ( sci-libs/hipBLASLt:${SLOT} )
+ test? ( dev-cpp/gtest )
+"
+
+DEPEND="
+ >=dev-cpp/msgpack-cxx-6.0.0
+ dev-util/hip:${SLOT}
+ test? (
+ virtual/blas
+ dev-cpp/gtest
+ llvm-runtimes/openmp
+ )
+ benchmark? (
+ virtual/blas
+ llvm-runtimes/openmp
+ )
+"
+
+QA_FLAGS_IGNORED="/usr/lib64/rocblas/library/.*"
+
+PATCHES=(
+ "${FILESDIR}"/${PN}-5.4.2-add-missing-header.patch
+ "${FILESDIR}"/${PN}-5.4.2-link-cblas.patch
+ "${FILESDIR}"/${PN}-6.0.2-expand-isa-compatibility.patch
+ "${FILESDIR}"/${PN}-6.3.0-no-git.patch
+ "${FILESDIR}"/${PN}-6.3.0-find-cblas.patch
+)
+
+src_prepare() {
+ cmake_src_prepare
+ sed -e "s:,-rpath=.*\":\":" -i clients/CMakeLists.txt || die
+}
+
+src_configure() {
+ rocm_use_hipcc
+
+ # too many warnings
+ append-cxxflags -Wno-explicit-specialization-storage-class
+
+ local mycmakeargs=(
+ -DCMAKE_SKIP_RPATH=ON
+ -DBUILD_FILE_REORG_BACKWARD_COMPATIBILITY=OFF
+ -DROCM_SYMLINK_LIBS=OFF
+ -DAMDGPU_TARGETS="$(get_amdgpu_flags)"
+ -DBUILD_WITH_TENSILE="$(usex video_cards_amdgpu)"
+ -DCMAKE_INSTALL_INCLUDEDIR="include/rocblas"
+ -DBUILD_CLIENTS_SAMPLES=OFF
+ -DBUILD_CLIENTS_TESTS="$(usex test ON OFF)"
+ -DBUILD_CLIENTS_BENCHMARKS="$(usex benchmark ON OFF)"
+ -DBUILD_WITH_PIP=OFF
+ -DBUILD_WITH_HIPBLASLT="$(usex hipblaslt ON OFF)"
+ -DLINK_BLIS=OFF
+ -Wno-dev
+ )
+
+ if usex video_cards_amdgpu; then
+ mycmakeargs+=(
+ -DTensile_LOGIC="asm_full"
+ -DTensile_COMPILER="hipcc"
+ -DTensile_LIBRARY_FORMAT="msgpack"
+ -DTensile_CODE_OBJECT_VERSION="default"
+ -DTensile_ROOT="${EPREFIX}/usr/share/Tensile"
+ -DTensile_CPU_THREADS="$(makeopts_jobs)"
+ )
+ fi
+
+ cmake_src_configure
+}
+
+src_compile() {
+ docs_compile
+ cmake_src_compile
+}
+
+src_test() {
+ check_amdgpu
+ cd "${BUILD_DIR}"/clients/staging || die
+ export ROCBLAS_TEST_TIMEOUT=3600 ROCBLAS_TENSILE_LIBPATH="${BUILD_DIR}/Tensile/library"
+ export LD_LIBRARY_PATH="${BUILD_DIR}/clients:${BUILD_DIR}/library/src"
+
+ # `--gtest_filter=*quick*:*pre_checkin*-*known_bug*` is >1h on 7900XTX
+ edob ./rocblas-test --yaml rocblas_smoke.yaml
+}
+
+src_install() {
+ cmake_src_install
+
+ if use benchmark; then
+ cd "${BUILD_DIR}" || die
+ dolib.a clients/librocblas_fortran_client.a
+ dobin clients/staging/rocblas-bench
+ fi
+
+ # Stop llvm-strip from removing .strtab section from *.hsaco files,
+ # otherwise rocclr/elf/elf.cpp complains with "failed: null sections(STRTAB)" and crashes
+ dostrip -x "/usr/$(get_libdir)/rocblas/library/"
+}