diff options
Diffstat (limited to 'sci-libs/rocBLAS')
7 files changed, 0 insertions, 395 deletions
diff --git a/sci-libs/rocBLAS/Manifest b/sci-libs/rocBLAS/Manifest index ca44e7ca5686..8e328c26a78e 100644 --- a/sci-libs/rocBLAS/Manifest +++ b/sci-libs/rocBLAS/Manifest @@ -1,5 +1,3 @@ DIST rocBLAS-5.0.2-Tensile-asm_full-navi22.tar.gz 1110323 BLAKE2B 80fab97c6f89fccf1f8829ad41baf15ad31bbbb313b48825841834c7ec1b9f8ece794aebdf9fda42b54a38f642beb1bc1e374f2f3b4e43d8ba9dfd1eb6e3ece5 SHA512 8f6946cf9d68afd195640ae7e0da8dc33341c67f28813813b5361a56531fa2af4453d075703ea52c66d93a1936cf74688b86aa2fa62b52a7ed5f03272290c232 -DIST rocm-Tensile-4.3.0.tar.gz 14250149 BLAKE2B 030138eaca2a0aadd96801e6dbd72e510716dd90553ef3795c5e04e00a34a05ecae82b24f755e4033a4acfcdb1cf26291da1e7902bb090f89a010d403e832beb SHA512 126db0b413c716fba8d5be9bff7a44fd1badacbf32f3db8d0db649819177db37ebd56fd22dd3c809655f5d29675be115e698cd10bc3d0b4b23878ae3726fce47 -DIST rocm-rocBLAS-4.3.0.tar.gz 11569970 BLAKE2B f11b0acf2bbd5737b036142d3b2cc1e18c38e088a8b7db58156d478dd6718befbb82bb7fd43a38fe64a5427124c5ad5241fa37977f094e6efd195d168d3e5f65 SHA512 490ab1c1e98a8b311ad5630515c448d9bb0a2bf588a08bcbebee345e2954d616b4ffe7c2e03dadca82c590438c42afccb98fe8ba00856aece101b5ffe62ef1e0 DIST rocm-rocBLAS-5.0.2.tar.gz 13295178 BLAKE2B e1abfa06b9ac1545732465857839dae3f3708af49439a306a2b5b1b1b392101c38c95815f2c05a0d9ed29d41b154bc2e16a4f9203a37f5e2f68ee12cc4b44a06 SHA512 2f4a74f49350ede0debcf32229a6b6b95505615723c3f2bee16e4c169a3bb966dfb1971819028f47c525f571bea5662b892e63f655b0d1d2b8f20746bc5fe770 DIST rocm-rocBLAS-5.1.3.tar.gz 13741546 BLAKE2B af10d8cb69bee44ef5aab2dc350e1d9f3b6fddb3a840c17230c4b55b2649a4724c9f2e58c1eafdb3e2716eea016a72a35c3ddb498881b1ce682d780baa8d8b07 SHA512 5ab71838fdd0e9c5848cbf28a19d113353b619a878d8c7d05f64feb32faae2054169c95ed6e9dd6b05a2e807b57229dd2c361c4d289b6e6f17c196558640890f diff --git a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-change-default-Tensile-library-dir.patch b/sci-libs/rocBLAS/files/rocBLAS-4.3.0-change-default-Tensile-library-dir.patch deleted file mode 100644 index 1841424c6e56..000000000000 --- a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-change-default-Tensile-library-dir.patch +++ /dev/null @@ -1,39 +0,0 @@ -change the default rocm tensile library search path ---- orig/library/src/tensile_host.cpp 2021-08-21 17:56:47.040481580 +0800 -+++ rocBLAS-rocm-4.3.0/library/src/tensile_host.cpp 2021-08-21 17:58:46.360482372 +0800 -@@ -489,34 +489,7 @@ namespace - } - else - { --#ifndef ROCBLAS_STATIC_LIB -- Dl_info info; -- -- // Find the location of librocblas.so -- // Fall back on hard-coded path if static library or not found -- // [Use a C API (rocblas_sccal) *not* defined in this file to -- // avoid compile-time resolution of the function pointer; cf. -- // https://man7.org/linux/man-pages/man3/dladdr.3.html "BUGS"] -- -- if(dladdr((void*)rocblas_sscal, &info)) -- { -- path = info.dli_fname; -- path = std::string{dirname(&path[0])}; -- } -- else --#endif -- { -- path = "/opt/rocm/rocblas/lib"; -- } -- -- // Find the location of the libraries -- if(TestPath(path + "/../../Tensile/library")) -- path += "/../../Tensile/library"; -- else -- path += "/library"; -- -- if(TestPath(path + "/" + processor)) -- path += "/" + processor; -+ path="@GENTOO_PORTAGE_EPREFIX@/usr/lib64/rocblas/library"; - } - - // only load modules for the current architecture diff --git a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-link-system-blas.patch b/sci-libs/rocBLAS/files/rocBLAS-4.3.0-link-system-blas.patch deleted file mode 100644 index 184b76d7ef38..000000000000 --- a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-link-system-blas.patch +++ /dev/null @@ -1,24 +0,0 @@ -Link system blas libraries rather than the downloaded libraries (in install.sh) - ---- orig/clients/benchmarks/CMakeLists.txt -+++ rocBLAS-rocm-4.2.0/clients/benchmarks/CMakeLists.txt -@@ -49,7 +49,7 @@ target_include_directories( rocblas-benc - $<BUILD_INTERFACE:${BLIS_INCLUDE_DIR}> - ) - --target_link_libraries( rocblas-bench PRIVATE rocblas_fortran_client roc::rocblas lapack cblas ) -+target_link_libraries( rocblas-bench PRIVATE rocblas_fortran_client roc::rocblas lapack cblas -lblas ) - if(LINK_BLIS) - target_link_libraries( rocblas-bench PRIVATE ${BLIS_LIBRARY} ) - endif() ---- orig/clients/gtest/CMakeLists.txt -+++ rocBLAS-rocm-4.2.0/clients/gtest/CMakeLists.txt -@@ -129,7 +129,7 @@ target_include_directories( rocblas-test - $<BUILD_INTERFACE:${BLIS_INCLUDE_DIR}> - ) - --target_link_libraries( rocblas-test PRIVATE rocblas_fortran_client roc::rocblas lapack cblas ${GTEST_LIBRARIES} ) -+target_link_libraries( rocblas-test PRIVATE rocblas_fortran_client roc::rocblas lapack cblas -lblas ${GTEST_LIBRARIES} ) - if(LINK_BLIS) - target_link_libraries( rocblas-test PRIVATE ${BLIS_LIBRARY} ) - endif() diff --git a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-remove-problematic-test-suites.patch b/sci-libs/rocBLAS/files/rocBLAS-4.3.0-remove-problematic-test-suites.patch deleted file mode 100644 index 4265e999f322..000000000000 --- a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-remove-problematic-test-suites.patch +++ /dev/null @@ -1,22 +0,0 @@ -Those tests will fail comparing rocblas vs openblas, because the testing program is so strict that it cannot tolerate the numerical differences which is actually OK. - -https://github.com/ROCmSoftwarePlatform/rocBLAS/issues/1202 ---- orig/clients/gtest/known_bugs.yaml -+++ rocBLAS-rocm-4.3.0/clients/gtest/known_bugs.yaml -@@ -7,6 +7,16 @@ Known bugs: - - { function: gemm_ex, a_type: i8_r, b_type: i8_r, c_type: i32_r, d_type: i32_r, compute_type: i32_r, flags: 0, known_bug_platforms: "gfx900,gfx906,gfx1010,gfx1011,gfx1012,gfx1030" } - - { function: gemm_batched_ex, a_type: i8_r, b_type: i8_r, c_type: i32_r, d_type: i32_r, compute_type: i32_r, flags: 0, known_bug_platforms: "gfx900,gfx906,gfx90a,gfx1010,gfx1011,gfx1012,gfx1030" } - - { function: gemm_strided_batched_ex, a_type: i8_r, b_type: i8_r, c_type: i32_r, d_type: i32_r, compute_type: i32_r, flags: 0, known_bug_platforms: "gfx900,gfx906,gfx1010,gfx1011,gfx1012,gfx1030" } -+# gemv openblas reference differences due to summation order dependent roundoff accumulation with large M float complex -+# 8th significant digit difference vs CPU on single precision float math, leads to expected equality test failure -+# code needs to be changed to a tolerance test or reduce M for float complex type if using equality vs. CPU reference -+- { function: gemv, a_type: f32_c, transA: T, M: 131071 } -+- { function: gemv, a_type: f32_c, transA: C, M: 131071 } -+- { function: gemv_batched, a_type: f32_c, transA: T, M: 131071 } -+- { function: gemv_batched, a_type: f32_c, transA: C, M: 131071 } -+- { function: gemv_strided_batched, a_type: f32_c, transA: T, M: 131071 } -+- { function: gemv_strided_batched, a_type: f32_c, transA: C, M: 131071 } -+ - - #- { function: gemm_ex, a_type: bf16_r, b_type: bf16_r, c_type: bf16_r, d_type: bf16_r, compute_type: f32_r, transA: C, transB: N, M: 512, N: 512, K: 512, lda: 512, ldb: 512, ldc: 512, ldd: 512, alpha: 5.0, alphai: 0.0, beta: 0.0, betai: 0.0, known_bug_platforms: gfx908 } - #- { function: gemm_ex, a_type: bf16_r, b_type: bf16_r, c_type: bf16_r, d_type: bf16_r, compute_type: f32_r, transA: C, transB: N, M: 512, N: 512, K: 512, lda: 512, ldb: 512, ldc: 512, ldd: 512, alpha: 0.0, alphai: 0.0, beta: 3.0, betai: 0.0, known_bug_platforms: gfx908 } diff --git a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-unbundle-Tensile.patch b/sci-libs/rocBLAS/files/rocBLAS-4.3.0-unbundle-Tensile.patch deleted file mode 100644 index c8d99c851b00..000000000000 --- a/sci-libs/rocBLAS/files/rocBLAS-4.3.0-unbundle-Tensile.patch +++ /dev/null @@ -1,22 +0,0 @@ -diff --git a/cmake/virtualenv.cmake b/cmake/virtualenv.cmake -index 4c29c94..f9838c2 100644 ---- a/cmake/virtualenv.cmake -+++ b/cmake/virtualenv.cmake -@@ -11,7 +11,7 @@ set(VIRTUALENV_HOME_DIR ${CMAKE_BINARY_DIR}/virtualenv CACHE PATH "Path to virtu - function(virtualenv_create) - message("${VIRTUALENV_PYTHON_EXE} -m venv ${VIRTUALENV_HOME_DIR} --system-site-packages --clear") - execute_process( -- COMMAND ${VIRTUALENV_PYTHON_EXE} -m venv ${VIRTUALENV_HOME_DIR} --system-site-packages --clear -+ COMMAND true - ) - endfunction() - -@@ -21,7 +21,7 @@ function(virtualenv_install) - message("${VIRTUALENV_HOME_DIR}/bin/python -m pip install ${ARGN}") - execute_process( - RESULT_VARIABLE rc -- COMMAND ${VIRTUALENV_HOME_DIR}/bin/python -m pip install ${ARGN} -+ COMMAND true - ) - if(rc) - message(FATAL_ERROR ${rc}) diff --git a/sci-libs/rocBLAS/rocBLAS-4.3.0-r1.ebuild b/sci-libs/rocBLAS/rocBLAS-4.3.0-r1.ebuild deleted file mode 100644 index 63704e613e53..000000000000 --- a/sci-libs/rocBLAS/rocBLAS-4.3.0-r1.ebuild +++ /dev/null @@ -1,146 +0,0 @@ -# Copyright 1999-2022 Gentoo Authors -# Distributed under the terms of the GNU General Public License v2 - -EAPI=8 - -PYTHON_COMPAT=( python3_{8..10} ) -DOCS_BUILDER="doxygen" -DOCS_DIR="docs" -DOCS_DEPEND="media-gfx/graphviz" -inherit cmake docs prefix python-any-r1 - -DESCRIPTION="AMD's library for BLAS on ROCm" -HOMEPAGE="https://github.com/ROCmSoftwarePlatform/rocBLAS" -SRC_URI="https://github.com/ROCmSoftwarePlatform/rocBLAS/archive/rocm-${PV}.tar.gz -> rocm-${P}.tar.gz" -S="${WORKDIR}/${PN}-rocm-${PV}" - -LICENSE="BSD" -KEYWORDS="~amd64" -SLOT="0/$(ver_cut 1-2)" -IUSE="benchmark test" -RESTRICT="!test? ( test )" - -BDEPEND="${PYTHON_DEPS} - dev-util/rocm-cmake:${SLOT} - $(python_gen_any_dep ' - dev-util/Tensile[${PYTHON_USEDEP}] - ') - dev-util/Tensile:${SLOT} -" - -DEPEND=" - dev-util/hip:${SLOT} - dev-libs/msgpack - test? ( - virtual/blas - dev-cpp/gtest - sys-libs/libomp - ) - benchmark? ( - virtual/blas - sys-libs/libomp - ) -" - -PATCHES=( - "${FILESDIR}"/${PN}-4.3.0-fix-glibc-2.32-and-above.patch - "${FILESDIR}"/${PN}-4.3.0-change-default-Tensile-library-dir.patch - "${FILESDIR}"/${PN}-4.3.0-link-system-blas.patch - "${FILESDIR}"/${PN}-4.3.0-remove-problematic-test-suites.patch - "${FILESDIR}"/${PN}-4.3.0-unbundle-Tensile.patch -) - -python_check_deps() { - python_has_version "dev-util/Tensile[${PYTHON_USEDEP}]" -} - -src_prepare() { - cmake_src_prepare - # Fit for Gentoo FHS rule - sed -e "/PREFIX rocblas/d" \ - -e "/<INSTALL_INTERFACE/s:include:include/rocblas:" \ - -e "s:rocblas/include:include/rocblas:" \ - -e "s:\\\\\${CPACK_PACKAGING_INSTALL_PREFIX}rocblas/lib:${EPREFIX}/usr/$(get_libdir)/rocblas:" \ - -e "s:share/doc/rocBLAS:share/doc/${P}:" \ - -e "/rocm_install_symlink_subdir( rocblas )/d" -i library/src/CMakeLists.txt || die - - sed -e "s:,-rpath=.*\":\":" -i clients/CMakeLists.txt || die - - eprefixify library/src/tensile_host.cpp -} - -src_configure() { - # allow acces to hardware - addpredict /dev/kfd - addpredict /dev/dri/ - addpredict /dev/random - - export PATH="${EPREFIX}/usr/lib/llvm/roc/bin:${PATH}" - - local mycmakeargs=( - -DTensile_LOGIC="asm_full" - -DTensile_COMPILER="hipcc" - -DTensile_LIBRARY_FORMAT="msgpack" - -DTensile_CODE_OBJECT_VERSION="V3" - -DTensile_TEST_LOCAL_PATH="${EPREFIX}/usr/share/Tensile" - -DTensile_ROOT="${EPREFIX}/usr/share/Tensile" - -DBUILD_WITH_TENSILE=ON - -DBUILD_WITH_TENSILE_HOST=ON - -DCMAKE_INSTALL_PREFIX="${EPREFIX}/usr" - -DCMAKE_INSTALL_INCLUDEDIR="include/rocblas" - -DCMAKE_SKIP_RPATH=TRUE - -DBUILD_TESTING=OFF - -DBUILD_CLIENTS_SAMPLES=OFF - -DBUILD_CLIENTS_TESTS=$(usex test ON OFF) - -DBUILD_CLIENTS_BENCHMARKS=$(usex benchmark ON OFF) - ${AMDGPU_TARGETS+-DAMDGPU_TARGETS="${AMDGPU_TARGETS}"} - ) - - CXX="hipcc" cmake_src_configure - - # do not rerun cmake and the build process in src_install - sed -e '/RERUN/,+1d' -i "${BUILD_DIR}"/build.ninja || die -} - -src_compile() { - docs_compile - cmake_src_compile -} - -check_rw_permission() { - local cmd="[ -r $1 ] && [ -w $1 ]" - local error=0 user - if has sandbox ${FEATURES}; then - user="portage" - su portage -c "${cmd}" || error=1 - else - user="$(whoami)" - ${cmd} || error=1 - fi - if [[ "${error}" == 1 ]]; then - die "${user} do not have read and write permissions on $1! \n Make sure ${user} is in render group and check the permissions." - fi -} - -src_test() { - # check permissions on /dev/kfd and /dev/dri/render* - check_rw_permission /dev/kfd - check_rw_permission /dev/dri/render* - addwrite /dev/kfd - addwrite /dev/dri/ - cd "${BUILD_DIR}/clients/staging" || die - LD_LIBRARY_PATH="${BUILD_DIR}/clients:${BUILD_DIR}/library/src" ROCBLAS_TENSILE_LIBPATH="${BUILD_DIR}/Tensile/library" ./rocblas-test || die "Tests failed" -} - -src_install() { - cmake_src_install - - if use benchmark; then - cd "${BUILD_DIR}" || die - dolib.so clients/librocblas_fortran_client.so - dobin clients/staging/rocblas-bench - fi - - # Don't install the License (it is installed into the wrong dir) - rm "${ED}/usr/share/doc/${P}/LICENSE"* || die -} diff --git a/sci-libs/rocBLAS/rocBLAS-4.3.0.ebuild b/sci-libs/rocBLAS/rocBLAS-4.3.0.ebuild deleted file mode 100644 index a32ba82060c7..000000000000 --- a/sci-libs/rocBLAS/rocBLAS-4.3.0.ebuild +++ /dev/null @@ -1,140 +0,0 @@ -# Copyright 1999-2022 Gentoo Authors -# Distributed under the terms of the GNU General Public License v2 - -EAPI=7 - -PYTHON_COMPAT=( python3_{6..9} ) - -inherit cmake multiprocessing prefix python-any-r1 - -DESCRIPTION="AMD's library for BLAS on ROCm" -HOMEPAGE="https://github.com/ROCmSoftwarePlatform/rocBLAS" -SRC_URI="https://github.com/ROCmSoftwarePlatform/rocBLAS/archive/rocm-${PV}.tar.gz -> rocm-${P}.tar.gz - https://github.com/ROCmSoftwarePlatform/Tensile/archive/rocm-${PV}.tar.gz -> rocm-Tensile-${PV}.tar.gz" - -LICENSE="BSD" -KEYWORDS="~amd64" -IUSE="benchmark test" -SLOT="0/$(ver_cut 1-2)" - -BDEPEND=" - dev-util/rocm-cmake - !dev-util/Tensile - $(python_gen_any_dep ' - dev-python/msgpack[${PYTHON_USEDEP}] - dev-python/pyyaml[${PYTHON_USEDEP}] - ') -" - -DEPEND=" - dev-util/hip:${SLOT} - dev-libs/msgpack - test? ( virtual/blas - dev-cpp/gtest - sys-libs/libomp ) - benchmark? ( virtual/blas - sys-libs/libomp ) -" -RESTRICT="!test? ( test )" - -python_check_deps() { - python_has_version "dev-python/pyyaml[${PYTHON_USEDEP}]" && - python_has_version "dev-python/msgpack[${PYTHON_USEDEP}]" -} - -S="${WORKDIR}"/${PN}-rocm-${PV} - -PATCHES=("${FILESDIR}"/${PN}-4.3.0-fix-glibc-2.32-and-above.patch - "${FILESDIR}"/${PN}-4.3.0-change-default-Tensile-library-dir.patch - "${FILESDIR}"/${PN}-4.3.0-link-system-blas.patch - "${FILESDIR}"/${PN}-4.3.0-remove-problematic-test-suites.patch ) - -src_prepare() { - eapply_user - - pushd "${WORKDIR}"/Tensile-rocm-${PV} || die - eapply "${FILESDIR}/Tensile-${PV}-hsaco-compile-specified-arch.patch" # backported from upstream, should remove after 4.3.0 - eapply "${FILESDIR}/Tensile-4.3.0-output-commands.patch" - sed -e "/Number of parallel jobs to launch/s:default=-1:default=$(makeopts_jobs):" -i Tensile/TensileCreateLibrary.py || die - popd || die - - # Fit for Gentoo FHS rule - sed -e "/PREFIX rocblas/d" \ - -e "/<INSTALL_INTERFACE/s:include:include/rocblas:" \ - -e "s:rocblas/include:include/rocblas:" \ - -e "s:\\\\\${CPACK_PACKAGING_INSTALL_PREFIX}rocblas/lib:${EPREFIX}/usr/$(get_libdir)/rocblas:" \ - -e "s:share/doc/rocBLAS:share/doc/${P}:" \ - -e "/rocm_install_symlink_subdir( rocblas )/d" -i library/src/CMakeLists.txt || die - - # Use setup.py to install Tensile rather than pip - sed -r -e "/pip install/s:([^ \"\(]*python) -m pip install ([^ \"\)]*):\1 setup.py install --single-version-externally-managed --root / WORKING_DIRECTORY \2:g" -i cmake/virtualenv.cmake - - sed -e "s:,-rpath=.*\":\":" -i clients/CMakeLists.txt || die - - cmake_src_prepare - eprefixify library/src/tensile_host.cpp -} - -src_configure() { - # allow acces to hardware - addpredict /dev/kfd - addpredict /dev/dri/ - addpredict /dev/random - - export PATH="${EPREFIX}/usr/lib/llvm/roc/bin:${PATH}" - - local mycmakeargs=( - -DTensile_LOGIC="asm_full" - -DTensile_COMPILER="hipcc" - -DTensile_LIBRARY_FORMAT="msgpack" - -DTensile_CODE_OBJECT_VERSION="V3" - -DTensile_TEST_LOCAL_PATH="${WORKDIR}/Tensile-rocm-${PV}" - -DBUILD_WITH_TENSILE=ON - -DBUILD_WITH_TENSILE_HOST=ON - -DCMAKE_INSTALL_PREFIX="${EPREFIX}/usr" - -DCMAKE_INSTALL_INCLUDEDIR="include/rocblas" - -DCMAKE_SKIP_RPATH=TRUE - -DBUILD_TESTING=OFF - -DBUILD_CLIENTS_SAMPLES=OFF - -DBUILD_CLIENTS_TESTS=$(usex test ON OFF) - -DBUILD_CLIENTS_BENCHMARKS=$(usex benchmark ON OFF) - ${AMDGPU_TARGETS+-DAMDGPU_TARGETS="${AMDGPU_TARGETS}"} - ) - - CXX="hipcc" cmake_src_configure - - # do not rerun cmake and the build process in src_install - sed -e '/RERUN/,+1d' -i "${BUILD_DIR}"/build.ninja || die -} - -check_rw_permission() { - cmd="[ -r $1 ] && [ -w $1 ]" - errormsg="${user} do not have read and write permissions on $1! \n Make sure ${user} is in render group and check the permissions." - if has sandbox ${FEATURES}; then - user=portage - su portage -c "${cmd}" || die ${errormsg} - else - user=`whoami` - ${cmd} || die ${errormsg} - fi -} - -src_test() { - # check permissions on /dev/kfd and /dev/dri/render* - check_rw_permission /dev/kfd - check_rw_permission /dev/dri/render* - addwrite /dev/kfd - addwrite /dev/dri/ - cd "${BUILD_DIR}/clients/staging" || die - ROCBLAS_TENSILE_LIBPATH="${BUILD_DIR}/Tensile/library" ./rocblas-test -} - -src_install() { - cmake_src_install - - if use benchmark; then - cd "${BUILD_DIR}" || die - dolib.so clients/librocblas_fortran_client.so - dobin clients/staging/rocblas-bench - fi -} |