mirror of
https://github.com/gentoo-mirror/gentoo.git
synced 2025-12-08 00:05:33 +03:00
75 lines
1.7 KiB
Bash
75 lines
1.7 KiB
Bash
# Copyright 1999-2025 Gentoo Authors
|
|
# Distributed under the terms of the GNU General Public License v2
|
|
|
|
EAPI=8
|
|
|
|
ROCM_SKIP_GLOBALS=1
|
|
|
|
inherit cmake rocm
|
|
|
|
DESCRIPTION="library for accelerating mixed precision matrix multiply-accumulate operations"
|
|
HOMEPAGE="https://github.com/ROCm/rocWMMA"
|
|
SRC_URI="https://github.com/ROCm/rocWMMA/archive/rocm-${PV}.tar.gz -> rocWMMA-${PV}.tar.gz"
|
|
S="${WORKDIR}/rocWMMA-rocm-${PV}"
|
|
|
|
LICENSE="MIT"
|
|
SLOT="0/$(ver_cut 1-2)"
|
|
KEYWORDS="~amd64"
|
|
|
|
IUSE_TARGETS=( gfx908 gfx90a gfx942 gfx950 gfx1100 gfx1101 gfx1102 gfx1151 gfx1200 gfx1201 )
|
|
IUSE_TARGETS=( "${IUSE_TARGETS[@]/#/amdgpu_targets_}" )
|
|
ROCM_REQUIRED_USE=" || ( ${IUSE_TARGETS[*]} )"
|
|
|
|
IUSE="${IUSE_TARGETS[*]/#/+} test"
|
|
REQUIRED_USE="test? ( ${ROCM_REQUIRED_USE} )"
|
|
|
|
RESTRICT="!test? ( test )"
|
|
|
|
DEPEND="
|
|
dev-util/hip:${SLOT}
|
|
dev-util/rocm-smi:${SLOT}
|
|
"
|
|
# interface dependencies of header library
|
|
RDEPEND="${DEPEND}"
|
|
|
|
BDEPEND="
|
|
test? (
|
|
dev-cpp/gtest
|
|
sci-libs/rocBLAS:${SLOT}
|
|
)
|
|
dev-build/rocm-cmake
|
|
"
|
|
|
|
PATCHES=(
|
|
"${FILESDIR}"/${PN}-6.1.1-no-test-install.patch
|
|
)
|
|
|
|
src_prepare() {
|
|
# unknown arguments for hipcc
|
|
sed -e "s/ -parallel-jobs=4//" \
|
|
-e "s/ -Xclang -fallow-half-arguments-and-returns//" \
|
|
-i CMakeLists.txt || die
|
|
|
|
cmake_src_prepare
|
|
}
|
|
|
|
src_configure() {
|
|
rocm_use_clang
|
|
|
|
local mycmakeargs=(
|
|
-DGPU_TARGETS="$(get_amdgpu_flags)"
|
|
-DROCWMMA_BUILD_SAMPLES=OFF
|
|
-DROCWMMA_BUILD_TESTS="$(usex test)"
|
|
)
|
|
use test && mycmakeargs+=(-DROCWMMA_USE_SYSTEM_GOOGLETEST=ON)
|
|
cmake_src_configure
|
|
}
|
|
|
|
src_test() {
|
|
check_amdgpu
|
|
|
|
# Expected time on gfx1100 is 1260s (-j1) or 936s (-j32)
|
|
# Visible devices are limited to the first one to exclude APU (if not disabled in the BIOS)
|
|
HIP_VISIBLE_DEVICES=0 cmake_src_test
|
|
}
|