blob: b9dcb25f7acd2001223a24b3d10f1f21cb865fe0 (
plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
|
# Copyright 1999-2022 Gentoo Authors
# Distributed under the terms of the GNU General Public License v2
EAPI=7
PYTHON_COMPAT=( python3_{7..10} )
inherit cmake check-reqs multiprocessing python-any-r1
DESCRIPTION="Next generation FFT implementation for ROCm"
HOMEPAGE="https://github.com/ROCmSoftwarePlatform/rocFFT"
SRC_URI="https://github.com/ROCmSoftwarePlatform/rocFFT/archive/rocm-${PV}.tar.gz -> rocFFT-${PV}.tar.gz"
LICENSE="MIT"
KEYWORDS="~amd64"
SLOT="0/$(ver_cut 1-2)"
RDEPEND="dev-util/hip:${SLOT}"
DEPEND="${RDEPEND}
${PYTHON_DEPS}"
BDEPEND="
test? ( dev-cpp/gtest dev-libs/boost
>=sci-libs/fftw-3 sys-libs/libomp )
>=dev-util/cmake-3.22
"
CHECKREQS_DISK_BUILD="7G"
IUSE="test"
RESTRICT="!test? ( test )"
S="${WORKDIR}/rocFFT-rocm-${PV}"
PATCHES=("${FILESDIR}/${PN}-4.2.0-add-functional-header.patch")
required_mem() {
if use test; then
echo "52G"
else
if [[ -n "${AMDGPU_TARGETS}" ]]; then
local NARCH=$(($(awk -F";" '{print NF-1}' <<< "${AMDGPU_TARGETS}" || die)+1)) # count how many archs user specified in ${AMDGPU_TARGETS}
else
local NARCH=7 # The default number of AMDGPU_TARGETS for rocFFT-4.3.0. May change in the future.
fi
echo "$(($(makeopts_jobs)*${NARCH}*25+2200))M" # A linear function estimating how much memory required
fi
}
pkg_pretend() {
return # leave the disk space check to pkg_setup phase
}
pkg_setup() {
export CHECKREQS_MEMORY=$(required_mem)
check-reqs_pkg_setup
python_setup
}
src_prepare() {
sed -e "s/PREFIX rocfft//" \
-e "/rocm_install_symlink_subdir/d" \
-e "/<INSTALL_INTERFACE/s,include,include/rocFFT," \
-i library/src/CMakeLists.txt || die
sed -e "/rocm_install_symlink_subdir/d" \
-e "$!N;s:PREFIX\n[ ]*rocfft:# PREFIX rocfft\n:;P;D" \
-i library/src/device/CMakeLists.txt || die
eapply_user
cmake_src_prepare
}
src_configure() {
# Grant access to the device
addwrite /dev/kfd
addpredict /dev/dri/
# Compiler to use
export CXX=hipcc
local mycmakeargs=(
-Wno-dev
-DCMAKE_INSTALL_INCLUDEDIR="include/rocFFT/"
-DCMAKE_SKIP_RPATH=ON
-DBUILD_CLIENTS_TESTS=$(usex test ON OFF)
-DBUILD_CLIENTS_SELFTEST=OFF # rocFFT-4.3.0 self test fails. See https://github.com/ROCmSoftwarePlatform/rocFFT/issues/324. Enable it for rocFFT-4.4
${AMDGPU_TARGETS+-DAMDGPU_TARGETS="${AMDGPU_TARGETS}"}
)
cmake_src_configure
}
src_test() {
addwrite /dev/kfd
addpredict /dev/dri
cd "${BUILD_DIR}/clients/staging" || die
einfo "Running rocfft-test"
LD_LIBRARY_PATH=${BUILD_DIR}/library/src/:${BUILD_DIR}/library/src/device ./rocfft-test || die
# rocFFT-4.3.0 self test fails. See https://github.com/ROCmSoftwarePlatform/rocFFT/issues/324. Enable it for rocFFT-4.4
# einfo "Running rocfft-selftest"
# LD_LIBRARY_PATH=${BUILD_DIR}/library/src/:${BUILD_DIR}/library/src/device ./rocfft-selftest || die
}
|