1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
|
# Copyright 1999-2022 Gentoo Authors
# Distributed under the terms of the GNU General Public License v2
EAPI=8
PYTHON_COMPAT=( python3_{8..10} )
inherit cmake check-reqs multiprocessing python-r1
DESCRIPTION="Next generation FFT implementation for ROCm"
HOMEPAGE="https://github.com/ROCmSoftwarePlatform/rocFFT"
SRC_URI="https://github.com/ROCmSoftwarePlatform/rocFFT/archive/rocm-${PV}.tar.gz -> rocFFT-${PV}.tar.gz"
LICENSE="MIT"
KEYWORDS="~amd64"
SLOT="0/$(ver_cut 1-2)"
# RDEPEND: perfscripts? dev-python/plotly[${PYTHON_USEDEP}] # currently masked by arch/amd64/x32/package.mask
RDEPEND="
perfscripts? (
>=media-gfx/asymptote-2.61
dev-texlive/texlive-latex
dev-tex/latexmk
sys-apps/texinfo
dev-python/sympy[${PYTHON_USEDEP}]
dev-python/numpy[${PYTHON_USEDEP}]
dev-python/scipy[${PYTHON_USEDEP}]
dev-python/pandas[${PYTHON_USEDEP}] )
${PYTHON_DEPS}"
DEPEND="dev-util/hip:=
${PYTHON_DEPS}"
BDEPEND="
test? ( dev-cpp/gtest dev-libs/boost
>=sci-libs/fftw-3 sys-libs/libomp )
>=dev-util/cmake-3.22
>=dev-util/rocm-cmake-${PV}-r1:${SLOT}
"
CHECKREQS_DISK_BUILD="7G"
IUSE="benchmark perfscripts test"
REQUIRED_USE="perfscripts? ( benchmark ) ${PYTHON_REQUIRED_USE}"
RESTRICT="!test? ( test )"
S="${WORKDIR}/rocFFT-rocm-${PV}"
PATCHES=(
"${FILESDIR}/${PN}-4.2.0-add-functional-header.patch"
"${FILESDIR}/${PN}-5.0.2-unbundle-sqlite.patch"
"${FILESDIR}/${PN}-5.0.2-add-math-header.patch" )
required_mem() {
if use test; then
echo "52G"
else
if [[ -n "${AMDGPU_TARGETS}" ]]; then
local NARCH=$(($(awk -F";" '{print NF-1}' <<< "${AMDGPU_TARGETS}" || die)+1)) # count how many archs user specified in ${AMDGPU_TARGETS}
else
local NARCH=7 # The default number of AMDGPU_TARGETS for rocFFT-4.3.0. May change in the future.
fi
echo "$(($(makeopts_jobs)*${NARCH}*25+2200))M" # A linear function estimating how much memory required
fi
}
pkg_pretend() {
return # leave the disk space check to pkg_setup phase
}
pkg_setup() {
export CHECKREQS_MEMORY=$(required_mem)
check-reqs_pkg_setup
python_setup
}
src_prepare() {
sed -e "s/PREFIX rocfft//" \
-e "/rocm_install_symlink_subdir/d" \
-e "/<INSTALL_INTERFACE/s,include,include/rocFFT," \
-i library/src/CMakeLists.txt || die
sed -e "/rocm_install_symlink_subdir/d" \
-e "$!N;s:PREFIX\n[ ]*rocfft:# PREFIX rocfft\n:;P;D" \
-i library/src/device/CMakeLists.txt || die
if use perfscripts; then
pushd scripts/perf || die
sed -e "/\/opt\/rocm/d" -e "/rocmversion/s,rocm_info.strip(),\"${PV}\"," -i perflib/specs.py || dir
sed -e "/^top/,+1d" -i rocfft-perf suites.py || die
sed -e "s,perflib,${PN}_perflib,g" -i rocfft-perf suites.py perflib/*.py || die
sed -e "/^top = /s,__file__).*$,\"${EPREFIX}/usr/share/${PN}-perflib\")," -i perflib/pdf.py perflib/generators.py || die
popd
fi
cmake_src_prepare
}
src_configure() {
# Grant access to the device
addwrite /dev/kfd
addpredict /dev/dri/
# Compiler to use
export CXX=hipcc
local mycmakeargs=(
-Wno-dev
-DCMAKE_INSTALL_INCLUDEDIR="include/rocFFT/"
-DCMAKE_SKIP_RPATH=ON
-DBUILD_CLIENTS_TESTS=$(usex test ON OFF)
-DBUILD_CLIENTS_SELFTEST=$(usex test ON OFF)
-DBUILD_CLIENTS_RIDER=$(usex benchmark ON OFF)
${AMDGPU_TARGETS+-DAMDGPU_TARGETS="${AMDGPU_TARGETS}"}
)
cmake_src_configure
}
src_test() {
addwrite /dev/kfd
addpredict /dev/dri
cd "${BUILD_DIR}/clients/staging" || die
einfo "Running rocfft-test"
LD_LIBRARY_PATH=${BUILD_DIR}/library/src/:${BUILD_DIR}/library/src/device ./rocfft-test || die
einfo "Running rocfft-selftest"
LD_LIBRARY_PATH=${BUILD_DIR}/library/src/:${BUILD_DIR}/library/src/device ./rocfft-selftest || die
}
src_install() {
cmake_src_install
if use benchmark; then
cd "${BUILD_DIR}"/clients/staging || die
dobin *rider
fi
if use perfscripts; then
cd "${S}"/scripts/perf || die
python_foreach_impl python_doexe rocfft-perf
python_moduleinto ${PN}_perflib
python_foreach_impl python_domodule perflib/*.py
insinto /usr/share/${PN}-perflib
doins *.asy suites.py
fi
}
|