summaryrefslogtreecommitdiff
path: root/dev-util/Tensile
diff options
context:
space:
mode:
authorV3n3RiX <venerix@koprulu.sector>2025-02-09 00:12:01 +0000
committerV3n3RiX <venerix@koprulu.sector>2025-02-09 00:12:01 +0000
commitb95a6fd4a7b591baa7cfc689f8ce5643592d07be (patch)
tree6a7c4722b40bdb6c409879ce253d8b42817fec14 /dev-util/Tensile
parent8b3c41ecef8a1cdd270ce3aabcfdfb991839699c (diff)
gentoo auto-resync : 09:02:2025 - 00:12:00
Diffstat (limited to 'dev-util/Tensile')
-rw-r--r--dev-util/Tensile/Manifest2
-rw-r--r--dev-util/Tensile/Tensile-6.3.2.ebuild140
2 files changed, 142 insertions, 0 deletions
diff --git a/dev-util/Tensile/Manifest b/dev-util/Tensile/Manifest
index 64bdf7f875a0..64ba88f4b941 100644
--- a/dev-util/Tensile/Manifest
+++ b/dev-util/Tensile/Manifest
@@ -21,10 +21,12 @@ DIST rocm-Tensile-5.4.2.tar.gz 14413805 BLAKE2B ca1c13785164439f6fe83f16b36b7a0b
DIST rocm-Tensile-5.7.1.tar.gz 12396002 BLAKE2B ec2c2bc3f07fe22abd800b642c998ea80b9e4e2d0d28c4763d574dbd2fcb14c735223ddc7571d4ab3a48f0bd819cc835c16df9882049c5bf56f25ef729e6d654 SHA512 8f356f36cfec74ee9b000d1180cf52077dc5c595e5c5a40792fc3eb13f3139980c7440f9bc912218f946cf8137e2481d23fe39f110511c1bb55fe85a933ffd36
DIST rocm-Tensile-6.1.1.tar.gz 12675289 BLAKE2B dfe3698d7dda14d5b20a6fe1ef6535ac9737ac330b71678a3a94e939adc2350e2dcf33e58c711ee90dae543efba59fe210bfa39fc69b63910ec4537db3f209bf SHA512 cf8b014b1ff7cd5d45236b8a9a6f5604b02e34a9245a163c672847b535d565151bf7e3a5127601681e80e6fe26964a0e544594044efe2fe68e39b0f1128f96e2
DIST rocm-Tensile-6.3.0.tar.gz 12724004 BLAKE2B 83887efe8ab4102b9d33bae1f97a245d40bcc186635760de509079218628fd4d57072c6c2c1726fec6d8603d40e760e37fa1a443eead290d121cac099ae779ff SHA512 4c80a269236690545d8bc9090b799c5b4095ed9152a1e19ff8b2e5decd588545641ccdf3c6c469b12f4de29b3f4c2821a6e4714460771250b05339ac32f57c13
+DIST rocm-Tensile-6.3.2.tar.gz 12723907 BLAKE2B aaabae87664340f3e044ac5fdc68331084cd597466f294d60f8ed3d523c0f1ebc0c6e3e353585d4bb85f4fe30c644b1a70f2123b6f62d67a6b7a1904f3d820bb SHA512 df8888d7250f9e3dc6818590c82a3e1dc3ff787e0eac29e45969ef408db92261d39faca29f5ac7a6bae5e5b614365ff6e37d087956697c25c65d9d7e4c1ba74d
EBUILD Tensile-5.1.3-r3.ebuild 2812 BLAKE2B 4c005cc1fcdcc45e74d97b463b1c7aff059a953fb951f2833ac3439e20138ce5d0cd15d20f47db6640a164def7e66c268289d6d1634f9b29ef1930665c77cc47 SHA512 3f1377286dc82e2a0a0797feb5f1223dcefa8367817cd97559c1ef78159ee9854d5be4b0eb0078ef3687702bf67ee708725c76d08dd9ae40e999b3b3aafc61ae
EBUILD Tensile-5.4.2-r2.ebuild 3348 BLAKE2B 45125cb1fcf233eaa847f3f5b565e1aa7e5fb7504ae37de9f16f9755f4bcb1b8bbd97a6cafe54a0a2a3253e21fea1a31b6d1ca6412b34994561eacd996f23088 SHA512 59a34c46a1372a071cc2df45cade4d4183cfb1f13f867cd380a193c1d1525b7ea4d1d4570c64101886787abd6880865432ea8577a241cebdb97807fd6b4ddb79
EBUILD Tensile-5.7.1-r2.ebuild 3534 BLAKE2B 508198211e41ae0e519a0c358e8b6d2b35384da585b947b1c29457ec4a8d91a941fd53e51da44dc5db56fec9749a101dd2598a0189a3953dddf29aced4832263 SHA512 6e41dd66afc8236aaf096eec8f445f59ad152c4b5846edda1b4a583695756dc7fe1743a530454a439d72469984f8038ae20e0fedfad102867c9ce049133aa1fc
EBUILD Tensile-6.1.1-r1.ebuild 3613 BLAKE2B bc993857e81720270ccdb3aa68c6a36a07ec32f46a45a8edbdf01af05c069ef58a5ba9349fe9be51fe3204ea8fd894595cc16304708c5d7d0eda76dde84dd1a6 SHA512 2f381562ba1ed3fd38435e519dd58ffe0198428b382d6114b18aadf6f6090e6b477aec1009744413e6e9cfcbb759f569b8a6a6b62c149dab613d449d8615ff0c
EBUILD Tensile-6.1.1.ebuild 3561 BLAKE2B cd1cc973261db88e42b84bdfb977bdfe5f3d8053a3cbd564dbb960e7730c6028e984499b7fea9bb091773b4ff5fa1775bd253cba2898d896f4d5e17a67820ee2 SHA512 680cc2e82ad2d393316224c119ec0b04d67f6e4729e412987c1fd449b68cffe570d0389904182020c03330ebd7a12a6bc7467b98c498c57159da21587a7d6550
EBUILD Tensile-6.3.0.ebuild 3539 BLAKE2B 189cfd03790ebd16ba082bf8d0b0a9df9cb8f31db8600f86c2fb327c4c5a79585a86382f025330399b0350bc020bee6b2c281638df38daf775145a7e7ca42173 SHA512 970317d58bfad0c22081868d18ed2b572802a8d0cd8375564468f34a5d674ead6b10a964ff79f570925f90d197a07a72a7ecc783c12f15abb100fee9e773247e
+EBUILD Tensile-6.3.2.ebuild 3539 BLAKE2B ce26a7042b3ec35815b0f9f3aaa796140717688023c66817bea1843793d9a68f5d6bde9cf31358de16c4ad4056a8f220277a5b2ba0ae4c6a56f3082100703e23 SHA512 2152eaf4e9932d9eaa3c271f5e716d81e2b8d647a466142a8a448d021820abbc95b8000dd269a96358f479c2a2df6a5138810ba5dcb9c669cda3e1dc27cadfdb
MISC metadata.xml 462 BLAKE2B 5ce10e79977a750f19569a4b78dfea8443364c8aa5540648cdcad85895c6bd3144b0e949a0dec2928c13eafa4700808b80a6a12d864cee3d17f5cad1d7fb0c41 SHA512 97db6599f4efc77421cc1c5f0a5733fd1e58b2a82236082b621f4b750638d68b4727fa129729e2f87e37fd28813d860a7eb00f056f252bbf3f5747200d4bcdd6
diff --git a/dev-util/Tensile/Tensile-6.3.2.ebuild b/dev-util/Tensile/Tensile-6.3.2.ebuild
new file mode 100644
index 000000000000..2b811c879756
--- /dev/null
+++ b/dev-util/Tensile/Tensile-6.3.2.ebuild
@@ -0,0 +1,140 @@
+# Copyright 1999-2025 Gentoo Authors
+# Distributed under the terms of the GNU General Public License v2
+
+EAPI=8
+
+PYTHON_COMPAT=( python3_{10..13} )
+DISTUTILS_USE_PEP517=setuptools
+ROCM_VERSION=${PV}
+LLVM_COMPAT=( 19 )
+
+inherit cmake distutils-r1 llvm-r1 prefix rocm
+
+DESCRIPTION="Stretching GPU performance for GEMMs and tensor contractions"
+HOMEPAGE="https://github.com/ROCm/Tensile"
+SRC_URI="https://github.com/ROCm/Tensile/archive/rocm-${PV}.tar.gz -> rocm-Tensile-${PV}.tar.gz"
+S="${WORKDIR}/${PN}-rocm-${PV}"
+
+LICENSE="MIT"
+SLOT="0/$(ver_cut 1-2)"
+KEYWORDS="~amd64"
+IUSE="client test"
+REQUIRED_USE="client? ( ${ROCM_REQUIRED_USE} )"
+
+# tests can freeze machine depending on gpu/kernel
+RESTRICT="test"
+
+RDEPEND="${PYTHON_DEPS}
+ client? ( dev-libs/boost )
+ >=dev-cpp/msgpack-cxx-6.0.0
+ dev-python/pyyaml[${PYTHON_USEDEP}]
+ dev-python/msgpack[${PYTHON_USEDEP}]
+ dev-python/joblib[${PYTHON_USEDEP}]
+ dev-util/hip:${SLOT}
+ dev-util/rocm-smi:${SLOT}
+ $(llvm_gen_dep '
+ llvm-core/clang:${LLVM_SLOT}
+ ')
+"
+DEPEND="${RDEPEND}"
+BDEPEND="
+ test? (
+ dev-python/pytest-forked[${PYTHON_USEDEP}]
+ dev-python/pytest-xdist[${PYTHON_USEDEP}]
+ dev-python/filelock[${PYTHON_USEDEP}]
+ dev-python/joblib[${PYTHON_USEDEP}]
+ )
+"
+
+distutils_enable_tests pytest
+
+PATCHES=(
+ "${FILESDIR}"/${PN}-5.4.2-fix-arch-parse.patch
+ "${FILESDIR}"/${PN}-6.3.0-use-ninja.patch
+ "${FILESDIR}"/${PN}-6.1.1-fix-msgpack-dependency.patch
+ "${FILESDIR}"/${PN}-6.0.2-expand-isa-compatibility.patch
+)
+
+CMAKE_USE_DIR="${S}/${PN}/Source"
+
+src_prepare() {
+ distutils-r1_src_prepare
+ sed -e "s,\@LLVM_PATH\@,$(get_llvm_prefix),g" \
+ "${FILESDIR}"/${PN}-5.7.1-gentoopath.patch > "${S}"/gentoopath.patch || die
+ eapply $(prefixify_ro "${S}"/gentoopath.patch)
+
+ pushd ${PN} || die
+
+ sed -e "/ROCM_SMI_ROOT/s,lib,$(get_libdir)," \
+ -i Source/cmake/FindROCmSMI.cmake || die
+ sed -r -e "/TENSILE_USE_LLVM/s/ON/OFF/" \
+ -i Source/CMakeLists.txt || die
+
+ # ${Tensile_ROOT}/bin does not exists; call command directly
+ sed -e "s,\${Tensile_ROOT}/bin/,,g" -i cmake/TensileConfig.cmake || die
+
+ local Tensile_share_dir="\"${EPREFIX}/usr/share/${PN}\""
+ sed -e "/HipClangVersion/s/0.0.0/$(hipconfig -v)/" -i Common.py || die
+
+ sed -e "s,os.path.dirname(os.path.realpath(__file__)),${Tensile_share_dir},g" \
+ -i ReplacementKernels.py Common.py ${PN}.py || die
+
+ sed -e "s|os\.path\.dirname.*$|\"${EPREFIX}/usr/share/Tensile/Source\", end='')|" -i __init__.py || die
+
+ popd || die
+
+ sed -e "/package_data/d" -e "/data_files/d" -i setup.py || die
+ use client && PATCHES= cmake_src_prepare # do not apply patches again in cmake_src_prepare
+}
+
+src_configure() {
+ rocm_use_hipcc
+
+ distutils-r1_src_configure
+ if use client; then
+ local mycmakeargs=(
+ -DCMAKE_SKIP_RPATH=ON
+ -DTENSILE_USE_MSGPACK=ON
+ -DTENSILE_USE_LLVM=ON
+ -DTensile_LIBRARY_FORMAT=msgpack
+ -DAMDGPU_TARGETS="$(get_amdgpu_flags)"
+ )
+ cmake_src_configure
+ fi
+}
+
+src_compile() {
+ distutils-r1_src_compile
+ use client && cmake_src_compile
+}
+
+python_install() {
+ distutils-r1_python_install
+
+ python_moduleinto Tensile
+ pushd Tensile || die
+ python_domodule Components
+ python_domodule Utilities
+ python_domodule TensileCreateLib
+}
+
+src_install() {
+ distutils-r1_src_install
+
+ pushd ${PN} || die
+ insinto /usr/share/${PN}
+ doins -r Configs Perf Source CustomKernels
+ insinto /usr/$(get_libdir)/cmake/${PN}
+ doins cmake/*.cmake
+
+ if use client; then
+ pushd "${BUILD_DIR}" || die
+ dobin client/tensile_client
+ fi
+}
+
+# Test suite fails to start without this
+python_test() {
+ export ROCM_PATH="${EPREFIX}/usr"
+ epytest
+}