From c387a20abbfd15a6fdbe44fdac6df6a415096d55 Mon Sep 17 00:00:00 2001 From: saundersp Date: Sun, 9 Mar 2025 22:37:00 +0100 Subject: [PATCH] Added dev-util/nvidia-cuda-toolkit-12.8.1 --- dev-util/nvidia-cuda-toolkit/Manifest | 7 + .../nvidia-cuda-toolkit/files/cuda-config.in | 28 ++ .../nvidia-cuda-toolkit-glibc-2.41-r1.patch | 72 ++++ .../files/parse_manifest.py | 223 +++++++++++ dev-util/nvidia-cuda-toolkit/metadata.xml | 16 + .../nvidia-cuda-toolkit-12.8.1.ebuild | 372 ++++++++++++++++++ .../dev-util/nvidia-cuda-toolkit-12.8.1 | 16 + 7 files changed, 734 insertions(+) create mode 100644 dev-util/nvidia-cuda-toolkit/Manifest create mode 100644 dev-util/nvidia-cuda-toolkit/files/cuda-config.in create mode 100644 dev-util/nvidia-cuda-toolkit/files/nvidia-cuda-toolkit-glibc-2.41-r1.patch create mode 100644 dev-util/nvidia-cuda-toolkit/files/parse_manifest.py create mode 100644 dev-util/nvidia-cuda-toolkit/metadata.xml create mode 100644 dev-util/nvidia-cuda-toolkit/nvidia-cuda-toolkit-12.8.1.ebuild create mode 100644 metadata/md5-cache/dev-util/nvidia-cuda-toolkit-12.8.1 diff --git a/dev-util/nvidia-cuda-toolkit/Manifest b/dev-util/nvidia-cuda-toolkit/Manifest new file mode 100644 index 0000000..0ab11ae --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/Manifest @@ -0,0 +1,7 @@ +AUX cuda-config.in 407 BLAKE2B 5f7a0d50d774db58c180b767f00bead7c7dbf5f6b3b4a2f960dfc3b8450f7abf5c2b67c6620c5318f1331646dd2003d61c70a4c31359efd16ff418ecc9d0b446 SHA512 363903b999c43a47a48c52e8898c6044fadcc66d259338ee22863e859c2bc9873a2f1392aa83c9182486d3aa4eaeb5f164cf8ccf29cc74fd8ad56245f76a039a +AUX nvidia-cuda-toolkit-glibc-2.41-r1.patch 3163 BLAKE2B a3d5dbc50898b1502a342c3c70997864bc0e49ccf035b32a76a4ca1b282d236609b5ebc5d094ac0489abcb835456231a90428a758471af59464198b0dcf79999 SHA512 e0fb0018273416df4c1c40e5f74f6d0261a93bb9c4471c12732306b40903c1df8a509a9fd9060d968ac5484b791b6dd86a6db80b6993b979b22a41f44d6bf456 +AUX parse_manifest.py 8488 BLAKE2B fe4748e41727e717d99b3b7f294d7c8e67b44e3f352f27a76c386502870e6134217ead3d93714755f50b0393d514b9e317748aed89637c660e354d53354d1485 SHA512 ab90e614bfd729a0a90a7373d58fcf2f6e7ba3beb8a00841b87e8240c9386a678daf551f4fcc89040f10d46d159e316442978c60b1a8960070576cfb7a11d52c +DIST cuda_12.8.1_570.124.06_linux.run 5382238770 BLAKE2B 6dff4eb32e97f960bdb2bd57d0dbf0920a9f85c19c26199adcac64eb9d30d7b6f6e2691c7a7a0b5b8249c7860cc685931080a3775c804f6e4e3294c43380e94f SHA512 2ac14ba054bf01924e1953053850f679ebdbc2b9150715398365464eae9d686cde2b82abb8f385b74e4eafa8d68421a9ea216c7647c08956ccba8b2299b50a6e +DIST cuda_12.8.1_570.124.06_linux_sbsa.run 4606631442 BLAKE2B 142c3a231f2a621c4d6a74059b72125baca83d2653ba95c726e3e3c12cf8a0a6b75ced7c0bdaa98450c3d2c2224e88886598191b594ac69be52ba5765bb30592 SHA512 108a75e0ca098b0fd514b3380d42b4752669201dcd68c41f2c1ecf9f29c216ac5937fa33d60e11be06e8a2ad8ae73aa49e6685a363ea77af943e1a1b936b8349 +EBUILD nvidia-cuda-toolkit-12.8.1.ebuild 10532 BLAKE2B b8da053e6d0c0d0dc42e1681182ab18319ce55881b6201a6a2ad0370ca0eeed89505347d6538c3fc8b6e22b6a943269821282a99361fc314a16e39761a90948e SHA512 d7de00fc0f20249b0e8ae60bcde6d3090d2dc26656a4fa5ab8f73aafacc15d99c329506b9eb5e46ec4a6f93f14c008ba624762ab44d10f5f3f455deec4c38a1f +MISC metadata.xml 761 BLAKE2B a6ae653c6206cbc05349297499b6dde91bce6d543e10bd5ea915cfe9729dfa6f1eb954ae09c2e4d3997f51315ae090b38606c21b5099e750596ea66fdd93e817 SHA512 9133517d805201d25b651e48abed90394c88ef33a2571ab20b3b19d365f85a90478486c7c087c9150d7d9f6e4026873c5236c64ed649fd3bfc8f9b81479dcc59 diff --git a/dev-util/nvidia-cuda-toolkit/files/cuda-config.in b/dev-util/nvidia-cuda-toolkit/files/cuda-config.in new file mode 100644 index 0000000..10db7dd --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/files/cuda-config.in @@ -0,0 +1,28 @@ +#!/bin/bash + +SUPPORT_GCC_VERSIONS_BY_CUDA="CUDA_SUPPORTED_GCC" + +_print_help() { + cat <<- EOF + Usage: + $(basename $0) [options] + + -s | --supported Returns by current CUDA supported gcc versions + -h | --help Shows this help + EOF +} + +case ${1} in + -s|--supported) + echo "${SUPPORT_GCC_VERSIONS_BY_CUDA}" + exit 0 + ;; + -h|--help) + _print_help + exit 255 + ;; + *) + _print_help + exit 1 + ;; +esac diff --git a/dev-util/nvidia-cuda-toolkit/files/nvidia-cuda-toolkit-glibc-2.41-r1.patch b/dev-util/nvidia-cuda-toolkit/files/nvidia-cuda-toolkit-glibc-2.41-r1.patch new file mode 100644 index 0000000..3156302 --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/files/nvidia-cuda-toolkit-glibc-2.41-r1.patch @@ -0,0 +1,72 @@ +From cae8ab12c9f981f110bb2e1318d9c5306e3a2d81 Mon Sep 17 00:00:00 2001 +From: Paul Zander +Date: Sat, 8 Feb 2025 16:34:42 +0100 +Subject: [PATCH] Updates headers for glibc-2.41 + +Match the extern definitions in cuda-crt headers with the changes in glibc-2.41. + +/usr/include/bits/mathcalls.h(79): error: exception specification is +incompatible with that of previous function "cospi" (declared at line 2601 +of +/opt/cuda-12.8.0/bin/../targets/x86_64-linux/include/crt/math_functions.h) + + extern double cospi (double __x) noexcept (true); extern double __cospi (double __x) noexcept (true); + +See-Also: https://sourceware.org/git/?p=glibc.git;a=commit;h=0ae0af68d8fa3bf6cbe1e4f1de5929ff71de67b3 +Signed-off-by: Paul Zander + +diff --git a/builds/cuda_nvcc/targets/x86_64-linux/include/crt/math_functions.h b/builds/cuda_nvcc/targets/x86_64-linux/include/crt/math_functions.h +index d8201f9..a9b19d4 100644 +--- a/builds/cuda_nvcc/targets/x86_64-linux/include/crt/math_functions.h ++++ b/builds/cuda_nvcc/targets/x86_64-linux/include/crt/math_functions.h +@@ -2553,7 +2553,11 @@ extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float rcbrt + * + * \note_accuracy_double + */ ++#if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ >= 41 ++extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double sinpi(double x) noexcept (true); ++#else + extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double sinpi(double x); ++#endif + /** + * \ingroup CUDA_MATH_SINGLE + * \brief Calculate the sine of the input argument +@@ -2576,7 +2580,11 @@ extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double sinpi + * + * \note_accuracy_single + */ ++#if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ >= 41 ++extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float sinpif(float x) noexcept (true); ++#else + extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float sinpif(float x); ++#endif + /** + * \ingroup CUDA_MATH_DOUBLE + * \brief Calculate the cosine of the input argument +@@ -2598,7 +2606,11 @@ extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float sinpi + * + * \note_accuracy_double + */ ++#if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ >= 41 ++extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double cospi(double x) noexcept (true); ++#else + extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double cospi(double x); ++#endif + /** + * \ingroup CUDA_MATH_SINGLE + * \brief Calculate the cosine of the input argument +@@ -2620,7 +2632,11 @@ extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ double cospi + * + * \note_accuracy_single + */ ++#if defined(__GLIBC__) && __GLIBC__ == 2 && __GLIBC_MINOR__ >= 41 ++extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float cospif(float x) noexcept (true); ++#else + extern __DEVICE_FUNCTIONS_DECL__ __device_builtin__ float cospif(float x); ++#endif + /** + * \ingroup CUDA_MATH_DOUBLE + * \brief Calculate the sine and cosine of the first input argument +-- +2.48.1 + diff --git a/dev-util/nvidia-cuda-toolkit/files/parse_manifest.py b/dev-util/nvidia-cuda-toolkit/files/parse_manifest.py new file mode 100644 index 0000000..57adad1 --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/files/parse_manifest.py @@ -0,0 +1,223 @@ +#!/usr/bin/env python +# Copyright 2024-2025 Gentoo Authors +# Distributed under the terms of the GNU General Public License v2 +# +# +# Takes the manifests/*.xml file from the NVIDIA CUDA Toolkit as input. +# Those files contain a nested tree of package items. +# +# For each package node a if block is output that checks the package's +# name attribute against the environment provided array SKIP_COMPONENTS +# and skips that whole package if it's listed in it. +# +# Each item contains four nodes that reference things to install, +# `dir`, `file`, `desktopFile`, & `pcfile`, and metadata that further +# detail these. This script will output calls to do* calls that +# use the metadata. +# - dodir would create an empty file - we handle this in dofile +# - dofile copies a regex file glob +# - dodesktopFile creates a .desktop file +# - dopcfile creates a pkgconfig file +# +# The resulting bash code can be run inside src_install(). +# +# Usage: python parse_manifest.py + + +import argparse +import xml.etree.ElementTree + +import defusedxml.ElementTree +from pathlib import Path + +ind = "\t" +indent = 1 + + +def main(): + parser = argparse.ArgumentParser() + parser.add_argument('filename') # positional argument + + args = parser.parse_args() + + basedir = Path(args.filename).parents[1] + + et = defusedxml.ElementTree.parse(args.filename) + + # Find all packages under the package with the id main (i.e. under "CUDA Installer") + for e in et.findall("[@id='main']/package"): + def p_package(el: xml.etree.ElementTree.Element, level: int = 0): + + skip = { + "Documentation", # obsolete + "Driver", # unused + # "Kernel Objects", # split + # "Demo Suite", + # "Visual Tools", + # old eclipse + # "nsight", + # old java + # "nvvp", + # "cuda-gdb-src" + } + + name = el.get("name") + + # trim leading CUDA and trailing version + if name.startswith("CUDA"): + name2 = ' '.join(name.split(" ")[1:-1]) + else: + name2 = name + + if name2 in skip: + return + + # avoid having to deal with whitespaces in bash + name2 = name2.replace(" ", "_") + + path = "" + + print(f"{ind * (level + 0) * indent}if ! has {name2} \"${{SKIP_COMPONENTS[@]}}\"; then # \"{name}\"") + + # output attributes from unhandled tags + for child in el: + if child.tag == "package": + continue + if child.tag == "file": + continue + if child.tag == "desktopFile": + continue + if child.tag == "pcfile": + continue + for attrib in child.attrib: + print(f"{child.tag} {attrib}={child.attrib[attrib]}") + + # CUDA Installer + # only for CUDA Installer + # unused + for node in el.findall("./name"): + print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # compiler + # category. We use the package name instead. + # unused + # for node in el.findall("./type"): + # print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # 1 + # probably sorting for the tui installer + # unused + # for node in el.findall("./priority"): + # print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # + # proably for tui installer + # unused + # for node in el.findall("./single-selection"): + # print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # 2.24.2 + # version of the installed kernel object (Kernel Objects only) + # unused + for node in el.findall("./koversion"): + print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # /usr/local/cuda-12.8 + # overrides the install location + # unused + # for node in el.findall("./installPath"): + # print(f"{ind * (level + 1) * indent}# {node.tag}: \"{node.text}\"") + + # ./builds/cuda_cccl/ + # path where the package files are found + # we cd into it + for node in el.findall("./buildPath"): + path = node.text.removeprefix('./') + print(f"{ind * (level + 1) * indent}cd \"${{S}}/{path}\" || die \"cd ${{S}}/{path} failed\"") + print() + + # bin + # would install empty dirs + # unused + # for node in el.findall("./dir"): + # pass + + # .* + # targets/x86_64-linux/lib/.*\.so + # regex glob of files to install. + for node in el.findall("./file"): + # unescape '.*' -> '*' & '\.' -> '.' + file = (node.text + .replace(".*", "*") + .replace(r"\.", ".") + .replace("x86_64", "${narch}") + .replace("sbsa", "${narch}") + ) + + # optional dir offset, we merge it into path + dir = "" + if "dir" in node.attrib: + dir = f" \"{Path(node.attrib["dir"])}\"" + + filepath = basedir / path / file + + # ignore existing symlinks ( include, lib* ) and the uninstallers + if not filepath.is_symlink() and not file.endswith("-uninstaller"): + print(f"{ind * (level + 1) * indent}dofile \"{file}\"{dir}") + + # opencl-12.8.pc + # create a pkgconfig file for the given description and lib name/version + for node in el.findall("./pcfile"): + offset = node.text.rfind('-') + if offset == -1: + raise RuntimeError(f"failed to split pcfile {node.text}") + + lib_name = node.text[:offset] + + if not node.text.endswith('.pc'): + raise RuntimeError(f"pcfile does not end in '.pc' {node.text}") + lib_version = node.text[offset+1:-3] + + if "description" not in node.attrib: + raise RuntimeError(f"no description for {node.text}") + + subdir = "" + if "subdir" in node.attrib: + subdir = f" \"{node.attrib["subdir"]}\"" + + print(f"{ind * (level + 1) * indent}dopcfile " + f"\"{lib_name}\" " + f"\"{lib_version}\" " + f"\"{node.attrib["description"]}\"{subdir}") + + # + # create a .desktop file + for node in el.findall("./desktopFile"): + print(f"{ind * (level + 1) * indent}dodesktopFile \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["filename"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["name"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["categories"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["keywords"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["iconPath"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["execPath"]}\" \\") + print(f"{ind * (level + 2) * indent}\"{node.attrib["tryExecPath"]}\"") + + # iterator over all nested packages + for node in el.findall("./package"): + p_package(node, level + 1) + + print(f"{ind * (level + 0) * indent}fi") + + p_package(e) + + +if __name__ == "__main__": + main() diff --git a/dev-util/nvidia-cuda-toolkit/metadata.xml b/dev-util/nvidia-cuda-toolkit/metadata.xml new file mode 100644 index 0000000..ae4d401 --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/metadata.xml @@ -0,0 +1,16 @@ + + + + + sci@gentoo.org + Gentoo Science Project + + + Install the CUDA debugger + Install profiling and optimizing tools (nsight-compute, nsight-systems) + Install the NVIDIA CUDA profiler (nvprof) and the related libraries + Enable infiniband support via sys-cluster/rdma-core + Install compute-sanitizer tool + Install the NVIDIA CUDA visual profiler (nvvp) + + diff --git a/dev-util/nvidia-cuda-toolkit/nvidia-cuda-toolkit-12.8.1.ebuild b/dev-util/nvidia-cuda-toolkit/nvidia-cuda-toolkit-12.8.1.ebuild new file mode 100644 index 0000000..bb3eba4 --- /dev/null +++ b/dev-util/nvidia-cuda-toolkit/nvidia-cuda-toolkit-12.8.1.ebuild @@ -0,0 +1,372 @@ +# Copyright 1999-2025 Gentoo Authors +# Distributed under the terms of the GNU General Public License v2 + +# shellcheck disable=SC2317 + +EAPI=8 + +PYTHON_COMPAT=( python3_{10..13} ) +inherit check-reqs toolchain-funcs +inherit python-r1 + +DRIVER_PV="570.124.06" +GCC_MAX_VER="14" +CLANG_MAX_VER="19" + +DESCRIPTION="NVIDIA CUDA Toolkit (compiler and friends)" +HOMEPAGE="https://developer.nvidia.com/cuda-zone" +SRC_URI=" + amd64? ( + https://developer.download.nvidia.com/compute/cuda/${PV}/local_installers/cuda_${PV}_${DRIVER_PV}_linux.run + ) + arm64? ( + https://developer.download.nvidia.com/compute/cuda/${PV}/local_installers/cuda_${PV}_${DRIVER_PV}_linux_sbsa.run + ) +" +S="${WORKDIR}" + +LICENSE="NVIDIA-CUDA" + +SLOT="0/${PV}" # UNSLOTTED +# SLOT="${PV}" # SLOTTED + +KEYWORDS="-* ~amd64 ~arm64 ~amd64-linux ~arm64-linux" +IUSE="debugger examples profiler rdma sanitizer" +RESTRICT="bindist mirror strip test" + +REQUIRED_USE="${PYTHON_REQUIRED_USE}" + +# since CUDA 11, the bundled toolkit driver (== ${DRIVER_PV}) and the +# actual required minimum driver version are different. +RDEPEND=" + || ( + ${ED} ${_DESTDIR}" + } + + dopcfile() { + [[ $# -eq 0 ]] && return + + dodir "${CUDA_PATH}/pkgconfig" + cat > "${ED}${CUDA_PATH}/pkgconfig/${1}-${2}.pc" <<-EOF || die "dopcfile" + cudaroot=${EPREFIX}${CUDA_PATH} + libdir=\${cudaroot}/targets/${narch}-linux/lib${4} + includedir=\${cudaroot}/targets/${narch}-linux/include + + Name: ${1} + Description: ${3} + Version: ${2} + Libs: -L\${libdir} -l${1} + Cflags: -I\${includedir} + EOF + } + + pushd builds >/dev/null || die + fix_executable_bit=( + cuda_cupti/extras/CUPTI/samples/pc_sampling_utility/pc_sampling_utility_helper.h + cuda_cupti/extras/CUPTI/samples/pc_sampling_continuous/libpc_sampling_continuous.pl + + libcufile/gds/tools/run_gdsio.cfg + ) + + if use amd64; then + fix_executable_bit+=( + cuda_opencl/targets/*/include/CL/cl.hpp + + libcufile/targets/*/lib/libcufile_rdma_static.a + libcufile/targets/*/lib/libcufile_static.a + ) + fi + chmod -x "${fix_executable_bit[@]}" || die "failed chmod" + popd >/dev/null || die + + ebegin "parsing manifest" "${S}/manifests/cuda_"*.xml # {{{ + + "${EPYTHON}" "${FILESDIR}/parse_manifest.py" "${S}/manifests/cuda_"*".xml" &> "${T}/install.sh" \ + || die "failed to parse manifest" + # shellcheck disable=SC1091 + source "${T}/install.sh" || die "failed to source install script" + + eend $? # }}} + + if use debugger; then + if [[ -d "${ED}/${CUDA_PATH}/extras/Debugger/lib64" ]]; then + rmdir "${ED}/${CUDA_PATH}/extras/Debugger/lib64" || die "remove debugger lib64" + fi + + find "${ED}/${CUDA_PATH}/bin" -maxdepth 1 -name "cuda-gdb-*-tui" -print0 | while read -rd $'\0' tui_name; do + impl="$(basename "${tui_name}" | cut -d '-' -f 3 | tr '.' '_')" + + if ! has "${impl}" "${PYTHON_COMPAT[@]}" || ! use "python_targets_${impl}"; then + rm "${tui_name}" || die "tui-name rm ${tui_name}" + sed -e "/$(basename "${tui_name}")\"/d" -i "${ED}/${CUDA_PATH}/bin/cuda-gdb" || die "tui_name sed" + fi + done + fi + + # remove rdma libs (unless USE=rdma) + if ! use rdma; then + rm "${ED}/${CUDA_PATH}/targets/${narch}-linux/lib/libcufile_rdma"* || die "failed to remove rdma files" + fi + + # Add include and lib symlinks + dosym "targets/${narch}-linux/include" "${CUDA_PATH}/include" + dosym "targets/${narch}-linux/lib" "${CUDA_PATH}/lib64" + + find "${ED}/${CUDA_PATH}" -empty -delete || die + + local ldpathextradirs pathextradirs + + use debugger && ldpathextradirs+=":${EPREFIX}${CUDA_PATH}/extras/Debugger/lib64" + use profiler && ldpathextradirs+=":${EPREFIX}${CUDA_PATH}/extras/CUPTI/lib64" + + local revord=$(( 999999 - $(printf "%02d%02d%02d" "$(ver_cut 1)" "$(ver_cut 2)" "$(ver_cut 3)") )) + newenvd - "99cuda${revord}" <<-EOF + PATH=${EPREFIX}${CUDA_PATH}/bin${pathextradirs} + PKG_CONFIG_PATH=${EPREFIX}${CUDA_PATH}/pkgconfig + LDPATH=${EPREFIX}${CUDA_PATH}/lib64:${EPREFIX}${CUDA_PATH}/nvvm/lib64${ldpathextradirs} + EOF + + # CUDA prepackages libraries, don't revdep-build on them + insinto /etc/revdep-rebuild + newins - "80${PN}${revord}" <<-EOF + SEARCH_DIRS_MASK="${EPREFIX}${CUDA_PATH}" + EOF + + # https://bugs.gentoo.org/926116 + insinto /etc/sandbox.d + newins - "80${PN}" <<-EOF + SANDBOX_PREDICT="/proc/self/task" + EOF + + # TODO drop and replace with runtime detection similar to what python does {{{ + # ATTENTION: change requires revbump, see link below for supported GCC # versions + # https://docs.nvidia.com/cuda/cuda-installation-guide-linux/index.html#system-requirements + local cuda_supported_gcc=( 8.5 9.5 10 11 12 13 "${GCC_MAX_VER}" ) + + sed \ + -e "s:CUDA_SUPPORTED_GCC:${cuda_supported_gcc[*]}:g" \ + "${FILESDIR}"/cuda-config.in > "${ED}/${CUDA_PATH}/bin/cuda-config" || die + fperms +x "${CUDA_PATH}/bin/cuda-config" + # }}} + + # skip til cudnn has been changed #950207 + # if [[ "${SLOT}" != "${PV}" ]]; then + # dosym "${CUDA_PATH}" "${CUDA_PATH%"-${PV}"}" + # fi + + fowners -R root:root "${CUDA_PATH}" +} + +pkg_postinst_check() { + if tc-is-gcc && + ver_test "$(gcc-major-version)" -gt "${GCC_MAX_VER}"; then + ewarn + ewarn "gcc > ${GCC_MAX_VER} will not work with CUDA" + ewarn + ewarn "Append --ccbin= pointing to a gcc bindir to the nvcc compiler flags (NVCCFLAGS)" + ewarn "or set NVCC_CCBIN to the same bindir." + ewarn " NVCCFLAGS=\"--ccbin=$(eval echo "${EPREFIX}/usr/*-linux-gnu/gcc-bin/${GCC_MAX_VER}")\"" + ewarn " NVCC_CCBIN=$(eval echo "${EPREFIX}/usr/*-linux-gnu/gcc-bin/${GCC_MAX_VER}")" + ewarn + fi + + if tc-is-clang && + ver_test "$(clang-major-version)" -gt "${CLANG_MAX_VER}"; then + ewarn + ewarn "clang > ${CLANG_MAX_VER} will not work with CUDA" + ewarn + ewarn "Append --ccbin= pointing to a clang bindir to the nvcc compiler flags (NVCCFLAGS)" + ewarn "or set NVCC_CCBIN to the same bindir." + ewarn " NVCCFLAGS=\"--ccbin=$(eval echo "${EPREFIX}/usr/lib/llvm/*/bin${CLANG_MAX_VER}")\"" + ewarn " NVCC_CCBIN=$(eval echo "${EPREFIX}/usr/lib/llvm/*/bin${CLANG_MAX_VER}")" + ewarn + fi +} + +pkg_postinst() { + if [[ ${MERGE_TYPE} != binary ]]; then + pkg_postinst_check + fi + + if use profiler; then + einfo + einfo "nvidia-drivers restricts access to performance counters." + einfo "You'll need to run profiling tools (nvprof) " + einfo "using sudo (needs cap SYS_ADMIN) or add the following line to " + einfo "a modprobe configuration file " + einfo "(e.g. /etc/modprobe.d/nvidia-prof.conf): " + einfo + einfo "options nvidia NVreg_RestrictProfilingToAdminUsers=0" + einfo + fi +} diff --git a/metadata/md5-cache/dev-util/nvidia-cuda-toolkit-12.8.1 b/metadata/md5-cache/dev-util/nvidia-cuda-toolkit-12.8.1 new file mode 100644 index 0000000..05b436a --- /dev/null +++ b/metadata/md5-cache/dev-util/nvidia-cuda-toolkit-12.8.1 @@ -0,0 +1,16 @@ +BDEPEND=|| ( ( dev-lang/python:3.13 dev-python/defusedxml[python_targets_python3_13(-)] ) ( dev-lang/python:3.12 dev-python/defusedxml[python_targets_python3_12(-)] ) ( dev-lang/python:3.11 dev-python/defusedxml[python_targets_python3_11(-)] ) ( dev-lang/python:3.10 dev-python/defusedxml[python_targets_python3_10(-)] ) ) +DEFINED_PHASES=compile configure install postinst pretend setup unpack +DESCRIPTION=NVIDIA CUDA Toolkit (compiler and friends) +EAPI=8 +HOMEPAGE=https://developer.nvidia.com/cuda-zone +INHERIT=check-reqs toolchain-funcs python-r1 +IUSE=debugger examples profiler rdma sanitizer python_targets_python3_10 python_targets_python3_11 python_targets_python3_12 python_targets_python3_13 +KEYWORDS=-* ~amd64 ~arm64 ~amd64-linux ~arm64-linux +LICENSE=NVIDIA-CUDA +RDEPEND=|| (