Merge pull request #299578 from ConnorBaker/fix/treewide-cuda-reformat-nixfmt-rfc-style-2024-03-01

treewide: CUDA reformat with `nixfmt-rfc-style`
This commit is contained in:
Silvan Mosberger
2024-04-02 20:57:36 +02:00
committed by GitHub
36 changed files with 1027 additions and 994 deletions

View File

@@ -102,3 +102,6 @@ fb0e5be84331188a69b3edd31679ca6576edb75a
# systemd: break too long lines of Nix code # systemd: break too long lines of Nix code
67643f8ec84bef1482204709073e417c9f07eb87 67643f8ec84bef1482204709073e417c9f07eb87
# {pkgs/development/cuda-modules,pkgs/test/cuda,pkgs/top-level/cuda-packages.nix}: reformat all CUDA files with nixfmt-rfc-style 2023-03-01
802a1b4d3338f24cbc4efd704616654456d75a94

50
.github/workflows/check-nix-format.yml vendored Normal file
View File

@@ -0,0 +1,50 @@
# This file was copied mostly from check-maintainers-sorted.yaml.
# NOTE: Formatting with the RFC-style nixfmt command is not yet stable. See
# https://github.com/NixOS/rfcs/pull/166.
# Because of this, this action is not yet enabled for all files -- only for
# those who have opted in.
name: Check that Nix files are formatted
on:
pull_request_target:
permissions:
contents: read
jobs:
nixos:
runs-on: ubuntu-latest
if: github.repository_owner == 'NixOS'
steps:
- uses: actions/checkout@9bb56186c3b09b4f86b1c65136769dd318469633 # v4.1.2
with:
# pull_request_target checks out the base branch by default
ref: refs/pull/${{ github.event.pull_request.number }}/merge
- uses: cachix/install-nix-action@8887e596b4ee1134dae06b98d573bd674693f47c # v26
with:
# explicitly enable sandbox
extra_nix_config: sandbox = true
- name: Install nixfmt
run: nix-env -f default.nix -iAP nixfmt-rfc-style
- name: Check that Nix files are formatted according to the RFC style
# Each environment variable beginning with NIX_FMT_PATHS_ is a list of
# paths to check with nixfmt.
env:
# Format paths related to the Nixpkgs CUDA ecosystem.
NIX_FMT_PATHS_CUDA: |
pkgs/development/cuda-modules
pkgs/test/cuda
pkgs/top-level/cuda-packages.nix
# Iterate over all environment variables beginning with NIX_FMT_PATHS_.
run: |
for env_var in "${!NIX_FMT_PATHS_@}"; do
readarray -t paths <<< "${!env_var}"
if [[ "${paths[*]}" == "" ]]; then
echo "Error: $env_var is empty."
exit 1
fi
echo "Checking paths: ${paths[@]}"
if ! nixfmt --check "${paths[@]}"; then
echo "Error: nixfmt failed."
exit 1
fi
done

View File

@@ -21,6 +21,6 @@ let
assertCondition = true; assertCondition = true;
in in
/* TODO: Consider testing whether we in fact use the newer libstdc++ */ # TODO: Consider testing whether we in fact use the newer libstdc++
lib.extendDerivation assertCondition passthruExtra cudaStdenv lib.extendDerivation assertCondition passthruExtra cudaStdenv

View File

@@ -1,4 +1,4 @@
{hostPlatform, lib}: { hostPlatform, lib }:
let let
# Samples are built around the CUDA Toolkit, which is not available for # Samples are built around the CUDA Toolkit, which is not available for
# aarch64. Check for both CUDA version and platform. # aarch64. Check for both CUDA version and platform.
@@ -8,7 +8,7 @@ let
extension = extension =
final: _: final: _:
lib.attrsets.optionalAttrs platformIsSupported { lib.attrsets.optionalAttrs platformIsSupported {
cuda-library-samples = final.callPackage ./generic.nix {}; cuda-library-samples = final.callPackage ./generic.nix { };
}; };
in in
extension extension

View File

@@ -22,7 +22,7 @@ let
cmake cmake
addOpenGLRunpath addOpenGLRunpath
]; ];
buildInputs = [cudatoolkit]; buildInputs = [ cudatoolkit ];
postFixup = '' postFixup = ''
for exe in $out/bin/*; do for exe in $out/bin/*; do
addOpenGLRunpath $exe addOpenGLRunpath $exe
@@ -36,7 +36,7 @@ let
cuSPARSE, cuSOLVER, cuFFT, cuRAND, NPP and nvJPEG. cuSPARSE, cuSOLVER, cuFFT, cuRAND, NPP and nvJPEG.
''; '';
license = lib.licenses.bsd3; license = lib.licenses.bsd3;
maintainers = with lib.maintainers; [obsidian-systems-maintenance] ++ lib.teams.cuda.members; maintainers = with lib.maintainers; [ obsidian-systems-maintenance ] ++ lib.teams.cuda.members;
}; };
}; };
in in
@@ -69,9 +69,9 @@ in
src = "${src}/cuTENSOR"; src = "${src}/cuTENSOR";
buildInputs = [cutensor]; buildInputs = [ cutensor ];
cmakeFlags = ["-DCUTENSOR_EXAMPLE_BINARY_INSTALL_DIR=${builtins.placeholder "out"}/bin"]; cmakeFlags = [ "-DCUTENSOR_EXAMPLE_BINARY_INSTALL_DIR=${builtins.placeholder "out"}/bin" ];
# CUTENSOR_ROOT is double escaped # CUTENSOR_ROOT is double escaped
postPatch = '' postPatch = ''

View File

@@ -15,65 +15,63 @@
let let
inherit (lib) lists strings; inherit (lib) lists strings;
in in
backendStdenv.mkDerivation ( backendStdenv.mkDerivation (finalAttrs: {
finalAttrs: { strictDeps = true;
strictDeps = true;
pname = "cuda-samples"; pname = "cuda-samples";
version = cudaVersion; version = cudaVersion;
src = fetchFromGitHub { src = fetchFromGitHub {
owner = "NVIDIA"; owner = "NVIDIA";
repo = finalAttrs.pname; repo = finalAttrs.pname;
rev = "v${finalAttrs.version}"; rev = "v${finalAttrs.version}";
inherit hash; inherit hash;
}; };
nativeBuildInputs = nativeBuildInputs =
[ [
autoAddDriverRunpath autoAddDriverRunpath
pkg-config pkg-config
] ]
# CMake has to run as a native, build-time dependency for libNVVM samples. # CMake has to run as a native, build-time dependency for libNVVM samples.
# However, it's not the primary build tool -- that's still make. # However, it's not the primary build tool -- that's still make.
# As such, we disable CMake's build system. # As such, we disable CMake's build system.
++ lists.optionals (strings.versionAtLeast finalAttrs.version "12.2") [cmake]; ++ lists.optionals (strings.versionAtLeast finalAttrs.version "12.2") [ cmake ];
dontUseCmakeConfigure = true; dontUseCmakeConfigure = true;
buildInputs = [ buildInputs = [
cudatoolkit cudatoolkit
freeimage freeimage
glfw3 glfw3
]; ];
# See https://github.com/NVIDIA/cuda-samples/issues/75. # See https://github.com/NVIDIA/cuda-samples/issues/75.
patches = lib.optionals (finalAttrs.version == "11.3") [ patches = lib.optionals (finalAttrs.version == "11.3") [
(fetchpatch { (fetchpatch {
url = "https://github.com/NVIDIA/cuda-samples/commit/5c3ec60faeb7a3c4ad9372c99114d7bb922fda8d.patch"; url = "https://github.com/NVIDIA/cuda-samples/commit/5c3ec60faeb7a3c4ad9372c99114d7bb922fda8d.patch";
hash = "sha256-0XxdmNK9MPpHwv8+qECJTvXGlFxc+fIbta4ynYprfpU="; hash = "sha256-0XxdmNK9MPpHwv8+qECJTvXGlFxc+fIbta4ynYprfpU=";
}) })
]; ];
enableParallelBuilding = true; enableParallelBuilding = true;
preConfigure = '' preConfigure = ''
export CUDA_PATH=${cudatoolkit} export CUDA_PATH=${cudatoolkit}
''; '';
installPhase = '' installPhase = ''
runHook preInstall runHook preInstall
install -Dm755 -t $out/bin bin/${backendStdenv.hostPlatform.parsed.cpu.name}/${backendStdenv.hostPlatform.parsed.kernel.name}/release/* install -Dm755 -t $out/bin bin/${backendStdenv.hostPlatform.parsed.cpu.name}/${backendStdenv.hostPlatform.parsed.kernel.name}/release/*
runHook postInstall runHook postInstall
''; '';
meta = { meta = {
description = "Samples for CUDA Developers which demonstrates features in CUDA Toolkit"; description = "Samples for CUDA Developers which demonstrates features in CUDA Toolkit";
# CUDA itself is proprietary, but these sample apps are not. # CUDA itself is proprietary, but these sample apps are not.
license = lib.licenses.bsd3; license = lib.licenses.bsd3;
maintainers = with lib.maintainers; [obsidian-systems-maintenance] ++ lib.teams.cuda.members; maintainers = with lib.maintainers; [ obsidian-systems-maintenance ] ++ lib.teams.cuda.members;
}; };
} })
)

View File

@@ -1,4 +1,4 @@
{cudaVersion, lib}: { cudaVersion, lib }:
let let
inherit (lib) attrsets modules trivial; inherit (lib) attrsets modules trivial;
redistName = "cuda"; redistName = "cuda";
@@ -63,23 +63,21 @@ let
featureRelease featureRelease
; ;
}).overrideAttrs }).overrideAttrs
( (prevAttrs: {
prevAttrs: { # Add the package-specific license.
# Add the package-specific license. meta = prevAttrs.meta // {
meta = prevAttrs.meta // { license =
license = let
let licensePath =
licensePath = if redistribRelease.license_path != null then
if redistribRelease.license_path != null then redistribRelease.license_path
redistribRelease.license_path else
else "${pname}/LICENSE.txt";
"${pname}/LICENSE.txt"; url = "https://developer.download.nvidia.com/compute/cuda/redist/${licensePath}";
url = "https://developer.download.nvidia.com/compute/cuda/redist/${licensePath}"; in
in lib.licenses.nvidiaCudaRedist // { inherit url; };
lib.licenses.nvidiaCudaRedist // {inherit url;}; };
}; });
}
);
in in
drv; drv;

View File

@@ -1,4 +1,8 @@
{cudaVersion, lib, addDriverRunpath}: {
cudaVersion,
lib,
addDriverRunpath,
}:
let let
inherit (lib) attrsets lists strings; inherit (lib) attrsets lists strings;
# cudaVersionOlder : Version -> Boolean # cudaVersionOlder : Version -> Boolean
@@ -8,96 +12,92 @@ let
addBuildInputs = addBuildInputs =
drv: buildInputs: drv: buildInputs:
drv.overrideAttrs (prevAttrs: {buildInputs = prevAttrs.buildInputs ++ buildInputs;}); drv.overrideAttrs (prevAttrs: {
buildInputs = prevAttrs.buildInputs ++ buildInputs;
});
in in
# NOTE: Filter out attributes that are not present in the previous version of # NOTE: Filter out attributes that are not present in the previous version of
# the package set. This is necessary to prevent the appearance of attributes # the package set. This is necessary to prevent the appearance of attributes
# like `cuda_nvcc` in `cudaPackages_10_0, which predates redistributables. # like `cuda_nvcc` in `cudaPackages_10_0, which predates redistributables.
final: prev: final: prev:
attrsets.filterAttrs (attr: _: (builtins.hasAttr attr prev)) { attrsets.filterAttrs (attr: _: (builtins.hasAttr attr prev)) {
libcufile = prev.libcufile.overrideAttrs ( libcufile = prev.libcufile.overrideAttrs (prevAttrs: {
prevAttrs: { buildInputs = prevAttrs.buildInputs ++ [
buildInputs = prevAttrs.buildInputs ++ [ final.libcublas.lib
final.libcublas.lib final.pkgs.numactl
final.pkgs.numactl final.pkgs.rdma-core
final.pkgs.rdma-core ];
]; # Before 11.7 libcufile depends on itself for some reason.
# Before 11.7 libcufile depends on itself for some reason. autoPatchelfIgnoreMissingDeps =
autoPatchelfIgnoreMissingDeps = prevAttrs.autoPatchelfIgnoreMissingDeps
prevAttrs.autoPatchelfIgnoreMissingDeps ++ lists.optionals (cudaVersionOlder "11.7") [ "libcufile.so.0" ];
++ lists.optionals (cudaVersionOlder "11.7") [ "libcufile.so.0" ]; });
}
);
libcusolver = addBuildInputs prev.libcusolver ( libcusolver = addBuildInputs prev.libcusolver (
# Always depends on this # Always depends on this
[final.libcublas.lib] [ final.libcublas.lib ]
# Dependency from 12.0 and on # Dependency from 12.0 and on
++ lists.optionals (cudaVersionAtLeast "12.0") [final.libnvjitlink.lib] ++ lists.optionals (cudaVersionAtLeast "12.0") [ final.libnvjitlink.lib ]
# Dependency from 12.1 and on # Dependency from 12.1 and on
++ lists.optionals (cudaVersionAtLeast "12.1") [final.libcusparse.lib] ++ lists.optionals (cudaVersionAtLeast "12.1") [ final.libcusparse.lib ]
); );
libcusparse = addBuildInputs prev.libcusparse ( libcusparse = addBuildInputs prev.libcusparse (
lists.optionals (cudaVersionAtLeast "12.0") [final.libnvjitlink.lib] lists.optionals (cudaVersionAtLeast "12.0") [ final.libnvjitlink.lib ]
); );
cuda_cudart = prev.cuda_cudart.overrideAttrs ( cuda_cudart = prev.cuda_cudart.overrideAttrs (prevAttrs: {
prevAttrs: { # Remove once cuda-find-redist-features has a special case for libcuda
# Remove once cuda-find-redist-features has a special case for libcuda outputs =
outputs = prevAttrs.outputs
prevAttrs.outputs ++ lists.optionals (!(builtins.elem "stubs" prevAttrs.outputs)) [ "stubs" ];
++ lists.optionals (!(builtins.elem "stubs" prevAttrs.outputs)) [ "stubs" ];
allowFHSReferences = false; allowFHSReferences = false;
# The libcuda stub's pkg-config doesn't follow the general pattern: # The libcuda stub's pkg-config doesn't follow the general pattern:
postPatch = postPatch =
prevAttrs.postPatch or "" prevAttrs.postPatch or ""
+ '' + ''
while IFS= read -r -d $'\0' path ; do while IFS= read -r -d $'\0' path ; do
sed -i \ sed -i \
-e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib/stubs|" \ -e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib/stubs|" \
-e "s|^Libs\s*:\(.*\)\$|Libs: \1 -Wl,-rpath,${addDriverRunpath.driverLink}/lib|" \ -e "s|^Libs\s*:\(.*\)\$|Libs: \1 -Wl,-rpath,${addDriverRunpath.driverLink}/lib|" \
"$path" "$path"
done < <(find -iname 'cuda-*.pc' -print0) done < <(find -iname 'cuda-*.pc' -print0)
'' ''
+ '' + ''
# Namelink may not be enough, add a soname. # Namelink may not be enough, add a soname.
# Cf. https://gitlab.kitware.com/cmake/cmake/-/issues/25536 # Cf. https://gitlab.kitware.com/cmake/cmake/-/issues/25536
if [[ -f lib/stubs/libcuda.so && ! -f lib/stubs/libcuda.so.1 ]] ; then if [[ -f lib/stubs/libcuda.so && ! -f lib/stubs/libcuda.so.1 ]] ; then
ln -s libcuda.so lib/stubs/libcuda.so.1 ln -s libcuda.so lib/stubs/libcuda.so.1
fi fi
''; '';
postFixup = postFixup =
prevAttrs.postFixup or "" prevAttrs.postFixup or ""
+ '' + ''
moveToOutput lib/stubs "$stubs" moveToOutput lib/stubs "$stubs"
ln -s "$stubs"/lib/stubs/* "$stubs"/lib/ ln -s "$stubs"/lib/stubs/* "$stubs"/lib/
ln -s "$stubs"/lib/stubs "''${!outputLib}/lib/stubs" ln -s "$stubs"/lib/stubs "''${!outputLib}/lib/stubs"
''; '';
} });
);
cuda_compat = prev.cuda_compat.overrideAttrs ( cuda_compat = prev.cuda_compat.overrideAttrs (prevAttrs: {
prevAttrs: { autoPatchelfIgnoreMissingDeps = prevAttrs.autoPatchelfIgnoreMissingDeps ++ [
autoPatchelfIgnoreMissingDeps = prevAttrs.autoPatchelfIgnoreMissingDeps ++ [ "libnvrm_gpu.so"
"libnvrm_gpu.so" "libnvrm_mem.so"
"libnvrm_mem.so" "libnvdla_runtime.so"
"libnvdla_runtime.so" ];
]; # `cuda_compat` only works on aarch64-linux, and only when building for Jetson devices.
# `cuda_compat` only works on aarch64-linux, and only when building for Jetson devices. badPlatformsConditions = prevAttrs.badPlatformsConditions // {
badPlatformsConditions = prevAttrs.badPlatformsConditions // { "Trying to use cuda_compat on aarch64-linux targeting non-Jetson devices" =
"Trying to use cuda_compat on aarch64-linux targeting non-Jetson devices" = !final.flags.isJetsonBuild;
!final.flags.isJetsonBuild; };
}; });
}
);
cuda_gdb = addBuildInputs prev.cuda_gdb ( cuda_gdb = addBuildInputs prev.cuda_gdb (
# x86_64 only needs gmp from 12.0 and on # x86_64 only needs gmp from 12.0 and on
lists.optionals (cudaVersionAtLeast "12.0") [final.pkgs.gmp] lists.optionals (cudaVersionAtLeast "12.0") [ final.pkgs.gmp ]
); );
cuda_nvcc = prev.cuda_nvcc.overrideAttrs ( cuda_nvcc = prev.cuda_nvcc.overrideAttrs (
@@ -176,9 +176,9 @@ attrsets.filterAttrs (attr: _: (builtins.hasAttr attr prev)) {
} }
); );
cuda_nvprof = prev.cuda_nvprof.overrideAttrs ( cuda_nvprof = prev.cuda_nvprof.overrideAttrs (prevAttrs: {
prevAttrs: {buildInputs = prevAttrs.buildInputs ++ [final.cuda_cupti.lib];} buildInputs = prevAttrs.buildInputs ++ [ final.cuda_cupti.lib ];
); });
cuda_demo_suite = addBuildInputs prev.cuda_demo_suite [ cuda_demo_suite = addBuildInputs prev.cuda_demo_suite [
final.pkgs.freeglut final.pkgs.freeglut
@@ -189,26 +189,24 @@ attrsets.filterAttrs (attr: _: (builtins.hasAttr attr prev)) {
final.libcurand.lib final.libcurand.lib
]; ];
nsight_compute = prev.nsight_compute.overrideAttrs ( nsight_compute = prev.nsight_compute.overrideAttrs (prevAttrs: {
prevAttrs: { nativeBuildInputs =
nativeBuildInputs = prevAttrs.nativeBuildInputs
prevAttrs.nativeBuildInputs ++ (
++ ( if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then
if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then [ final.pkgs.qt5.wrapQtAppsHook ]
[final.pkgs.qt5.wrapQtAppsHook] else
else [ final.pkgs.qt6.wrapQtAppsHook ]
[final.pkgs.qt6.wrapQtAppsHook] );
); buildInputs =
buildInputs = prevAttrs.buildInputs
prevAttrs.buildInputs ++ (
++ ( if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then
if (strings.versionOlder prev.nsight_compute.version "2022.2.0") then [ final.pkgs.qt5.qtwebview ]
[final.pkgs.qt5.qtwebview] else
else [ final.pkgs.qt6.qtwebview ]
[final.pkgs.qt6.qtwebview] );
); });
}
);
nsight_systems = prev.nsight_systems.overrideAttrs ( nsight_systems = prev.nsight_systems.overrideAttrs (
prevAttrs: prevAttrs:

View File

@@ -1,6 +1,6 @@
{ {
cudaVersion, cudaVersion,
runPatches ? [], runPatches ? [ ],
autoPatchelfHook, autoPatchelfHook,
autoAddDriverRunpath, autoAddDriverRunpath,
addOpenGLRunpath, addOpenGLRunpath,
@@ -61,7 +61,7 @@ backendStdenv.mkDerivation rec {
dontPatchELF = true; dontPatchELF = true;
dontStrip = true; dontStrip = true;
src = fetchurl {inherit (release) url sha256;}; src = fetchurl { inherit (release) url sha256; };
outputs = [ outputs = [
"out" "out"
@@ -79,9 +79,9 @@ backendStdenv.mkDerivation rec {
autoAddDriverRunpath autoAddDriverRunpath
markForCudatoolkitRootHook markForCudatoolkitRootHook
] ]
++ lib.optionals (lib.versionOlder version "11") [libsForQt5.wrapQtAppsHook] ++ lib.optionals (lib.versionOlder version "11") [ libsForQt5.wrapQtAppsHook ]
++ lib.optionals (lib.versionAtLeast version "11.8") [qt6Packages.wrapQtAppsHook]; ++ lib.optionals (lib.versionAtLeast version "11.8") [ qt6Packages.wrapQtAppsHook ];
propagatedBuildInputs = [setupCudaHook]; propagatedBuildInputs = [ setupCudaHook ];
buildInputs = buildInputs =
lib.optionals (lib.versionOlder version "11") [ lib.optionals (lib.versionOlder version "11") [
libsForQt5.qt5.qtwebengine libsForQt5.qt5.qtwebengine
@@ -130,7 +130,7 @@ backendStdenv.mkDerivation rec {
(lib.getLib libtiff) (lib.getLib libtiff)
qt6Packages.qtwayland qt6Packages.qtwayland
rdma-core rdma-core
(ucx.override {enableCuda = false;}) # Avoid infinite recursion (ucx.override { enableCuda = false; }) # Avoid infinite recursion
xorg.libxshmfence xorg.libxshmfence
xorg.libxkbfile xorg.libxkbfile
] ]
@@ -144,17 +144,15 @@ backendStdenv.mkDerivation rec {
gst_all_1.gstreamer gst_all_1.gstreamer
gst_all_1.gst-plugins-base gst_all_1.gst-plugins-base
]) ])
++ ( ++ (with qt6; [
with qt6; [ qtmultimedia
qtmultimedia qttools
qttools qtpositioning
qtpositioning qtscxml
qtscxml qtsvg
qtsvg qtwebchannel
qtwebchannel qtwebengine
qtwebengine ])
]
)
)); ));
# Prepended to runpaths by autoPatchelf. # Prepended to runpaths by autoPatchelf.
@@ -170,26 +168,28 @@ backendStdenv.mkDerivation rec {
"${placeholder "out"}/nvvm/lib64" "${placeholder "out"}/nvvm/lib64"
]; ];
autoPatchelfIgnoreMissingDeps = [ autoPatchelfIgnoreMissingDeps =
# This is the hardware-dependent userspace driver that comes from [
# nvidia_x11 package. It must be deployed at runtime in # This is the hardware-dependent userspace driver that comes from
# /run/opengl-driver/lib or pointed at by LD_LIBRARY_PATH variable, rather # nvidia_x11 package. It must be deployed at runtime in
# than pinned in runpath # /run/opengl-driver/lib or pointed at by LD_LIBRARY_PATH variable, rather
"libcuda.so.1" # than pinned in runpath
"libcuda.so.1"
# The krb5 expression ships libcom_err.so.3 but cudatoolkit asks for the # The krb5 expression ships libcom_err.so.3 but cudatoolkit asks for the
# older # older
# This dependency is asked for by target-linux-x64/CollectX/RedHat/x86_64/libssl.so.10 # This dependency is asked for by target-linux-x64/CollectX/RedHat/x86_64/libssl.so.10
# - do we even want to use nvidia-shipped libssl? # - do we even want to use nvidia-shipped libssl?
"libcom_err.so.2" "libcom_err.so.2"
] ++ lib.optionals (lib.versionOlder version "10.1") [ ]
# For Cuda 10.0, nVidia also shipped a jre implementation which needed ++ lib.optionals (lib.versionOlder version "10.1") [
# two old versions of ffmpeg which are not available in nixpkgs # For Cuda 10.0, nVidia also shipped a jre implementation which needed
"libavcodec.so.54" # two old versions of ffmpeg which are not available in nixpkgs
"libavcodec.so.53" "libavcodec.so.54"
"libavformat.so.54" "libavcodec.so.53"
"libavformat.so.53" "libavformat.so.54"
]; "libavformat.so.53"
];
preFixup = preFixup =
if (lib.versionAtLeast version "10.1" && lib.versionOlder version "11") then if (lib.versionAtLeast version "10.1" && lib.versionOlder version "11") then
@@ -282,7 +282,14 @@ backendStdenv.mkDerivation rec {
for qtlib in $out/host-linux-x64/Plugins/*/libq*.so; do for qtlib in $out/host-linux-x64/Plugins/*/libq*.so; do
qtdir=$(basename $(dirname $qtlib)) qtdir=$(basename $(dirname $qtlib))
filename=$(basename $qtlib) filename=$(basename $qtlib)
for qtpkgdir in ${lib.concatMapStringsSep " " (x: qt6Packages.${x}) ["qtbase" "qtimageformats" "qtsvg" "qtwayland"]}; do for qtpkgdir in ${
lib.concatMapStringsSep " " (x: qt6Packages.${x}) [
"qtbase"
"qtimageformats"
"qtsvg"
"qtwayland"
]
}; do
if [ -e $qtpkgdir/lib/qt-6/plugins/$qtdir/$filename ]; then if [ -e $qtpkgdir/lib/qt-6/plugins/$qtdir/$filename ]; then
ln -snf $qtpkgdir/lib/qt-6/plugins/$qtdir/$filename $qtlib ln -snf $qtpkgdir/lib/qt-6/plugins/$qtdir/$filename $qtlib
fi fi
@@ -303,8 +310,9 @@ backendStdenv.mkDerivation rec {
''} ''}
# Remove some cruft. # Remove some cruft.
${lib.optionalString ((lib.versionAtLeast version "7.0") && (lib.versionOlder version "10.1")) ${lib.optionalString (
"rm $out/bin/uninstall*"} (lib.versionAtLeast version "7.0") && (lib.versionOlder version "10.1")
) "rm $out/bin/uninstall*"}
# Fixup path to samples (needed for cuda 6.5 or else nsight will not find them) # Fixup path to samples (needed for cuda 6.5 or else nsight will not find them)
if [ -d "$out"/cuda-samples ]; then if [ -d "$out"/cuda-samples ]; then
@@ -360,19 +368,18 @@ backendStdenv.mkDerivation rec {
wrapProgram "$out/bin/$b" \ wrapProgram "$out/bin/$b" \
--set GDK_PIXBUF_MODULE_FILE "$GDK_PIXBUF_MODULE_FILE" --set GDK_PIXBUF_MODULE_FILE "$GDK_PIXBUF_MODULE_FILE"
done done
${ ${lib.optionalString (lib.versionAtLeast version "12")
lib.optionalString (lib.versionAtLeast version "12") # Check we don't have any lurking vendored qt libraries that weren't
# Check we don't have any lurking vendored qt libraries that weren't # replaced during installPhase
# replaced during installPhase ''
'' qtlibfiles=$(find $out -name "libq*.so" -type f)
qtlibfiles=$(find $out -name "libq*.so" -type f) if [ ! -z "$qtlibfiles" ]; then
if [ ! -z "$qtlibfiles" ]; then echo "Found unexpected vendored Qt library files in $out" >&2
echo "Found unexpected vendored Qt library files in $out" >&2 echo $qtlibfiles >&2
echo $qtlibfiles >&2 echo "These should be replaced with symlinks in installPhase" >&2
echo "These should be replaced with symlinks in installPhase" >&2 exit 1
exit 1 fi
fi ''
''
} }
''; '';
@@ -405,7 +412,7 @@ backendStdenv.mkDerivation rec {
meta = with lib; { meta = with lib; {
description = "A compiler for NVIDIA GPUs, math libraries, and tools"; description = "A compiler for NVIDIA GPUs, math libraries, and tools";
homepage = "https://developer.nvidia.com/cuda-toolkit"; homepage = "https://developer.nvidia.com/cuda-toolkit";
platforms = ["x86_64-linux"]; platforms = [ "x86_64-linux" ];
license = licenses.nvidiaCuda; license = licenses.nvidiaCuda;
maintainers = teams.cuda.members; maintainers = teams.cuda.members;
}; };

View File

@@ -17,7 +17,7 @@ let
; ;
in in
finalAttrs: prevAttrs: { finalAttrs: prevAttrs: {
src = fetchurl {inherit (package) url hash;}; src = fetchurl { inherit (package) url hash; };
# Useful for inspecting why something went wrong. # Useful for inspecting why something went wrong.
brokenConditions = brokenConditions =
@@ -34,9 +34,9 @@ finalAttrs: prevAttrs: {
buildInputs = buildInputs =
prevAttrs.buildInputs prevAttrs.buildInputs
++ [zlib] ++ [ zlib ]
++ lists.optionals finalAttrs.passthru.useCudatoolkitRunfile [final.cudatoolkit] ++ lists.optionals finalAttrs.passthru.useCudatoolkitRunfile [ final.cudatoolkit ]
++ lists.optionals (!finalAttrs.passthru.useCudatoolkitRunfile) [final.libcublas.lib]; ++ lists.optionals (!finalAttrs.passthru.useCudatoolkitRunfile) [ final.libcublas.lib ];
# Tell autoPatchelf about runtime dependencies. # Tell autoPatchelf about runtime dependencies.
# NOTE: Versions from CUDNN releases have four components. # NOTE: Versions from CUDNN releases have four components.
@@ -51,13 +51,11 @@ finalAttrs: prevAttrs: {
homepage = "https://developer.nvidia.com/cudnn"; homepage = "https://developer.nvidia.com/cudnn";
maintainers = maintainers =
prevAttrs.meta.maintainers prevAttrs.meta.maintainers
++ ( ++ (with maintainers; [
with maintainers; [ mdaiter
mdaiter samuela
samuela connorbaker
connorbaker ]);
]
);
license = { license = {
shortName = "cuDNN EULA"; shortName = "cuDNN EULA";
fullName = "NVIDIA cuDNN Software License Agreement (EULA)"; fullName = "NVIDIA cuDNN Software License Agreement (EULA)";

View File

@@ -13,7 +13,7 @@
} }
]; ];
# powerpc # powerpc
linux-ppc64le = []; linux-ppc64le = [ ];
# server-grade arm # server-grade arm
linux-sbsa = [ linux-sbsa = [
{ {

View File

@@ -65,12 +65,10 @@ let
# Un-nest the manifests attribute set. # Un-nest the manifests attribute set.
releaseGrabber = evaluatedModules: evaluatedModules.config.cutensor.manifests; releaseGrabber = evaluatedModules: evaluatedModules.config.cutensor.manifests;
in in
lists.map lists.map (trivial.flip trivial.pipe [
(trivial.flip trivial.pipe [ configEvaluator
configEvaluator releaseGrabber
releaseGrabber ]) cutensorVersions;
])
cutensorVersions;
# Our cudaVersion tells us which version of CUDA we're building against. # Our cudaVersion tells us which version of CUDA we're building against.
# The subdirectories in lib/ tell us which versions of CUDA are supported. # The subdirectories in lib/ tell us which versions of CUDA are supported.
@@ -96,15 +94,11 @@ let
redistArch = flags.getRedistArch hostPlatform.system; redistArch = flags.getRedistArch hostPlatform.system;
# platformIsSupported :: Manifests -> Boolean # platformIsSupported :: Manifests -> Boolean
platformIsSupported = platformIsSupported =
{feature, ...}: { feature, ... }:
(attrsets.attrByPath (attrsets.attrByPath [
[ pname
pname redistArch
redistArch ] null feature) != null;
]
null
feature
) != null;
# TODO(@connorbaker): With an auxilliary file keeping track of the CUDA versions each release supports, # TODO(@connorbaker): With an auxilliary file keeping track of the CUDA versions each release supports,
# we could filter out releases that don't support our CUDA version. # we could filter out releases that don't support our CUDA version.
@@ -116,41 +110,39 @@ let
# Compute versioned attribute name to be used in this package set # Compute versioned attribute name to be used in this package set
# Patch version changes should not break the build, so we only use major and minor # Patch version changes should not break the build, so we only use major and minor
# computeName :: RedistribRelease -> String # computeName :: RedistribRelease -> String
computeName = {version, ...}: mkVersionedPackageName redistName version; computeName = { version, ... }: mkVersionedPackageName redistName version;
in in
final: _: final: _:
let let
# buildCutensorPackage :: Manifests -> AttrSet Derivation # buildCutensorPackage :: Manifests -> AttrSet Derivation
buildCutensorPackage = buildCutensorPackage =
{redistrib, feature}: { redistrib, feature }:
let let
drv = final.callPackage ../generic-builders/manifest.nix { drv = final.callPackage ../generic-builders/manifest.nix {
inherit pname redistName libPath; inherit pname redistName libPath;
redistribRelease = redistrib.${pname}; redistribRelease = redistrib.${pname};
featureRelease = feature.${pname}; featureRelease = feature.${pname};
}; };
fixedDrv = drv.overrideAttrs ( fixedDrv = drv.overrideAttrs (prevAttrs: {
prevAttrs: { buildInputs =
buildInputs = prevAttrs.buildInputs
prevAttrs.buildInputs ++ lists.optionals (strings.versionOlder cudaVersion "11.4") [ final.cudatoolkit ]
++ lists.optionals (strings.versionOlder cudaVersion "11.4") [final.cudatoolkit] ++ lists.optionals (strings.versionAtLeast cudaVersion "11.4") (
++ lists.optionals (strings.versionAtLeast cudaVersion "11.4") ( [ final.libcublas.lib ]
[final.libcublas.lib] # For some reason, the 1.4.x release of cuTENSOR requires the cudart library.
# For some reason, the 1.4.x release of cuTENSOR requires the cudart library. ++ lists.optionals (strings.hasPrefix "1.4" redistrib.${pname}.version) [ final.cuda_cudart.lib ]
++ lists.optionals (strings.hasPrefix "1.4" redistrib.${pname}.version) [final.cuda_cudart.lib] );
); meta = prevAttrs.meta // {
meta = prevAttrs.meta // { description = "cuTENSOR: A High-Performance CUDA Library For Tensor Primitives";
description = "cuTENSOR: A High-Performance CUDA Library For Tensor Primitives"; homepage = "https://developer.nvidia.com/cutensor";
homepage = "https://developer.nvidia.com/cutensor"; maintainers = prevAttrs.meta.maintainers ++ [ lib.maintainers.obsidian-systems-maintenance ];
maintainers = prevAttrs.meta.maintainers ++ [lib.maintainers.obsidian-systems-maintenance]; license = lib.licenses.unfreeRedistributable // {
license = lib.licenses.unfreeRedistributable // { shortName = "cuTENSOR EULA";
shortName = "cuTENSOR EULA"; name = "cuTENSOR SUPPLEMENT TO SOFTWARE LICENSE AGREEMENT FOR NVIDIA SOFTWARE DEVELOPMENT KITS";
name = "cuTENSOR SUPPLEMENT TO SOFTWARE LICENSE AGREEMENT FOR NVIDIA SOFTWARE DEVELOPMENT KITS"; url = "https://docs.nvidia.com/cuda/cutensor/license.html";
url = "https://docs.nvidia.com/cuda/cutensor/license.html";
};
}; };
} };
); });
in in
attrsets.nameValuePair (computeName redistrib.${pname}) fixedDrv; attrsets.nameValuePair (computeName redistrib.${pname}) fixedDrv;
@@ -158,7 +150,7 @@ let
let let
nameOfNewest = computeName (lists.last supportedManifests).redistrib.${pname}; nameOfNewest = computeName (lists.last supportedManifests).redistrib.${pname};
drvs = builtins.listToAttrs (lists.map buildCutensorPackage supportedManifests); drvs = builtins.listToAttrs (lists.map buildCutensorPackage supportedManifests);
containsDefault = attrsets.optionalAttrs (drvs != {}) {cutensor = drvs.${nameOfNewest};}; containsDefault = attrsets.optionalAttrs (drvs != { }) { cutensor = drvs.${nameOfNewest}; };
in in
drvs // containsDefault; drvs // containsDefault;
in in

View File

@@ -3,7 +3,7 @@
# - See the documentation in ./gpus.nix. # - See the documentation in ./gpus.nix.
{ {
config, config,
cudaCapabilities ? (config.cudaCapabilities or []), cudaCapabilities ? (config.cudaCapabilities or [ ]),
cudaForwardCompat ? (config.cudaForwardCompat or true), cudaForwardCompat ? (config.cudaForwardCompat or true),
lib, lib,
cudaVersion, cudaVersion,
@@ -77,9 +77,9 @@ let
# cudaArchNameToVersions :: AttrSet String (List String) # cudaArchNameToVersions :: AttrSet String (List String)
# Maps the name of a GPU architecture to different versions of that architecture. # Maps the name of a GPU architecture to different versions of that architecture.
# For example, "Ampere" maps to [ "8.0" "8.6" "8.7" ]. # For example, "Ampere" maps to [ "8.0" "8.6" "8.7" ].
cudaArchNameToVersions = cudaArchNameToVersions = lists.groupBy' (versions: gpu: versions ++ [ gpu.computeCapability ]) [ ] (
lists.groupBy' (versions: gpu: versions ++ [gpu.computeCapability]) [] (gpu: gpu.archName) gpu: gpu.archName
supportedGpus; ) supportedGpus;
# cudaComputeCapabilityToName :: AttrSet String String # cudaComputeCapabilityToName :: AttrSet String String
# Maps the version of a GPU architecture to the name of that architecture. # Maps the version of a GPU architecture to the name of that architecture.
@@ -108,7 +108,7 @@ let
jetsonTargets = lists.intersectLists jetsonComputeCapabilities cudaCapabilities; jetsonTargets = lists.intersectLists jetsonComputeCapabilities cudaCapabilities;
# dropDot :: String -> String # dropDot :: String -> String
dropDot = ver: builtins.replaceStrings ["."] [""] ver; dropDot = ver: builtins.replaceStrings [ "." ] [ "" ] ver;
# archMapper :: String -> List String -> List String # archMapper :: String -> List String -> List String
# Maps a feature across a list of architecture versions to produce a list of architectures. # Maps a feature across a list of architecture versions to produce a list of architectures.
@@ -135,25 +135,29 @@ let
# `all-packages.nix`, which is evaluated on all systems. As such, we need to handle unsupported # `all-packages.nix`, which is evaluated on all systems. As such, we need to handle unsupported
# systems gracefully. # systems gracefully.
# getRedistArch :: String -> String # getRedistArch :: String -> String
getRedistArch = nixSystem: attrsets.attrByPath [ nixSystem ] "unsupported" { getRedistArch =
aarch64-linux = if jetsonTargets != [] then "linux-aarch64" else "linux-sbsa"; nixSystem:
x86_64-linux = "linux-x86_64"; attrsets.attrByPath [ nixSystem ] "unsupported" {
ppc64le-linux = "linux-ppc64le"; aarch64-linux = if jetsonTargets != [ ] then "linux-aarch64" else "linux-sbsa";
x86_64-windows = "windows-x86_64"; x86_64-linux = "linux-x86_64";
}; ppc64le-linux = "linux-ppc64le";
x86_64-windows = "windows-x86_64";
};
# Maps NVIDIA redist arch to Nix system. # Maps NVIDIA redist arch to Nix system.
# NOTE: This function *will* be called by unsupported systems because `cudaPackages` is part of # NOTE: This function *will* be called by unsupported systems because `cudaPackages` is part of
# `all-packages.nix`, which is evaluated on all systems. As such, we need to handle unsupported # `all-packages.nix`, which is evaluated on all systems. As such, we need to handle unsupported
# systems gracefully. # systems gracefully.
# getNixSystem :: String -> String # getNixSystem :: String -> String
getNixSystem = redistArch: attrsets.attrByPath [ redistArch ] "unsupported-${redistArch}" { getNixSystem =
linux-sbsa = "aarch64-linux"; redistArch:
linux-aarch64 = "aarch64-linux"; attrsets.attrByPath [ redistArch ] "unsupported-${redistArch}" {
linux-x86_64 = "x86_64-linux"; linux-sbsa = "aarch64-linux";
linux-ppc64le = "ppc64le-linux"; linux-aarch64 = "aarch64-linux";
windows-x86_64 = "x86_64-windows"; linux-x86_64 = "x86_64-linux";
}; linux-ppc64le = "ppc64le-linux";
windows-x86_64 = "x86_64-windows";
};
formatCapabilities = formatCapabilities =
{ {
@@ -194,7 +198,7 @@ let
gencode = gencode =
let let
base = gencodeMapper "sm" cudaCapabilities; base = gencodeMapper "sm" cudaCapabilities;
forward = gencodeMapper "compute" [(lists.last cudaCapabilities)]; forward = gencodeMapper "compute" [ (lists.last cudaCapabilities) ];
in in
base ++ lib.optionals enableForwardCompat forward; base ++ lib.optionals enableForwardCompat forward;
@@ -209,150 +213,151 @@ let
# isJetsonBuild :: Boolean # isJetsonBuild :: Boolean
isJetsonBuild = isJetsonBuild =
let let
requestedJetsonDevices = requestedJetsonDevices = lists.filter (
lists.filter (cap: cudaComputeCapabilityToIsJetson.${cap} or false) cap: cudaComputeCapabilityToIsJetson.${cap} or false
cudaCapabilities; ) cudaCapabilities;
requestedNonJetsonDevices = requestedNonJetsonDevices = lists.filter (
lists.filter (cap: !(builtins.elem cap requestedJetsonDevices)) cap: !(builtins.elem cap requestedJetsonDevices)
cudaCapabilities; ) cudaCapabilities;
jetsonBuildSufficientCondition = requestedJetsonDevices != []; jetsonBuildSufficientCondition = requestedJetsonDevices != [ ];
jetsonBuildNecessaryCondition = requestedNonJetsonDevices == [] && hostPlatform.isAarch64; jetsonBuildNecessaryCondition = requestedNonJetsonDevices == [ ] && hostPlatform.isAarch64;
in in
trivial.throwIf (jetsonBuildSufficientCondition && !jetsonBuildNecessaryCondition) trivial.throwIf (jetsonBuildSufficientCondition && !jetsonBuildNecessaryCondition) ''
'' Jetson devices cannot be targeted with non-Jetson devices. Additionally, they require hostPlatform to be aarch64.
Jetson devices cannot be targeted with non-Jetson devices. Additionally, they require hostPlatform to be aarch64. You requested ${builtins.toJSON cudaCapabilities} for host platform ${hostPlatform.system}.
You requested ${builtins.toJSON cudaCapabilities} for host platform ${hostPlatform.system}. Requested Jetson devices: ${builtins.toJSON requestedJetsonDevices}.
Requested Jetson devices: ${builtins.toJSON requestedJetsonDevices}. Requested non-Jetson devices: ${builtins.toJSON requestedNonJetsonDevices}.
Requested non-Jetson devices: ${builtins.toJSON requestedNonJetsonDevices}. Exactly one of the following must be true:
Exactly one of the following must be true: - All CUDA capabilities belong to Jetson devices and hostPlatform is aarch64.
- All CUDA capabilities belong to Jetson devices and hostPlatform is aarch64. - No CUDA capabilities belong to Jetson devices.
- No CUDA capabilities belong to Jetson devices. See ${./gpus.nix} for a list of architectures supported by this version of Nixpkgs.
See ${./gpus.nix} for a list of architectures supported by this version of Nixpkgs. '' jetsonBuildSufficientCondition
''
jetsonBuildSufficientCondition
&& jetsonBuildNecessaryCondition; && jetsonBuildNecessaryCondition;
}; };
in in
# When changing names or formats: pause, validate, and update the assert # When changing names or formats: pause, validate, and update the assert
assert let assert
expected = { let
cudaCapabilities = [ expected = {
"7.5" cudaCapabilities = [
"8.6" "7.5"
]; "8.6"
enableForwardCompat = true; ];
enableForwardCompat = true;
archNames = [ archNames = [
"Turing" "Turing"
"Ampere" "Ampere"
]; ];
realArches = [ realArches = [
"sm_75" "sm_75"
"sm_86" "sm_86"
]; ];
virtualArches = [ virtualArches = [
"compute_75" "compute_75"
"compute_86" "compute_86"
]; ];
arches = [ arches = [
"sm_75" "sm_75"
"sm_86" "sm_86"
"compute_86" "compute_86"
]; ];
gencode = [ gencode = [
"-gencode=arch=compute_75,code=sm_75" "-gencode=arch=compute_75,code=sm_75"
"-gencode=arch=compute_86,code=sm_86" "-gencode=arch=compute_86,code=sm_86"
"-gencode=arch=compute_86,code=compute_86" "-gencode=arch=compute_86,code=compute_86"
]; ];
gencodeString = "-gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_86,code=sm_86 -gencode=arch=compute_86,code=compute_86"; gencodeString = "-gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_86,code=sm_86 -gencode=arch=compute_86,code=compute_86";
isJetsonBuild = false; isJetsonBuild = false;
}; };
actual = formatCapabilities { actual = formatCapabilities {
cudaCapabilities = [ cudaCapabilities = [
"7.5" "7.5"
"8.6" "8.6"
]; ];
}; };
actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value; actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value;
in in
asserts.assertMsg ((strings.versionAtLeast cudaVersion "11.2") -> (expected == actualWrapped)) '' asserts.assertMsg ((strings.versionAtLeast cudaVersion "11.2") -> (expected == actualWrapped)) ''
This test should only fail when using a version of CUDA older than 11.2, the first to support This test should only fail when using a version of CUDA older than 11.2, the first to support
8.6. 8.6.
Expected: ${builtins.toJSON expected}
Actual: ${builtins.toJSON actualWrapped}
'';
# Check mixed Jetson and non-Jetson devices
assert let
expected = false;
actual = formatCapabilities {
cudaCapabilities = [
"7.2"
"7.5"
];
};
actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value;
in
asserts.assertMsg (expected == actualWrapped) ''
Jetson devices capabilities cannot be mixed with non-jetson devices.
Capability 7.5 is non-Jetson and should not be allowed with Jetson 7.2.
Expected: ${builtins.toJSON expected}
Actual: ${builtins.toJSON actualWrapped}
'';
# Check Jetson-only
assert let
expected = {
cudaCapabilities = [
"6.2"
"7.2"
];
enableForwardCompat = true;
archNames = [
"Pascal"
"Volta"
];
realArches = [
"sm_62"
"sm_72"
];
virtualArches = [
"compute_62"
"compute_72"
];
arches = [
"sm_62"
"sm_72"
"compute_72"
];
gencode = [
"-gencode=arch=compute_62,code=sm_62"
"-gencode=arch=compute_72,code=sm_72"
"-gencode=arch=compute_72,code=compute_72"
];
gencodeString = "-gencode=arch=compute_62,code=sm_62 -gencode=arch=compute_72,code=sm_72 -gencode=arch=compute_72,code=compute_72";
isJetsonBuild = true;
};
actual = formatCapabilities {
cudaCapabilities = [
"6.2"
"7.2"
];
};
actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value;
in
asserts.assertMsg
# We can't do this test unless we're targeting aarch64
(hostPlatform.isAarch64 -> (expected == actualWrapped))
''
Jetson devices can only be built with other Jetson devices.
Both 6.2 and 7.2 are Jetson devices.
Expected: ${builtins.toJSON expected} Expected: ${builtins.toJSON expected}
Actual: ${builtins.toJSON actualWrapped} Actual: ${builtins.toJSON actualWrapped}
''; '';
# Check mixed Jetson and non-Jetson devices
assert
let
expected = false;
actual = formatCapabilities {
cudaCapabilities = [
"7.2"
"7.5"
];
};
actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value;
in
asserts.assertMsg (expected == actualWrapped) ''
Jetson devices capabilities cannot be mixed with non-jetson devices.
Capability 7.5 is non-Jetson and should not be allowed with Jetson 7.2.
Expected: ${builtins.toJSON expected}
Actual: ${builtins.toJSON actualWrapped}
'';
# Check Jetson-only
assert
let
expected = {
cudaCapabilities = [
"6.2"
"7.2"
];
enableForwardCompat = true;
archNames = [
"Pascal"
"Volta"
];
realArches = [
"sm_62"
"sm_72"
];
virtualArches = [
"compute_62"
"compute_72"
];
arches = [
"sm_62"
"sm_72"
"compute_72"
];
gencode = [
"-gencode=arch=compute_62,code=sm_62"
"-gencode=arch=compute_72,code=sm_72"
"-gencode=arch=compute_72,code=compute_72"
];
gencodeString = "-gencode=arch=compute_62,code=sm_62 -gencode=arch=compute_72,code=sm_72 -gencode=arch=compute_72,code=compute_72";
isJetsonBuild = true;
};
actual = formatCapabilities {
cudaCapabilities = [
"6.2"
"7.2"
];
};
actualWrapped = (builtins.tryEval (builtins.deepSeq actual actual)).value;
in
asserts.assertMsg
# We can't do this test unless we're targeting aarch64
(hostPlatform.isAarch64 -> (expected == actualWrapped))
''
Jetson devices can only be built with other Jetson devices.
Both 6.2 and 7.2 are Jetson devices.
Expected: ${builtins.toJSON expected}
Actual: ${builtins.toJSON actualWrapped}
'';
{ {
# formatCapabilities :: { cudaCapabilities: List Capability, enableForwardCompat: Boolean } -> { ... } # formatCapabilities :: { cudaCapabilities: List Capability, enableForwardCompat: Boolean } -> { ... }
inherit formatCapabilities; inherit formatCapabilities;
@@ -376,6 +381,6 @@ asserts.assertMsg
; ;
} }
// formatCapabilities { // formatCapabilities {
cudaCapabilities = if cudaCapabilities == [] then defaultCapabilities else cudaCapabilities; cudaCapabilities = if cudaCapabilities == [ ] then defaultCapabilities else cudaCapabilities;
enableForwardCompat = cudaForwardCompat; enableForwardCompat = cudaForwardCompat;
} }

View File

@@ -50,144 +50,139 @@ let
sourceMatchesHost = flags.getNixSystem redistArch == stdenv.hostPlatform.system; sourceMatchesHost = flags.getNixSystem redistArch == stdenv.hostPlatform.system;
in in
backendStdenv.mkDerivation ( backendStdenv.mkDerivation (finalAttrs: {
finalAttrs: { # NOTE: Even though there's no actual buildPhase going on here, the derivations of the
# NOTE: Even though there's no actual buildPhase going on here, the derivations of the # redistributables are sensitive to the compiler flags provided to stdenv. The patchelf package
# redistributables are sensitive to the compiler flags provided to stdenv. The patchelf package # is sensitive to the compiler flags provided to stdenv, and we depend on it. As such, we are
# is sensitive to the compiler flags provided to stdenv, and we depend on it. As such, we are # also sensitive to the compiler flags provided to stdenv.
# also sensitive to the compiler flags provided to stdenv. inherit pname;
inherit pname; inherit (redistribRelease) version;
inherit (redistribRelease) version;
# Don't force serialization to string for structured attributes, like outputToPatterns # Don't force serialization to string for structured attributes, like outputToPatterns
# and brokenConditions. # and brokenConditions.
# Avoids "set cannot be coerced to string" errors. # Avoids "set cannot be coerced to string" errors.
__structuredAttrs = true; __structuredAttrs = true;
# Keep better track of dependencies. # Keep better track of dependencies.
strictDeps = true; strictDeps = true;
# NOTE: Outputs are evaluated jointly with meta, so in the case that this is an unsupported platform, # NOTE: Outputs are evaluated jointly with meta, so in the case that this is an unsupported platform,
# we still need to provide a list of outputs. # we still need to provide a list of outputs.
outputs = outputs =
let let
# Checks whether the redistributable provides an output. # Checks whether the redistributable provides an output.
hasOutput = hasOutput =
output: output:
attrsets.attrByPath attrsets.attrByPath [
[ redistArch
redistArch "outputs"
"outputs" output
output ] false featureRelease;
] # Order is important here so we use a list.
false possibleOutputs = [
featureRelease; "bin"
# Order is important here so we use a list.
possibleOutputs = [
"bin"
"lib"
"static"
"dev"
"doc"
"sample"
"python"
];
# Filter out outputs that don't exist in the redistributable.
# NOTE: In the case the redistributable isn't supported on the target platform,
# we will have `outputs = [ "out" ] ++ possibleOutputs`. This is of note because platforms which
# aren't supported would otherwise have evaluation errors when trying to access outputs other than `out`.
# The alternative would be to have `outputs = [ "out" ]` when`redistArch = "unsupported"`, but that would
# require adding guards throughout the entirety of the CUDA package set to ensure `cudaSupport` is true --
# recall that OfBorg will evaluate packages marked as broken and that `cudaPackages` will be evaluated with
# `cudaSupport = false`!
additionalOutputs =
if redistArch == "unsupported"
then possibleOutputs
else builtins.filter hasOutput possibleOutputs;
# The out output is special -- it's the default output and we always include it.
outputs = [ "out" ] ++ additionalOutputs;
in
outputs;
# Traversed in the order of the outputs speficied in outputs;
# entries are skipped if they don't exist in outputs.
outputToPatterns = {
bin = [ "bin" ];
dev = [
"share/pkgconfig"
"**/*.pc"
"**/*.cmake"
];
lib = [
"lib" "lib"
"lib64" "static"
"dev"
"doc"
"sample"
"python"
]; ];
static = ["**/*.a"]; # Filter out outputs that don't exist in the redistributable.
sample = ["samples"]; # NOTE: In the case the redistributable isn't supported on the target platform,
python = ["**/*.whl"]; # we will have `outputs = [ "out" ] ++ possibleOutputs`. This is of note because platforms which
}; # aren't supported would otherwise have evaluation errors when trying to access outputs other than `out`.
# The alternative would be to have `outputs = [ "out" ]` when`redistArch = "unsupported"`, but that would
# require adding guards throughout the entirety of the CUDA package set to ensure `cudaSupport` is true --
# recall that OfBorg will evaluate packages marked as broken and that `cudaPackages` will be evaluated with
# `cudaSupport = false`!
additionalOutputs =
if redistArch == "unsupported" then possibleOutputs else builtins.filter hasOutput possibleOutputs;
# The out output is special -- it's the default output and we always include it.
outputs = [ "out" ] ++ additionalOutputs;
in
outputs;
# Useful for introspecting why something went wrong. Maps descriptions of why the derivation would be marked as # Traversed in the order of the outputs speficied in outputs;
# broken on have badPlatforms include the current platform. # entries are skipped if they don't exist in outputs.
outputToPatterns = {
# brokenConditions :: AttrSet Bool bin = [ "bin" ];
# Sets `meta.broken = true` if any of the conditions are true. dev = [
# Example: Broken on a specific version of CUDA or when a dependency has a specific version. "share/pkgconfig"
brokenConditions = { }; "**/*.pc"
"**/*.cmake"
# badPlatformsConditions :: AttrSet Bool
# Sets `meta.badPlatforms = meta.platforms` if any of the conditions are true.
# Example: Broken on a specific architecture when some condition is met (like targeting Jetson).
badPlatformsConditions = {
"No source" = !sourceMatchesHost;
};
# src :: Optional Derivation
src = trivial.pipe redistArch [
# If redistArch doesn't exist in redistribRelease, return null.
(redistArch: redistribRelease.${redistArch} or null)
# If the release is non-null, fetch the source; otherwise, return null.
(trivial.mapNullable (
{ relative_path, sha256, ... }:
fetchurl {
url = "https://developer.download.nvidia.com/compute/${redistName}/redist/${relative_path}";
inherit sha256;
}
))
]; ];
lib = [
"lib"
"lib64"
];
static = [ "**/*.a" ];
sample = [ "samples" ];
python = [ "**/*.whl" ];
};
# Handle the pkg-config files: # Useful for introspecting why something went wrong. Maps descriptions of why the derivation would be marked as
# 1. No FHS # broken on have badPlatforms include the current platform.
# 2. Location expected by the pkg-config wrapper
# 3. Generate unversioned names too
postPatch = ''
for path in pkg-config pkgconfig ; do
[[ -d "$path" ]] || continue
mkdir -p share/pkgconfig
mv "$path"/* share/pkgconfig/
rmdir "$path"
done
for pc in share/pkgconfig/*.pc ; do # brokenConditions :: AttrSet Bool
sed -i \ # Sets `meta.broken = true` if any of the conditions are true.
-e "s|^cudaroot\s*=.*\$|cudaroot=''${!outputDev}|" \ # Example: Broken on a specific version of CUDA or when a dependency has a specific version.
-e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib|" \ brokenConditions = { };
-e "s|^includedir\s*=.*/include\$|includedir=''${!outputDev}/include|" \
"$pc"
done
# E.g. cuda-11.8.pc -> cuda.pc # badPlatformsConditions :: AttrSet Bool
for pc in share/pkgconfig/*-"$majorMinorVersion.pc" ; do # Sets `meta.badPlatforms = meta.platforms` if any of the conditions are true.
ln -s "$(basename "$pc")" "''${pc%-$majorMinorVersion.pc}".pc # Example: Broken on a specific architecture when some condition is met (like targeting Jetson).
done badPlatformsConditions = {
''; "No source" = !sourceMatchesHost;
};
env.majorMinorVersion = cudaMajorMinorVersion; # src :: Optional Derivation
src = trivial.pipe redistArch [
# If redistArch doesn't exist in redistribRelease, return null.
(redistArch: redistribRelease.${redistArch} or null)
# If the release is non-null, fetch the source; otherwise, return null.
(trivial.mapNullable (
{ relative_path, sha256, ... }:
fetchurl {
url = "https://developer.download.nvidia.com/compute/${redistName}/redist/${relative_path}";
inherit sha256;
}
))
];
# We do need some other phases, like configurePhase, so the multiple-output setup hook works. # Handle the pkg-config files:
dontBuild = true; # 1. No FHS
# 2. Location expected by the pkg-config wrapper
# 3. Generate unversioned names too
postPatch = ''
for path in pkg-config pkgconfig ; do
[[ -d "$path" ]] || continue
mkdir -p share/pkgconfig
mv "$path"/* share/pkgconfig/
rmdir "$path"
done
nativeBuildInputs = [ for pc in share/pkgconfig/*.pc ; do
sed -i \
-e "s|^cudaroot\s*=.*\$|cudaroot=''${!outputDev}|" \
-e "s|^libdir\s*=.*/lib\$|libdir=''${!outputLib}/lib|" \
-e "s|^includedir\s*=.*/include\$|includedir=''${!outputDev}/include|" \
"$pc"
done
# E.g. cuda-11.8.pc -> cuda.pc
for pc in share/pkgconfig/*-"$majorMinorVersion.pc" ; do
ln -s "$(basename "$pc")" "''${pc%-$majorMinorVersion.pc}".pc
done
'';
env.majorMinorVersion = cudaMajorMinorVersion;
# We do need some other phases, like configurePhase, so the multiple-output setup hook works.
dontBuild = true;
nativeBuildInputs =
[
autoPatchelfHook autoPatchelfHook
# This hook will make sure libcuda can be found # This hook will make sure libcuda can be found
# in typically /lib/opengl-driver by adding that # in typically /lib/opengl-driver by adding that
@@ -205,142 +200,140 @@ backendStdenv.mkDerivation (
autoAddCudaCompatRunpath autoAddCudaCompatRunpath
]; ];
buildInputs = buildInputs = [
[ # autoPatchelfHook will search for a libstdc++ and we're giving it
# autoPatchelfHook will search for a libstdc++ and we're giving it # one that is compatible with the rest of nixpkgs, even when
# one that is compatible with the rest of nixpkgs, even when # nvcc forces us to use an older gcc
# nvcc forces us to use an older gcc # NB: We don't actually know if this is the right thing to do
# NB: We don't actually know if this is the right thing to do stdenv.cc.cc.lib
stdenv.cc.cc.lib ];
];
# Picked up by autoPatchelf # Picked up by autoPatchelf
# Needed e.g. for libnvrtc to locate (dlopen) libnvrtc-builtins # Needed e.g. for libnvrtc to locate (dlopen) libnvrtc-builtins
appendRunpaths = ["$ORIGIN"]; appendRunpaths = [ "$ORIGIN" ];
# NOTE: We don't need to check for dev or doc, because those outputs are handled by # NOTE: We don't need to check for dev or doc, because those outputs are handled by
# the multiple-outputs setup hook. # the multiple-outputs setup hook.
# NOTE: moveToOutput operates on all outputs: # NOTE: moveToOutput operates on all outputs:
# https://github.com/NixOS/nixpkgs/blob/2920b6fc16a9ed5d51429e94238b28306ceda79e/pkgs/build-support/setup-hooks/multiple-outputs.sh#L105-L107 # https://github.com/NixOS/nixpkgs/blob/2920b6fc16a9ed5d51429e94238b28306ceda79e/pkgs/build-support/setup-hooks/multiple-outputs.sh#L105-L107
installPhase = installPhase =
let let
mkMoveToOutputCommand = mkMoveToOutputCommand =
output: output:
let
template = pattern: ''moveToOutput "${pattern}" "${"$" + output}"'';
patterns = finalAttrs.outputToPatterns.${output} or [];
in
strings.concatMapStringsSep "\n" template patterns;
in
# Pre-install hook
''
runHook preInstall
''
# Handle the existence of libPath, which requires us to re-arrange the lib directory
+ strings.optionalString (libPath != null) ''
full_lib_path="lib/${libPath}"
if [[ ! -d "$full_lib_path" ]] ; then
echo "${finalAttrs.pname}: '$full_lib_path' does not exist, only found:" >&2
find lib/ -mindepth 1 -maxdepth 1 >&2
echo "This release might not support your CUDA version" >&2
exit 1
fi
echo "Making libPath '$full_lib_path' the root of lib" >&2
mv "$full_lib_path" lib_new
rm -r lib
mv lib_new lib
''
# Create the primary output, out, and move the other outputs into it.
+ ''
mkdir -p "$out"
mv * "$out"
''
# Move the outputs into their respective outputs.
+ strings.concatMapStringsSep "\n" mkMoveToOutputCommand (builtins.tail finalAttrs.outputs)
# Add a newline to the end of the installPhase, so that the post-install hook doesn't
# get concatenated with the last moveToOutput command.
+ "\n"
# Post-install hook
+ ''
runHook postInstall
'';
doInstallCheck = true;
allowFHSReferences = true; # TODO: Default to `false`
postInstallCheck = ''
echo "Executing postInstallCheck"
if [[ -z "''${allowFHSReferences-}" ]] ; then
mapfile -t outputPaths < <(for o in $(getAllOutputNames); do echo "''${!o}"; done)
if grep --max-count=5 --recursive --exclude=LICENSE /usr/ "''${outputPaths[@]}" ; then
echo "Detected references to /usr" >&2
exit 1
fi
fi
'';
# libcuda needs to be resolved during runtime
autoPatchelfIgnoreMissingDeps = [
"libcuda.so"
"libcuda.so.*"
];
# The out output leverages the same functionality which backs the `symlinkJoin` function in
# Nixpkgs:
# https://github.com/NixOS/nixpkgs/blob/d8b2a92df48f9b08d68b0132ce7adfbdbc1fbfac/pkgs/build-support/trivial-builders/default.nix#L510
#
# That should allow us to emulate "fat" default outputs without having to actually create them.
#
# It is important that this run after the autoPatchelfHook, otherwise the symlinks in out will reference libraries in lib, creating a circular dependency.
postPhases = ["postPatchelf"];
# For each output, create a symlink to it in the out output.
# NOTE: We must recreate the out output here, because the setup hook will have deleted it if it was empty.
postPatchelf = ''
mkdir -p "$out"
for output in $(getAllOutputNames); do
if [[ "$output" != "out" ]]; then
${meta.getExe lndir} "''${!output}" "$out"
fi
done
'';
# Make the CUDA-patched stdenv available
passthru.stdenv = backendStdenv;
# Setting propagatedBuildInputs to false will prevent outputs known to the multiple-outputs
# from depending on `out` by default.
# https://github.com/NixOS/nixpkgs/blob/2920b6fc16a9ed5d51429e94238b28306ceda79e/pkgs/build-support/setup-hooks/multiple-outputs.sh#L196
# Indeed, we want to do the opposite -- fat "out" outputs that contain all the other outputs.
propagatedBuildOutputs = false;
# By default, if the dev output exists it just uses that.
# However, because we disabled propagatedBuildOutputs, dev doesn't contain libraries or
# anything of the sort. To remedy this, we set outputSpecified to true, and use
# outputsToInstall, which tells Nix which outputs to use when the package name is used
# unqualified (that is, without an explicit output).
outputSpecified = true;
meta = {
description = "${redistribRelease.name}. By downloading and using the packages you accept the terms and conditions of the ${finalAttrs.meta.license.shortName}";
sourceProvenance = [sourceTypes.binaryNativeCode];
broken = lists.any trivial.id (attrsets.attrValues finalAttrs.brokenConditions);
platforms = trivial.pipe supportedRedistArchs [
# Map each redist arch to the equivalent nix system or null if there is no equivalent.
(builtins.map flags.getNixSystem)
# Filter out unsupported systems
(builtins.filter (nixSystem: !(strings.hasPrefix "unsupported-" nixSystem)))
];
badPlatforms =
let let
isBadPlatform = lists.any trivial.id (attrsets.attrValues finalAttrs.badPlatformsConditions); template = pattern: ''moveToOutput "${pattern}" "${"$" + output}"'';
patterns = finalAttrs.outputToPatterns.${output} or [ ];
in in
lists.optionals isBadPlatform finalAttrs.meta.platforms; strings.concatMapStringsSep "\n" template patterns;
license = licenses.unfree; in
maintainers = teams.cuda.members; # Pre-install hook
# Force the use of the default, fat output by default (even though `dev` exists, which ''
# causes Nix to prefer that output over the others if outputSpecified isn't set). runHook preInstall
outputsToInstall = ["out"]; ''
}; # Handle the existence of libPath, which requires us to re-arrange the lib directory
} + strings.optionalString (libPath != null) ''
) full_lib_path="lib/${libPath}"
if [[ ! -d "$full_lib_path" ]] ; then
echo "${finalAttrs.pname}: '$full_lib_path' does not exist, only found:" >&2
find lib/ -mindepth 1 -maxdepth 1 >&2
echo "This release might not support your CUDA version" >&2
exit 1
fi
echo "Making libPath '$full_lib_path' the root of lib" >&2
mv "$full_lib_path" lib_new
rm -r lib
mv lib_new lib
''
# Create the primary output, out, and move the other outputs into it.
+ ''
mkdir -p "$out"
mv * "$out"
''
# Move the outputs into their respective outputs.
+ strings.concatMapStringsSep "\n" mkMoveToOutputCommand (builtins.tail finalAttrs.outputs)
# Add a newline to the end of the installPhase, so that the post-install hook doesn't
# get concatenated with the last moveToOutput command.
+ "\n"
# Post-install hook
+ ''
runHook postInstall
'';
doInstallCheck = true;
allowFHSReferences = true; # TODO: Default to `false`
postInstallCheck = ''
echo "Executing postInstallCheck"
if [[ -z "''${allowFHSReferences-}" ]] ; then
mapfile -t outputPaths < <(for o in $(getAllOutputNames); do echo "''${!o}"; done)
if grep --max-count=5 --recursive --exclude=LICENSE /usr/ "''${outputPaths[@]}" ; then
echo "Detected references to /usr" >&2
exit 1
fi
fi
'';
# libcuda needs to be resolved during runtime
autoPatchelfIgnoreMissingDeps = [
"libcuda.so"
"libcuda.so.*"
];
# The out output leverages the same functionality which backs the `symlinkJoin` function in
# Nixpkgs:
# https://github.com/NixOS/nixpkgs/blob/d8b2a92df48f9b08d68b0132ce7adfbdbc1fbfac/pkgs/build-support/trivial-builders/default.nix#L510
#
# That should allow us to emulate "fat" default outputs without having to actually create them.
#
# It is important that this run after the autoPatchelfHook, otherwise the symlinks in out will reference libraries in lib, creating a circular dependency.
postPhases = [ "postPatchelf" ];
# For each output, create a symlink to it in the out output.
# NOTE: We must recreate the out output here, because the setup hook will have deleted it if it was empty.
postPatchelf = ''
mkdir -p "$out"
for output in $(getAllOutputNames); do
if [[ "$output" != "out" ]]; then
${meta.getExe lndir} "''${!output}" "$out"
fi
done
'';
# Make the CUDA-patched stdenv available
passthru.stdenv = backendStdenv;
# Setting propagatedBuildInputs to false will prevent outputs known to the multiple-outputs
# from depending on `out` by default.
# https://github.com/NixOS/nixpkgs/blob/2920b6fc16a9ed5d51429e94238b28306ceda79e/pkgs/build-support/setup-hooks/multiple-outputs.sh#L196
# Indeed, we want to do the opposite -- fat "out" outputs that contain all the other outputs.
propagatedBuildOutputs = false;
# By default, if the dev output exists it just uses that.
# However, because we disabled propagatedBuildOutputs, dev doesn't contain libraries or
# anything of the sort. To remedy this, we set outputSpecified to true, and use
# outputsToInstall, which tells Nix which outputs to use when the package name is used
# unqualified (that is, without an explicit output).
outputSpecified = true;
meta = {
description = "${redistribRelease.name}. By downloading and using the packages you accept the terms and conditions of the ${finalAttrs.meta.license.shortName}";
sourceProvenance = [ sourceTypes.binaryNativeCode ];
broken = lists.any trivial.id (attrsets.attrValues finalAttrs.brokenConditions);
platforms = trivial.pipe supportedRedistArchs [
# Map each redist arch to the equivalent nix system or null if there is no equivalent.
(builtins.map flags.getNixSystem)
# Filter out unsupported systems
(builtins.filter (nixSystem: !(strings.hasPrefix "unsupported-" nixSystem)))
];
badPlatforms =
let
isBadPlatform = lists.any trivial.id (attrsets.attrValues finalAttrs.badPlatformsConditions);
in
lists.optionals isBadPlatform finalAttrs.meta.platforms;
license = licenses.unfree;
maintainers = teams.cuda.members;
# Force the use of the default, fat output by default (even though `dev` exists, which
# causes Nix to prefer that output over the others if outputSpecified isn't set).
outputsToInstall = [ "out" ];
};
})

View File

@@ -52,7 +52,9 @@ let
# - Package: ../modules/${pname}/releases/package.nix # - Package: ../modules/${pname}/releases/package.nix
# FIXME: do this at the module system level # FIXME: do this at the module system level
propagatePlatforms = lib.mapAttrs (redistArch: packages: map (p: { inherit redistArch; } // p) packages); propagatePlatforms = lib.mapAttrs (
redistArch: packages: map (p: { inherit redistArch; } // p) packages
);
# All releases across all platforms # All releases across all platforms
# See ../modules/${pname}/releases/releases.nix # See ../modules/${pname}/releases/releases.nix
@@ -61,7 +63,7 @@ let
# Compute versioned attribute name to be used in this package set # Compute versioned attribute name to be used in this package set
# Patch version changes should not break the build, so we only use major and minor # Patch version changes should not break the build, so we only use major and minor
# computeName :: Package -> String # computeName :: Package -> String
computeName = {version, ...}: mkVersionedPackageName pname version; computeName = { version, ... }: mkVersionedPackageName pname version;
# Check whether a package supports our CUDA version and platform. # Check whether a package supports our CUDA version and platform.
# isSupported :: Package -> Bool # isSupported :: Package -> Bool
@@ -81,16 +83,15 @@ let
# All the supported packages we can build for our platform. # All the supported packages we can build for our platform.
# perSystemReleases :: List Package # perSystemReleases :: List Package
allReleases = lib.pipe releaseSets allReleases = lib.pipe releaseSets [
[ (lib.attrValues)
(lib.attrValues) (lists.flatten)
(lists.flatten) (lib.groupBy (p: lib.versions.majorMinor p.version))
(lib.groupBy (p: lib.versions.majorMinor p.version)) (lib.mapAttrs (_: builtins.sort preferable))
(lib.mapAttrs (_: builtins.sort preferable)) (lib.mapAttrs (_: lib.take 1))
(lib.mapAttrs (_: lib.take 1)) (lib.attrValues)
(lib.attrValues) (lib.concatMap lib.trivial.id)
(lib.concatMap lib.trivial.id) ];
];
newest = builtins.head (builtins.sort preferable allReleases); newest = builtins.head (builtins.sort preferable allReleases);
@@ -115,7 +116,10 @@ let
buildPackage = buildPackage =
package: package:
let let
shims = final.callPackage shimsFn {inherit package; inherit (package) redistArch; }; shims = final.callPackage shimsFn {
inherit package;
inherit (package) redistArch;
};
name = computeName package; name = computeName package;
drv = final.callPackage ./manifest.nix { drv = final.callPackage ./manifest.nix {
inherit pname; inherit pname;
@@ -129,7 +133,9 @@ let
# versionedDerivations :: AttrSet Derivation # versionedDerivations :: AttrSet Derivation
versionedDerivations = builtins.listToAttrs (lists.map buildPackage allReleases); versionedDerivations = builtins.listToAttrs (lists.map buildPackage allReleases);
defaultDerivation = { ${pname} = (buildPackage newest).value; }; defaultDerivation = {
${pname} = (buildPackage newest).value;
};
in in
versionedDerivations // defaultDerivation; versionedDerivations // defaultDerivation;
in in

View File

@@ -1 +1,4 @@
{options, ...}: {options.cuda.manifests = options.generic.manifests;} { options, ... }:
{
options.cuda.manifests = options.generic.manifests;
}

View File

@@ -1,4 +1,4 @@
{options, ...}: { options, ... }:
{ {
options.cudnn.releases = options.generic.releases; options.cudnn.releases = options.generic.releases;
# TODO(@connorbaker): Figure out how to add additional options to the # TODO(@connorbaker): Figure out how to add additional options to the

View File

@@ -1 +1,4 @@
{options, ...}: {options.cutensor.manifests = options.generic.manifests;} { options, ... }:
{
options.cutensor.manifests = options.generic.manifests;
}

View File

@@ -1,7 +1,7 @@
{lib, config, ...}: { lib, config, ... }:
{ {
options.generic.manifests = { options.generic.manifests = {
feature = import ./feature/manifest.nix {inherit lib config;}; feature = import ./feature/manifest.nix { inherit lib config; };
redistrib = import ./redistrib/manifest.nix {inherit lib;}; redistrib = import ./redistrib/manifest.nix { inherit lib; };
}; };
} }

View File

@@ -1,7 +1,7 @@
{lib, config, ...}: { lib, config, ... }:
let let
inherit (lib) options trivial types; inherit (lib) options trivial types;
Release = import ./release.nix {inherit lib config;}; Release = import ./release.nix { inherit lib config; };
in in
options.mkOption { options.mkOption {
description = "A feature manifest is an attribute set which includes a mapping from package name to release"; description = "A feature manifest is an attribute set which includes a mapping from package name to release";

View File

@@ -1,4 +1,4 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
in in

View File

@@ -1,10 +1,10 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
Outputs = import ./outputs.nix {inherit lib;}; Outputs = import ./outputs.nix { inherit lib; };
in in
options.mkOption { options.mkOption {
description = "A package in the manifest"; description = "A package in the manifest";
example = (import ./release.nix {inherit lib;}).linux-x86_64; example = (import ./release.nix { inherit lib; }).linux-x86_64;
type = types.submodule {options.outputs = Outputs;}; type = types.submodule { options.outputs = Outputs; };
} }

View File

@@ -1,10 +1,10 @@
{lib, config, ...}: { lib, config, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
Package = import ./package.nix {inherit lib config;}; Package = import ./package.nix { inherit lib config; };
in in
options.mkOption { options.mkOption {
description = "A release is an attribute set which includes a mapping from platform to package"; description = "A release is an attribute set which includes a mapping from platform to package";
example = (import ./manifest.nix {inherit lib;}).cuda_cccl; example = (import ./manifest.nix { inherit lib; }).cuda_cccl;
type = types.attrsOf Package.type; type = types.attrsOf Package.type;
} }

View File

@@ -1,7 +1,7 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options trivial types; inherit (lib) options trivial types;
Release = import ./release.nix {inherit lib;}; Release = import ./release.nix { inherit lib; };
in in
options.mkOption { options.mkOption {
description = "A redistributable manifest is an attribute set which includes a mapping from package name to release"; description = "A redistributable manifest is an attribute set which includes a mapping from package name to release";

View File

@@ -1,10 +1,10 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
in in
options.mkOption { options.mkOption {
description = "A package in the manifest"; description = "A package in the manifest";
example = (import ./release.nix {inherit lib;}).linux-x86_64; example = (import ./release.nix { inherit lib; }).linux-x86_64;
type = types.submodule { type = types.submodule {
options = { options = {
relative_path = options.mkOption { relative_path = options.mkOption {

View File

@@ -1,11 +1,11 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
Package = import ./package.nix {inherit lib;}; Package = import ./package.nix { inherit lib; };
in in
options.mkOption { options.mkOption {
description = "A release is an attribute set which includes a mapping from platform to package"; description = "A release is an attribute set which includes a mapping from platform to package";
example = (import ./manifest.nix {inherit lib;}).cuda_cccl; example = (import ./manifest.nix { inherit lib; }).cuda_cccl;
type = types.submodule { type = types.submodule {
# Allow any attribute name as these will be the platform names # Allow any attribute name as these will be the platform names
freeformType = types.attrsOf Package.type; freeformType = types.attrsOf Package.type;

View File

@@ -1,4 +1,4 @@
{lib, config, ...}: { lib, config, ... }:
let let
inherit (config.generic.types) majorMinorVersion majorMinorPatchBuildVersion; inherit (config.generic.types) majorMinorVersion majorMinorPatchBuildVersion;
inherit (lib) options types; inherit (lib) options types;

View File

@@ -1,11 +1,11 @@
{lib, ...}: { lib, ... }:
let let
inherit (lib) options types; inherit (lib) options types;
in in
{ {
options.generic.types = options.mkOption { options.generic.types = options.mkOption {
type = types.attrsOf types.optionType; type = types.attrsOf types.optionType;
default = {}; default = { };
description = "A set of generic types."; description = "A set of generic types.";
}; };
config.generic.types = { config.generic.types = {

View File

@@ -1,4 +1,4 @@
{options, ...}: { options, ... }:
{ {
options.tensorrt.releases = options.generic.releases; options.tensorrt.releases = options.generic.releases;
# TODO(@connorbaker): Figure out how to add additional options to the # TODO(@connorbaker): Figure out how to add additional options to the

View File

@@ -22,63 +22,61 @@ let
nccl nccl
; ;
in in
backendStdenv.mkDerivation ( backendStdenv.mkDerivation (finalAttrs: {
finalAttrs: {
pname = "nccl-tests"; pname = "nccl-tests";
version = "2.13.9"; version = "2.13.9";
src = fetchFromGitHub { src = fetchFromGitHub {
owner = "NVIDIA"; owner = "NVIDIA";
repo = finalAttrs.pname; repo = finalAttrs.pname;
rev = "v${finalAttrs.version}"; rev = "v${finalAttrs.version}";
hash = "sha256-QYuMBPhvHHVo2ku14jD1CVINLPW0cyiXJkXxb77IxbE="; hash = "sha256-QYuMBPhvHHVo2ku14jD1CVINLPW0cyiXJkXxb77IxbE=";
}; };
strictDeps = true; strictDeps = true;
nativeBuildInputs = nativeBuildInputs =
[which] [ which ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit] ++ lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [cuda_nvcc]; ++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ cuda_nvcc ];
buildInputs = buildInputs =
[nccl] [ nccl ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit] ++ lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ ++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
cuda_nvcc.dev # crt/host_config.h cuda_nvcc.dev # crt/host_config.h
cuda_cudart cuda_cudart
] ]
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [ ++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [
cuda_cccl.dev # <nv/target> cuda_cccl.dev # <nv/target>
] ]
++ lib.optionals mpiSupport [mpi]; ++ lib.optionals mpiSupport [ mpi ];
makeFlags = makeFlags =
["NCCL_HOME=${nccl}"] [ "NCCL_HOME=${nccl}" ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") ["CUDA_HOME=${cudatoolkit}"] ++ lib.optionals (lib.versionOlder cudaVersion "11.4") [ "CUDA_HOME=${cudatoolkit}" ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") ["CUDA_HOME=${cuda_nvcc}"] ++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ "CUDA_HOME=${cuda_nvcc}" ]
++ lib.optionals mpiSupport ["MPI=1"]; ++ lib.optionals mpiSupport [ "MPI=1" ];
enableParallelBuilding = true; enableParallelBuilding = true;
installPhase = '' installPhase = ''
mkdir -p $out/bin mkdir -p $out/bin
cp -r build/* $out/bin/ cp -r build/* $out/bin/
''; '';
passthru.updateScript = gitUpdater { passthru.updateScript = gitUpdater {
inherit (finalAttrs) pname version; inherit (finalAttrs) pname version;
rev-prefix = "v"; rev-prefix = "v";
}; };
meta = with lib; { meta = with lib; {
description = "Tests to check both the performance and the correctness of NVIDIA NCCL operations"; description = "Tests to check both the performance and the correctness of NVIDIA NCCL operations";
homepage = "https://github.com/NVIDIA/nccl-tests"; homepage = "https://github.com/NVIDIA/nccl-tests";
platforms = platforms.linux; platforms = platforms.linux;
license = licenses.bsd3; license = licenses.bsd3;
broken = !config.cudaSupport || (mpiSupport && mpi == null); broken = !config.cudaSupport || (mpiSupport && mpi == null);
maintainers = with maintainers; [jmillerpdt] ++ teams.cuda.members; maintainers = with maintainers; [ jmillerpdt ] ++ teams.cuda.members;
}; };
} })
)

View File

@@ -22,94 +22,92 @@ let
cudaVersion cudaVersion
; ;
in in
backendStdenv.mkDerivation ( backendStdenv.mkDerivation (finalAttrs: {
finalAttrs: { pname = "nccl";
pname = "nccl"; version = "2.20.5-1";
version = "2.20.5-1";
src = fetchFromGitHub { src = fetchFromGitHub {
owner = "NVIDIA"; owner = "NVIDIA";
repo = finalAttrs.pname; repo = finalAttrs.pname;
rev = "v${finalAttrs.version}"; rev = "v${finalAttrs.version}";
hash = "sha256-ModIjD6RaRD/57a/PA1oTgYhZsAQPrrvhl5sNVXnO6c="; hash = "sha256-ModIjD6RaRD/57a/PA1oTgYhZsAQPrrvhl5sNVXnO6c=";
}; };
strictDeps = true; strictDeps = true;
outputs = [ outputs = [
"out" "out"
"dev" "dev"
];
nativeBuildInputs =
[
which
autoAddDriverRunpath
python3
]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ cuda_nvcc ];
buildInputs =
lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
cuda_nvcc.dev # crt/host_config.h
cuda_cudart
]
# NOTE: CUDA versions in Nixpkgs only use a major and minor version. When we do comparisons
# against other version, like below, it's important that we use the same format. Otherwise,
# we'll get incorrect results.
# For example, lib.versionAtLeast "12.0" "12.0.0" == false.
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [ cuda_cccl ];
env.NIX_CFLAGS_COMPILE = toString [ "-Wno-unused-function" ];
preConfigure = ''
patchShebangs ./src/device/generate.py
makeFlagsArray+=(
"NVCC_GENCODE=${lib.concatStringsSep " " cudaFlags.gencode}"
)
'';
makeFlags =
[ "PREFIX=$(out)" ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [
"CUDA_HOME=${cudatoolkit}"
"CUDA_LIB=${lib.getLib cudatoolkit}/lib"
"CUDA_INC=${lib.getDev cudatoolkit}/include"
]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
"CUDA_HOME=${cuda_nvcc}"
"CUDA_LIB=${lib.getLib cuda_cudart}/lib"
"CUDA_INC=${lib.getDev cuda_cudart}/include"
]; ];
nativeBuildInputs = enableParallelBuilding = true;
postFixup = ''
moveToOutput lib/libnccl_static.a $dev
'';
passthru.updateScript = gitUpdater {
inherit (finalAttrs) pname version;
rev-prefix = "v";
};
meta = with lib; {
description = "Multi-GPU and multi-node collective communication primitives for NVIDIA GPUs";
homepage = "https://developer.nvidia.com/nccl";
license = licenses.bsd3;
platforms = platforms.linux;
# NCCL is not supported on Jetson, because it does not use NVLink or PCI-e for inter-GPU communication.
# https://forums.developer.nvidia.com/t/can-jetson-orin-support-nccl/232845/9
badPlatforms = lib.optionals cudaFlags.isJetsonBuild [ "aarch64-linux" ];
maintainers =
with maintainers;
[ [
which mdaiter
autoAddDriverRunpath orivej
python3
] ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit] ++ teams.cuda.members;
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [cuda_nvcc]; };
})
buildInputs =
lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
cuda_nvcc.dev # crt/host_config.h
cuda_cudart
]
# NOTE: CUDA versions in Nixpkgs only use a major and minor version. When we do comparisons
# against other version, like below, it's important that we use the same format. Otherwise,
# we'll get incorrect results.
# For example, lib.versionAtLeast "12.0" "12.0.0" == false.
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [cuda_cccl];
env.NIX_CFLAGS_COMPILE = toString ["-Wno-unused-function"];
preConfigure = ''
patchShebangs ./src/device/generate.py
makeFlagsArray+=(
"NVCC_GENCODE=${lib.concatStringsSep " " cudaFlags.gencode}"
)
'';
makeFlags =
["PREFIX=$(out)"]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [
"CUDA_HOME=${cudatoolkit}"
"CUDA_LIB=${lib.getLib cudatoolkit}/lib"
"CUDA_INC=${lib.getDev cudatoolkit}/include"
]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
"CUDA_HOME=${cuda_nvcc}"
"CUDA_LIB=${lib.getLib cuda_cudart}/lib"
"CUDA_INC=${lib.getDev cuda_cudart}/include"
];
enableParallelBuilding = true;
postFixup = ''
moveToOutput lib/libnccl_static.a $dev
'';
passthru.updateScript = gitUpdater {
inherit (finalAttrs) pname version;
rev-prefix = "v";
};
meta = with lib; {
description = "Multi-GPU and multi-node collective communication primitives for NVIDIA GPUs";
homepage = "https://developer.nvidia.com/nccl";
license = licenses.bsd3;
platforms = platforms.linux;
# NCCL is not supported on Jetson, because it does not use NVLink or PCI-e for inter-GPU communication.
# https://forums.developer.nvidia.com/t/can-jetson-orin-support-nccl/232845/9
badPlatforms = lib.optionals cudaFlags.isJetsonBuild [ "aarch64-linux" ];
maintainers =
with maintainers;
[
mdaiter
orivej
]
++ teams.cuda.members;
};
}
)

View File

@@ -31,18 +31,18 @@ backendStdenv.mkDerivation {
cmake cmake
autoAddDriverRunpath autoAddDriverRunpath
] ]
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit] ++ lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [cuda_nvcc]; ++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ cuda_nvcc ];
buildInputs = buildInputs =
lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit] lib.optionals (lib.versionOlder cudaVersion "11.4") [ cudatoolkit ]
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [ ++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
(getDev libcublas) (getDev libcublas)
(getLib libcublas) (getLib libcublas)
(getOutput "static" libcublas) (getOutput "static" libcublas)
cuda_cudart cuda_cudart
] ]
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [cuda_cccl]; ++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [ cuda_cccl ];
cmakeFlags = [ cmakeFlags = [
(lib.cmakeBool "CMAKE_VERBOSE_MAKEFILE" true) (lib.cmakeBool "CMAKE_VERBOSE_MAKEFILE" true)

View File

@@ -2,63 +2,50 @@ final: _: {
# Helper hook used in both autoAddCudaCompatRunpath and # Helper hook used in both autoAddCudaCompatRunpath and
# autoAddDriverRunpath that applies a generic patching action to all elf # autoAddDriverRunpath that applies a generic patching action to all elf
# files with a dynamic linking section. # files with a dynamic linking section.
autoFixElfFiles = autoFixElfFiles = final.callPackage (
final.callPackage { makeSetupHook }: makeSetupHook { name = "auto-fix-elf-files"; } ./auto-fix-elf-files.sh
( ) { };
{makeSetupHook}:
makeSetupHook
{
name = "auto-fix-elf-files";
}
./auto-fix-elf-files.sh
)
{};
# Internal hook, used by cudatoolkit and cuda redist packages # Internal hook, used by cudatoolkit and cuda redist packages
# to accommodate automatic CUDAToolkit_ROOT construction # to accommodate automatic CUDAToolkit_ROOT construction
markForCudatoolkitRootHook = markForCudatoolkitRootHook = final.callPackage (
final.callPackage { makeSetupHook }:
( makeSetupHook { name = "mark-for-cudatoolkit-root-hook"; } ./mark-for-cudatoolkit-root-hook.sh
{makeSetupHook}: ) { };
makeSetupHook {name = "mark-for-cudatoolkit-root-hook";} ./mark-for-cudatoolkit-root-hook.sh
)
{};
# Currently propagated by cuda_nvcc or cudatoolkit, rather than used directly # Currently propagated by cuda_nvcc or cudatoolkit, rather than used directly
setupCudaHook = setupCudaHook = (
(final.callPackage final.callPackage (
( { makeSetupHook, backendStdenv }:
{makeSetupHook, backendStdenv}: makeSetupHook {
makeSetupHook name = "setup-cuda-hook";
{
name = "setup-cuda-hook";
substitutions.setupCudaHook = placeholder "out"; substitutions.setupCudaHook = placeholder "out";
# Point NVCC at a compatible compiler # Point NVCC at a compatible compiler
substitutions.ccRoot = "${backendStdenv.cc}"; substitutions.ccRoot = "${backendStdenv.cc}";
# Required in addition to ccRoot as otherwise bin/gcc is looked up # Required in addition to ccRoot as otherwise bin/gcc is looked up
# when building CMakeCUDACompilerId.cu # when building CMakeCUDACompilerId.cu
substitutions.ccFullPath = "${backendStdenv.cc}/bin/${backendStdenv.cc.targetPrefix}c++"; substitutions.ccFullPath = "${backendStdenv.cc}/bin/${backendStdenv.cc.targetPrefix}c++";
} } ./setup-cuda-hook.sh
./setup-cuda-hook.sh ) { }
) );
{}
);
autoAddDriverRunpath = autoAddDriverRunpath = final.callPackage (
final.callPackage {
( addDriverRunpath,
{addDriverRunpath, autoFixElfFiles, makeSetupHook}: autoFixElfFiles,
makeSetupHook makeSetupHook,
{ }:
name = "auto-add-opengl-runpath-hook"; makeSetupHook {
propagatedBuildInputs = [addDriverRunpath autoFixElfFiles]; name = "auto-add-opengl-runpath-hook";
} propagatedBuildInputs = [
./auto-add-driver-runpath-hook.sh addDriverRunpath
) autoFixElfFiles
{}; ];
} ./auto-add-driver-runpath-hook.sh
) { };
# Deprecated: an alias kept for compatibility. Consider removing after 24.11 # Deprecated: an alias kept for compatibility. Consider removing after 24.11
autoAddOpenGLRunpathHook = final.autoAddDriverRunpath; autoAddOpenGLRunpathHook = final.autoAddDriverRunpath;
@@ -68,27 +55,26 @@ final: _: {
# patched elf files, but `cuda_compat` path must take precedence (otherwise, # patched elf files, but `cuda_compat` path must take precedence (otherwise,
# it doesn't have any effect) and thus appear first. Meaning this hook must be # it doesn't have any effect) and thus appear first. Meaning this hook must be
# executed last. # executed last.
autoAddCudaCompatRunpath = autoAddCudaCompatRunpath = final.callPackage (
final.callPackage {
( makeSetupHook,
{makeSetupHook, autoFixElfFiles, cuda_compat ? null }: autoFixElfFiles,
makeSetupHook cuda_compat ? null,
{ }:
name = "auto-add-cuda-compat-runpath-hook"; makeSetupHook {
propagatedBuildInputs = [autoFixElfFiles]; name = "auto-add-cuda-compat-runpath-hook";
propagatedBuildInputs = [ autoFixElfFiles ];
substitutions = { substitutions = {
# Hotfix Ofborg evaluation # Hotfix Ofborg evaluation
libcudaPath = if final.flags.isJetsonBuild then "${cuda_compat}/compat" else null; libcudaPath = if final.flags.isJetsonBuild then "${cuda_compat}/compat" else null;
}; };
meta.broken = !final.flags.isJetsonBuild; meta.broken = !final.flags.isJetsonBuild;
# Pre-cuda_compat CUDA release: # Pre-cuda_compat CUDA release:
meta.badPlatforms = final.lib.optionals (cuda_compat == null) final.lib.platforms.all; meta.badPlatforms = final.lib.optionals (cuda_compat == null) final.lib.platforms.all;
meta.platforms = cuda_compat.meta.platforms or [ ]; meta.platforms = cuda_compat.meta.platforms or [ ];
} } ./auto-add-cuda-compat-runpath.sh
./auto-add-cuda-compat-runpath.sh ) { };
)
{};
} }

View File

@@ -108,6 +108,6 @@ finalAttrs: prevAttrs: {
prevAttrs.meta.badPlatforms or [ ] prevAttrs.meta.badPlatforms or [ ]
++ lib.optionals (targetArch == "unsupported") [ hostPlatform.system ]; ++ lib.optionals (targetArch == "unsupported") [ hostPlatform.system ];
homepage = "https://developer.nvidia.com/tensorrt"; homepage = "https://developer.nvidia.com/tensorrt";
maintainers = prevAttrs.meta.maintainers ++ [maintainers.aidalgol]; maintainers = prevAttrs.meta.maintainers ++ [ maintainers.aidalgol ];
}; };
} }

View File

@@ -3,9 +3,9 @@
{ {
tensorrt.releases = { tensorrt.releases = {
# jetson # jetson
linux-aarch64 = []; linux-aarch64 = [ ];
# powerpc # powerpc
linux-ppc64le = []; linux-ppc64le = [ ];
# server-grade arm # server-grade arm
linux-sbsa = [ linux-sbsa = [
{ {

View File

@@ -40,78 +40,75 @@ let
# Backbone # Backbone
gpus = builtins.import ../development/cuda-modules/gpus.nix; gpus = builtins.import ../development/cuda-modules/gpus.nix;
nvccCompatibilities = builtins.import ../development/cuda-modules/nvcc-compatibilities.nix; nvccCompatibilities = builtins.import ../development/cuda-modules/nvcc-compatibilities.nix;
flags = callPackage ../development/cuda-modules/flags.nix {inherit cudaVersion gpus;}; flags = callPackage ../development/cuda-modules/flags.nix { inherit cudaVersion gpus; };
passthruFunction = passthruFunction = final: ({
final: inherit cudaVersion lib pkgs;
( inherit gpus nvccCompatibilities flags;
{ cudaMajorVersion = versions.major cudaVersion;
inherit cudaVersion lib pkgs; cudaMajorMinorVersion = versions.majorMinor cudaVersion;
inherit gpus nvccCompatibilities flags; cudaOlder = strings.versionOlder cudaVersion;
cudaMajorVersion = versions.major cudaVersion; cudaAtLeast = strings.versionAtLeast cudaVersion;
cudaMajorMinorVersion = versions.majorMinor cudaVersion;
cudaOlder = strings.versionOlder cudaVersion;
cudaAtLeast = strings.versionAtLeast cudaVersion;
# Maintain a reference to the final cudaPackages. # Maintain a reference to the final cudaPackages.
# Without this, if we use `final.callPackage` and a package accepts `cudaPackages` as an argument, # Without this, if we use `final.callPackage` and a package accepts `cudaPackages` as an argument,
# it's provided with `cudaPackages` from the top-level scope, which is not what we want. We want to # it's provided with `cudaPackages` from the top-level scope, which is not what we want. We want to
# provide the `cudaPackages` from the final scope -- that is, the *current* scope. # provide the `cudaPackages` from the final scope -- that is, the *current* scope.
cudaPackages = final; cudaPackages = final;
# TODO(@connorbaker): `cudaFlags` is an alias for `flags` which should be removed in the future. # TODO(@connorbaker): `cudaFlags` is an alias for `flags` which should be removed in the future.
cudaFlags = flags; cudaFlags = flags;
# Exposed as cudaPackages.backendStdenv. # Exposed as cudaPackages.backendStdenv.
# This is what nvcc uses as a backend, # This is what nvcc uses as a backend,
# and it has to be an officially supported one (e.g. gcc11 for cuda11). # and it has to be an officially supported one (e.g. gcc11 for cuda11).
# #
# It, however, propagates current stdenv's libstdc++ to avoid "GLIBCXX_* not found errors" # It, however, propagates current stdenv's libstdc++ to avoid "GLIBCXX_* not found errors"
# when linked with other C++ libraries. # when linked with other C++ libraries.
# E.g. for cudaPackages_11_8 we use gcc11 with gcc12's libstdc++ # E.g. for cudaPackages_11_8 we use gcc11 with gcc12's libstdc++
# Cf. https://github.com/NixOS/nixpkgs/pull/218265 for context # Cf. https://github.com/NixOS/nixpkgs/pull/218265 for context
backendStdenv = final.callPackage ../development/cuda-modules/backend-stdenv.nix {}; backendStdenv = final.callPackage ../development/cuda-modules/backend-stdenv.nix { };
# Loose packages # Loose packages
cudatoolkit = final.callPackage ../development/cuda-modules/cudatoolkit {}; cudatoolkit = final.callPackage ../development/cuda-modules/cudatoolkit { };
saxpy = final.callPackage ../development/cuda-modules/saxpy {}; saxpy = final.callPackage ../development/cuda-modules/saxpy { };
nccl = final.callPackage ../development/cuda-modules/nccl {}; nccl = final.callPackage ../development/cuda-modules/nccl { };
nccl-tests = final.callPackage ../development/cuda-modules/nccl-tests {}; nccl-tests = final.callPackage ../development/cuda-modules/nccl-tests { };
} });
);
mkVersionedPackageName = mkVersionedPackageName =
name: version: name: version:
strings.concatStringsSep "_" [ strings.concatStringsSep "_" [
name name
(strings.replaceStrings ["."] ["_"] (versions.majorMinor version)) (strings.replaceStrings [ "." ] [ "_" ] (versions.majorMinor version))
]; ];
composedExtension = fixedPoints.composeManyExtensions ([ composedExtension = fixedPoints.composeManyExtensions (
(import ../development/cuda-modules/setup-hooks/extension.nix) [
(callPackage ../development/cuda-modules/cuda/extension.nix {inherit cudaVersion;}) (import ../development/cuda-modules/setup-hooks/extension.nix)
(callPackage ../development/cuda-modules/cuda/overrides.nix {inherit cudaVersion;}) (callPackage ../development/cuda-modules/cuda/extension.nix { inherit cudaVersion; })
(callPackage ../development/cuda-modules/generic-builders/multiplex.nix { (callPackage ../development/cuda-modules/cuda/overrides.nix { inherit cudaVersion; })
inherit cudaVersion flags mkVersionedPackageName; (callPackage ../development/cuda-modules/generic-builders/multiplex.nix {
pname = "cudnn"; inherit cudaVersion flags mkVersionedPackageName;
releasesModule = ../development/cuda-modules/cudnn/releases.nix; pname = "cudnn";
shimsFn = ../development/cuda-modules/cudnn/shims.nix; releasesModule = ../development/cuda-modules/cudnn/releases.nix;
fixupFn = ../development/cuda-modules/cudnn/fixup.nix; shimsFn = ../development/cuda-modules/cudnn/shims.nix;
}) fixupFn = ../development/cuda-modules/cudnn/fixup.nix;
(callPackage ../development/cuda-modules/cutensor/extension.nix { })
inherit cudaVersion flags mkVersionedPackageName; (callPackage ../development/cuda-modules/cutensor/extension.nix {
}) inherit cudaVersion flags mkVersionedPackageName;
(callPackage ../development/cuda-modules/generic-builders/multiplex.nix { })
inherit cudaVersion flags mkVersionedPackageName; (callPackage ../development/cuda-modules/generic-builders/multiplex.nix {
pname = "tensorrt"; inherit cudaVersion flags mkVersionedPackageName;
releasesModule = ../development/cuda-modules/tensorrt/releases.nix; pname = "tensorrt";
shimsFn = ../development/cuda-modules/tensorrt/shims.nix; releasesModule = ../development/cuda-modules/tensorrt/releases.nix;
fixupFn = ../development/cuda-modules/tensorrt/fixup.nix; shimsFn = ../development/cuda-modules/tensorrt/shims.nix;
}) fixupFn = ../development/cuda-modules/tensorrt/fixup.nix;
(callPackage ../development/cuda-modules/cuda-samples/extension.nix {inherit cudaVersion;}) })
(callPackage ../development/cuda-modules/cuda-library-samples/extension.nix {}) (callPackage ../development/cuda-modules/cuda-samples/extension.nix { inherit cudaVersion; })
] ++ lib.optionals config.allowAliases [ (callPackage ../development/cuda-modules/cuda-library-samples/extension.nix { })
(import ../development/cuda-modules/aliases.nix) ]
]); ++ lib.optionals config.allowAliases [ (import ../development/cuda-modules/aliases.nix) ]
);
cudaPackages = customisation.makeScope newScope ( cudaPackages = customisation.makeScope newScope (
fixedPoints.extends composedExtension passthruFunction fixedPoints.extends composedExtension passthruFunction