63746cac08
This PR refactor CUDA setup hooks, and in particular autoAddOpenGLRunpath and autoAddCudaCompatRunpathHook, that were using a lot of code in common (in fact, I introduced the latter by copy pasting most of the bash script of the former). This is not satisfying for maintenance, as a recent patch showed, because we need to duplicate changes to both hooks. This commit abstract the common part in a single shell script that applies a generic patch action to every elf file in the output. For autoAddOpenGLRunpath the action is just addOpenGLRunpath (now addDriverRunpath), and is few line function for autoAddCudaCompatRunpathHook. Doing so, we also takes the occasion to use the newer addDriverRunpath instead of the previous addOpenGLRunpath, and rename the CUDA hook to reflect that as well. Co-Authored-By: Connor Baker <connor.baker@tweag.io>
62 lines
1.4 KiB
Nix
62 lines
1.4 KiB
Nix
{
|
|
cmake,
|
|
cudaPackages,
|
|
lib,
|
|
}:
|
|
let
|
|
inherit (cudaPackages)
|
|
autoAddDriverRunpath
|
|
backendStdenv
|
|
cuda_cccl
|
|
cuda_cudart
|
|
cuda_nvcc
|
|
cudatoolkit
|
|
cudaVersion
|
|
flags
|
|
libcublas
|
|
setupCudaHook
|
|
;
|
|
inherit (lib) getDev getLib getOutput;
|
|
in
|
|
backendStdenv.mkDerivation {
|
|
pname = "saxpy";
|
|
version = "unstable-2023-07-11";
|
|
|
|
src = ./.;
|
|
|
|
strictDeps = true;
|
|
|
|
nativeBuildInputs =
|
|
[
|
|
cmake
|
|
autoAddDriverRunpath
|
|
]
|
|
++ lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit]
|
|
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [cuda_nvcc];
|
|
|
|
buildInputs =
|
|
lib.optionals (lib.versionOlder cudaVersion "11.4") [cudatoolkit]
|
|
++ lib.optionals (lib.versionAtLeast cudaVersion "11.4") [
|
|
(getDev libcublas)
|
|
(getLib libcublas)
|
|
(getOutput "static" libcublas)
|
|
cuda_cudart
|
|
]
|
|
++ lib.optionals (lib.versionAtLeast cudaVersion "12.0") [cuda_cccl];
|
|
|
|
cmakeFlags = [
|
|
(lib.cmakeBool "CMAKE_VERBOSE_MAKEFILE" true)
|
|
(lib.cmakeFeature "CMAKE_CUDA_ARCHITECTURES" (
|
|
with flags; lib.concatStringsSep ";" (lib.lists.map dropDot cudaCapabilities)
|
|
))
|
|
];
|
|
|
|
meta = rec {
|
|
description = "A simple (Single-precision AX Plus Y) FindCUDAToolkit.cmake example for testing cross-compilation";
|
|
license = lib.licenses.mit;
|
|
maintainers = lib.teams.cuda.members;
|
|
platforms = lib.platforms.unix;
|
|
badPlatforms = lib.optionals flags.isJetsonBuild platforms;
|
|
};
|
|
}
|