2024-08-22 19:51:54 +02:00
|
|
|
{ pkgs, lib, ... }:
|
|
|
|
let
|
|
|
|
testCDIScript = pkgs.writeShellScriptBin "test-cdi" ''
|
|
|
|
die() {
|
|
|
|
echo "$1"
|
|
|
|
exit 1
|
|
|
|
}
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
check_file_referential_integrity() {
|
|
|
|
echo "checking $1 referential integrity"
|
|
|
|
( ${pkgs.glibc.bin}/bin/ldd "$1" | ${lib.getExe pkgs.gnugrep} "not found" &> /dev/null ) && return 1
|
|
|
|
return 0
|
|
|
|
}
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
check_directory_referential_integrity() {
|
|
|
|
${lib.getExe pkgs.findutils} "$1" -type f -print0 | while read -d $'\0' file; do
|
|
|
|
if [[ $(${lib.getExe pkgs.file} "$file" | ${lib.getExe pkgs.gnugrep} ELF) ]]; then
|
|
|
|
check_file_referential_integrity "$file" || exit 1
|
|
|
|
else
|
|
|
|
echo "skipping $file: not an ELF file"
|
|
|
|
fi
|
|
|
|
done
|
|
|
|
}
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
check_directory_referential_integrity "/usr/bin" || exit 1
|
|
|
|
check_directory_referential_integrity "${pkgs.addDriverRunpath.driverLink}" || exit 1
|
|
|
|
check_directory_referential_integrity "/usr/local/nvidia" || exit 1
|
|
|
|
'';
|
|
|
|
testContainerImage = pkgs.dockerTools.buildImage {
|
|
|
|
name = "cdi-test";
|
|
|
|
tag = "latest";
|
|
|
|
config = {
|
|
|
|
Cmd = [ (lib.getExe testCDIScript) ];
|
2024-08-22 19:25:49 +02:00
|
|
|
};
|
2024-08-22 19:51:54 +02:00
|
|
|
copyToRoot = with pkgs.dockerTools; [
|
|
|
|
usrBinEnv
|
|
|
|
binSh
|
|
|
|
];
|
|
|
|
};
|
|
|
|
emptyCDISpec = ''
|
|
|
|
{
|
|
|
|
"cdiVersion": "0.5.0",
|
|
|
|
"kind": "nvidia.com/gpu",
|
|
|
|
"devices": [
|
|
|
|
{
|
|
|
|
"name": "all",
|
|
|
|
"containerEdits": {
|
|
|
|
"deviceNodes": [
|
|
|
|
{
|
|
|
|
"path": "/dev/urandom"
|
|
|
|
}
|
|
|
|
],
|
|
|
|
"hooks": [],
|
|
|
|
"mounts": []
|
2024-08-16 20:33:50 +02:00
|
|
|
}
|
|
|
|
}
|
2024-08-22 19:51:54 +02:00
|
|
|
],
|
|
|
|
"containerEdits": {
|
|
|
|
"deviceNodes": [],
|
|
|
|
"hooks": [],
|
|
|
|
"mounts": []
|
2024-08-22 19:25:49 +02:00
|
|
|
}
|
2024-08-22 19:51:54 +02:00
|
|
|
}
|
|
|
|
'';
|
|
|
|
nvidia-container-toolkit = {
|
|
|
|
enable = true;
|
|
|
|
package = pkgs.stdenv.mkDerivation {
|
|
|
|
pname = "nvidia-ctk-dummy";
|
|
|
|
version = "1.0.0";
|
|
|
|
dontUnpack = true;
|
|
|
|
dontBuild = true;
|
2024-08-22 19:25:49 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
inherit emptyCDISpec;
|
|
|
|
passAsFile = [ "emptyCDISpec" ];
|
2024-08-22 19:25:49 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
installPhase = ''
|
|
|
|
mkdir -p $out/bin $out/share/nvidia-container-toolkit
|
|
|
|
cp "$emptyCDISpecPath" "$out/share/nvidia-container-toolkit/spec.json"
|
|
|
|
echo -n "$emptyCDISpec" > "$out/bin/nvidia-ctk";
|
|
|
|
cat << EOF > "$out/bin/nvidia-ctk"
|
|
|
|
#!${pkgs.runtimeShell}
|
|
|
|
cat "$out/share/nvidia-container-toolkit/spec.json"
|
|
|
|
EOF
|
|
|
|
chmod +x $out/bin/nvidia-ctk
|
|
|
|
'';
|
|
|
|
meta.mainProgram = "nvidia-ctk";
|
|
|
|
};
|
|
|
|
};
|
|
|
|
in
|
|
|
|
{
|
|
|
|
name = "nvidia-container-toolkit";
|
|
|
|
meta = with lib.maintainers; {
|
|
|
|
maintainers = [ ereslibre ];
|
|
|
|
};
|
|
|
|
defaults =
|
|
|
|
{ config, ... }:
|
|
|
|
{
|
|
|
|
environment.systemPackages = with pkgs; [ jq ];
|
|
|
|
virtualisation.diskSize = lib.mkDefault 10240;
|
|
|
|
virtualisation.containers.enable = lib.mkDefault true;
|
|
|
|
hardware = {
|
|
|
|
inherit nvidia-container-toolkit;
|
|
|
|
nvidia = {
|
|
|
|
open = true;
|
|
|
|
package = config.boot.kernelPackages.nvidiaPackages.stable.open;
|
|
|
|
};
|
|
|
|
graphics.enable = lib.mkDefault true;
|
2024-08-16 20:33:50 +02:00
|
|
|
};
|
|
|
|
};
|
2024-08-22 19:51:54 +02:00
|
|
|
nodes = {
|
|
|
|
no-gpus = {
|
|
|
|
virtualisation.containers.enable = false;
|
|
|
|
hardware.graphics.enable = false;
|
2024-08-16 20:33:50 +02:00
|
|
|
};
|
2024-08-22 19:51:54 +02:00
|
|
|
one-gpu =
|
|
|
|
{ pkgs, ... }:
|
|
|
|
{
|
|
|
|
environment.systemPackages = with pkgs; [ podman ];
|
|
|
|
hardware.graphics.enable = true;
|
|
|
|
};
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
one-gpu-invalid-host-paths = {
|
|
|
|
hardware.nvidia-container-toolkit.mounts = [
|
2024-08-16 20:33:50 +02:00
|
|
|
{
|
2024-08-22 19:51:54 +02:00
|
|
|
hostPath = "/non-existant-path";
|
|
|
|
containerPath = "/some/path";
|
|
|
|
}
|
|
|
|
];
|
2024-08-16 20:33:50 +02:00
|
|
|
};
|
2024-08-22 19:51:54 +02:00
|
|
|
};
|
|
|
|
testScript = ''
|
|
|
|
start_all()
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
with subtest("Generate an empty CDI spec for a machine with no Nvidia GPUs"):
|
|
|
|
no_gpus.wait_for_unit("nvidia-container-toolkit-cdi-generator.service")
|
|
|
|
no_gpus.succeed("cat /var/run/cdi/nvidia-container-toolkit.json | jq")
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
with subtest("Podman loads the generated CDI spec for a machine with an Nvidia GPU"):
|
|
|
|
one_gpu.wait_for_unit("nvidia-container-toolkit-cdi-generator.service")
|
|
|
|
one_gpu.succeed("cat /var/run/cdi/nvidia-container-toolkit.json | jq")
|
|
|
|
one_gpu.succeed("podman load < ${testContainerImage}")
|
|
|
|
print(one_gpu.succeed("podman run --pull=never --device=nvidia.com/gpu=all -v /run/opengl-driver:/run/opengl-driver:ro cdi-test:latest"))
|
2024-08-16 20:33:50 +02:00
|
|
|
|
2024-08-22 19:51:54 +02:00
|
|
|
# Issue: https://github.com/NixOS/nixpkgs/issues/319201
|
|
|
|
with subtest("The generated CDI spec skips specified non-existant paths in the host"):
|
|
|
|
one_gpu_invalid_host_paths.wait_for_unit("nvidia-container-toolkit-cdi-generator.service")
|
|
|
|
one_gpu_invalid_host_paths.fail("grep 'non-existant-path' /var/run/cdi/nvidia-container-toolkit.json")
|
|
|
|
'';
|
|
|
|
}
|