Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -10,6 +10,8 @@
- ensure the toolkit exits if NRI Plugin init fails
- feat(nvcdi): Allow IPC sockets to not be discovered
- fix(cudacompat): Fix handling of CUDA compat on Orin
- Update systemd unit conditions to execute nvidia-smi
- Reintroduce restart logic to nvidia-cdi-refresh.service

## v1.19.0
- Promote v1.19.0-rc.7 to v1.19.0
Expand Down
8 changes: 8 additions & 0 deletions deployments/systemd/nvidia-cdi-refresh.service
Original file line number Diff line number Diff line change
Expand Up @@ -18,15 +18,23 @@ ConditionPathExists=|/usr/bin/nvidia-smi
ConditionPathExists=|/usr/sbin/nvidia-smi
ConditionPathExists=|/usr/lib/wsl/lib/nvidia-smi
ConditionPathExists=/usr/bin/nvidia-ctk
# Limit the number of successive restarts to 5 in 10 seconds.
StartLimitBurst=5
StartLimitIntervalSec=10s

[Service]
Type=oneshot
# Values from Environment will be replaced if defined in EnvironmentFile
Environment=NVIDIA_CTK_CDI_OUTPUT_FILE_PATH=/var/run/cdi/nvidia.yaml
EnvironmentFile=-/etc/nvidia-container-toolkit/nvidia-cdi-refresh.env
ExecCondition=/bin/sh -c '/usr/bin/grep -qE "/(nvidia|nvidia-current)[.]ko" /lib/modules/%v/modules.dep || [ -e /dev/dxg ]'
ExecCondition=/bin/sh -c '/usr/bin/nvidia-smi -L || /usr/sbin/nvidia-smi -L || /usr/lib/wsl/lib/nvidia-smi -L'
ExecStart=/usr/bin/nvidia-ctk cdi generate
CapabilityBoundingSet=CAP_SYS_MODULE CAP_SYS_ADMIN CAP_MKNOD
# We set the service to restart on failure to ensure that a CDI spec is
# eventually generated.
Restart=on-failure
RestartSec=1s

[Install]
WantedBy=multi-user.target
Loading