Hi,
I am working in a custom system, using AGX Orin 64G SOM, with custom software based on Yocto Kirkstone,
I think I have a problem with nvidia-container-runtime, for examplenvidia-container-cli info doesn’t print the GPU information:
root@ubuntu:~# nvidia-container-cli info
libnvrm_gpu.so: NvRmGpuLibOpen failed, error=4
nvidia-container-cli: initialization error: cuda error: unknown error
Docker runtime
root@change-me:~# cat /etc/docker/daemon.json
{
"bip": "240.10.0.1/24",
"fixed-cidr": "240.10.0.0/24" ,
"runtimes": {
"nvidia": {
"path": "/usr/bin/nvidia-container-runtime",
"runtimeArgs": []
}},
"default-runtime": "nvidia"
}
I have checked if the drivers are loaded:
root@ubuntu:~# lsmod | grep nvgpu
nvgpu 2662400 0
nvmap 229376 2 nvgpu
Check if there is GPU devices:
root@ubuntu:~# ls -l /dev/nv*
crw-rw---- 1 root video 506, 0 Apr 28 2022 /dev/nvhost-ctrl
crw-rw---- 1 root video 506, 58 Apr 28 2022 /dev/nvhost-ctrl-isp
crw-rw---- 1 root video 506, 22 Apr 28 2022 /dev/nvhost-ctrl-nvdec
crw-rw---- 1 root video 506, 50 Apr 28 2022 /dev/nvhost-ctrl-nvdla0
crw-rw---- 1 root video 506, 54 Apr 28 2022 /dev/nvhost-ctrl-nvdla1
crw-rw---- 1 root video 506, 46 Apr 28 2022 /dev/nvhost-ctrl-pva0
crw-rw---- 1 root video 506, 57 Apr 28 2022 /dev/nvhost-isp
crw-rw---- 1 root video 506, 41 Apr 28 2022 /dev/nvhost-isp-thi
crw-rw---- 1 root video 506, 13 Apr 28 2022 /dev/nvhost-msenc
crw-rw---- 1 root video 506, 29 Apr 28 2022 /dev/nvhost-nvcsi
crw-rw---- 1 root video 506, 21 Apr 28 2022 /dev/nvhost-nvdec
crw-rw---- 1 root video 506, 49 Apr 28 2022 /dev/nvhost-nvdla0
crw-rw---- 1 root video 506, 53 Apr 28 2022 /dev/nvhost-nvdla1
crw-rw---- 1 root video 506, 5 Apr 28 2022 /dev/nvhost-nvjpg
crw-rw---- 1 root video 506, 9 Apr 28 2022 /dev/nvhost-nvjpg1
crw-rw---- 1 root video 506, 17 Apr 28 2022 /dev/nvhost-ofa
crw-rw---- 1 root video 505, 0 Apr 28 2022 /dev/nvhost-power-gpu
crw-rw---- 1 root video 506, 45 Apr 28 2022 /dev/nvhost-pva0
crw-rw---- 1 root video 506, 25 Apr 28 2022 /dev/nvhost-tsec
crw-rw---- 1 root video 506, 61 Apr 28 2022 /dev/nvhost-vi0
crw-rw---- 1 root video 506, 33 Apr 28 2022 /dev/nvhost-vi0-thi
crw-rw---- 1 root video 506, 65 Apr 28 2022 /dev/nvhost-vi1
crw-rw---- 1 root video 506, 37 Apr 28 2022 /dev/nvhost-vi1-thi
crw-rw---- 1 root video 506, 1 Apr 28 2022 /dev/nvhost-vic
crw-rw-rw- 1 root root 195, 254 Apr 28 2022 /dev/nvidia-modeset
crw-rw-rw- 1 root root 195, 0 Apr 28 2022 /dev/nvidia0
crw-rw-rw- 1 root root 195, 255 Apr 28 2022 /dev/nvidiactl
crw-rw---- 1 root video 10, 55 Apr 28 2022 /dev/nvmap
crw------- 1 root root 234, 0 Apr 28 2022 /dev/nvme0
brw-rw---- 1 root disk 259, 0 Apr 28 2022 /dev/nvme0n1
crw-rw-rw- 1 root root 235, 0 Apr 28 2022 /dev/nvsciipc
/dev/nvgpu:
total 0
drwxr-xr-x 2 root root 60 Apr 28 2022 igpu0
Verify if library exists
root@change-me:/usr/lib# ls -l /usr/lib/libnvrm_gpu.so
-rw-r--r-- 1 root root 379584 Mar 9 2018 /usr/lib/libnvrm_gpu.so
I am not sure how to track the root of the problem.