nvidia-bug-report.log.gz (1.4 MB)
I don’t have anything in .bashrc nor .bash_profile. root and other users can run the cmd successfully. I restarted cuda-driver as well as nvidia-persistenced services. Is this a permission issue? Here is a strace and debug log attached.
strace nvidia-smi
execve("/cm/local/apps/cuda/libs/current/bin/nvidia-smi", ["nvidia-smi"], 0x7fffffffc480 /* 122 vars */) = 0
brk(NULL) = 0x69d000
arch_prctl(0x3001 /* ARCH_??? */, 0x7fffffffc2c0) = -1 EINVAL (Invalid argument)
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x155555516000
access("/etc/ld.so.preload", R_OK) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/glibc-hwcaps/x86-64-v3/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/glibc-hwcaps/x86-64-v3", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/glibc-hwcaps/x86-64-v2/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/glibc-hwcaps/x86-64-v2", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/tls", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64", {st_mode=S_IFDIR|0755, st_size=4096, ...}, 0) = 0
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/glibc-hwcaps/x86-64-v3/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/glibc-hwcaps/x86-64-v3", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/glibc-hwcaps/x86-64-v2/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/glibc-hwcaps/x86-64-v2", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/tls", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib", {st_mode=S_IFDIR|0755, st_size=8192, ...}, 0) = 0
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/glibc-hwcaps/x86-64-v3/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/glibc-hwcaps/x86-64-v3", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/glibc-hwcaps/x86-64-v2/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/glibc-hwcaps/x86-64-v2", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/tls", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm", {st_mode=S_IFDIR|0755, st_size=8192, ...}, 0) = 0
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/glibc-hwcaps/x86-64-v3/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/glibc-hwcaps/x86-64-v3", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/glibc-hwcaps/x86-64-v2/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/glibc-hwcaps/x86-64-v2", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/tls", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/x86_64", 0x7fffffffb500, 0) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
newfstatat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64", {st_mode=S_IFDIR|0755, st_size=4096, ...}, 0) = 0
openat(AT_FDCWD, "/etc/ld.so.cache", O_RDONLY|O_CLOEXEC) = 3
newfstatat(3, "", {st_mode=S_IFREG|0644, st_size=58087, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 58087, PROT_READ, MAP_PRIVATE, 3, 0) = 0x155555507000
close(3) = 0
openat(AT_FDCWD, "/lib64/libpthread.so.0", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0P\20\0\0\0\0\0\0"..., 832) = 832
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=15960, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 16392, PROT_READ, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155555502000
mmap(0x155555503000, 4096, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1000) = 0x155555503000
mmap(0x155555504000, 4096, PROT_READ, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555504000
mmap(0x155555505000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555505000
mmap(0x155555506000, 8, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x155555506000
close(3) = 0
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/libm.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/libm.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/libm.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/libm.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib64/libm.so.6", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220\363\0\0\0\0\0\0"..., 832) = 832
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=905848, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 892944, PROT_READ, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155555427000
mmap(0x155555436000, 458752, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0xf000) = 0x155555436000
mmap(0x1555554a6000, 368640, PROT_READ, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x7f000) = 0x1555554a6000
mmap(0x155555500000, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0xd8000) = 0x155555500000
close(3) = 0
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/libdl.so.2", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/libdl.so.2", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/libdl.so.2", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/libdl.so.2", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib64/libdl.so.2", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0P\20\0\0\0\0\0\0"..., 832) = 832
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=15936, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 16392, PROT_READ, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155555422000
mmap(0x155555423000, 4096, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1000) = 0x155555423000
mmap(0x155555424000, 4096, PROT_READ, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555424000
mmap(0x155555425000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555425000
mmap(0x155555426000, 8, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x155555426000
close(3) = 0
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/libc.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/libc.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/libc.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/libc.so.6", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib64/libc.so.6", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\3\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220P\4\0\0\0\0\0"..., 832) = 832
pread64(3, "\6\0\0\0\4\0\0\0@\0\0\0\0\0\0\0@\0\0\0\0\0\0\0@\0\0\0\0\0\0\0"..., 784, 64) = 784
pread64(3, "\4\0\0\0 \0\0\0\5\0\0\0GNU\0\2\0\0\300\4\0\0\0\3\0\0\0\0\0\0\0"..., 48, 848) = 48
pread64(3, "\4\0\0\0\24\0\0\0\3\0\0\0GNU\0y\356%$[\271\321\0350\340\225\347\356&)\252"..., 68, 896) = 68
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=2389384, ...}, AT_EMPTY_PATH) = 0
pread64(3, "\6\0\0\0\4\0\0\0@\0\0\0\0\0\0\0@\0\0\0\0\0\0\0@\0\0\0\0\0\0\0"..., 784, 64) = 784
mmap(NULL, 2136752, PROT_READ, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155555218000
mprotect(0x155555244000, 1880064, PROT_NONE) = 0
mmap(0x155555244000, 1531904, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2c000) = 0x155555244000
mmap(0x1555553ba000, 344064, PROT_READ, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1a2000) = 0x1555553ba000
mmap(0x15555540f000, 24576, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1f6000) = 0x15555540f000
mmap(0x155555415000, 51888, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x155555415000
close(3) = 0
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/librt.so.1", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/cuda12.1/toolkit/12.1.1/targets/x86_64-linux/lib/librt.so.1", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/slurm/librt.so.1", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/cm/shared/apps/slurm/current/lib64/librt.so.1", O_RDONLY|O_CLOEXEC) = -1 ENOENT (No such file or directory)
openat(AT_FDCWD, "/lib64/librt.so.1", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0\220\20\0\0\0\0\0\0"..., 832) = 832
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=16656, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 16392, PROT_READ, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155555213000
mmap(0x155555214000, 4096, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x1000) = 0x155555214000
mmap(0x155555215000, 4096, PROT_READ, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555215000
mmap(0x155555216000, 4096, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x2000) = 0x155555216000
mmap(0x155555217000, 8, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x155555217000
close(3) = 0
mmap(NULL, 8192, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_ANONYMOUS, -1, 0) = 0x155555211000
arch_prctl(ARCH_SET_FS, 0x155555212300) = 0
set_tid_address(0x1555552125d0) = 299934
set_robust_list(0x1555552125e0, 24) = 0
mprotect(0x15555540f000, 12288, PROT_READ) = 0
mprotect(0x155555216000, 4096, PROT_READ) = 0
mprotect(0x155555425000, 4096, PROT_READ) = 0
mprotect(0x155555500000, 4096, PROT_READ) = 0
mprotect(0x155555505000, 4096, PROT_READ) = 0
mprotect(0x681000, 86016, PROT_READ) = 0
mprotect(0x155555552000, 8192, PROT_READ) = 0
prlimit64(0, RLIMIT_STACK, NULL, {rlim_cur=RLIM64_INFINITY, rlim_max=RLIM64_INFINITY}) = 0
munmap(0x155555507000, 58087) = 0
getrandom("\x15\x46\xca\xb7\x72\x26\x83\x4a", 8, GRND_NONBLOCK) = 8
brk(NULL) = 0x69d000
brk(0x6be000) = 0x6be000
openat(AT_FDCWD, "/cm/local/apps/cuda/libs/current/lib64/libnvidia-ml.so.1", O_RDONLY|O_CLOEXEC) = 3
read(3, "\177ELF\2\1\1\0\0\0\0\0\0\0\0\0\3\0>\0\1\0\0\0 <\1\0\0\0\0\0"..., 832) = 832
newfstatat(3, "", {st_mode=S_IFREG|0755, st_size=1806968, ...}, AT_EMPTY_PATH) = 0
mmap(NULL, 16449256, PROT_READ|PROT_EXEC, MAP_PRIVATE|MAP_DENYWRITE, 3, 0) = 0x155554261000
mprotect(0x1555543c9000, 2093056, PROT_NONE) = 0
mmap(0x1555545c8000, 335872, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_DENYWRITE, 3, 0x167000) = 0x1555545c8000
mmap(0x15555461a000, 12545768, PROT_READ|PROT_WRITE, MAP_PRIVATE|MAP_FIXED|MAP_ANONYMOUS, -1, 0) = 0x15555461a000
close(3) = 0
mprotect(0x1555545c8000, 331776, PROT_READ) = 0
getpid() = 299934
openat(AT_FDCWD, "/proc/modules", O_RDONLY) = 3
newfstatat(3, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(3, "nvidia_peermem 16384 0 - Live 0x"..., 1024) = 1024
read(3, "0000000000000\nrpcrdma 98304 4 - "..., 1024) = 1024
close(3) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 3
newfstatat(3, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(3, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(3) = 0
stat("/dev/nvidiactl", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0xff), ...}) = 0
openat(AT_FDCWD, "/dev/nvidiactl", O_RDWR) = 3
fcntl(3, F_SETFD, FD_CLOEXEC) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0xd2, 0x48), 0x7fffffffba30) = 0
openat(AT_FDCWD, "/sys/devices/system/memory/block_size_bytes", O_RDONLY) = 4
read(4, "80000000\n", 99) = 9
close(4) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0xd6, 0x8), 0x7fffffffbac0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0xc8, 0x900), 0x15555520f4a0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2b, 0x20), 0x7fffffffbb90) = 0
openat(AT_FDCWD, "/proc/devices", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "Character devices:\n 1 mem\n 4 /"..., 1024) = 888
close(4) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/capabilities/mig/config", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "DeviceFileMinor: 1\nDeviceFileMod"..., 1024) = 59
close(4) = 0
mkdir("/dev/nvidia-caps", 0755) = -1 EEXIST (File exists)
openat(AT_FDCWD, "/proc/driver/nvidia/capabilities/mig/config", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "DeviceFileMinor: 1\nDeviceFileMod"..., 1024) = 59
read(4, "", 1024) = 0
close(4) = 0
stat("/dev/nvidia-caps/nvidia-cap1", {st_mode=S_IFCHR|0400, st_rdev=makedev(0x1fa, 0x1), ...}) = 0
access("/dev/nvidia-caps/nvidia-cap1", R_OK) = -1 EACCES (Permission denied)
openat(AT_FDCWD, "/proc/devices", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "Character devices:\n 1 mem\n 4 /"..., 1024) = 888
close(4) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/capabilities/mig/monitor", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "DeviceFileMinor: 2\nDeviceFileMod"..., 1024) = 59
close(4) = 0
mkdir("/dev/nvidia-caps", 0755) = -1 EEXIST (File exists)
openat(AT_FDCWD, "/proc/driver/nvidia/capabilities/mig/monitor", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "DeviceFileMinor: 2\nDeviceFileMod"..., 1024) = 59
read(4, "", 1024) = 0
close(4) = 0
stat("/dev/nvidia-caps/nvidia-cap2", {st_mode=S_IFCHR|0444, st_rdev=makedev(0x1fa, 0x2), ...}) = 0
access("/dev/nvidia-caps/nvidia-cap2", R_OK) = 0
openat(AT_FDCWD, "/dev/nvidia-caps/nvidia-cap2", O_RDONLY|O_CLOEXEC) = 4
fcntl(4, F_GETFD) = 0x1 (flags FD_CLOEXEC)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2b, 0x28), 0x7fffffffbb00) = 0
close(4) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia2", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x2), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia2", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia2", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia3", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x3), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia3", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia3", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia1", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x1), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia1", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia1", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia0", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia0", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia0", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia6", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x6), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia6", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia6", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia7", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x7), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia7", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia7", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia5", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x5), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia5", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia5", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffb0f0) = 0
openat(AT_FDCWD, "/proc/driver/nvidia/params", O_RDONLY) = 4
newfstatat(4, "", {st_mode=S_IFREG|0444, st_size=0, ...}, AT_EMPTY_PATH) = 0
read(4, "ResmanDebugLevel: 4294967295\nRmL"..., 1024) = 900
close(4) = 0
stat("/dev/nvidia4", {st_mode=S_IFCHR|0666, st_rdev=makedev(0xc3, 0x4), ...}) = 0
openat(AT_FDCWD, "/dev/nvidia4", O_RDWR|O_CLOEXEC) = -1 EPERM (Operation not permitted)
openat(AT_FDCWD, "/dev/nvidia4", O_RDWR) = -1 EPERM (Operation not permitted)
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffff8c80) = 0
getpid() = 299934
newfstatat(1, "", {st_mode=S_IFCHR|0620, st_rdev=makedev(0x88, 0x2), ...}, AT_EMPTY_PATH) = 0
write(1, "No devices were found\n", 22No devices were found
) = 22
getpid() = 299934
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x2a, 0x20), 0x7fffffffaef0) = 0
ioctl(3, _IOC(_IOC_READ|_IOC_WRITE, 0x46, 0x29, 0x10), 0x7fffffffb960) = 0
close(3) = 0
exit_group(6) = ?
+++ exited with 6 +++