Could pls help to check and guide next action how to fix? Thanks a lot!
[root@xxx]# nvidia-smi
No devices were found
[root@xxx]#tail -f /var/log/messages
Aug 9 13:57:34 localhost kernel: resource sanity check: requesting [mem 0xd0700000-0xd16fffff], which spans more than PCI Bus 0000:0b [mem 0xd0000000-0xd0ffffff]
Aug 9 13:57:34 localhost kernel: caller os_map_kernel_space.part.7+0xd6/0xf0 [nvidia] mapping multiple BARs
Aug 9 13:57:34 localhost kernel: NVRM: GPU 0000:0b:00.0: RmInitAdapter failed! (0x24:0x72:1436)
Aug 9 13:57:34 localhost kernel: NVRM: GPU 0000:0b:00.0: rm_init_adapter failed, device minor number 0
Aug 9 13:57:34 localhost kernel: resource sanity check: requesting [mem 0xd0700000-0xd16fffff], which spans more than PCI Bus 0000:0b [mem 0xd0000000-0xd0ffffff]
Aug 9 13:57:34 localhost kernel: caller os_map_kernel_space.part.7+0xd6/0xf0 [nvidia] mapping multiple BARs
Aug 9 13:57:34 localhost kernel: NVRM: GPU 0000:0b:00.0: RmInitAdapter failed! (0x24:0x72:1436)
Aug 9 13:57:34 localhost kernel: NVRM: GPU 0000:0b:00.0: rm_init_adapter failed, device minor number 0
[root@xxx]# lspci | grep NVIDIA
0b:00.0 3D controller: NVIDIA Corporation GP100GL [Tesla P100 PCIe 16GB] (rev a1)
[root@xxx]# hostnamectl
Static hostname: xxx
Icon name: computer
Deployment: ImageHubNetBoot17Nov2022
Machine ID: 75e5103042c24b5181f3702e763daab7
Boot ID: 580dd9f211c74f9f9776980a4f537d6b
Operating System: CentOS Linux 7 (Core)
CPE OS Name: cpe:/o:centos:centos:7
Kernel: Linux 3.10.0-1160.95.1.el7.x86_64
Architecture: x86-64
[root@xxx]# uname -a
Linux xxx 3.10.0-1160.95.1.el7.x86_64 #1 SMP Mon Jul 24 13:59:37 UTC 2023 x86_64 x86_64 x86_64 GNU/Linux
[root@xxx]# yum list installed | grep nvidia
Loaded plugins: fastestmirror, langpacks, nvidia
Repository cuda-rhel7-x86_64 is listed more than once in the configuration
kmod-nvidia-latest-dkms.x86_64 3:535.86.10-1.el7 @cuda-rhel7-x86_64
nvidia-driver-latest-dkms.x86_64 3:535.86.10-1.el7 @cuda-rhel7-x86_64
nvidia-driver-latest-dkms-NVML.x86_64
nvidia-driver-latest-dkms-NvFBCOpenGL.x86_64
nvidia-driver-latest-dkms-cuda.x86_64
nvidia-driver-latest-dkms-cuda-libs.x86_64
nvidia-driver-latest-dkms-devel.x86_64
nvidia-driver-latest-dkms-libs.x86_64
nvidia-libXNVCtrl.x86_64 3:535.86.10-1.el7 @cuda-rhel7-x86_64
nvidia-libXNVCtrl-devel.x86_64 3:535.86.10-1.el7 @cuda-rhel7-x86_64
nvidia-modprobe-latest-dkms.x86_64
nvidia-persistenced-latest-dkms.x86_64
nvidia-settings.x86_64 3:535.86.10-1.el7 @cuda-rhel7-x86_64
nvidia-xconfig-latest-dkms.x86_64
yum-plugin-nvidia.noarch 0.5-1.el7 @cuda-rhel7-x86_64
[root@xxx]# gcc --version
gcc (GCC) 4.8.5 20150623 (Red Hat 4.8.5-44)
Copyright (C) 2015 Free Software Foundation, Inc.
This is free software; see the source for copying conditions. There is NO
warranty; not even for MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
[root@xxx]# nvcc --version
nvcc: NVIDIA (R) Cuda compiler driver
Copyright (c) 2005-2023 NVIDIA Corporation
Built on Tue_Jul_11_02:20:44_PDT_2023
Cuda compilation tools, release 12.2, V12.2.128
Build cuda_12.2.r12.2/compiler.33053471_0
nvidia-bug-report.log.gz (118.8 KB)