Toolkit 11.4 RTXA4000 (8.6) - but its the same for 11.8 T4 7.5
Device Id : 0
Device Name : NVIDIA RTX A4000
MultiProcessorCount : 48
maxThreadsPerMultiProcessor : 1536
ClockRate(kilohertz) : 1560000
compute Capability : 8.6
Global Memory : 16504128(KB)
Const Memory : 64(KB)
shared Memory per Block : 48(KB)
MaxGridSize : 2147483647.65535.65535
maxThreadsDim : 1024.1024.64
MaxThreadsPerBlock : 1024
warpSize : 32
concurrentKernels : 1
streamPrioritiesSupported : Supported
StreamPriorityRange :(0–5)
MemoryClockRate(kilohertz) : 7001000
MemoryBusWidth : 256
a.h
void lib1rt();
a.cpp
#include
#include “a.h”
void lib1rt(){
std::cout << "lib1" <<std::endl;
}
make all
Building file: …/a.cpp
Invoking: NVCC Compiler
/usr/local/cuda/bin/nvcc --debug -gencode arch=compute_86,code=compute_86 -Xcompiler -fPIC -ccbin g++ -c -o “a.o” “…/a.cpp”
Finished building: …/a.cpp
Building target: libNirSharedLib1.so
Invoking: NVCC linker
/usr/local/cuda/bin/nvcc --cudart=static -ccbin g++ --shared -gencode arch=compute_86,code=compute_86 -o “libNirSharedLib1.so” ./a.o
Finished building target: libNirSharedLib1.so
b.h
void lib2rt();
b.cpp
#include
#include “b.h”
void lib2rt(){
std::cout << "lib2" <<std::endl;
}
Building file: …/b.cpp
Invoking: NVCC Compiler
/usr/local/cuda/bin/nvcc --device-debug --debug -gencode arch=compute_86,code=compute_86 -Xcompiler -fPIC -ccbin g++ -c -o “b.o” “…/b.cpp”
Finished building: …/b.cpp
Building target: libNirSharedLib2.so
Invoking: NVCC linker
/usr/local/cuda/bin/nvcc --cudart=static -ccbin g++ --shared -gencode arch=compute_86,code=compute_86 -o “libNirSharedLib2.so” ./b.o
Finished building target: libNirSharedLib2.so
LibTest.cpp
#include
#include <cuda_runtime.h>
#include <a.h>
#include <b.h>
int main() {
std::cout << “!!!Hello World!!!” << std::endl; // prints !!!Hello World!!!
cudaError_t err;
err = cudaDeviceSynchronize();
if (err != cudaSuccess)
{
std::cout << "error" << std::endl;
}
lib1rt();
lib2rt();
return 0;
}
Building file: …/src/LibTest.cpp
Invoking: NVCC Compiler
/usr/local/cuda/bin/nvcc -I"/home/zinir/eclipse-workspaceLib/NirSharedLib1" -I"/home/zinir/eclipse-workspaceLib/NirSharedLib2" --debug -gencode arch=compute_86,code=compute_86 -ccbin g++ -c -o “src/LibTest.o” “…/src/LibTest.cpp”
Finished building: …/src/LibTest.cpp
Building target: LibTest
Invoking: NVCC linker
/usr/local/cuda/bin/nvcc --cudart=static -L"/home/zinir/eclipse-workspaceLib/NirSharedLib1/Debug" -L"/home/zinir/eclipse-workspaceLib/NirSharedLib2/Debug" -ccbin g++ -gencode arch=compute_86,code=compute_86 -o “LibTest” ./src/LibTest.o -lNirSharedLib1 -lNirSharedLib2
Finished building target: LibTest