NVIDIA Developer Forums

"setting the device when a process is active is not allowed"

Accelerated Computing CUDA CUDA Programming and Performance

Racz_Tamas October 5, 2010, 5:36pm 1

Hi guys!

I’m getting the error in the Title when I try to call cudaSetDevice(i);

after i called my CUDA DLL function From C#

As I read it, I probably have some cuda device memory still not freed, but thats not likely couse I use only 2 device arrays and i free them every time. Did I do something wrong? Does any other thing could cause my problem?

shorten cuda DLL function code:

int *a is my array with 0-255 number

int *eredmenytomb is my calculated array with numbers 0-12750

[codebox]stuktura_tipus* DLLfun2(int *a, int *eredmenytomb, int dimX, int dimY, int filter, int offset)

{

char *error;

stuktura_tipus *my_stuktura;

my_stuktura = (stuktura_tipus*) malloc(sizeof(stuktura_tipus)); 

int dimA = dimX*dimY; 

//my_stuktura->eredmenykeptomb = (int*) malloc(sizeof(int)*dimA);

// define grid and block size

    int numThreadsPerBlock = 16;

int n_blocks = dimA/numThreadsPerBlock + (dimA%numThreadsPerBlock == 0?0:1);  // 1024 blocks

// pointer for device memory

int *d_a, *d_b;

// allocate host and device memory

   size_t memSize = dimA * sizeof(int);

cudaMalloc( (void **) &d_a, memSize );

cudaMalloc( (void **) &d_b, memSize );

// Copy host array to device array

    cudaMemcpy( d_a, a, memSize, cudaMemcpyHostToDevice );

error = checkCUDAError(" memcpy_todevice ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}

// launch kernel

reverseArrayBlock<<< n_blocks, numThreadsPerBlock >>>( d_b , d_a , dimA, dimX, dimY, offset);

// block until the device has completed

    cudaThreadSynchronize();

// check if kernel execution generated an error

error = checkCUDAError(" kernel invocation ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}

// device to host copy

cudaMemcpy( eredmenytomb, d_b, memSize, cudaMemcpyDeviceToHost );



// Check for any CUDA errors

error = checkCUDAError(" memcpy_backtoHost ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}



// free device memory

cudaFree(d_a);

cudaFree(d_b);

my_stuktura->cuda_err = error;

return my_stuktura;

};[/codebox]

Racz_Tamas October 5, 2010, 5:36pm 2

Hi guys!

I’m getting the error in the Title when I try to call cudaSetDevice(i);

after i called my CUDA DLL function From C#

As I read it, I probably have some cuda device memory still not freed, but thats not likely couse I use only 2 device arrays and i free them every time. Did I do something wrong? Does any other thing could cause my problem?

shorten cuda DLL function code:

int *a is my array with 0-255 number

int *eredmenytomb is my calculated array with numbers 0-12750

[codebox]stuktura_tipus* DLLfun2(int *a, int *eredmenytomb, int dimX, int dimY, int filter, int offset)

{

char *error;

stuktura_tipus *my_stuktura;

my_stuktura = (stuktura_tipus*) malloc(sizeof(stuktura_tipus)); 

int dimA = dimX*dimY; 

//my_stuktura->eredmenykeptomb = (int*) malloc(sizeof(int)*dimA);

// define grid and block size

    int numThreadsPerBlock = 16;

int n_blocks = dimA/numThreadsPerBlock + (dimA%numThreadsPerBlock == 0?0:1);  // 1024 blocks

// pointer for device memory

int *d_a, *d_b;

// allocate host and device memory

   size_t memSize = dimA * sizeof(int);

cudaMalloc( (void **) &d_a, memSize );

cudaMalloc( (void **) &d_b, memSize );

// Copy host array to device array

    cudaMemcpy( d_a, a, memSize, cudaMemcpyHostToDevice );

error = checkCUDAError(" memcpy_todevice ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}

// launch kernel

reverseArrayBlock<<< n_blocks, numThreadsPerBlock >>>( d_b , d_a , dimA, dimX, dimY, offset);

// block until the device has completed

    cudaThreadSynchronize();

// check if kernel execution generated an error

error = checkCUDAError(" kernel invocation ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}

// device to host copy

cudaMemcpy( eredmenytomb, d_b, memSize, cudaMemcpyDeviceToHost );



// Check for any CUDA errors

error = checkCUDAError(" memcpy_backtoHost ");

if (error != "noerr"){

	my_stuktura->cuda_err = error;

	// free device memory on error

	cudaFree(d_a);

	cudaFree(d_b);

	return my_stuktura;

}



// free device memory

cudaFree(d_a);

cudaFree(d_b);

my_stuktura->cuda_err = error;

return my_stuktura;

};[/codebox]

ceearem October 5, 2010, 6:03pm 3

Hi

you can not call cudaSetDevice if a device is still associated with your process. And a device is implicitely associated with your process if you call any cuda funtion (except for the device management functions themself). I think you can free a device with cudaThreadExit() again (which will also free all memory on the device). But not to sure about that.

Ceearem

ceearem October 5, 2010, 6:03pm 4

Hi

you can not call cudaSetDevice if a device is still associated with your process. And a device is implicitely associated with your process if you call any cuda funtion (except for the device management functions themself). I think you can free a device with cudaThreadExit() again (which will also free all memory on the device). But not to sure about that.

Ceearem

Racz_Tamas October 5, 2010, 7:15pm 5

It worked…I called cudaThreadExit() at the end of my function and there weren’t problem with cudaSetDevice.

THX External Media

Racz_Tamas October 5, 2010, 7:15pm 6

It worked…I called cudaThreadExit() at the end of my function and there weren’t problem with cudaSetDevice.

THX External Media

Topic		Replies	Views	Activity
Error: "Setting the device when a process is active is not allowed." CUDA Programming and Performance	9	36975	May 1, 2010
cudaErrorInvalidDeviceFunction CUDA Programming and Performance cuda , jetson	6	2776	September 26, 2022
strange behavior with device emulation CUDA Programming and Performance	5	2693	May 20, 2008
How to pass a struct to a kernel? CUDA Programming and Performance	8	2376	March 19, 2019
cudaErrorInvalidDeviceFunction Simple program throwing cudaErrorInvalidDeviceFunction error CUDA Programming and Performance	1	2513	April 24, 2010
cudaSetDevice bug? CUDA Programming and Performance	13	7527	November 16, 2010
Got out of memory from cudaMemcpy CUDA Programming and Performance	13	4024	January 28, 2022
CudaAPI calls in functions, compiler/linking bug? CUDA Programming and Performance	6	367	August 17, 2023
Invalid Device Ordinal CUDA Programming and Performance cuda	2	603	August 12, 2024
Pls help!Problem with CUDA Structure CUDA Programming and Performance	1	665	October 21, 2010