CUDA bug in dealing with cudaMemcpyToSymbol

pacard · December 28, 2009, 9:12am

This is a CUDA toolkit bug, exists for both 2.3 and 3.0. (I have only tried these two.)

For the following code, an “invalid device symbol” error message is always generated, which shouldn’t happen.

#include <stdio.h>

#include <cuda.h>

#  define CUT_CHECK_ERROR(errorMessage) do {							 \

	cudaError_t err = cudaGetLastError();								   \

	if( cudaSuccess != err) {										   \

		fprintf(stderr, "Cuda error: %s in file '%s' in line %i : %s.\n",	\

				errorMessage, __FILE__, __LINE__, cudaGetErrorString( err) );\

		exit(EXIT_FAILURE);											   \

	}																   \

	err = cudaThreadSynchronize();										 \

	if( cudaSuccess != err) {										   \

		fprintf(stderr, "Cuda error: %s in file '%s' in line %i : %s.\n",	\

				errorMessage, __FILE__, __LINE__, cudaGetErrorString( err) );\

		exit(EXIT_FAILURE);											   \

	} } while (0)

#  define CE(call) do {								\

		call;CUT_CHECK_ERROR("------- Error ------\n"); \

	 } while (0)

namespace HMM_GPU{

__constant__	char * a;

};

using namespace HMM_GPU;

void bar(char * & x){

		CE(cudaMemcpyToSymbol(a, &x, sizeof(a), 0, cudaMemcpyHostToDevice));

		CE(cudaMemcpyFromSymbol(&x, a, sizeof(a), 0, cudaMemcpyDeviceToHost));

}

int main(){

		char * x=0;

		bar(x);

		printf("%p\n",x);

		return 0;

}

Doing any one of the following gets rid of the message:

do not use namespace
change the type of a to void *
change the type of a to int

I looked into the header files, and I think the bug lies in the following code in cuda_runtime.h:

static __inline__ __host__ cudaError_t cudaMemcpyToSymbol(

		char				*symbol,

  const void				*src,

		size_t			   count,

		size_t			   offset = 0,

		enum cudaMemcpyKind  kind   = cudaMemcpyHostToDevice

)

{

  return cudaMemcpyToSymbol((const char*)symbol, src, count, offset, kind);

}

template<class T>

__inline__ __host__ cudaError_t cudaMemcpyToSymbol(

  const T				   &symbol,

  const void				*src,

		size_t			   count,

		size_t			   offset = 0,

		enum cudaMemcpyKind  kind   = cudaMemcpyHostToDevice

)

{

  return cudaMemcpyToSymbol((const char*)&symbol, src, count, offset, kind);

}

I commented out the first definition (also the corresponding definition for cudaMemcpyFromSymbol), and the code runs smoothly.

There are something I don’t understand, though:

why the error does not occur when I don’t use namespace?
what’s the first definition for?
In the second definition, the address of symbol is taken and converted into const char *, what is that for?

Topic		Replies	Views
cudaMemcpyToSymbol returnes "invalid device symbol" CUDA Programming and Performance	12	35865	May 2, 2011
Problem with cudaMemcpyToSymbol CUDA Programming and Performance	2	975	January 28, 2011
Cuda 5 issue with MemcpyToSymbol Not working when symbol is in a namespace CUDA Programming and Performance	2	1246	May 19, 2012
cudaMemcpyToSymbol(.....) input parameter issue CUDA Programming and Performance	2	4464	October 20, 2009
cudaMemcpyToSymbol returns "invalid device symbol" problem with __constant__ memory (Linux CUDA Programming and Performance	4	2095	September 17, 2010
Why I got a cudaErrorInvalidSymbol CUDA Programming and Performance	1	7172	June 19, 2009
invalid argument with cudaMemcpyToSymbol CUDA Programming and Performance	1	8287	November 28, 2011
cudaMemcpyFromSymbol not working as spec'ed CUDA Programming and Performance	5	11851	September 15, 2008
invalid device symbol when copying to constant memory CUDA Programming and Performance	4	10869	May 11, 2009
cudaMemcpyToSymbol fails when called from member functions, works ok frm static function CUDA Programming and Performance	0	4262	May 8, 2009

CUDA bug in dealing with cudaMemcpyToSymbol

Related topics