Dynamic Parallilism in cuda gives unresolved externals error in visual studio 2005

I Have simple dynamic parallilism code calculating square as

#include <stdio.h>
#include <cuda.h>


__global__ void square(float *a, int N)
{
  int idx = blockIdx.x * blockDim.x + threadIdx.x;
  a[idx] = a[idx] * a[idx];
}
// Kernel that executes on the CUDA device
__global__ void first(float *arr, int N)
{
  int idx = blockIdx.x * blockDim.x + threadIdx.x;
  square <<< 1, N >>> (arr, N);
 /*for(int i=0;i<N;i++)
 {
     a[i]=a[i]*a[i];
 }*/
}

// main routine that executes on the host
int main(void)
{
  float *a_h, *a_d;  // Pointer to host & device arrays
  const int N = 10;  // Number of elements in arrays
  size_t size = N * sizeof(float);
  a_h = (float *)malloc(size);        // Allocate array on host
  cudaMalloc((void **) &a_d, size);   // Allocate array on device
  // Initialize host array and copy it to CUDA device
  for (int i=0; i<N; i++) a_h[i] = (float)i;
  cudaMemcpy(a_d, a_h, size, cudaMemcpyHostToDevice);
  // Do calculation on device:
  int block_size = 4;
  int n_blocks = N/block_size + (N%block_size == 0 ? 0:1);
  first <<< 1, 1 >>> (a_d, N);
  // Retrieve result from device and store it in host array
  cudaMemcpy(a_h, a_d, sizeof(float)*N, cudaMemcpyDeviceToHost);
  // Print results
  for (int i=0; i<N; i++) printf("%d %f\n", i, a_h[i]);
  // Cleanup
  free(a_h); cudaFree(a_d);
}

I have included necessary cudadevrt.lib and also enabled cuda relocatable device code to yes and compiled with sm 35 but it gives the error as

Error   6   error LNK2019: unresolved external symbol ___cudaRegisterLinkedBinary_53_tmpxft_000014f0_00000000_8_dynamicparallilism_cpp1_ii_fa75b653 referenced in function "void __cdecl __sti____cudaRegisterAll_53_tmpxft_000014f0_00000000_8_dynamicparallilism_cpp1_ii_fa75b653(void)" (?__sti____cudaRegisterAll_53_tmpxft_000014f0_00000000_8_dynamicparallilism_cpp1_ii_fa75b653@@YAXXZ) dynamicparallilism.cu.obj

and

Error   7   fatal error LNK1120: 1 unresolved externals E:\cuda\dynamic_parallilism\Debug\dynamic_parallilism.exe

and the visual studio command output windows shows

1>------ Rebuild All started: Project: dynamic_parallilism, Configuration: Debug Win32 ------
1>Deleting intermediate and output files for project 'dynamic_parallilism', configuration 'Debug|Win32'
1>Compiling with CUDA Build Rule...
1>"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v5.0\bin\nvcc.exe"     -gencode=arch=compute_35,code=\"sm_35,compute_35\" -gencode=arch=compute_35,code=\"sm_35,compute_35\"  --machine 32 -ccbin "C:\Program Files (x86)\Microsoft Visual Studio 8\VC\bin"    -Xcompiler "/EHsc /W3 /nologo /O2 /Zi   /MTd  "  -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v5.0\include" -maxrregcount=0  -rdc=true --compile -o "Debug/dynamicparallilism.cu.obj" dynamicparallilism.cu  
1>nvcc : warning : nvcc support for MSVC 8.0 and earlier has been deprecated and is no longer being maintained
1>dynamicparallilism.cu
1>e:/cuda/dynamic_parallilism/dynamic_parallilism/dynamicparallilism.cu(14): warning: variable "idx" was declared but never referenced
1>e:/cuda/dynamic_parallilism/dynamic_parallilism/dynamicparallilism.cu(36): warning: variable "n_blocks" was declared but never referenced
1>tmpxft_00000718_00000000-5_dynamicparallilism.cudafe1.gpu
1>tmpxft_00000718_00000000-10_dynamicparallilism.cudafe2.gpu
1>dynamicparallilism.cu
1>e:/cuda/dynamic_parallilism/dynamic_parallilism/dynamicparallilism.cu(14): warning: variable "idx" was declared but never referenced
1>e:/cuda/dynamic_parallilism/dynamic_parallilism/dynamicparallilism.cu(36): warning: variable "n_blocks" was declared but never referenced
1>tmpxft_00000718_00000000-5_dynamicparallilism.cudafe1.cpp
1>tmpxft_00000718_00000000-15_dynamicparallilism.ii
1>Linking...
1>dynamicparallilism.cu.obj : error LNK2019: unresolved external symbol ___cudaRegisterLinkedBinary_53_tmpxft_00000718_00000000_8_dynamicparallilism_cpp1_ii_fa75b653 referenced in function "void __cdecl __sti____cudaRegisterAll_53_tmpxft_00000718_00000000_8_dynamicparallilism_cpp1_ii_fa75b653(void)" (?__sti____cudaRegisterAll_53_tmpxft_00000718_00000000_8_dynamicparallilism_cpp1_ii_fa75b653@@YAXXZ)
1>E:\cuda\dynamic_parallilism\Debug\dynamic_parallilism.exe : fatal error LNK1120: 1 unresolved externals
1>Project : warning PRJ0018 : The following environment variables were not found:
1>$(CUDA_LIB_PATH)
1>$(NVSDKCOMPUTE_ROOT)
1>Build log was saved at "file://e:\cuda\dynamic_parallilism\dynamic_parallilism\Debug\BuildLog.htm"
1>dynamic_parallilism - 2 error(s), 5 warning(s)
========== Rebuild All: 0 succeeded, 1 failed, 0 skipped ==========