problem of compile matrixMul error of compilation

smeil · August 11, 2010, 5:14pm

sorry this is my code

// includes, system
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <math.h>

// includes, project
#include <cutil_inline.h>

////////////////////////////////////////////////////////////////////////////////
// declaration, forward
void MatrixMulOnDevice(float * M, float * N, float * P, int Width);
void MatrixMulKernel(float * Md, float * Nd, float * Pd, int Width);

float* Md;
float* Nd;
float* Pd;

////////////////////////////////////////////////////////////////////////////////
// Program main
////////////////////////////////////////////////////////////////////////////////
int
main(int argc, char** argv)
{

MatrixMulOnDevice(Md, Nd, Pd, 10);

}

////////////////////////////////////////////////////////////////////////////////
//! Run a simple test for CUDA
////////////////////////////////////////////////////////////////////////////////

void MatrixMulKernel(float * Md, float * Nd, float * Pd, int Width)
{

int tx = threadIdx.x;
int ty = threadIdx.y;

float Pvaleur = 0;
for (int i = 0; i < Width; ++i)
{
    float MdElement = Md[ty * Width + i];
    float NdElement = Nd[i  * Width + tx];
    Pvaleur        += MdElement * NdElement;
}


Pd[ty * Width + tx] = Pvaleur;

}

void MatrixMulOnDevice(float * M, float * N, float * P, int Width)
{
int size = Width*Width * sizeof(float);

// allocate arrays on host
float* Ma = (float*) malloc(size);
float* Na = (float*) malloc(size);
float* Pa = (float*) malloc(size);

// initialize host memory
for (int i=0; i<size; i++) Ma[i] = (float)i;
for (int j=0; j<size; j++) Na[j] = (float)j;

// allocate array on device
cudaMalloc((void **) &Md, size);
cudaMemcpy(Md, Ma, size, cudaMemcpyHostToDevice) ;
cudaMalloc((void **) &Nd, size);
cudaMemcpy(Nd, Na, size, cudaMemcpyHostToDevice);
cudaMalloc((void **) &Pd, size);

dim3 dimGrid(1, 1);

dim3 dimBlock(Width, Width);

//Call of MatrixMulKernel
MatrixMulKernel<<<dimGrid, dimBlock>>>(Md, Nd, Pd, Width);

// copy data from host to device
cudaMemcpy(P, Pd, size, cudaMemcpyDeviceToHost);

//destruction des matrices, dÃ©sormais inutilisÃ©es
free(Ma);
free(Na);
free(Pa);
cudaFree(Md);
cudaFree(Nd);
cudaFree(Pd);

}

Topic		Replies	Views
problem of compile matrixMul error of compilation CUDA Programming and Performance	8	1326	August 12, 2010
Matrix multiplcation peoblem CUDA Programming and Performance	2	1171	July 9, 2010
CUDA kernel from matlab CUDA kernel for matrix operations from matlab CUDA Programming and Performance	1	1070	May 12, 2012
Matrix Multiplication Help CUDA Programming and Performance	5	3938	August 19, 2009
multiplication of no square matrix general code of multiplication of two matrix CUDA Programming and Performance	0	801	August 12, 2010
matrix multiplication--wrong answer CUDA Programming and Performance	6	3884	August 20, 2009
Matrix multiplication---not getting correct answer? answer for matrix multiplicatin seems to be wron CUDA Programming and Performance	0	3232	August 1, 2009
Matrix multiplication CUDA Programming and Performance	7	2261	July 2, 2010
mutrix multiplication CUDA Programming and Performance	4	2207	November 20, 2011
Matrix Multiplication CUDA Programming and Performance	5	1739	September 17, 2009

problem of compile matrixMul error of compilation

Related topics