How can I add vector elements in a cuda kernel?

Question

#include 
#include 
#include 
#include 
using namespace std;

__global__ void kernel(vector  *a,vector  *b, vector  *c)
{
    int index=threadIdx.x;
    c[index]=a[index]+b[index];
};

int main ()
{
    //Paar constanten initializeren
    int N=3;
    vector  a (3,1);
    vector  b (3,1);
    vector  c (3,0);
    int size=N*sizeof(vector );
    //Device variabelen
    vector  d_a;
    vector  d_b;
    vector  d_c;

    // bytes device-geheugen vrijmaken op locatie &a
    cudaMalloc( (void **) &a, size);
    cudaMalloc ( (void **) &b, size);
    cudaMalloc ( (void **) &c, size);

    //Kopieer inputs van &a naar &d_a
    cudaMemcpy(&d_a,&a,size,cudaMemcpyHostToDevice);
    cudaMemcpy(&d_b,&b,size,cudaMemcpyHostToDevice);

    printf( (char *) a[1]);
    printf( (char *) c[1]);
    //Voer kernel uit

    kernel<<>>(&d_a,&d_b,&d_c);

    //Kopieer resultaat terug naar host 
    cudaMemcpy(&c,&d_c,size,cudaMemcpyDeviceToHost);

    printf( (char *) c[1]);

    return 0;
};

So this is my basic C++ vector addition program, though it won't compile because it doesn't know what to do with the "+" when adding indexes ("no operator "+" matches these operands"). Anyone have an idea why this doesn't work inside the kernel? I think it may have to do with the fact that it's a host function or something like that, though I wouldn't know how to get around that problem.

Greetings and thanks in advance.

Jason · Accepted Answer

You can't use the STL in device code ... you're going to have to use an array or some other CUDA construct like the Thrust Library.

How can I add vector elements in a cuda kernel?

Answers (1)

Related Questions