1 #ifndef H_VECTOR_MBP_REDUCE_H__
2 #define H_VECTOR_MBP_REDUCE_H__
8 #include <cuda_runtime_api.h>
11 static const int wholeArraySize = 100000000;
12 static const int blockSize = 1024;
13 static const int gridSize = 24;
__global__ void cuda_vector_mbp_reduce(const float *a, float *out)
void vector_mbp_reduce(float *a, float *b, int n)