我正在尝试创建一个 CUDA + C++ 项目。基本上是一个需要一些 CUDA 内核的 .cpp 项目。所以我只是按照这里的例子,它基本上添加了两个向量。内核完成求和工作:http : //blog.norture.com/2012/10/gpu-parallel-programming-in-vs2012-with-nvidia-cuda/
这是代码,
#include <iostream>
#include "cuda_runtime.h"
#include "cuda.h"
#include "device_launch_parameters.h"
using namespace std;
__global__ void saxpy(int n, float a, float *x, float *y)
{
int i = blockIdx.x*blockDim.x + threadIdx.x;
if (i < n) y[i] = a*x[i] + y[i];
}
int main(void)
{
int N = 1<<20;
float *x, *y, *d_x, *d_y;
x = (float*)malloc(N*sizeof(float));
y = (float*)malloc(N*sizeof(float));
cudaMalloc(&d_x, N*sizeof(float));
cudaMalloc(&d_y, N*sizeof(float));
for (int i = 0; i < …Run Code Online (Sandbox Code Playgroud)