GPGPU编程技术(仇德元 编著)中第四章一个实例 “第一个CUDA程序”我是在VS2008+CUDA5.0下运行的老出错
1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(66): error : identifier "CUTFalse" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(66): error : identifier "cutCheckCondition" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(73): error : identifier "cutCheckCmdLineFlag" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(343): error : identifier "CUTBoolean" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(345): error : identifier "CUTTrue" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(397): error : identifier "cutGetCmdLineArgumenti" is undefined1> 1>C:\ProgramData\NVIDIA Corporation\NVIDIA GPU Computing SDK 4.1\C\common\inc\cutil_inline_runtime.h(425): error : identifier "cutCheckCmdLineFlag" is undefined
怎么这么多标示符都未定义啊 文件也包含进来了 搭配环境也建成功了 这个问题我换了个低版本的CUDA4.1的试了试还是会出现 高手指点迷津啊
以下是源代码高手可以在自己电脑上运行下 跪求真理
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include <math.h>
#include <cutil_inline_runtime.h>
__global__ void my_first_kernel(float *x)
{
int tid=threadIdx.x+blockDim.x*blockIdx.x;
x[tid]=(float)threadIdx.x;
}
int main(int argc, char **argv)
{
float *pfHost,*pfDevice;
int nBlocks,nThreads,nSize,n;
//初始化GPU
cutilDeviceInit(argc,argv);
//设置block数、每个block的线程数
nBlocks=2;
nThreads=8;
nSize=nBlocks*nThreads;
//分配主机、设备存储空间
pfHost=(float *)malloc(nSize *sizeof(float));
cutilSafeCall(cudaMalloc((void **)&pfDevice,nSize*sizeof(float)));
//执行全局函数
my_first_kernel<<<nBlocks,nThreads>>>(pfDevice);
cutilCheckMsg("my_first_kernel execution failed\n");
//取回计算结果,并打印输出
cutilSafeCall(cudaMemcpy(pfHost,pfDevice,nSize*sizeof(float),cudaMemcpyDeviceToHost));
for (n=0;n<nSize;n++)
{
printf("%d %f",n,pfHost[n]);
}
//回收存储空间
cutilSafeCall(cudaFree(pfDevice));
free(pfHost);
cutilExit(argc,argv);
}