求问这个是怎么回事?

VS2010安装了nsight之后可以直接建立CUDA工程,建立了以后,里面自带了一段代码,但是这段代码唯一的一个错误就是在调用kernel函数的时候编译器不认<<< >>>这个东西。请问这个定义是在哪个库文件里的?

#include "cuda_runtime.h"
#include "device_launch_parameters.h"#include <stdio.h>cudaError_t addWithCuda(int *c, const int *a, const int *b, size_t size);__global__ void addKernel(int *c, const int *a, const int *b)
{
   int i = threadIdx.x;
   c[i] = a[i] + b[i];
}int main()
{
 const int arraySize = 5;
   const int a[arraySize] = { 1, 2, 3, 4, 5 };
   const int b[arraySize] = { 10, 20, 30, 40, 50 };
   int c[arraySize] = { 0 };    // Add vectors in parallel.
   cudaError_t cudaStatus = addWithCuda(c, a, b, arraySize);
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "addWithCuda failed!");
   return 1;
   }    printf("{1,2,3,4,5} + {10,20,30,40,50} = {%d,%d,%d,%d,%d}\n",
   c[0], c[1], c[2], c[3], c[4]); // cudaDeviceReset must be called before exiting in order for profiling and
 // tracing tools such as Parallel Nsight and Visual Profiler to show complete traces.
   cudaStatus = cudaDeviceReset();
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaDeviceReset failed!");
   return 1;
   }    return 0;
}// Helper function for using CUDA to add vectors in parallel.
cudaError_t addWithCuda(int *c, const int *a, const int *b, size_t size)
{
   int *dev_a = 0;
   int *dev_b = 0;
   int *dev_c = 0;
   cudaError_t cudaStatus;    // Choose which GPU to run on, change this on a multi-GPU system.
   cudaStatus = cudaSetDevice(0);
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaSetDevice failed!  Do you have a CUDA-capable GPU installed?");
   goto Error;
   }    // Allocate GPU buffers for three vectors (two input, one output)    .
   cudaStatus = cudaMalloc((void**)&dev_c, size * sizeof(int));
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMalloc failed!");
   goto Error;
   }    cudaStatus = cudaMalloc((void**)&dev_a, size * sizeof(int));
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMalloc failed!");
   goto Error;
   }    cudaStatus = cudaMalloc((void**)&dev_b, size * sizeof(int));
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMalloc failed!");
   goto Error;
   }    // Copy input vectors from host memory to GPU buffers.
   cudaStatus = cudaMemcpy(dev_a, a, size * sizeof(int), cudaMemcpyHostToDevice);
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMemcpy failed!");
   goto Error;
   }    cudaStatus = cudaMemcpy(dev_b, b, size * sizeof(int), cudaMemcpyHostToDevice);
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMemcpy failed!");
   goto Error;
   }    // Launch a kernel on the GPU with one thread for each element.
   addKernel<<<1, size>>>(dev_c, dev_a, dev_b);    // cudaDeviceSynchronize waits for the kernel to finish, and returns
   // any errors encountered during the launch.
   cudaStatus = cudaDeviceSynchronize();
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaDeviceSynchronize returned error code %d after launching addKernel!\n", cudaStatus);
   goto Error;
   }    // Copy output vector from GPU buffer to host memory.
   cudaStatus = cudaMemcpy(c, dev_c, size * sizeof(int), cudaMemcpyDeviceToHost);
   if (cudaStatus != cudaSuccess) {
   fprintf(stderr, "cudaMemcpy failed!");
   goto Error;
   }Error:
   cudaFree(dev_c);
   cudaFree(dev_a);
   cudaFree(dev_b);
   
   return cudaStatus;
}

 

那个输出窗口中有没有提示NVCC在编译呀。

提示了,这个是输出的结果,另外,我这个机器是想拿来做双击调试的,只装了toolkit和SDK,没装驱动。难道跟这个有关吗?
1>------ Build started: Project: test, Configuration: Debug Win32 ------
1>Build started 2011/10/21 9:45:50.
1>PrepareForBuild:
1> Creating directory “D:\我的文档\sourcecode\test\Debug".
1>InitializeBuildStatus:
1> Creating “Debug\test.unsuccessfulbuild” because “AlwaysCreate” was specified.
1>AddCudaCompilePropsDeps:
1> Found “CudaToolkitCustomDir”.
1> Found “AdditionalDeps”.
1> Found “CompileOut”.
1> Found “Include”.
1> Found “Keep”.
1> Found “KeepDir”.
1> Found “NvccCompilation”.
1> Found “NvccPath”.
1> Found “RequiredIncludes”.
1> Found “TargetMachinePlatform”.
1> Found “CInterleavedPTX”.
1> Found “CodeGeneration”.
1> Found “GPUDebugInfo”.
1> Found “MaxRegCount”.
1> Found “PtxAsOptionV”.
1> Found “Defines”.
1> Found “Emulation”.
1> Found “HostDebugInfo”.
1> Found “FastMath”.
1> Found “Optimization”.
1> Found “Runtime”.
1> Found “RuntimeChecks”.
1> Found “TypeInfo”.
1> Found “Warning”.
1> Found “AdditionalOptions”.
1> Found “CommandLineTemplate”.
1>CudaBuild:
1> Compiling CUDA source file kernel.cu…
1>
1> D:\我的文档\sourcecode\test\test>“C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v4.0\bin\nvcc.exe” -gencode=arch=compute_10,code="sm_10,compute_10" --use-local-env --cl-version 2010 -ccbin “C:\Program Files\Microsoft Visual Studio 10.0\VC\bin” -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v4.0\include” -G0 --keep-dir “Debug” -maxrregcount=0 --machine 32 --compile -D_NEXUS_DEBUG -g -Xcompiler "/EHsc /nologo /Od /Zi /MDd " -o “Debug\kernel.cu.obj” “D:????\sourcecode\test\test\kernel.cu”
1> kernel.cu
1>c1xx : fatal error C1083: Cannot open source file: ‘D:/???/sourcecode/test/test/kernel.cu’: Invalid argument
1>C:\Program Files\MSBuild\Microsoft.Cpp\v4.0\BuildCustomizations\CUDA 4.0.targets(352,9): error MSB3721: The command ““C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v4.0\bin\nvcc.exe” -gencode=arch=compute_10,code="sm_10,compute_10" --use-local-env --cl-version 2010 -ccbin “C:\Program Files\Microsoft Visual Studio 10.0\VC\bin” -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v4.0\include” -G0 --keep-dir “Debug” -maxrregcount=0 --machine 32 --compile -D_NEXUS_DEBUG -g -Xcompiler “/EHsc /nologo /Od /Zi /MDd " -o “Debug\kernel.cu.obj” “D:\我的文档\sourcecode\test\test\kernel.cu”” exited with code 2.
1>
1>Build FAILED.
1>
1>Time Elapsed 00:00:02.15
========== Build: 0 succeeded, 1 failed, 0 up-to-date, 0 skipped ==========

移出中文目录试试吧。:lol

很久没有用过nsight了~

我是从来没用过啊,本来想用的,结果导师不给力,不给买电脑。

换了目录名以后确实可以编译了,不过那个<<<下面一直有道红线提示错误,看着很不爽啊。

那条小红线只占一个字节的长度。安心吧。我没有解决它。:slight_smile:

纠结,能运行就不错啦,嘿嘿:lol

没事,忍忍吧~

改成英文项目名果然就好了,不知这是怎么回事

项目路径中不能有中文名的,这是一个已知的要求。

请Dabai不要挖坟。

此贴将被立即下沉处理。