我使用此站点http://code.google.com/p/stanford-cs193g-sp2010/wiki/TutorialHelloWorld在 cuda 中复制了一个 hello world 程序
代码是
#include "util/cuPrintf.cu"
#include <stdio.h>
__global__ void device_greetings(void)
{
cuPrintf("Hello, world from the device!\n");
}
int main(void)
{
// greet from the host
printf("Hello, world from the host!\n");
// initialize cuPrintf
cudaPrintfInit();
// launch a kernel with a single thread to greet from the device
device_greetings<<<1,1>>>();
// display the device's greeting
cudaPrintfDisplay();
// clean up after cuPrintf
cudaPrintfEnd();
return 0;
}
然后使用编译,nvcc hello_world.cu -o hello_world
但是我只看到 hello fom 主机而不是设备。
我什至试过
printf("{CudaPrintfInt => %s}\n",cudaGetErrorString(cudaPrintfInit()));
printf("{cudaPrintfDisplay => %s}\n",cudaGetErrorString(cudaPrintfDisplay(stdout, true)));
并用 编译nvcc -arch=sm_11 hello_world.cu -o hello_world
,但是我得到:
$ ./hello_world
Hello, world from the host!
{CudaPrintfInt => initialization error}
{cudaPrintfDisplay => __global__ function call is not configured}
$
图形模型为:
$/sbin/lspci -v | grep VGA
07:01.0 VGA compatible controller: Matrox Graphics, Inc. MGA G200eW WPCM450 (rev 0a) (prog-if 00 [VGA controller])
cuda版本是4:
$ ls /usr/local/cuda/lib/
libcublas.so libcudart.so.4.0.17 libcurand.so.4 libnpp.so
libcublas.so.4 libcufft.so libcurand.so.4.0.17 libnpp.so.4
libcublas.so.4.0.17 libcufft.so.4 libcusparse.so libnpp.so.4.0.17
libcudart.so libcufft.so.4.0.17 libcusparse.so.4
libcudart.so.4 libcurand.so libcusparse.so.4.0.17