CUDA编程之:cudaMemcpy()函数
cudaMemcpy用于在主机(Host)和设备(Device)之间往返的传递数据,用法如下:
主机到设备:cudaMemcpy(d_A,h_A,nBytes,cudaMemcpyHostToDevice)
设备到主机:cudaMemcpy(h_A,d_A,nBytes,cudaMemcpyDeviceToHost)
注意:该函数是同步执行函数,在未完成数据的转移操作之前会锁死并一直占有CPU进程的控制权,所以不用再添加cudaDeviceSynchronize()函数
示例:
void VectorReal_copyBuffer(realVecHandle* addr, float hostArr[],long buffer, bool tohost, int copyMode) { realVecHandle * native =addr; float * host = hostArr; if ( copyMode == 0 ) { if (!tohost) { cudaMemcpy( native->data,host, native->size, cudaMemcpyHostToDevice) ; } else { cudaMemcpy( host, native->data, native->size, cudaMemcpyDeviceToHost) ; } } }