#include #include #include #include using namespace std; void initVector(float *u, int n, float c) { int i; for (i=0; i>>(u_dev, v_dev, z_dev, N); cudaDeviceSynchronize(); cout << "From GPU: " << gpuID << " " << cudaGetLastError() << endl; error = cudaMemcpy(z, z_dev, N*sizeof(float), cudaMemcpyDeviceToHost); cout << "From GPU: " << gpuID << " " << cudaGetErrorString(error) << endl; cout << z[0] << " " << z[1] << " " << z[2] << endl; cudaFree(u_dev); cudaFree(v_dev); cudaFree(z_dev); } return 0; }