1 2 3 4 5 6 7 8 9 10 11 12 13 14
| cudaEvent_t start, stop; ErrorCheck(cudaEventCreate(&start), __FILE__, __LINE__); ErrorCheck(cudaEventCreate(&stop), __FILE__, __LINE__); ErrorCheck(cudaEventRecord(start), __FILE__, __LINE__); cudaEventQuery(start); addFromGPU<<<grid, block>>>(fpDevice_A, fpDevice_B, fpDevice_C,iElemCount); ErrorCheck(cudaEventRecord(stop), __FILE__, __LINE__); ErrorCheck(cudaEventSynchronize(stop), __FILE__, __LINE__); float elapsed_time; ErrorCheck(cudaEventElapsedTime(&elapsed_time, start, stop), __FILE__, __LINE__);
ErrorCheck(cudaEventDestroy(start), __FILE__, __LINE__); ErrorCheck(cudaEventDestroy(stop), __FILE__, __LINE__);
|