Skip to content

Commit

Permalink
array sum
Browse files Browse the repository at this point in the history
  • Loading branch information
Tony Tan authored and Tony Tan committed Mar 9, 2018
1 parent 7d3ecbd commit e58c021
Showing 1 changed file with 3 additions and 0 deletions.
3 changes: 3 additions & 0 deletions 6_sum_matrix/sum_matrix.cu
Original file line number Diff line number Diff line change
Expand Up @@ -76,6 +76,7 @@ int main(int argc,char** argv)
iElaps=cpuSecond()-iStart;
printf("GPU Execution configuration<<<(%d,%d),(%d,%d)>>> Time elapsed %f sec\n",
grid_0.x,grid_0.y,block_0.x,block_0.y,iElaps);
CHECK(cudaMemcpy(C_from_gpu,C_dev,nBytes,cudaMemcpyDeviceToHost));
checkResult(C_host,C_from_gpu,nxy);
// 1d block and 1d grid
dimx=32;
Expand All @@ -87,6 +88,7 @@ int main(int argc,char** argv)
iElaps=cpuSecond()-iStart;
printf("GPU Execution configuration<<<(%d,%d),(%d,%d)>>> Time elapsed %f sec\n",
grid_1.x,grid_1.y,block_1.x,block_1.y,iElaps);
CHECK(cudaMemcpy(C_from_gpu,C_dev,nBytes,cudaMemcpyDeviceToHost));
checkResult(C_host,C_from_gpu,nxy);
// 2d block and 1d grid
dimx=32;
Expand All @@ -98,6 +100,7 @@ int main(int argc,char** argv)
iElaps=cpuSecond()-iStart;
printf("GPU Execution configuration<<<(%d,%d),(%d,%d)>>> Time elapsed %f sec\n",
grid_2.x,grid_2.y,block_2.x,block_2.y,iElaps);
CHECK(cudaMemcpy(C_from_gpu,C_dev,nBytes,cudaMemcpyDeviceToHost));
checkResult(C_host,C_from_gpu,nxy);


Expand Down

0 comments on commit e58c021

Please sign in to comment.