... | ... | @@ -70,3 +70,8 @@ nvprof --metrics achieved_occupancy,executed_ipc -o metrics.prof ./testcuda -p 8 |
|
|
nvprof --source-level-analysis pc_sampling -o pcsampling.prof ./testcuda -p 8 -r 10
|
|
|
nvprof --analysis-metrics -o analysis_metrics.prof ./testcuda -p 8 -r 10
|
|
|
```
|
|
|
|
|
|
### GPU Profiling Results
|
|
|
|
|
|
##### ```do_test_pair p=8 r=10``` initial kernel run
|
|
|
![Screen_Shot_2017-09-06_at_09.24.45](/uploads/48634931462502aac88a804f99dfa2c9/Screen_Shot_2017-09-06_at_09.24.45.png) |