24 lines
779 B
Bash
Executable File
24 lines
779 B
Bash
Executable File
#!/usr/bin/env bash
|
|
|
|
#
|
|
# prof.sh <exec> <report.file>
|
|
#
|
|
|
|
sudo /usr/local/cuda-11.4/bin/ncu \
|
|
--target-processes all \
|
|
--metrics "$(echo -n \
|
|
"smsp__inst_executed,"\
|
|
"smsp__cycles_active.avg,"\
|
|
"smsp__cycles_active.sum,"\
|
|
"gpu__time_duration.sum,"\
|
|
"smsp__average_warp_latency_issue_stalled_barrier,"\
|
|
"smsp__warp_issue_stalled_barrier_per_warp_active,"\
|
|
"l1tex__average_t_sectors_per_request_pipe_lsu_mem_global_op_ld,"\
|
|
"l1tex__average_t_sectors_per_request_pipe_lsu_mem_global_op_st,"\
|
|
"l1tex__data_pipe_lsu_wavefronts_mem_shared_cmd_read,"\
|
|
"l1tex__data_pipe_lsu_wavefronts_mem_shared_cmd_write,"\
|
|
"l1tex__data_bank_conflicts_pipe_lsu_mem_shared_op_ld.sum,"\
|
|
"l1tex__data_bank_conflicts_pipe_lsu_mem_shared_op_st.sum "\
|
|
)" \
|
|
"$1" -q 20 -b 512 > "$2"
|