File: WarpStateStatistics.section

package info (click to toggle)
nvidia-cuda-toolkit 12.4.1-2
  • links: PTS, VCS
  • area: non-free
  • in suites: trixie
  • size: 18,505,836 kB
  • sloc: ansic: 203,477; cpp: 64,769; python: 34,699; javascript: 22,006; xml: 13,410; makefile: 3,085; sh: 2,343; perl: 352
file content (126 lines) | stat: -rw-r--r-- 4,545 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
Identifier: "WarpStateStats"
DisplayName: "Warp State Statistics"
Description: "Analysis of the states in which all warps spent cycles during the kernel execution. The warp states describe a warp's readiness or inability to issue its next instruction. The warp cycles per instruction define the latency between two consecutive instructions. The higher the value, the more warp parallelism is required to hide this latency. For each warp state, the chart shows the average number of cycles spent in that state per issued instruction. Stalls are not always impacting the overall performance nor are they completely avoidable. Only focus on stall reasons if the schedulers fail to issue every cycle. When executing a kernel with mixed library and user code, these metrics show the combined values."
Order: 50
Sets {
  Identifier: "full"
}
Metrics {
  Metrics {
    Label: "Issued Warp Per Scheduler"
    Name: "smsp__issue_active.avg.per_cycle_active"
  }
}
Header {
  Metrics {
    Label: "Warp Cycles Per Issued Instruction"
    Name: "smsp__average_warp_latency_per_inst_issued.ratio"
  }
  Metrics {
    Label: "Avg. Active Threads Per Warp"
    Name: "smsp__thread_inst_executed_per_inst_executed.ratio"
  }
  Metrics {
    Label: "Warp Cycles Per Executed Instruction"
    Name: "smsp__average_warps_active_per_inst_executed.ratio"
  }
  Metrics {
    Label: "Avg. Not Predicated Off Threads Per Warp"
    Name: "smsp__thread_inst_executed_pred_on_per_inst_executed.ratio"
  }
}
Body {
Items {
    BarChart {
      Label: "Warp State (All Cycles)"
      SortKey: ByValue
      SortDirection: Descending
      CategoryAxis {
        Label: "Warp States"
      }
      ValueAxis {
        Label: "Cycles per Instruction"
      }
      ValueAxisAlignment: ValueAxisAlignments_Both
      Metrics {
        Label: "Stall Drain"
        Name: "smsp__average_warps_issue_stalled_drain_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall IMC Miss"
        Name: "smsp__average_warps_issue_stalled_imc_miss_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Barrier"
        Name: "smsp__average_warps_issue_stalled_barrier_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall GMMA"
        Name: "smsp__average_warps_issue_stalled_gmma_per_issue_active.ratio"
        Filter {
          MinArch: CC_90
        }
      }
      Metrics {
        Label: "Stall Branch Resolving"
        Name: "smsp__average_warps_issue_stalled_branch_resolving_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Membar"
        Name: "smsp__average_warps_issue_stalled_membar_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Short Scoreboard"
        Name: "smsp__average_warps_issue_stalled_short_scoreboard_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Sleeping"
        Name: "smsp__average_warps_issue_stalled_sleeping_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Wait"
        Name: "smsp__average_warps_issue_stalled_wait_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall No Instruction"
        Name: "smsp__average_warps_issue_stalled_no_instruction_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Math Pipe Throttle"
        Name: "smsp__average_warps_issue_stalled_math_pipe_throttle_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Tex Throttle"
        Name: "smsp__average_warps_issue_stalled_tex_throttle_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall LG Throttle"
        Name: "smsp__average_warps_issue_stalled_lg_throttle_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Dispatch Stall"
        Name: "smsp__average_warps_issue_stalled_dispatch_stall_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Misc"
        Name: "smsp__average_warps_issue_stalled_misc_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Not Selected"
        Name: "smsp__average_warps_issue_stalled_not_selected_per_issue_active.ratio"
      }
      Metrics {
        Label: "Selected"
        Name: "smsp__average_warps_issue_stalled_selected_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall Long Scoreboard"
        Name: "smsp__average_warps_issue_stalled_long_scoreboard_per_issue_active.ratio"
      }
      Metrics {
        Label: "Stall MIO Throttle"
        Name: "smsp__average_warps_issue_stalled_mio_throttle_per_issue_active.ratio"
      }
    }
  }
}