File: InstructionStatistics.section

package info (click to toggle)
nvidia-cuda-toolkit 12.4.1-2
  • links: PTS, VCS
  • area: non-free
  • in suites: trixie
  • size: 18,505,836 kB
  • sloc: ansic: 203,477; cpp: 64,769; python: 34,699; javascript: 22,006; xml: 13,410; makefile: 3,085; sh: 2,343; perl: 352
file content (66 lines) | stat: -rw-r--r-- 1,975 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
Identifier: "InstructionStats"
DisplayName: "Instruction Statistics"
Description: "Statistics of the executed low-level assembly instructions (SASS). The instruction mix provides insight into the types and frequency of the executed instructions. A narrow mix of instruction types implies a dependency on few instruction pipelines, while others remain unused. Using multiple pipelines allows hiding latencies and enables parallel execution. Note that 'Instructions/Opcode' and 'Executed Instructions' are measured differently and can diverge if cycles are spent in system calls."
Order: 60
Sets {
  Identifier: "full"
}
Metrics {
  Metrics {
    Label: "Instructions Executed"
    Name: "inst_executed"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
        CollectionScopes: CollectionScope_Cmdlist
      }
    }
  }
}
Header {
  Metrics {
    Label: "Executed Instructions"
    Name: "smsp__inst_executed.sum"
  }
  Metrics {
    Label: "Avg. Executed Instructions Per Scheduler"
    Name: "smsp__inst_executed.avg"
  }
  Metrics {
    Label: "Issued Instructions"
    Name: "smsp__inst_issued.sum"
  }
  Metrics {
    Label: "Avg. Issued Instructions Per Scheduler"
    Name: "smsp__inst_issued.avg"
  }
}
Body {
  Items {
    HorizontalContainer {
      Items {
        BarChart {
          Label: "Executed Instruction Mix"
          CategoryAxis {
            Label: "Opcodes"
          }
         ValueAxis {
            Label: "Executed Warp-Level Instructions/Opcode"
          }
          ValueAxisAlignment: ValueAxisAlignments_Both
          Metrics {
            Label: "Executed Warp-Level Instructions By Basic SASS Opcode"
            Name: "sass__inst_executed_per_opcode"
            ShowInstances: 1
          }
        }
        Filter {
          CollectionFilter {
            CollectionScopes: CollectionScope_Launch
            CollectionScopes: CollectionScope_Cmdlist
          }
        }
      }
    }
  }
}