File: WorkloadDistribution.section

package info (click to toggle)
nvidia-cuda-toolkit 12.4.1-2
  • links: PTS, VCS
  • area: non-free
  • in suites: trixie
  • size: 18,505,836 kB
  • sloc: ansic: 203,477; cpp: 64,769; python: 34,699; javascript: 22,006; xml: 13,410; makefile: 3,085; sh: 2,343; perl: 352
file content (145 lines) | stat: -rw-r--r-- 3,517 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
Identifier: "WorkloadDistribution"
DisplayName: "GPU and Memory Workload Distribution"
Description: "Analysis of workload distribution in active cycles of SM, SMP, SMSP, L1 & L2 caches, and DRAM"
Order: 100

Sets {
  Identifier: "basic"
}
Sets {
  Identifier: "detailed"
}
Sets {
  Identifier: "full"
}
Sets {
  Identifier: "roofline"
}

Header {
    Metrics {
        Label: "Average SM Active Cycles"
        Name: "sm__cycles_active.avg"
    }
    Metrics {
        Label: "Average L1 Active Cycles"
        Name: "l1tex__cycles_active.avg"
    }
    Metrics {
        Label: "Average L2 Active Cycles"
        Name: "lts__cycles_active.avg"
    }
    Metrics {
        Label: "Average SMSP Active Cycles"
        Name: "smsp__cycles_active.avg"
    }
    Metrics {
        Label: "Average DRAM Active Cycles"
        Name: "dram__cycles_active.avg"
        Filter {
          Items {
            MaxArch: CC_70
          }
          Items {
            MinArch: CC_75
            MaxArch: CC_86
          }
          Items {
            MinArch: CC_89
          }
        }
    }
    Metrics {
        Label: "Total SM Elapsed Cycles"
        Name: "sm__cycles_elapsed.sum"
    }
    Metrics {
        Label: "Total L1 Elapsed Cycles"
        Name: "l1tex__cycles_elapsed.sum"
    }
    Metrics {
        Label: "Total L2 Elapsed Cycles"
        Name: "lts__cycles_elapsed.sum"
    }
    Metrics {
        Label: "Total SMSP Elapsed Cycles"
        Name: "smsp__cycles_elapsed.sum"
    }
    Metrics {
        Label: "Total DRAM Elapsed Cycles"
        Name: "dram__cycles_elapsed.sum"
        Filter {
          Items {
            MaxArch: CC_70
          }
          Items {
            MinArch: CC_75
            MaxArch: CC_86
          }
          Items {
            MinArch: CC_89
          }
        }
    }
}

Body {
    Items {
        SuffixTable {
            Label: "Workload Distribution"
            Suffixes {
                Suffix {
                    Label: "Average"
                    Name: ".avg"
                }
                Suffix {
                    Label: "Min"
                    Name: ".min"
                }
                Suffix {
                    Label: "Max"
                    Name: ".max"
                }
                Suffix {
                    Label: "Sum"
                    Name: ".sum"
                }
            }
            BaseNames {
                BaseName {
                    Label: "SM Active Cycles"
                    Name: "sm__cycles_active"
                }
                BaseName {
                    Label: "SMSP Active Cycles"
                    Name: "smsp__cycles_active"
                }
                BaseName {
                    Label: "L1 Active Cycles"
                    Name: "l1tex__cycles_active"
                }
                BaseName {
                    Label: "L2 Active Cycles"
                    Name: "lts__cycles_active"
                }
                BaseName {
                    Label: "DRAM Active Cycles"
                    Name: "dram__cycles_active"
                    Filter {
                      Items {
                          MaxArch: CC_70
                      }
                      Items {
                          MinArch: CC_75
                          MaxArch: CC_86
                      }
                      Items {
                          MinArch: CC_89
                      }
                      }
                }

            }
        }
    }
}