File: MemoryWorkloadAnalysis_Tables.section

package info (click to toggle)
nvidia-cuda-toolkit 12.4.1-3
  • links: PTS, VCS
  • area: non-free
  • in suites: forky, sid
  • size: 18,505,836 kB
  • sloc: ansic: 203,477; cpp: 64,769; python: 34,699; javascript: 22,006; xml: 13,410; makefile: 3,085; sh: 2,343; perl: 352
file content (155 lines) | stat: -rw-r--r-- 3,824 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
Identifier: "MemoryWorkloadAnalysis_Tables"
DisplayName: "Memory Workload Analysis Tables"
Extends: "MemoryWorkloadAnalysis"
Description: "Detailed tables with data for each memory unit."
Order: 32
Sets {
  Identifier: "full"
}
Metrics {
  Metrics {
    Label: "Average Bytes Per Sector For Global Loads"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_global_op_ld.ratio"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Average Bytes Per Sector For Global Stores"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_global_op_st.ratio"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Average Bytes Per Sector For Local Loads"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_local_op_ld.ratio"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Average Bytes Per Sector For Local Stores"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_local_op_st.ratio"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Maximum Bytes Per Sector For Global Loads"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_global_op_ld.max_rate"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Maximum Bytes Per Sector For Global Stores"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_global_op_st.max_rate"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Maximum Bytes Per Sector For Local Loads"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_local_op_ld.max_rate"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "Maximum Bytes Per Sector For Local Stores"
    Name: "smsp__sass_average_data_bytes_per_sector_mem_local_op_st.max_rate"
    Filter {
      CollectionFilter {
        CollectionScopes: CollectionScope_Launch
      }
    }
  }
  Metrics {
    Label: "L1TEX Hit Rate For Global Loads"
    Name: "l1tex__t_sector_pipe_lsu_mem_global_op_ld_hit_rate.pct"
  }
  Metrics {
    Label: "L1TEX Hit Rate For Global Stores"
    Name: "l1tex__t_sector_pipe_lsu_mem_global_op_st_hit_rate.pct"
  }
  Metrics {
    Label: "L1TEX Hit Rate For Local Loads"
    Name: "l1tex__t_sector_pipe_lsu_mem_local_op_ld_hit_rate.pct"
  }
  Metrics {
    Label: "L1TEX Hit Rate For Local Stores"
    Name: "l1tex__t_sector_pipe_lsu_mem_local_op_st_hit_rate.pct"
  }
  Metrics {
    Label: "L2 Hit Rate For Loads"
    Name: "lts__t_sector_op_read_hit_rate.pct"
  }
  Metrics {
    Label: "L2 Hit Rate For Stores"
    Name: "lts__t_sector_op_write_hit_rate.pct"
  }
  Metrics {
    Label: "L1TEX Throughput"
    Name: "l1tex__throughput.avg.pct_of_peak_sustained_elapsed"
  }
  Metrics {
    Label: "L2 Throughput"
    Name: "lts__throughput.avg.pct_of_peak_sustained_elapsed"
  }
  Metrics {
    Label: "DRAM Throughput"
    Name: "gpu__dram_throughput.avg.pct_of_peak_sustained_elapsed"
  }
}
Body {
  DisplayName: "Memory Tables"
  Items {
    MemorySharedTable {
      Label: "Shared Memory"
    }
  }
  Items {
    MemoryL1TEXCacheTable {
      Label: "L1/TEX Cache"
    }
  }
  Items {
    MemoryL2CacheTable {
      Label: "L2 Cache"
    }
  }
  Items {
    MemoryL2CacheEvictPolicyTable {
      Label: "L2 Cache Eviction Policies"
    }
    Filter {
      Items {
        MinArch: 80
        MaxArch: 86
      }
      Items {
        MinArch: 89
      }
    }
  }
  Items {
    MemoryDeviceMemoryTable {
      Label: "Device Memory"
    }
  }
}