File: LaunchStatistics.section

package info (click to toggle)
nvidia-cuda-toolkit 12.4.1-2
  • links: PTS, VCS
  • area: non-free
  • in suites: forky, trixie
  • size: 18,505,836 kB
  • sloc: ansic: 203,477; cpp: 64,769; python: 34,699; javascript: 22,006; xml: 13,410; makefile: 3,085; sh: 2,343; perl: 352
file content (94 lines) | stat: -rw-r--r-- 2,100 bytes parent folder | download | duplicates (6)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
Identifier: "LaunchStats"
DisplayName: "Launch Statistics"
Description: "Summary of the configuration used to launch the kernel. The launch configuration defines the size of the kernel grid, the division of the grid into blocks, and the GPU resources needed to execute the kernel. Choosing an efficient launch configuration maximizes device utilization."
Order: 70
Sets {
  Identifier: "basic"
}
Sets {
  Identifier: "detailed"
}
Sets {
  Identifier: "full"
}

Filter {
  CollectionFilter {
    CollectionScopes: CollectionScope_Launch
  }
}

Header {
  Metrics {
    Label: "Grid Size"
    Name: "launch__grid_size"
  }
  Metrics {
    Label: "Function Cache Configuration"
    Name: "launch__func_cache_config"
  }
  Metrics {
    Label: "Cluster Size"
    Name: "launch__cluster_size"
    Filter {
      MinArch: CC_90
    }
  }
  Metrics {
    Label: "Registers Per Thread"
    Name: "launch__registers_per_thread"
  }
  Metrics {
    Label: "Cluster Scheduling Policy"
    Name: "launch__cluster_scheduling_policy"
    Filter {
      MinArch: CC_90
    }
  }
  Metrics {
    Label: "Static Shared Memory Per Block"
    Name: "launch__shared_mem_per_block_static"
  }
  Metrics {
    Label: "Block Size"
    Name: "launch__block_size"
  }
  Metrics {
    Label: "Dynamic Shared Memory Per Block"
    Name: "launch__shared_mem_per_block_dynamic"
  }
  Metrics {
    Label: "Threads"
    Name: "launch__thread_count"
  }
  Metrics {
    Label: "Driver Shared Memory Per Block"
    Name: "launch__shared_mem_per_block_driver"
  }
  Metrics {
    Label: "Waves Per SM"
    Name: "launch__waves_per_multiprocessor"
  }
  Metrics {
    Label: "Shared Memory Configuration Size"
    Name: "launch__shared_mem_config_size"
  }
  Metrics {
    Label: "Uses Green Context"
    Name: "launch__uses_green_context"
  }
  Metrics {
    Label: "# SMs"
    Name: "launch__sm_count"
  }
}
Metrics {
  Metrics {
    Label: "Achieved Occupancy"
    Name: "sm__warps_active.avg.pct_of_peak_sustained_active"
  }
  Metrics {
    Label: "Theoretical Occupancy"
    Name: "sm__maximum_warps_per_active_cycle_pct"
  }
}