File: flatten-and-annotate.ll

package info (click to toggle)
llvm-toolchain-21 1%3A21.1.6-3
  • links: PTS, VCS
  • area: main
  • in suites: forky, sid
  • size: 2,245,028 kB
  • sloc: cpp: 7,619,726; ansic: 1,434,018; asm: 1,058,748; python: 252,740; f90: 94,671; objc: 70,685; lisp: 42,813; pascal: 18,401; sh: 8,601; ml: 5,111; perl: 4,720; makefile: 3,675; awk: 3,523; javascript: 2,409; xml: 892; fortran: 770
file content (119 lines) | stat: -rw-r--r-- 4,214 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
; REQUIRES: x86_64-linux
;
; RUN: rm -rf %t
; RUN: split-file %s %t
; RUN: llvm-ctxprof-util fromYAML --input=%t/profile.yaml --output=%t/profile.ctxprofdata
; RUN: opt -module-summary -passes='thinlto-pre-link<O2>' -use-ctx-profile=%t/profile.ctxprofdata \
; RUN:   %t/example.ll -S -o %t/4909520559318251808.ll
; RUN: FileCheck --input-file %t/4909520559318251808.ll %s --check-prefix=PRELINK

; RUN: opt -passes='ctx-prof-flatten' -use-ctx-profile=%t/profile.ctxprofdata %t/4909520559318251808.ll -S  | FileCheck %s --check-prefix=POSTLINK
;
;
; Check that instrumentation occurs where expected: the "no" block for both foo and
; @an_entrypoint - which explains the subsequent branch weights
;
; PRELINK-LABEL: @foo
; PRELINK-LABEL: yes:
; PRELINK-LABEL: no:
; PRELINK-NEXT:     call void @llvm.instrprof.increment(ptr @foo, i64 [[#]], i32 2, i32 1)

; PRELINK-LABEL: @an_entrypoint
; PRELINK:       br i1 %t, label %yes, label %common.ret, !prof ![[PREPROF:[0-9]+]]
; PRELINK-LABEL: yes:
; PRELINK-NEXT:    call void @llvm.instrprof.increment(ptr @an_entrypoint, i64 [[#]], i32 2, i32 1)
; PRELINK:      ![[#]] = !{i32 1, !"ProfileSummary", !1}
; PRELINK:      ![[#]] = !{!"TotalCount", i64 151600}
; PRELINK:      ![[#]] = !{!"MaxCount", i64 102000}
; PRELINK:      ![[#]] = !{!"MaxInternalCount", i64 102000}
; PRELINK:      ![[#]] = !{!"MaxFunctionCount", i64 20100}
; PRELINK:      ![[#]] = !{!"NumCounts", i64 6}
; PRELINK:      ![[#]] = !{!"NumFunctions", i64 3}
; PRELINK:       ![[PREPROF]] = !{!"branch_weights", i32 4000, i32 6000}

; Check that the output has:
;  - no instrumentation
;  - the 2 functions have an entry count
;  - each conditional branch has profile annotation
;
; POSTLINK-NOT:   call void @llvm.instrprof
;
; make sure we have function entry counts, branch weights, and a profile summary.
; POSTLINK-LABEL: @foo
; POSTLINK-SAME:    !prof ![[FOO_EP:[0-9]+]]
; POSTLINK:          br i1 %t, label %yes, label %no, !prof ![[FOO_BW:[0-9]+]]
; POSTLINK-LABEL: @an_entrypoint
; POSTLINK-SAME:    !prof ![[AN_ENTRYPOINT_EP:[0-9]+]]
; POSTLINK:          br i1 %t, label %yes, label %common.ret, !prof ![[AN_ENTRYPOINT_BW:[0-9]+]]

; The postlink summary is restricted to the stuff under the root - including the
; "unhandled" data.
; POSTLINK:      ![[#]] = !{i32 1, !"ProfileSummary", !1}
; POSTLINK:      ![[#]] = !{!"TotalCount", i64 149500}
; POSTLINK:      ![[#]] = !{!"MaxCount", i64 100000}
; POSTLINK:      ![[#]] = !{!"MaxInternalCount", i64 100000}
; POSTLINK:      ![[#]] = !{!"MaxFunctionCount", i64 20000}
; POSTLINK:      ![[#]] = !{!"NumCounts", i64 6}
; POSTLINK:      ![[#]] = !{!"NumFunctions", i64 3}

;
; @foo will be called both unconditionally and conditionally, on the "yes" branch
; which has a count of 40. So 140 times.

; POSTLINK:       ![[FOO_EP]] = !{!"function_entry_count", i64 14000} 

; foo's "no" branch is taken 10+5 times (from the 2 contexts belonging to foo).
; Which means its "yes" branch is taken 140 - 15 times.

; POSTLINK:       ![[FOO_BW]] = !{!"branch_weights", i32 12500, i32 1500} 
; POSTLINK:       ![[AN_ENTRYPOINT_EP]] = !{!"function_entry_count", i64 10000}
; POSTLINK:       ![[AN_ENTRYPOINT_BW]] = !{!"branch_weights", i32 4000, i32 6000} 

;--- profile.yaml
Contexts:
  - Guid: 4909520559318251808
    TotalRootEntryCount: 100
    Unhandled:
      - Guid: 1234
        Counters: [200, 1000]
    Counters: [100, 40]
    Callsites: -
                - Guid: 11872291593386833696
                  Counters: [ 100, 5 ]
               -
                - Guid: 11872291593386833696
                  Counters: [ 40, 10 ]
FlatProfiles:
  - Guid: 1234
    Counters: [ 100, 2000 ]
;--- example.ll
declare void @bar()

define void @foo(i32 %a, ptr %fct) #0 !guid !0 {
  %t = icmp sgt i32 %a, 7
  br i1 %t, label %yes, label %no
yes:
  call void %fct(i32 %a)
  br label %exit
no:
  call void @bar()
  br label %exit
exit:
  ret void
}

define void @an_entrypoint(i32 %a) !guid !1 {
  %t = icmp sgt i32 %a, 0
  call void @foo(i32 10, ptr null)
  br i1 %t, label %yes, label %no

yes:
  call void @foo(i32 1, ptr null)
  ret void
no:
  ret void
}

attributes #0 = { noinline }
!0 = !{ i64 11872291593386833696 }
!1 = !{i64 4909520559318251808}