File: tailcall-speculatable-callee.ll

package info (click to toggle)
llvm-toolchain-11 1%3A11.0.1-2
  • links: PTS, VCS
  • area: main
  • in suites: bullseye
  • size: 995,808 kB
  • sloc: cpp: 4,767,656; ansic: 760,916; asm: 477,436; python: 170,940; objc: 69,804; lisp: 29,914; sh: 23,855; f90: 18,173; pascal: 7,551; perl: 7,471; ml: 5,603; awk: 3,489; makefile: 2,573; xml: 915; cs: 573; fortran: 503; javascript: 452
file content (96 lines) | stat: -rw-r--r-- 3,338 bytes parent folder | download | duplicates (2)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
; RUN: llc -verify-machineinstrs -mtriple=powerpc64le-unknown-linux-gnu \
; RUN:   -ppc-asm-full-reg-names -ppc-vsr-nums-as-vr < %s | FileCheck %s

; The tests check the behavior of the tail call decision when the callee is speculatable.

; Callee should be tail called in this function since it is at a tail call position.
define dso_local double @speculatable_callee_return_use_only (double* nocapture %res, double %a) #0 {
; CHECK-LABEL: speculatable_callee_return_use_only:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: b callee
entry:
  %value = tail call double @callee(double %a) #2
  ret double %value
}

; Callee should not be tail called since it is not at a tail call position.
define dso_local void @speculatable_callee_non_return_use_only (double* nocapture %res, double %a) #0 {
; CHECK-LABEL: speculatable_callee_non_return_use_only:
; CHECK: # %bb.0: # %entry
; CHECK-NEXT: mflr r0
; CHECK-NEXT: std r30, -16(r1)  # 8-byte Folded Spill
; CHECK-NEXT: std r0, 16(r1)
; CHECK-NEXT: stdu r1, -48(r1)
; CHECK-NEXT: mr r30, r3
; CHECK-NEXT: bl callee
; CHECK-NEXT: stfdx f1, 0, r30
; CHECK-NEXT: addi r1, r1, 48
; CHECK-NEXT: ld r0, 16(r1)
; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
; CHECK-NEXT: mtlr r0
; CHECK-NEXT: blr
entry:
  %call = tail call double @callee(double %a) #2
  store double %call, double* %res, align 8
  ret void
}

; Callee should not be tail called since it is not at a tail call position.
define dso_local double @speculatable_callee_multi_use (double* nocapture %res, double %a) #0 {
  ; CHECK-LABEL: speculatable_callee_multi_use:
  ; CHECK: # %bb.0: # %entry
  ; CHECK-NEXT: mflr r0
  ; CHECK-NEXT: std r30, -16(r1)  # 8-byte Folded Spill
  ; CHECK-NEXT: std r0, 16(r1)
  ; CHECK-NEXT: stdu r1, -48(r1)
  ; CHECK-NEXT: mr r30, r3
  ; CHECK-NEXT: bl callee
  ; CHECK-NEXT: stfdx f1, 0, r30
  ; CHECK-NEXT: addi r1, r1, 48
  ; CHECK-NEXT: ld r0, 16(r1)
  ; CHECK-NEXT: ld r30, -16(r1) # 8-byte Folded Reload
  ; CHECK-NEXT: mtlr r0
  ; CHECK-NEXT: blr
  entry:
  %call = tail call double @callee(double %a) #2
  store double %call, double* %res, align 8
  ret double %call
}

; Callee should not be tail called since it is not at a tail call position.
; FIXME: A speculatable callee can be tail called if it is moved into a valid tail call position.
define dso_local double @speculatable_callee_intermediate_instructions (double* nocapture %res, double %a) #0 {
  ; CHECK-LABEL: speculatable_callee_intermediate_instructions:
  ; CHECK: # %bb.0: # %entry
  ; CHECK-NEXT: mflr r0
  ; CHECK-NEXT: std r30, -16(r1)  # 8-byte Folded Spill
  ; CHECK-NEXT: std r0, 16(r1)
  ; CHECK-NEXT: stdu r1, -48(r1)
  ; CHECK-NEXT: mr r30, r3
  ; CHECK-NEXT: bl callee
  ; CHECK-NEXT: lis r3, 16404
  ; CHECK-NEXT: ori r3, r3, 52428
  ; CHECK-NEXT: sldi r3, r3, 32
  ; CHECK-NEXT: oris r3, r3, 52428
  ; CHECK-NEXT: ori r3, r3, 52429
  ; CHECK-NEXT: std r3, 0(r30)
  ; CHECK-NEXT: addi r1, r1, 48
  ; CHECK-NEXT: ld r0, 16(r1)
  ; CHECK-NEXT: ld r30, -16(r1)  # 8-byte Folded Reload
  ; CHECK-NEXT: mtlr r0
  ; CHECK-NEXT: blr

  entry:
  %call = tail call double @callee(double %a) #2
  store double 5.2, double* %res, align 8
  ret double %call
}


define double @callee(double) #1 {
  ret double 4.5
}

attributes #0 = { nounwind }
attributes #1 = { readnone speculatable }
attributes #2 = { nounwind noinline }