1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117
|
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=aarch64-unknown-linux-gnu | FileCheck %s --check-prefixes=AARCH
define { i128, i8 } @muloti_test(i128 %l, i128 %r) unnamed_addr #0 {
; AARCH-LABEL: muloti_test:
; AARCH: // %bb.0: // %start
; AARCH-NEXT: mul x8, x3, x0
; AARCH-NEXT: umulh x9, x0, x2
; AARCH-NEXT: madd x8, x1, x2, x8
; AARCH-NEXT: umulh x10, x1, x2
; AARCH-NEXT: adds x8, x9, x8
; AARCH-NEXT: cset w9, hs
; AARCH-NEXT: cmp x1, #0
; AARCH-NEXT: ccmp x3, #0, #4, ne
; AARCH-NEXT: mov x1, x8
; AARCH-NEXT: ccmp xzr, x10, #0, eq
; AARCH-NEXT: umulh x10, x3, x0
; AARCH-NEXT: mul x0, x0, x2
; AARCH-NEXT: ccmp xzr, x10, #0, eq
; AARCH-NEXT: cset w10, ne
; AARCH-NEXT: orr w2, w10, w9
; AARCH-NEXT: ret
start:
%0 = tail call { i128, i1 } @llvm.umul.with.overflow.i128(i128 %l, i128 %r) #2
%1 = extractvalue { i128, i1 } %0, 0
%2 = extractvalue { i128, i1 } %0, 1
%3 = zext i1 %2 to i8
%4 = insertvalue { i128, i8 } undef, i128 %1, 0
%5 = insertvalue { i128, i8 } %4, i8 %3, 1
ret { i128, i8 } %5
}
; PR56403
; We avoid lowering the intrinsic as a libcall because this function has the same name as
; the libcall we wanted to generate (that would create an infinite loop).
define i128 @__muloti4(i128 %0, i128 %1, i32* nocapture nonnull writeonly align 4 %2) #2 {
; AARCH-LABEL: __muloti4:
; AARCH: // %bb.0: // %Entry
; AARCH-NEXT: asr x9, x1, #63
; AARCH-NEXT: asr x10, x3, #63
; AARCH-NEXT: umulh x14, x0, x2
; AARCH-NEXT: mov x8, x1
; AARCH-NEXT: mul x11, x2, x9
; AARCH-NEXT: str wzr, [x4]
; AARCH-NEXT: umulh x12, x10, x0
; AARCH-NEXT: umulh x13, x2, x9
; AARCH-NEXT: madd x12, x10, x1, x12
; AARCH-NEXT: add x13, x13, x11
; AARCH-NEXT: mul x10, x10, x0
; AARCH-NEXT: madd x9, x3, x9, x13
; AARCH-NEXT: add x12, x12, x10
; AARCH-NEXT: adds x10, x10, x11
; AARCH-NEXT: mul x11, x1, x2
; AARCH-NEXT: adc x9, x12, x9
; AARCH-NEXT: umulh x13, x1, x2
; AARCH-NEXT: mul x12, x0, x3
; AARCH-NEXT: adds x11, x11, x14
; AARCH-NEXT: umulh x14, x0, x3
; AARCH-NEXT: cinc x13, x13, hs
; AARCH-NEXT: adds x1, x12, x11
; AARCH-NEXT: mul x12, x8, x3
; AARCH-NEXT: cinc x11, x14, hs
; AARCH-NEXT: mul x0, x0, x2
; AARCH-NEXT: adds x11, x13, x11
; AARCH-NEXT: umulh x13, x8, x3
; AARCH-NEXT: cset w14, hs
; AARCH-NEXT: adds x11, x12, x11
; AARCH-NEXT: adc x12, x13, x14
; AARCH-NEXT: adds x10, x11, x10
; AARCH-NEXT: adc x9, x12, x9
; AARCH-NEXT: asr x11, x1, #63
; AARCH-NEXT: eor x9, x9, x11
; AARCH-NEXT: eor x10, x10, x11
; AARCH-NEXT: orr x9, x10, x9
; AARCH-NEXT: cmp x9, #0
; AARCH-NEXT: cset w9, ne
; AARCH-NEXT: tbz x8, #63, .LBB1_2
; AARCH-NEXT: // %bb.1: // %Entry
; AARCH-NEXT: eor x8, x3, #0x8000000000000000
; AARCH-NEXT: orr x8, x2, x8
; AARCH-NEXT: cbz x8, .LBB1_3
; AARCH-NEXT: .LBB1_2: // %Else2
; AARCH-NEXT: cbz w9, .LBB1_4
; AARCH-NEXT: .LBB1_3: // %Then7
; AARCH-NEXT: mov w8, #1
; AARCH-NEXT: str w8, [x4]
; AARCH-NEXT: .LBB1_4: // %Block9
; AARCH-NEXT: ret
Entry:
store i32 0, i32* %2, align 4
%.fr = freeze i128 %1
%mul = tail call { i128, i1 } @llvm.smul.with.overflow.i128(i128 %0, i128 %.fr)
%3 = icmp slt i128 %0, 0
%4 = icmp eq i128 %.fr, -170141183460469231731687303715884105728
%5 = and i1 %3, %4
br i1 %5, label %Then7, label %Else2
Else2: ; preds = %Entry
%mul.ov = extractvalue { i128, i1 } %mul, 1
br i1 %mul.ov, label %Then7, label %Block9
Then7: ; preds = %Else2, %Entry
store i32 1, i32* %2, align 4
br label %Block9
Block9: ; preds = %Else2, %Then7
%mul.val = extractvalue { i128, i1 } %mul, 0
ret i128 %mul.val
}
declare { i128, i1 } @llvm.umul.with.overflow.i128(i128, i128) #1
declare { i128, i1 } @llvm.smul.with.overflow.i128(i128, i128) #1
attributes #0 = { nounwind readnone uwtable }
attributes #1 = { nounwind readnone speculatable }
attributes #2 = { nounwind }
|