aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/AArch64/umulo-128-legalisation-lowering.ll
blob: edfd80b4f27061b29095adfb6f670499d657affb (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
; NOTE: Assertions have been autogenerated by utils/update_llc_test_checks.py
; RUN: llc < %s -mtriple=aarch64-unknown-linux-gnu | FileCheck %s --check-prefixes=AARCH

define { i128, i8 } @muloti_test(i128 %l, i128 %r) unnamed_addr #0 {
; AARCH-LABEL: muloti_test:
; AARCH:       // %bb.0: // %start
; AARCH-NEXT:    mul x9, x3, x0
; AARCH-NEXT:    cmp x1, #0
; AARCH-NEXT:    ccmp x3, #0, #4, ne
; AARCH-NEXT:    umulh x8, x1, x2
; AARCH-NEXT:    umulh x10, x3, x0
; AARCH-NEXT:    madd x9, x1, x2, x9
; AARCH-NEXT:    ccmp xzr, x8, #0, eq
; AARCH-NEXT:    umulh x11, x0, x2
; AARCH-NEXT:    ccmp xzr, x10, #0, eq
; AARCH-NEXT:    mul x0, x0, x2
; AARCH-NEXT:    cset w8, ne
; AARCH-NEXT:    adds x1, x11, x9
; AARCH-NEXT:    csinc w2, w8, wzr, lo
; AARCH-NEXT:    ret
start:
  %0 = tail call { i128, i1 } @llvm.umul.with.overflow.i128(i128 %l, i128 %r) #2
  %1 = extractvalue { i128, i1 } %0, 0
  %2 = extractvalue { i128, i1 } %0, 1
  %3 = zext i1 %2 to i8
  %4 = insertvalue { i128, i8 } undef, i128 %1, 0
  %5 = insertvalue { i128, i8 } %4, i8 %3, 1
  ret { i128, i8 } %5
}

; PR56403
; We avoid lowering the intrinsic as a libcall because this function has the same name as
; the libcall we wanted to generate (that would create an infinite loop).

define i128 @__muloti4(i128 %0, i128 %1, ptr nocapture nonnull writeonly align 4 %2) #2 {
; AARCH-LABEL: __muloti4:
; AARCH:       // %bb.0: // %Entry
; AARCH-NEXT:    asr x11, x1, #63
; AARCH-NEXT:    asr x9, x3, #63
; AARCH-NEXT:    umulh x12, x0, x2
; AARCH-NEXT:    mov x8, x1
; AARCH-NEXT:    str wzr, [x4]
; AARCH-NEXT:    mul x13, x1, x2
; AARCH-NEXT:    umulh x10, x1, x2
; AARCH-NEXT:    mul x11, x11, x2
; AARCH-NEXT:    adds x12, x13, x12
; AARCH-NEXT:    mul x15, x0, x3
; AARCH-NEXT:    umulh x14, x0, x3
; AARCH-NEXT:    adc x10, x10, x11
; AARCH-NEXT:    mul x9, x0, x9
; AARCH-NEXT:    mul x16, x1, x3
; AARCH-NEXT:    adds x1, x15, x12
; AARCH-NEXT:    asr x12, x10, #63
; AARCH-NEXT:    smulh x11, x8, x3
; AARCH-NEXT:    adc x9, x14, x9
; AARCH-NEXT:    asr x13, x9, #63
; AARCH-NEXT:    adds x9, x10, x9
; AARCH-NEXT:    asr x10, x1, #63
; AARCH-NEXT:    mul x0, x0, x2
; AARCH-NEXT:    adc x12, x12, x13
; AARCH-NEXT:    adds x9, x16, x9
; AARCH-NEXT:    adc x11, x11, x12
; AARCH-NEXT:    cmp x9, x10
; AARCH-NEXT:    ccmp x11, x10, #0, eq
; AARCH-NEXT:    cset w9, ne
; AARCH-NEXT:    tbz x8, #63, .LBB1_2
; AARCH-NEXT:  // %bb.1: // %Entry
; AARCH-NEXT:    eor x8, x3, #0x8000000000000000
; AARCH-NEXT:    orr x8, x2, x8
; AARCH-NEXT:    cbz x8, .LBB1_3
; AARCH-NEXT:  .LBB1_2: // %Else2
; AARCH-NEXT:    cbz w9, .LBB1_4
; AARCH-NEXT:  .LBB1_3: // %Then7
; AARCH-NEXT:    mov w8, #1 // =0x1
; AARCH-NEXT:    str w8, [x4]
; AARCH-NEXT:  .LBB1_4: // %Block9
; AARCH-NEXT:    ret
Entry:
  store i32 0, ptr %2, align 4
  %.fr = freeze i128 %1
  %mul = tail call { i128, i1 } @llvm.smul.with.overflow.i128(i128 %0, i128 %.fr)
  %3 = icmp slt i128 %0, 0
  %4 = icmp eq i128 %.fr, -170141183460469231731687303715884105728
  %5 = and i1 %3, %4
  br i1 %5, label %Then7, label %Else2

Else2:                                            ; preds = %Entry
  %mul.ov = extractvalue { i128, i1 } %mul, 1
  br i1 %mul.ov, label %Then7, label %Block9

Then7:                                            ; preds = %Else2, %Entry
  store i32 1, ptr %2, align 4
  br label %Block9

Block9:                                           ; preds = %Else2, %Then7
  %mul.val = extractvalue { i128, i1 } %mul, 0
  ret i128 %mul.val
}

declare { i128, i1 } @llvm.umul.with.overflow.i128(i128, i128) #1
declare { i128, i1 } @llvm.smul.with.overflow.i128(i128, i128) #1

attributes #0 = { nounwind readnone uwtable }
attributes #1 = { nounwind readnone speculatable }
attributes #2 = { nounwind }