aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/CodeGen/AArch64/cgdata-merge-local.ll
blob: 608fe29e17398a6c23801bdfc12806c3d0b570fe (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
; This test checks if two similar functions, f1 and f2, can be merged locally within a single module
; while parameterizing a difference in their global variables, g1 and g2.
; To achieve this, we create two instances of the global merging function, f1.Tgm and f2.Tgm,
; which are tail-called from thunks f1 and f2 respectively.
; These identical functions, f1.Tgm and f2.Tgm, will be folded by the linker via Identical Code Folding (ICF).

; RUN: opt -mtriple=arm64-apple-darwin -S --passes=global-merge-func %s | FileCheck %s

; A merging instance is created with additional parameter.
; CHECK: define internal i32 @f1.Tgm(i32 %0, ptr %1)
; CHECK-NEXT: entry:
; CHECK-NEXT:  %idxprom = sext i32 %0 to i64
; CHECK-NEXT:  %arrayidx = getelementptr inbounds [0 x i32], ptr @g, i64 0, i64 %idxprom
; CHECK-NEXT:  %2 = load i32, ptr %arrayidx, align 4
; CHECK-NEXT:  %3 = load volatile i32, ptr %1, align 4
; CHECK-NEXT:  %mul = mul nsw i32 %3, %2
; CHECK-NEXT:  %add = add nsw i32 %mul, 1
; CHECK-NEXT:  ret i32 %add

; The original function becomes a thunk passing g1.
; CHECK: define i32 @f1(i32 %a)
; CHECK-NEXT:  %1 = tail call i32 @f1.Tgm(i32 %a, ptr @g1)
; CHECK-NEXT:  ret i32 %1

; A same sequence is produced for f2.Tgm.
; CHECK: define internal i32 @f2.Tgm(i32 %0, ptr %1)
; CHECK-NEXT: entry:
; CHECK-NEXT:  %idxprom = sext i32 %0 to i64
; CHECK-NEXT:  %arrayidx = getelementptr inbounds [0 x i32], ptr @g, i64 0, i64 %idxprom
; CHECK-NEXT:  %2 = load i32, ptr %arrayidx, align 4
; CHECK-NEXT:  %3 = load volatile i32, ptr %1, align 4
; CHECK-NEXT:  %mul = mul nsw i32 %3, %2
; CHECK-NEXT:  %add = add nsw i32 %mul, 1
; CHECK-NEXT:  ret i32 %add

; The original function becomes a thunk passing g2.
; CHECK: define i32 @f2(i32 %a)
; CHECK-NEXT:  %1 = tail call i32 @f2.Tgm(i32 %a, ptr @g2)
; CHECK-NEXT:  ret i32 %1

; RUN: llc -mtriple=arm64-apple-darwin -enable-global-merge-func=true < %s | FileCheck %s --check-prefix=MERGE
; RUN: llc -mtriple=arm64-apple-darwin -enable-global-merge-func=false < %s | FileCheck %s --check-prefix=NOMERGE

; MERGE: _f1.Tgm
; MERGE: _f2.Tgm

; NOMERGE-NOT: _f1.Tgm
; NOMERGE-NOT: _f2.Tgm

@g = external local_unnamed_addr global [0 x i32], align 4
@g1 = external global i32, align 4
@g2 = external global i32, align 4

define i32 @f1(i32 %a) {
entry:
  %idxprom = sext i32 %a to i64
  %arrayidx = getelementptr inbounds [0 x i32], [0 x i32]* @g, i64 0, i64 %idxprom
  %0 = load i32, i32* %arrayidx, align 4
  %1 = load volatile i32, i32* @g1, align 4
  %mul = mul nsw i32 %1, %0
  %add = add nsw i32 %mul, 1
  ret i32 %add
}

define i32 @f2(i32 %a) {
entry:
  %idxprom = sext i32 %a to i64
  %arrayidx = getelementptr inbounds [0 x i32], [0 x i32]* @g, i64 0, i64 %idxprom
  %0 = load i32, i32* %arrayidx, align 4
  %1 = load volatile i32, i32* @g2, align 4
  %mul = mul nsw i32 %1, %0
  %add = add nsw i32 %mul, 1
  ret i32 %add
}