aboutsummaryrefslogtreecommitdiff
path: root/llvm/test/Transforms/LoopInterchange/delay-cachecost-calculation.ll
blob: d80b4420c034cc509443c13f0686c255722738f1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
; REQUIRES: asserts

; RUN: opt -passes=loop-interchange -debug -disable-output %s 2>&1 | FileCheck %s

@A = global [16 x [16 x i32]] zeroinitializer

; Check that the CacheCost is calculated only when required. In this case, it
; is computed after passing the legality check.
;
; for (i = 0; i < 16; i++)
;   for (j = 0; j < 16; j++)
;     A[j][i] += 1;

; CHECK: Loops are legal to interchange
; CHECK: Compute CacheCost
define void @legal_to_interchange() {
entry:
  br label %for.i.header

for.i.header:
  %i = phi i32 [ 0, %entry ], [ %i.next, %for.i.latch ]
  br label %for.j

for.j:
  %j = phi i32 [ 0, %for.i.header ], [ %j.next, %for.j ]
  %idx = getelementptr inbounds [16 x [16 x i32]], ptr @A, i32 0, i32 %j, i32 %i
  %val = load i32, ptr %idx
  %inc = add i32 %val, 1
  store i32 %inc, ptr %idx
  %j.next = add i32 %j, 1
  %j.exit = icmp eq i32 %j.next, 16
  br i1 %j.exit, label %for.i.latch, label %for.j

for.i.latch:
  %i.next = add i32 %i, 1
  %i.exit = icmp eq i32 %i.next, 16
  br i1 %i.exit, label %exit, label %for.i.header

exit:
  ret void
}

; Check that the CacheCost is not calculated when not required. In this case,
; the legality check always fails so that we do not need to compute the
; CacheCost.
;
; for (i = 0; i < 16; i++)
;   for (j = 0; j < 16; j++)
;     A[j][i] = A[i][j];

; CHECK-NOT: Compute CacheCost
define void @illegal_to_interchange() {
entry:
  br label %for.i.header

for.i.header:
  %i = phi i32 [ 0, %entry ], [ %i.next, %for.i.latch ]
  br label %for.j

for.j:
  %j = phi i32 [ 0, %for.i.header ], [ %j.next, %for.j ]
  %idx.load = getelementptr inbounds [16 x [16 x i32]], ptr @A, i32 0, i32 %i, i32 %j
  %idx.store = getelementptr inbounds [16 x [16 x i32]], ptr @A, i32 0, i32 %j, i32 %i
  %val = load i32, ptr %idx.load
  store i32 %val, ptr %idx.store
  %j.next = add i32 %j, 1
  %j.exit = icmp eq i32 %j.next, 16
  br i1 %j.exit, label %for.i.latch, label %for.j

for.i.latch:
  %i.next = add i32 %i, 1
  %i.exit = icmp eq i32 %i.next, 16
  br i1 %i.exit, label %exit, label %for.i.header

exit:
  ret void
}