blob: 0263e93a6ca6f0a4aca619416cd08c637df294bf [file] [log] [blame]
Silviu Barangaac920f72017-09-12 07:48:22 +00001; RUN: opt -basicaa -loop-accesses -analyze < %s | FileCheck %s
2
3target datalayout = "e-m:e-i8:8:32-i16:16:32-i64:64-i128:128-n32:64-S128"
4
5; i and i + 1 can overflow in the following kernel:
6; void test1(unsigned long long x, int *a, int *b) {
7; for (unsigned i = 0; i < x; ++i)
8; b[i] = a[i+1] + 1;
9; }
10;
11; If accesses to a and b can alias, we need to emit a run-time alias check
12; between accesses to a and b. However, when i and i + 1 can wrap, their
13; SCEV expression is not an AddRec. We need to create SCEV predicates and
14; coerce the expressions to AddRecs in order to be able to emit the run-time
15; alias check.
16;
17; The accesses at b[i] and a[i+1] correspond to the addresses %arrayidx and
18; %arrayidx4 in the test. The SCEV expressions for these are:
19; ((4 * (zext i32 {1,+,1}<%for.body> to i64))<nuw><nsw> + %a)<nsw>
20; ((4 * (zext i32 {0,+,1}<%for.body> to i64))<nuw><nsw> + %b)<nsw>
21;
22; The transformed expressions are:
23; i64 {(4 + %a),+,4}<%for.body>
24; i64 {(4 + %b),+,4}<%for.body>
25
26; CHECK-LABEL: test1
27; CHECK: Memory dependences are safe with run-time checks
28; CHECK-NEXT: Dependences:
29; CHECK-NEXT: Run-time memory checks:
30; CHECK-NEXT: Check 0:
31; CHECK-NEXT: Comparing group
32; CHECK-NEXT: %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
33; CHECK-NEXT: Against group
34; CHECK-NEXT: %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11
35; CHECK-NEXT: Grouped accesses:
36; CHECK-NEXT: Group
37; CHECK-NEXT: (Low: (4 + %a) High: (4 + (4 * (1 umax %x)) + %a))
38; CHECK-NEXT: Member: {(4 + %a),+,4}<%for.body>
39; CHECK-NEXT: Group
40; CHECK-NEXT: (Low: %b High: ((4 * (1 umax %x)) + %b))
41; CHECK-NEXT: Member: {%b,+,4}<%for.body>
42; CHECK: Store to invariant address was not found in loop.
43; CHECK-NEXT: SCEV assumptions:
44; CHECK-NEXT: {1,+,1}<%for.body> Added Flags: <nusw>
45; CHECK-NEXT: {0,+,1}<%for.body> Added Flags: <nusw>
46; CHECK: Expressions re-written:
47; CHECK-NEXT: [PSE] %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom:
48; CHECK-NEXT: ((4 * (zext i32 {1,+,1}<%for.body> to i64))<nuw><nsw> + %a)<nsw>
49; CHECK-NEXT: --> {(4 + %a),+,4}<%for.body>
50; CHECK-NEXT: [PSE] %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11:
51; CHECK-NEXT: ((4 * (zext i32 {0,+,1}<%for.body> to i64))<nuw><nsw> + %b)<nsw>
52; CHECK-NEXT: --> {%b,+,4}<%for.body>
53define void @test1(i64 %x, i32* %a, i32* %b) {
54entry:
55 br label %for.body
56
57for.body: ; preds = %for.body.preheader, %for.body
58 %conv11 = phi i64 [ %conv, %for.body ], [ 0, %entry ]
59 %i.010 = phi i32 [ %add, %for.body ], [ 0, %entry ]
60 %add = add i32 %i.010, 1
61 %idxprom = zext i32 %add to i64
62 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %idxprom
63 %ld = load i32, i32* %arrayidx, align 4
64 %add2 = add nsw i32 %ld, 1
65 %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %conv11
66 store i32 %add2, i32* %arrayidx4, align 4
67 %conv = zext i32 %add to i64
68 %cmp = icmp ult i64 %conv, %x
69 br i1 %cmp, label %for.body, label %exit
70
71exit:
72 ret void
73}
74
75; i can overflow in the following kernel:
76; void test2(unsigned long long x, int *a) {
77; for (unsigned i = 0; i < x; ++i)
78; a[i] = a[i] + 1;
79; }
80;
81; We need to check that i doesn't wrap, but we don't need a run-time alias
82; check. We also need an extra no-wrap check to get the backedge taken count.
83
84; CHECK-LABEL: test2
85; CHECK: Memory dependences are safe
86; CHECK: SCEV assumptions:
87; CHECK-NEXT: {1,+,1}<%for.body> Added Flags: <nusw>
88; CHECK-NEXT: {0,+,1}<%for.body> Added Flags: <nusw>
89 define void @test2(i64 %x, i32* %a) {
90entry:
91 br label %for.body
92
93for.body:
94 %conv11 = phi i64 [ %conv, %for.body ], [ 0, %entry ]
95 %i.010 = phi i32 [ %inc, %for.body ], [ 0, %entry ]
96 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %conv11
97 %ld = load i32, i32* %arrayidx, align 4
98 %add = add nsw i32 %ld, 1
99 store i32 %add, i32* %arrayidx, align 4
100 %inc = add i32 %i.010, 1
101 %conv = zext i32 %inc to i64
102 %cmp = icmp ult i64 %conv, %x
103 br i1 %cmp, label %for.body, label %exit
104
105exit:
106 ret void
107}