blob: 70ba5940257f5ab2deb503a634a7d9fac6dc8f71 [file] [log] [blame]
Florian Hahn6c7f0252017-07-18 09:47:06 +00001; RUN: opt < %s -basicaa -loop-interchange -S | FileCheck %s
2;; We test the complete .ll for adjustment in outer loop header/latch and inner loop header/latch.
3
4target datalayout = "e-m:e-i64:64-f80:128-n8:16:32:64-S128"
5target triple = "x86_64-unknown-linux-gnu"
6
7@A = common global [100 x [100 x i32]] zeroinitializer
8@B = common global [100 x i32] zeroinitializer
9
10;; for(int i=0;i<100;i++)
11;; for(int j=100;j>=0;j--)
12;; A[j][i] = A[j][i]+k;
13
14define void @interchange_02(i32 %k) {
15entry:
16 br label %for.cond1.preheader
17
18for.cond1.preheader:
19 %indvars.iv19 = phi i64 [ 0, %entry ], [ %indvars.iv.next20, %for.inc10 ]
20 br label %for.body3
21
22for.body3:
23 %indvars.iv = phi i64 [ 100, %for.cond1.preheader ], [ %indvars.iv.next, %for.body3 ]
24 %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %indvars.iv, i64 %indvars.iv19
25 %0 = load i32, i32* %arrayidx5
26 %add = add nsw i32 %0, %k
27 store i32 %add, i32* %arrayidx5
28 %indvars.iv.next = add nsw i64 %indvars.iv, -1
29 %cmp2 = icmp sgt i64 %indvars.iv, 0
30 br i1 %cmp2, label %for.body3, label %for.inc10
31
32for.inc10:
33 %indvars.iv.next20 = add nuw nsw i64 %indvars.iv19, 1
34 %exitcond = icmp eq i64 %indvars.iv.next20, 100
35 br i1 %exitcond, label %for.end11, label %for.cond1.preheader
36
37for.end11:
38 ret void
39}
40
41; CHECK-LABEL: @interchange_02
42; CHECK: entry:
43; CHECK: br label %for.body3.preheader
44; CHECK: for.cond1.preheader.preheader:
45; CHECK: br label %for.cond1.preheader
46; CHECK: for.cond1.preheader:
47; CHECK: %indvars.iv19 = phi i64 [ %indvars.iv.next20, %for.inc10 ], [ 0, %for.cond1.preheader.preheader ]
48; CHECK: br label %for.body3.split1
49; CHECK: for.body3.preheader:
50; CHECK: br label %for.body3
51; CHECK: for.body3:
52; CHECK: %indvars.iv = phi i64 [ %indvars.iv.next, %for.body3.split ], [ 100, %for.body3.preheader ]
53; CHECK: br label %for.cond1.preheader.preheader
54; CHECK: for.body3.split1: ; preds = %for.cond1.preheader
55; CHECK: %arrayidx5 = getelementptr inbounds [100 x [100 x i32]], [100 x [100 x i32]]* @A, i64 0, i64 %indvars.iv, i64 %indvars.iv19
56; CHECK: %0 = load i32, i32* %arrayidx5
57; CHECK: %add = add nsw i32 %0, %k
58; CHECK: store i32 %add, i32* %arrayidx5
59; CHECK: br label %for.inc10
60; CHECK: for.body3.split:
61; CHECK: %indvars.iv.next = add nsw i64 %indvars.iv, -1
62; CHECK: %cmp2 = icmp sgt i64 %indvars.iv, 0
63; CHECK: br i1 %cmp2, label %for.body3, label %for.end11
64; CHECK: for.inc10:
65; CHECK: %indvars.iv.next20 = add nuw nsw i64 %indvars.iv19, 1
66; CHECK: %exitcond = icmp eq i64 %indvars.iv.next20, 100
67; CHECK: br i1 %exitcond, label %for.body3.split, label %for.cond1.preheader
68; CHECK: for.end11:
69; CHECK: ret void