Adam Nemet | ce48250 | 2015-04-08 17:48:40 +0000 | [diff] [blame] | 1 | ; RUN: opt < %s -loop-accesses -analyze | FileCheck %s |
Sean Silva | 284b032 | 2016-07-07 01:01:53 +0000 | [diff] [blame] | 2 | ; RUN: opt -passes='require<scalar-evolution>,require<aa>,loop(print-access-info)' -disable-output < %s 2>&1 | FileCheck %s |
Adam Nemet | ce48250 | 2015-04-08 17:48:40 +0000 | [diff] [blame] | 3 | |
Anna Thomas | 6f732bf | 2018-10-16 15:46:26 +0000 | [diff] [blame] | 4 | ; Inner loop has a store to invariant address, but LAA does not need to identify |
| 5 | ; the store to invariant address, since it is a single store. |
Adam Nemet | ce48250 | 2015-04-08 17:48:40 +0000 | [diff] [blame] | 6 | ; |
| 7 | ; for(; i < itr; i++) { |
| 8 | ; for(; j < itr; j++) { |
| 9 | ; var1[j] = ++var2[i] + var1[j]; |
| 10 | ; } |
| 11 | ; } |
| 12 | |
Anna Thomas | 5e9215f | 2018-11-19 15:39:59 +0000 | [diff] [blame] | 13 | ; CHECK: Non vectorizable stores to invariant address were not found in loop. |
Adam Nemet | ce48250 | 2015-04-08 17:48:40 +0000 | [diff] [blame] | 14 | |
| 15 | define void @foo(i32* nocapture %var1, i32* nocapture %var2, i32 %itr) #0 { |
| 16 | entry: |
| 17 | %cmp20 = icmp sgt i32 %itr, 0 |
| 18 | br i1 %cmp20, label %for.cond1.preheader, label %for.end11 |
| 19 | |
| 20 | for.cond1.preheader: ; preds = %entry, %for.inc9 |
| 21 | %indvars.iv23 = phi i64 [ %indvars.iv.next24, %for.inc9 ], [ 0, %entry ] |
| 22 | %j.022 = phi i32 [ %j.1.lcssa, %for.inc9 ], [ 0, %entry ] |
| 23 | %cmp218 = icmp slt i32 %j.022, %itr |
| 24 | br i1 %cmp218, label %for.body3.lr.ph, label %for.inc9 |
| 25 | |
| 26 | for.body3.lr.ph: ; preds = %for.cond1.preheader |
| 27 | %arrayidx = getelementptr inbounds i32, i32* %var2, i64 %indvars.iv23 |
| 28 | %0 = sext i32 %j.022 to i64 |
| 29 | br label %for.body3 |
| 30 | |
| 31 | for.body3: ; preds = %for.body3, %for.body3.lr.ph |
| 32 | %indvars.iv = phi i64 [ %0, %for.body3.lr.ph ], [ %indvars.iv.next, %for.body3 ] |
| 33 | %1 = load i32, i32* %arrayidx, align 4 |
| 34 | %inc = add nsw i32 %1, 1 |
| 35 | store i32 %inc, i32* %arrayidx, align 4 |
| 36 | %arrayidx5 = getelementptr inbounds i32, i32* %var1, i64 %indvars.iv |
| 37 | %2 = load i32, i32* %arrayidx5, align 4 |
| 38 | %add = add nsw i32 %inc, %2 |
| 39 | store i32 %add, i32* %arrayidx5, align 4 |
| 40 | %indvars.iv.next = add nsw i64 %indvars.iv, 1 |
| 41 | %lftr.wideiv = trunc i64 %indvars.iv.next to i32 |
| 42 | %exitcond = icmp eq i32 %lftr.wideiv, %itr |
| 43 | br i1 %exitcond, label %for.inc9, label %for.body3 |
| 44 | |
| 45 | for.inc9: ; preds = %for.body3, %for.cond1.preheader |
| 46 | %j.1.lcssa = phi i32 [ %j.022, %for.cond1.preheader ], [ %itr, %for.body3 ] |
| 47 | %indvars.iv.next24 = add nuw nsw i64 %indvars.iv23, 1 |
| 48 | %lftr.wideiv25 = trunc i64 %indvars.iv.next24 to i32 |
| 49 | %exitcond26 = icmp eq i32 %lftr.wideiv25, %itr |
| 50 | br i1 %exitcond26, label %for.end11, label %for.cond1.preheader |
| 51 | |
| 52 | for.end11: ; preds = %for.inc9, %entry |
| 53 | ret void |
| 54 | } |