Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 1 | ; RUN: opt -basicaa -loop-idiom < %s -S | FileCheck %s |
| 2 | |
| 3 | target datalayout = "e-p:32:32:32-p1:64:64:64-p2:16:16:16-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:32:32-n8:16:32:64" |
| 4 | target triple = "x86_64-apple-darwin10.0.0" |
| 5 | |
| 6 | ; Two dimensional nested loop should be promoted to one big memset. |
| 7 | define void @test10(i8 addrspace(2)* %X) nounwind ssp { |
| 8 | ; CHECK-LABEL: @test10( |
| 9 | ; CHECK: entry: |
| 10 | ; CHECK-NEXT: call void @llvm.memset.p2i8.i16(i8 addrspace(2)* %X, i8 0, i16 10000, i32 1, i1 false) |
| 11 | ; CHECK-NOT: store |
| 12 | ; CHECK: ret void |
| 13 | |
| 14 | entry: |
| 15 | br label %bb.nph |
| 16 | |
| 17 | bb.nph: ; preds = %entry, %for.inc10 |
| 18 | %i.04 = phi i16 [ 0, %entry ], [ %inc12, %for.inc10 ] |
| 19 | br label %for.body5 |
| 20 | |
| 21 | for.body5: ; preds = %for.body5, %bb.nph |
| 22 | %j.02 = phi i16 [ 0, %bb.nph ], [ %inc, %for.body5 ] |
| 23 | %mul = mul nsw i16 %i.04, 100 |
| 24 | %add = add nsw i16 %j.02, %mul |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 25 | %arrayidx = getelementptr inbounds i8, i8 addrspace(2)* %X, i16 %add |
Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 26 | store i8 0, i8 addrspace(2)* %arrayidx, align 1 |
| 27 | %inc = add nsw i16 %j.02, 1 |
| 28 | %cmp4 = icmp eq i16 %inc, 100 |
| 29 | br i1 %cmp4, label %for.inc10, label %for.body5 |
| 30 | |
| 31 | for.inc10: ; preds = %for.body5 |
| 32 | %inc12 = add nsw i16 %i.04, 1 |
| 33 | %cmp = icmp eq i16 %inc12, 100 |
| 34 | br i1 %cmp, label %for.end13, label %bb.nph |
| 35 | |
| 36 | for.end13: ; preds = %for.inc10 |
| 37 | ret void |
| 38 | } |
| 39 | |
| 40 | define void @test11_pattern(i32 addrspace(2)* nocapture %P) nounwind ssp { |
| 41 | ; CHECK-LABEL: @test11_pattern( |
| 42 | ; CHECK-NOT: memset_pattern |
| 43 | entry: |
| 44 | br label %for.body |
| 45 | |
| 46 | for.body: ; preds = %entry, %for.body |
| 47 | %indvar = phi i64 [ 0, %entry ], [ %indvar.next, %for.body ] |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 48 | %arrayidx = getelementptr i32, i32 addrspace(2)* %P, i64 %indvar |
Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 49 | store i32 1, i32 addrspace(2)* %arrayidx, align 4 |
| 50 | %indvar.next = add i64 %indvar, 1 |
| 51 | %exitcond = icmp eq i64 %indvar.next, 10000 |
| 52 | br i1 %exitcond, label %for.end, label %for.body |
| 53 | |
| 54 | for.end: ; preds = %for.body |
| 55 | ret void |
| 56 | } |
| 57 | |
| 58 | ; PR9815 - This is a partial overlap case that cannot be safely transformed |
| 59 | ; into a memcpy. |
| 60 | @g_50 = addrspace(2) global [7 x i32] [i32 0, i32 0, i32 0, i32 0, i32 1, i32 0, i32 0], align 16 |
| 61 | |
| 62 | |
| 63 | define i32 @test14() nounwind { |
| 64 | ; CHECK-LABEL: @test14( |
| 65 | ; CHECK: for.body: |
| 66 | ; CHECK: load i32 |
| 67 | ; CHECK: store i32 |
| 68 | ; CHECK: br i1 %cmp |
| 69 | |
| 70 | entry: |
| 71 | br label %for.body |
| 72 | |
| 73 | for.body: ; preds = %for.inc, %for.body.lr.ph |
| 74 | %tmp5 = phi i32 [ %inc, %for.body ], [ 0, %entry ] |
| 75 | %add = add nsw i32 %tmp5, 4 |
| 76 | %idxprom = sext i32 %add to i64 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 77 | %arrayidx = getelementptr inbounds [7 x i32], [7 x i32] addrspace(2)* @g_50, i32 0, i64 %idxprom |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame^] | 78 | %tmp2 = load i32, i32 addrspace(2)* %arrayidx, align 4 |
Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 79 | %add4 = add nsw i32 %tmp5, 5 |
| 80 | %idxprom5 = sext i32 %add4 to i64 |
David Blaikie | 79e6c74 | 2015-02-27 19:29:02 +0000 | [diff] [blame] | 81 | %arrayidx6 = getelementptr inbounds [7 x i32], [7 x i32] addrspace(2)* @g_50, i32 0, i64 %idxprom5 |
Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 82 | store i32 %tmp2, i32 addrspace(2)* %arrayidx6, align 4 |
| 83 | %inc = add nsw i32 %tmp5, 1 |
| 84 | %cmp = icmp slt i32 %inc, 2 |
| 85 | br i1 %cmp, label %for.body, label %for.end |
| 86 | |
| 87 | for.end: ; preds = %for.inc |
David Blaikie | a79ac14 | 2015-02-27 21:17:42 +0000 | [diff] [blame^] | 88 | %tmp8 = load i32, i32 addrspace(2)* getelementptr inbounds ([7 x i32] addrspace(2)* @g_50, i32 0, i64 6), align 4 |
Matt Arsenault | 009faed | 2013-09-11 05:09:42 +0000 | [diff] [blame] | 89 | ret i32 %tmp8 |
| 90 | } |
| 91 | |