Dan Gohman | becfb88 | 2011-05-04 23:14:02 +0000 | [diff] [blame] | 1 | ; RUN: llc -regalloc=greedy < %s | FileCheck %s |
Dan Gohman | cca8214 | 2011-05-03 00:46:49 +0000 | [diff] [blame] | 2 | |
| 3 | ; LSR shouldn't introduce more induction variables than needed, increasing |
| 4 | ; register pressure and therefore spilling. There is more room for improvement |
| 5 | ; here. |
| 6 | |
Jakob Stoklund Olesen | 51458ed | 2011-07-08 20:46:18 +0000 | [diff] [blame^] | 7 | ; CHECK: sub sp, #{{32|28|24}} |
Dan Gohman | cca8214 | 2011-05-03 00:46:49 +0000 | [diff] [blame] | 8 | |
Jakob Stoklund Olesen | 51458ed | 2011-07-08 20:46:18 +0000 | [diff] [blame^] | 9 | ; CHECK: %for.inc |
| 10 | ; CHECK: ldr{{(.w)?}} r{{.*}}, [sp, # |
| 11 | ; CHECK: ldr{{(.w)?}} r{{.*}}, [sp, # |
| 12 | ; CHECK: ldr{{(.w)?}} r{{.*}}, [sp, # |
| 13 | ; CHECK: add |
Dan Gohman | cca8214 | 2011-05-03 00:46:49 +0000 | [diff] [blame] | 14 | |
| 15 | target datalayout = "e-p:32:32:32-i1:8:32-i8:8:32-i16:16:32-i32:32:32-i64:32:32-f32:32:32-f64:32:32-v64:32:64-v128:32:128-a0:0:32-n32" |
| 16 | target triple = "thumbv7-apple-macosx10.7.0" |
| 17 | |
| 18 | %struct.partition_entry = type { i32, i32, i64, i64 } |
| 19 | |
| 20 | define i32 @partition_overlap_check(%struct.partition_entry* nocapture %part, i32 %num_entries) nounwind readonly optsize ssp { |
| 21 | entry: |
| 22 | %cmp79 = icmp sgt i32 %num_entries, 0 |
| 23 | br i1 %cmp79, label %outer.loop, label %for.end72 |
| 24 | |
| 25 | outer.loop: ; preds = %for.inc69, %entry |
| 26 | %overlap.081 = phi i32 [ %overlap.4, %for.inc69 ], [ 0, %entry ] |
| 27 | %0 = phi i32 [ %inc71, %for.inc69 ], [ 0, %entry ] |
| 28 | %offset = getelementptr %struct.partition_entry* %part, i32 %0, i32 2 |
| 29 | %len = getelementptr %struct.partition_entry* %part, i32 %0, i32 3 |
| 30 | %tmp5 = load i64* %offset, align 4, !tbaa !0 |
| 31 | %tmp15 = load i64* %len, align 4, !tbaa !0 |
| 32 | %add = add nsw i64 %tmp15, %tmp5 |
| 33 | br label %inner.loop |
| 34 | |
| 35 | inner.loop: ; preds = %for.inc, %outer.loop |
| 36 | %overlap.178 = phi i32 [ %overlap.081, %outer.loop ], [ %overlap.4, %for.inc ] |
| 37 | %1 = phi i32 [ 0, %outer.loop ], [ %inc, %for.inc ] |
| 38 | %cmp23 = icmp eq i32 %0, %1 |
| 39 | br i1 %cmp23, label %for.inc, label %if.end |
| 40 | |
| 41 | if.end: ; preds = %inner.loop |
| 42 | %len39 = getelementptr %struct.partition_entry* %part, i32 %1, i32 3 |
| 43 | %offset28 = getelementptr %struct.partition_entry* %part, i32 %1, i32 2 |
| 44 | %tmp29 = load i64* %offset28, align 4, !tbaa !0 |
| 45 | %tmp40 = load i64* %len39, align 4, !tbaa !0 |
| 46 | %add41 = add nsw i64 %tmp40, %tmp29 |
| 47 | %cmp44 = icmp sge i64 %tmp29, %tmp5 |
| 48 | %cmp47 = icmp slt i64 %tmp29, %add |
| 49 | %or.cond = and i1 %cmp44, %cmp47 |
| 50 | %overlap.2 = select i1 %or.cond, i32 1, i32 %overlap.178 |
| 51 | %cmp52 = icmp sle i64 %add41, %add |
| 52 | %cmp56 = icmp sgt i64 %add41, %tmp5 |
| 53 | %or.cond74 = and i1 %cmp52, %cmp56 |
| 54 | %overlap.3 = select i1 %or.cond74, i32 1, i32 %overlap.2 |
| 55 | %cmp61 = icmp sgt i64 %tmp29, %tmp5 |
| 56 | %cmp65 = icmp slt i64 %add41, %add |
| 57 | %or.cond75 = or i1 %cmp61, %cmp65 |
| 58 | br i1 %or.cond75, label %for.inc, label %if.then66 |
| 59 | |
| 60 | if.then66: ; preds = %if.end |
| 61 | br label %for.inc |
| 62 | |
| 63 | for.inc: ; preds = %if.end, %if.then66, %inner.loop |
| 64 | %overlap.4 = phi i32 [ %overlap.178, %inner.loop ], [ 1, %if.then66 ], [ %overlap.3, %if.end ] |
| 65 | %inc = add nsw i32 %1, 1 |
| 66 | %exitcond = icmp eq i32 %inc, %num_entries |
| 67 | br i1 %exitcond, label %for.inc69, label %inner.loop |
| 68 | |
| 69 | for.inc69: ; preds = %for.inc |
| 70 | %inc71 = add nsw i32 %0, 1 |
| 71 | %exitcond83 = icmp eq i32 %inc71, %num_entries |
| 72 | br i1 %exitcond83, label %for.end72, label %outer.loop |
| 73 | |
| 74 | for.end72: ; preds = %for.inc69, %entry |
| 75 | %overlap.0.lcssa = phi i32 [ 0, %entry ], [ %overlap.4, %for.inc69 ] |
| 76 | ret i32 %overlap.0.lcssa |
| 77 | } |
| 78 | |
| 79 | !0 = metadata !{metadata !"long long", metadata !1} |
| 80 | !1 = metadata !{metadata !"omnipotent char", metadata !2} |
| 81 | !2 = metadata !{metadata !"Simple C/C++ TBAA", null} |