blob: 9291faca19c2cd17086557f9ee12fe33d6202fad [file] [log] [blame]
Sanjay Patel28f53ef2017-07-08 16:10:42 +00001; NOTE: Assertions have been autogenerated by utils/update_test_checks.py
Sanjay Patelb653de12014-09-10 17:58:16 +00002; RUN: opt < %s -loop-vectorize -force-vector-interleave=1 -force-vector-width=4 -enable-if-conversion -dce -instcombine -S | FileCheck %s
Nadav Rotem628c2db2012-12-04 06:15:11 +00003
4target datalayout = "e-p:64:64:64-i1:8:8-i8:8:8-i16:16:16-i32:32:32-i64:64:64-f32:32:32-f64:64:64-v64:64:64-v128:128:128-a0:0:64-s0:64:64-f80:128:128-n8:16:32:64-S128"
Nadav Rotem628c2db2012-12-04 06:15:11 +00005
6; This is the loop in this example:
7;
8;int function0(int *a, int *b, int start, int end) {
9;
10; for (int i=start; i<end; ++i) {
11; unsigned k = a[i];
12;
13; if (a[i] > b[i]) <------ notice the IF inside the loop.
14; k = k * 5 + 3;
15;
16; a[i] = k; <---- K is a phi node that becomes vector-select.
17; }
18;}
19
Nadav Rotem628c2db2012-12-04 06:15:11 +000020define i32 @function0(i32* nocapture %a, i32* nocapture %b, i32 %start, i32 %end) nounwind uwtable ssp {
Sanjay Patel28f53ef2017-07-08 16:10:42 +000021; CHECK-LABEL: @function0(
22; CHECK-NEXT: entry:
23; CHECK-NEXT: [[CMP16:%.*]] = icmp slt i32 [[START:%.*]], [[END:%.*]]
24; CHECK-NEXT: br i1 [[CMP16]], label [[FOR_BODY_LR_PH:%.*]], label [[FOR_END:%.*]]
25; CHECK: for.body.lr.ph:
26; CHECK-NEXT: [[TMP0:%.*]] = sext i32 [[START]] to i64
27; CHECK-NEXT: [[TMP1:%.*]] = add i32 [[END]], -1
28; CHECK-NEXT: [[TMP2:%.*]] = sub i32 [[TMP1]], [[START]]
29; CHECK-NEXT: [[TMP3:%.*]] = zext i32 [[TMP2]] to i64
30; CHECK-NEXT: [[TMP4:%.*]] = add nuw nsw i64 [[TMP3]], 1
31; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[TMP4]], 4
32; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[MIN_ITERS_CHECKED:%.*]]
33; CHECK: min.iters.checked:
34; CHECK-NEXT: [[TMP5:%.*]] = add i32 [[TMP2]], 1
35; CHECK-NEXT: [[TMP6:%.*]] = and i32 [[TMP5]], 3
36; CHECK-NEXT: [[N_MOD_VF:%.*]] = zext i32 [[TMP6]] to i64
37; CHECK-NEXT: [[N_VEC:%.*]] = sub nsw i64 [[TMP4]], [[N_MOD_VF]]
38; CHECK-NEXT: [[CMP_ZERO:%.*]] = icmp eq i64 [[N_VEC]], 0
39; CHECK-NEXT: br i1 [[CMP_ZERO]], label [[SCALAR_PH]], label [[VECTOR_MEMCHECK:%.*]]
40; CHECK: vector.memcheck:
41; CHECK-NEXT: [[SCEVGEP:%.*]] = getelementptr i32, i32* [[A:%.*]], i64 [[TMP0]]
42; CHECK-NEXT: [[TMP7:%.*]] = add i32 [[END]], -1
43; CHECK-NEXT: [[TMP8:%.*]] = sub i32 [[TMP7]], [[START]]
44; CHECK-NEXT: [[TMP9:%.*]] = zext i32 [[TMP8]] to i64
45; CHECK-NEXT: [[TMP10:%.*]] = add nsw i64 [[TMP0]], [[TMP9]]
46; CHECK-NEXT: [[TMP11:%.*]] = add nsw i64 [[TMP10]], 1
47; CHECK-NEXT: [[SCEVGEP2:%.*]] = getelementptr i32, i32* [[A]], i64 [[TMP11]]
48; CHECK-NEXT: [[SCEVGEP4:%.*]] = getelementptr i32, i32* [[B:%.*]], i64 [[TMP0]]
49; CHECK-NEXT: [[SCEVGEP6:%.*]] = getelementptr i32, i32* [[B]], i64 [[TMP11]]
50; CHECK-NEXT: [[BOUND0:%.*]] = icmp ult i32* [[SCEVGEP]], [[SCEVGEP6]]
51; CHECK-NEXT: [[BOUND1:%.*]] = icmp ult i32* [[SCEVGEP4]], [[SCEVGEP2]]
52; CHECK-NEXT: [[MEMCHECK_CONFLICT:%.*]] = and i1 [[BOUND0]], [[BOUND1]]
53; CHECK-NEXT: [[IND_END:%.*]] = add nsw i64 [[N_VEC]], [[TMP0]]
54; CHECK-NEXT: br i1 [[MEMCHECK_CONFLICT]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
55; CHECK: vector.ph:
56; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
57; CHECK: vector.body:
58; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
59; CHECK-NEXT: [[TMP12:%.*]] = add i64 [[INDEX]], [[TMP0]]
60; CHECK-NEXT: [[TMP13:%.*]] = getelementptr inbounds i32, i32* [[A]], i64 [[TMP12]]
61; CHECK-NEXT: [[TMP14:%.*]] = bitcast i32* [[TMP13]] to <4 x i32>*
62; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <4 x i32>, <4 x i32>* [[TMP14]], align 4, !alias.scope !0, !noalias !3
63; CHECK-NEXT: [[TMP15:%.*]] = getelementptr inbounds i32, i32* [[B]], i64 [[TMP12]]
64; CHECK-NEXT: [[TMP16:%.*]] = bitcast i32* [[TMP15]] to <4 x i32>*
65; CHECK-NEXT: [[WIDE_LOAD8:%.*]] = load <4 x i32>, <4 x i32>* [[TMP16]], align 4, !alias.scope !3
66; CHECK-NEXT: [[TMP17:%.*]] = mul <4 x i32> [[WIDE_LOAD]], <i32 5, i32 5, i32 5, i32 5>
67; CHECK-NEXT: [[TMP18:%.*]] = add <4 x i32> [[TMP17]], <i32 3, i32 3, i32 3, i32 3>
68; CHECK-NEXT: [[TMP19:%.*]] = icmp sgt <4 x i32> [[WIDE_LOAD]], [[WIDE_LOAD8]]
69; CHECK-NEXT: [[PREDPHI:%.*]] = select <4 x i1> [[TMP19]], <4 x i32> [[TMP18]], <4 x i32> [[WIDE_LOAD]]
70; CHECK-NEXT: [[TMP20:%.*]] = bitcast i32* [[TMP13]] to <4 x i32>*
71; CHECK-NEXT: store <4 x i32> [[PREDPHI]], <4 x i32>* [[TMP20]], align 4, !alias.scope !0, !noalias !3
72; CHECK-NEXT: [[INDEX_NEXT]] = add i64 [[INDEX]], 4
73; CHECK-NEXT: [[TMP21:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
74; CHECK-NEXT: br i1 [[TMP21]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop !5
75; CHECK: middle.block:
76; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i32 [[TMP6]], 0
77; CHECK-NEXT: br i1 [[CMP_N]], label [[FOR_END_LOOPEXIT:%.*]], label [[SCALAR_PH]]
78; CHECK: scalar.ph:
79; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[IND_END]], [[MIDDLE_BLOCK]] ], [ [[TMP0]], [[FOR_BODY_LR_PH]] ], [ [[TMP0]], [[MIN_ITERS_CHECKED]] ], [ [[TMP0]], [[VECTOR_MEMCHECK]] ]
80; CHECK-NEXT: br label [[FOR_BODY:%.*]]
81; CHECK: for.body:
82; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ], [ [[INDVARS_IV_NEXT:%.*]], [[IF_END:%.*]] ]
83; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[A]], i64 [[INDVARS_IV]]
84; CHECK-NEXT: [[TMP22:%.*]] = load i32, i32* [[ARRAYIDX]], align 4
85; CHECK-NEXT: [[ARRAYIDX4:%.*]] = getelementptr inbounds i32, i32* [[B]], i64 [[INDVARS_IV]]
86; CHECK-NEXT: [[TMP23:%.*]] = load i32, i32* [[ARRAYIDX4]], align 4
87; CHECK-NEXT: [[CMP5:%.*]] = icmp sgt i32 [[TMP22]], [[TMP23]]
88; CHECK-NEXT: br i1 [[CMP5]], label [[IF_THEN:%.*]], label [[IF_END]]
89; CHECK: if.then:
90; CHECK-NEXT: [[MUL:%.*]] = mul i32 [[TMP22]], 5
91; CHECK-NEXT: [[ADD:%.*]] = add i32 [[MUL]], 3
92; CHECK-NEXT: br label [[IF_END]]
93; CHECK: if.end:
94; CHECK-NEXT: [[K_0:%.*]] = phi i32 [ [[ADD]], [[IF_THEN]] ], [ [[TMP22]], [[FOR_BODY]] ]
95; CHECK-NEXT: store i32 [[K_0]], i32* [[ARRAYIDX]], align 4
96; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add i64 [[INDVARS_IV]], 1
97; CHECK-NEXT: [[TMP24:%.*]] = trunc i64 [[INDVARS_IV_NEXT]] to i32
98; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[TMP24]], [[END]]
99; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_END_LOOPEXIT]], !llvm.loop !8
100; CHECK: for.end.loopexit:
101; CHECK-NEXT: br label [[FOR_END]]
102; CHECK: for.end:
103; CHECK-NEXT: ret i32 undef
104;
Nadav Rotem628c2db2012-12-04 06:15:11 +0000105entry:
106 %cmp16 = icmp slt i32 %start, %end
107 br i1 %cmp16, label %for.body.lr.ph, label %for.end
108
109for.body.lr.ph:
110 %0 = sext i32 %start to i64
111 br label %for.body
112
113for.body:
114 %indvars.iv = phi i64 [ %0, %for.body.lr.ph ], [ %indvars.iv.next, %if.end ]
David Blaikie79e6c742015-02-27 19:29:02 +0000115 %arrayidx = getelementptr inbounds i32, i32* %a, i64 %indvars.iv
David Blaikiea79ac142015-02-27 21:17:42 +0000116 %1 = load i32, i32* %arrayidx, align 4
David Blaikie79e6c742015-02-27 19:29:02 +0000117 %arrayidx4 = getelementptr inbounds i32, i32* %b, i64 %indvars.iv
David Blaikiea79ac142015-02-27 21:17:42 +0000118 %2 = load i32, i32* %arrayidx4, align 4
Nadav Rotem628c2db2012-12-04 06:15:11 +0000119 %cmp5 = icmp sgt i32 %1, %2
120 br i1 %cmp5, label %if.then, label %if.end
121
122if.then:
123 %mul = mul i32 %1, 5
124 %add = add i32 %mul, 3
125 br label %if.end
126
127if.end:
128 %k.0 = phi i32 [ %add, %if.then ], [ %1, %for.body ]
129 store i32 %k.0, i32* %arrayidx, align 4
130 %indvars.iv.next = add i64 %indvars.iv, 1
131 %3 = trunc i64 %indvars.iv.next to i32
132 %cmp = icmp slt i32 %3, %end
133 br i1 %cmp, label %for.body, label %for.end
134
135for.end:
136 ret i32 undef
137}
Nadav Rotema10b3112012-12-04 18:17:33 +0000138
139
140
141; int func(int *A, int n) {
142; unsigned sum = 0;
143; for (int i = 0; i < n; ++i)
144; if (A[i] > 30)
145; sum += A[i] + 2;
146;
147; return sum;
148; }
149
Nadav Rotema10b3112012-12-04 18:17:33 +0000150define i32 @reduction_func(i32* nocapture %A, i32 %n) nounwind uwtable readonly ssp {
Sanjay Patel28f53ef2017-07-08 16:10:42 +0000151; CHECK-LABEL: @reduction_func(
152; CHECK-NEXT: entry:
153; CHECK-NEXT: [[CMP10:%.*]] = icmp sgt i32 [[N:%.*]], 0
154; CHECK-NEXT: br i1 [[CMP10]], label [[FOR_BODY_PREHEADER:%.*]], label [[FOR_END:%.*]]
155; CHECK: for.body.preheader:
156; CHECK-NEXT: [[TMP0:%.*]] = add i32 [[N]], -1
157; CHECK-NEXT: [[TMP1:%.*]] = zext i32 [[TMP0]] to i64
158; CHECK-NEXT: [[TMP2:%.*]] = add nuw nsw i64 [[TMP1]], 1
159; CHECK-NEXT: [[MIN_ITERS_CHECK:%.*]] = icmp ult i64 [[TMP2]], 4
160; CHECK-NEXT: br i1 [[MIN_ITERS_CHECK]], label [[SCALAR_PH:%.*]], label [[MIN_ITERS_CHECKED:%.*]]
161; CHECK: min.iters.checked:
162; CHECK-NEXT: [[TMP3:%.*]] = and i32 [[N]], 3
163; CHECK-NEXT: [[N_MOD_VF:%.*]] = zext i32 [[TMP3]] to i64
164; CHECK-NEXT: [[N_VEC:%.*]] = sub nsw i64 [[TMP2]], [[N_MOD_VF]]
165; CHECK-NEXT: [[CMP_ZERO:%.*]] = icmp eq i64 [[N_VEC]], 0
166; CHECK-NEXT: br i1 [[CMP_ZERO]], label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
167; CHECK: vector.ph:
168; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
169; CHECK: vector.body:
170; CHECK-NEXT: [[INDEX:%.*]] = phi i64 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
171; CHECK-NEXT: [[VEC_PHI:%.*]] = phi <4 x i32> [ zeroinitializer, [[VECTOR_PH]] ], [ [[PREDPHI:%.*]], [[VECTOR_BODY]] ]
172; CHECK-NEXT: [[TMP4:%.*]] = getelementptr inbounds i32, i32* [[A:%.*]], i64 [[INDEX]]
173; CHECK-NEXT: [[TMP5:%.*]] = bitcast i32* [[TMP4]] to <4 x i32>*
174; CHECK-NEXT: [[WIDE_LOAD:%.*]] = load <4 x i32>, <4 x i32>* [[TMP5]], align 4
175; CHECK-NEXT: [[TMP6:%.*]] = add <4 x i32> [[VEC_PHI]], <i32 2, i32 2, i32 2, i32 2>
176; CHECK-NEXT: [[TMP7:%.*]] = add <4 x i32> [[TMP6]], [[WIDE_LOAD]]
177; CHECK-NEXT: [[TMP8:%.*]] = icmp slt <4 x i32> [[WIDE_LOAD]], <i32 31, i32 31, i32 31, i32 31>
178; CHECK-NEXT: [[PREDPHI]] = select <4 x i1> [[TMP8]], <4 x i32> [[VEC_PHI]], <4 x i32> [[TMP7]]
179; CHECK-NEXT: [[INDEX_NEXT]] = add i64 [[INDEX]], 4
180; CHECK-NEXT: [[TMP9:%.*]] = icmp eq i64 [[INDEX_NEXT]], [[N_VEC]]
181; CHECK-NEXT: br i1 [[TMP9]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop !9
182; CHECK: middle.block:
183; CHECK-NEXT: [[RDX_SHUF:%.*]] = shufflevector <4 x i32> [[PREDPHI]], <4 x i32> undef, <4 x i32> <i32 2, i32 3, i32 undef, i32 undef>
184; CHECK-NEXT: [[BIN_RDX:%.*]] = add <4 x i32> [[PREDPHI]], [[RDX_SHUF]]
185; CHECK-NEXT: [[RDX_SHUF1:%.*]] = shufflevector <4 x i32> [[BIN_RDX]], <4 x i32> undef, <4 x i32> <i32 1, i32 undef, i32 undef, i32 undef>
186; CHECK-NEXT: [[BIN_RDX2:%.*]] = add <4 x i32> [[BIN_RDX]], [[RDX_SHUF1]]
187; CHECK-NEXT: [[TMP10:%.*]] = extractelement <4 x i32> [[BIN_RDX2]], i32 0
188; CHECK-NEXT: [[CMP_N:%.*]] = icmp eq i32 [[TMP3]], 0
189; CHECK-NEXT: br i1 [[CMP_N]], label [[FOR_END_LOOPEXIT:%.*]], label [[SCALAR_PH]]
190; CHECK: scalar.ph:
191; CHECK-NEXT: [[BC_RESUME_VAL:%.*]] = phi i64 [ [[N_VEC]], [[MIDDLE_BLOCK]] ], [ 0, [[FOR_BODY_PREHEADER]] ], [ 0, [[MIN_ITERS_CHECKED]] ]
192; CHECK-NEXT: [[BC_MERGE_RDX:%.*]] = phi i32 [ [[TMP10]], [[MIDDLE_BLOCK]] ], [ 0, [[FOR_BODY_PREHEADER]] ], [ 0, [[MIN_ITERS_CHECKED]] ]
193; CHECK-NEXT: br label [[FOR_BODY:%.*]]
194; CHECK: for.body:
195; CHECK-NEXT: [[INDVARS_IV:%.*]] = phi i64 [ [[INDVARS_IV_NEXT:%.*]], [[FOR_INC:%.*]] ], [ [[BC_RESUME_VAL]], [[SCALAR_PH]] ]
196; CHECK-NEXT: [[SUM_011:%.*]] = phi i32 [ [[SUM_1:%.*]], [[FOR_INC]] ], [ [[BC_MERGE_RDX]], [[SCALAR_PH]] ]
197; CHECK-NEXT: [[ARRAYIDX:%.*]] = getelementptr inbounds i32, i32* [[A]], i64 [[INDVARS_IV]]
198; CHECK-NEXT: [[TMP11:%.*]] = load i32, i32* [[ARRAYIDX]], align 4
199; CHECK-NEXT: [[CMP1:%.*]] = icmp sgt i32 [[TMP11]], 30
200; CHECK-NEXT: br i1 [[CMP1]], label [[IF_THEN:%.*]], label [[FOR_INC]]
201; CHECK: if.then:
202; CHECK-NEXT: [[ADD:%.*]] = add i32 [[SUM_011]], 2
203; CHECK-NEXT: [[ADD4:%.*]] = add i32 [[ADD]], [[TMP11]]
204; CHECK-NEXT: br label [[FOR_INC]]
205; CHECK: for.inc:
206; CHECK-NEXT: [[SUM_1]] = phi i32 [ [[ADD4]], [[IF_THEN]] ], [ [[SUM_011]], [[FOR_BODY]] ]
207; CHECK-NEXT: [[INDVARS_IV_NEXT]] = add i64 [[INDVARS_IV]], 1
208; CHECK-NEXT: [[LFTR_WIDEIV:%.*]] = trunc i64 [[INDVARS_IV_NEXT]] to i32
209; CHECK-NEXT: [[EXITCOND:%.*]] = icmp eq i32 [[LFTR_WIDEIV]], [[N]]
210; CHECK-NEXT: br i1 [[EXITCOND]], label [[FOR_END_LOOPEXIT]], label [[FOR_BODY]], !llvm.loop !10
211; CHECK: for.end.loopexit:
212; CHECK-NEXT: [[SUM_1_LCSSA:%.*]] = phi i32 [ [[SUM_1]], [[FOR_INC]] ], [ [[TMP10]], [[MIDDLE_BLOCK]] ]
213; CHECK-NEXT: br label [[FOR_END]]
214; CHECK: for.end:
215; CHECK-NEXT: [[SUM_0_LCSSA:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[SUM_1_LCSSA]], [[FOR_END_LOOPEXIT]] ]
216; CHECK-NEXT: ret i32 [[SUM_0_LCSSA]]
217;
Nadav Rotema10b3112012-12-04 18:17:33 +0000218entry:
219 %cmp10 = icmp sgt i32 %n, 0
220 br i1 %cmp10, label %for.body, label %for.end
221
222for.body: ; preds = %entry, %for.inc
223 %indvars.iv = phi i64 [ %indvars.iv.next, %for.inc ], [ 0, %entry ]
224 %sum.011 = phi i32 [ %sum.1, %for.inc ], [ 0, %entry ]
David Blaikie79e6c742015-02-27 19:29:02 +0000225 %arrayidx = getelementptr inbounds i32, i32* %A, i64 %indvars.iv
David Blaikiea79ac142015-02-27 21:17:42 +0000226 %0 = load i32, i32* %arrayidx, align 4
Nadav Rotema10b3112012-12-04 18:17:33 +0000227 %cmp1 = icmp sgt i32 %0, 30
228 br i1 %cmp1, label %if.then, label %for.inc
229
230if.then: ; preds = %for.body
231 %add = add i32 %sum.011, 2
232 %add4 = add i32 %add, %0
233 br label %for.inc
234
235for.inc: ; preds = %for.body, %if.then
236 %sum.1 = phi i32 [ %add4, %if.then ], [ %sum.011, %for.body ]
237 %indvars.iv.next = add i64 %indvars.iv, 1
238 %lftr.wideiv = trunc i64 %indvars.iv.next to i32
239 %exitcond = icmp eq i32 %lftr.wideiv, %n
240 br i1 %exitcond, label %for.end, label %for.body
241
242for.end: ; preds = %for.inc, %entry
243 %sum.0.lcssa = phi i32 [ 0, %entry ], [ %sum.1, %for.inc ]
244 ret i32 %sum.0.lcssa
245}
246
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000247@a = common global [1 x i32*] zeroinitializer, align 8
248@c = common global i32* null, align 8
249
250; We use to if convert this loop. This is not safe because there is a trapping
251; constant expression.
252; PR16729
253
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000254define i32 @trapping_constant_expression() {
Sanjay Patel28f53ef2017-07-08 16:10:42 +0000255; CHECK-LABEL: @trapping_constant_expression(
256; CHECK-NEXT: entry:
257; CHECK-NEXT: br i1 false, label [[SCALAR_PH:%.*]], label [[MIN_ITERS_CHECKED:%.*]]
258; CHECK: min.iters.checked:
259; CHECK-NEXT: br i1 false, label [[SCALAR_PH]], label [[VECTOR_PH:%.*]]
260; CHECK: vector.ph:
261; CHECK-NEXT: br label [[VECTOR_BODY:%.*]]
262; CHECK: vector.body:
263; CHECK-NEXT: [[INDEX:%.*]] = phi i32 [ 0, [[VECTOR_PH]] ], [ [[INDEX_NEXT:%.*]], [[VECTOR_BODY]] ]
264; CHECK-NEXT: [[INDEX_NEXT]] = add i32 [[INDEX]], 4
265; CHECK-NEXT: [[TMP0:%.*]] = icmp eq i32 [[INDEX_NEXT]], 128
266; CHECK-NEXT: br i1 [[TMP0]], label [[MIDDLE_BLOCK:%.*]], label [[VECTOR_BODY]], !llvm.loop !12
267; CHECK: middle.block:
268; CHECK-NEXT: br i1 true, label [[FOR_END:%.*]], label [[SCALAR_PH]]
269; CHECK: scalar.ph:
270; CHECK-NEXT: br label [[FOR_BODY:%.*]]
271; CHECK: for.body:
272; CHECK-NEXT: br i1 false, label [[COND_FALSE:%.*]], label [[COND_END:%.*]]
273; CHECK: cond.false:
274; CHECK-NEXT: br label [[COND_END]]
275; CHECK: cond.end:
276; CHECK-NEXT: br i1 undef, label [[FOR_BODY]], label [[FOR_END]], !llvm.loop !13
277; CHECK: for.end:
278; CHECK-NEXT: ret i32 0
279;
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000280entry:
281 br label %for.body
282
283for.body:
284 %inc3 = phi i32 [ 0, %entry ], [ %inc, %cond.end ]
285 %or2 = phi i32 [ 0, %entry ], [ %or, %cond.end ]
David Blaikief72d05b2015-03-13 18:20:45 +0000286 br i1 icmp eq (i32** getelementptr inbounds ([1 x i32*], [1 x i32*]* @a, i64 0, i64 0), i32** @c), label %cond.false, label %cond.end
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000287
288cond.false:
289 br label %cond.end
290
291cond.end:
David Blaikief72d05b2015-03-13 18:20:45 +0000292 %cond = phi i32 [ sdiv (i32 1, i32 zext (i1 icmp eq (i32** getelementptr inbounds ([1 x i32*], [1 x i32*]* @a, i64 0, i64 0), i32** @c) to i32)), %cond.false ], [ 0, %for.body ]
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000293 %or = or i32 %or2, %cond
294 %inc = add nsw i32 %inc3, 1
295 %cmp = icmp slt i32 %inc, 128
296 br i1 %cmp, label %for.body, label %for.end
297
298for.end:
299 ret i32 %or
300}
301
302; Neither should we if-convert if there is an instruction operand that is a
303; trapping constant expression.
304; PR16729
305
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000306define i32 @trapping_constant_expression2() {
Sanjay Patel28f53ef2017-07-08 16:10:42 +0000307; CHECK-LABEL: @trapping_constant_expression2(
308; CHECK-NEXT: entry:
309; CHECK-NEXT: br label [[FOR_BODY:%.*]]
310; CHECK: for.body:
311; CHECK-NEXT: [[INC3:%.*]] = phi i32 [ 0, [[ENTRY:%.*]] ], [ [[INC:%.*]], [[COND_END:%.*]] ]
312; CHECK-NEXT: [[OR2:%.*]] = phi i32 [ 0, [[ENTRY]] ], [ [[OR:%.*]], [[COND_END]] ]
313; CHECK-NEXT: br i1 false, label [[COND_FALSE:%.*]], label [[COND_END]]
314; CHECK: cond.false:
315; CHECK-NEXT: br label [[COND_END]]
316; CHECK: cond.end:
317; CHECK-NEXT: [[OR]] = or i32 [[OR2]], [[INC3]]
318; CHECK-NEXT: [[INC]] = add nsw i32 [[INC3]], 1
319; CHECK-NEXT: [[CMP:%.*]] = icmp slt i32 [[INC3]], 127
320; CHECK-NEXT: br i1 [[CMP]], label [[FOR_BODY]], label [[FOR_END:%.*]]
321; CHECK: for.end:
322; CHECK-NEXT: ret i32 [[OR]]
323;
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000324entry:
325 br label %for.body
326
327for.body:
328 %inc3 = phi i32 [ 0, %entry ], [ %inc, %cond.end ]
329 %or2 = phi i32 [ 0, %entry ], [ %or, %cond.end ]
David Blaikief72d05b2015-03-13 18:20:45 +0000330 br i1 icmp eq (i32** getelementptr inbounds ([1 x i32*], [1 x i32*]* @a, i64 0, i64 0), i32** @c), label %cond.false, label %cond.end
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000331
332cond.false:
David Blaikief72d05b2015-03-13 18:20:45 +0000333 %cond.1 = or i32 %inc3, sdiv (i32 1, i32 zext (i1 icmp eq (i32** getelementptr inbounds ([1 x i32*], [1 x i32*]* @a, i64 0, i64 1), i32** @c) to i32))
Arnold Schwaighofer50b83022013-12-17 01:11:01 +0000334 br label %cond.end
335
336cond.end:
337 %cond = phi i32 [ %cond.1, %cond.false ], [ %inc3, %for.body ]
338 %or = or i32 %or2, %cond
339 %inc = add nsw i32 %inc3, 1
340 %cmp = icmp slt i32 %inc, 128
341 br i1 %cmp, label %for.body, label %for.end
342
343for.end:
344 ret i32 %or
345}