blob: 420df631a10fcc37d6d801ad0b8acfcc559e4263 [file] [log] [blame]
Sam Parker8c4b9642018-08-10 13:57:13 +00001; RUN: llc -mtriple=thumbv8.main -mcpu=cortex-m33 %s -arm-disable-cgp=false -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-NODSP
2; RUN: llc -mtriple=thumbv7-linux-android %s -arm-disable-cgp=false -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-NODSP
3; RUN: llc -mtriple=thumbv7em %s -arm-disable-cgp=false -arm-enable-scalar-dsp=true -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-DSP
4; RUN: llc -mtriple=thumbv8 %s -arm-disable-cgp=false -arm-enable-scalar-dsp=true -arm-enable-scalar-dsp-imms=true -o - | FileCheck %s --check-prefix=CHECK-COMMON --check-prefix=CHECK-DSP-IMM
5
6; Transform will fail because the trunc is not a sink.
7; CHECK-COMMON-LABEL: dsp_trunc
8; CHECK-COMMON: add [[ADD:[^ ]+]],
9; CHECK-DSP-NEXT: ldrh r1, [r3]
10; CHECK-DSP-NEXT: ldrh r2, [r2]
11; CHECK-DSP-NEXT: subs r1, r1, [[ADD]]
12; CHECK-DSP-NEXT: add r0, r2
13; CHECK-DSP-NEXT: uxth r3, r1
14; CHECK-DSP-NEXT: uxth r2, r0
15; CHECK-DSP-NEXT: cmp r2, r3
16
17; With DSP-IMM, we could have:
18; movs r1, #0
19; uxth r0, r0
20; usub16 r1, r1, r0
21; ldrh r0, [r2]
22; ldrh r3, [r3]
23; usub16 r0, r0, r1
24; uadd16 r1, r3, r1
25; cmp r0, r1
26define i16 @dsp_trunc(i32 %arg0, i32 %arg1, i16* %gep0, i16* %gep1) {
27entry:
28 %add0 = add i32 %arg0, %arg1
29 %conv0 = trunc i32 %add0 to i16
30 %sub0 = sub i16 0, %conv0
31 %load0 = load i16, i16* %gep0, align 2
32 %load1 = load i16, i16* %gep1, align 2
33 %sub1 = sub i16 %load0, %sub0
34 %add1 = add i16 %load1, %sub0
35 %cmp = icmp ult i16 %sub1, %add1
36 %res = select i1 %cmp, i16 %add1, i16 %sub1
37 ret i16 %res
38}
39
40; CHECK-COMMON-LABEL: trunc_i16_i8
41; CHECK-COMMON: ldrh
42; CHECK-COMMON: uxtb
43; CHECK-COMMON: cmp
44define i8 @trunc_i16_i8(i16* %ptr, i16 zeroext %arg0, i8 zeroext %arg1) {
45entry:
46 %0 = load i16, i16* %ptr
47 %1 = add i16 %0, %arg0
48 %2 = trunc i16 %1 to i8
49 %3 = icmp ugt i8 %2, %arg1
50 %4 = select i1 %3, i8 %2, i8 %arg1
51 ret i8 %4
52}
53
Sam Parker0e2f0bd2018-08-16 11:54:09 +000054; The pass perform the transform, but a uxtb will still be inserted to handle
55; the zext to the icmp.
Sam Parker8c4b9642018-08-10 13:57:13 +000056; CHECK-COMMON-LABEL: icmp_i32_zext:
Sam Parker0e2f0bd2018-08-16 11:54:09 +000057; CHECK-COMMON: sub
Sam Parker8c4b9642018-08-10 13:57:13 +000058; CHECK-COMMON: uxtb
Sam Parker0e2f0bd2018-08-16 11:54:09 +000059; CHECK-COMMON: cmp
Sam Parker8c4b9642018-08-10 13:57:13 +000060define i8 @icmp_i32_zext(i8* %ptr) {
61entry:
62 %gep = getelementptr inbounds i8, i8* %ptr, i32 0
63 %0 = load i8, i8* %gep, align 1
64 %1 = sub nuw nsw i8 %0, 1
65 %conv44 = zext i8 %0 to i32
66 br label %preheader
67
68preheader:
69 br label %body
70
71body:
72 %2 = phi i8 [ %1, %preheader ], [ %3, %if.end ]
73 %si.0274 = phi i32 [ %conv44, %preheader ], [ %inc, %if.end ]
74 %conv51266 = zext i8 %2 to i32
75 %cmp52267 = icmp eq i32 %si.0274, %conv51266
76 br i1 %cmp52267, label %if.end, label %exit
77
78if.end:
79 %inc = add i32 %si.0274, 1
80 %gep1 = getelementptr inbounds i8, i8* %ptr, i32 %inc
81 %3 = load i8, i8* %gep1, align 1
82 br label %body
83
84exit:
85 ret i8 %2
86}
87
Sam Parker481cdab2018-09-17 13:57:39 +000088; TODO: We should be able to remove both extends from this example, by looking
89; back through the zexts and accepting a type size <= than the icmp.
90; CHECK-COMMON-LABEL: icmp_i16_zext
91; CHECK-COMMON: uxt
92; CHECK-COMMON: uxt
93define i8 @icmp_i16_zext(i8* %ptr) {
94entry:
95 %gep = getelementptr inbounds i8, i8* %ptr, i32 0
96 %0 = load i8, i8* %gep, align 1
97 %1 = sub nuw nsw i8 %0, 1
98 %conv44 = zext i8 %0 to i16
99 br label %preheader
100
101preheader:
102 br label %body
103
104body:
105 %2 = phi i8 [ %1, %preheader ], [ %3, %if.end ]
106 %si.0274 = phi i16 [ %conv44, %preheader ], [ %inc, %if.end ]
107 %conv51266 = zext i8 %2 to i16
108 %cmp52267 = icmp eq i16 %si.0274, %conv51266
109 br i1 %cmp52267, label %if.end, label %exit
110
111if.end:
112 %inc = add nuw i16 %si.0274, 1
113 %conv = zext i16 %inc to i32
114 %gep1 = getelementptr inbounds i8, i8* %ptr, i32 %conv
115 %3 = load i8, i8* %gep1, align 1
116 br label %body
117
118exit:
119 ret i8 %2
120}
121
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000122; Won't don't handle sext
Sam Parker8c4b9642018-08-10 13:57:13 +0000123; CHECK-COMMON-LABEL: icmp_sext_zext_store_i8_i16
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000124; CHECK-COMMON: ldrb
125; CHECK-COMMON: ldrsh
Sam Parker8c4b9642018-08-10 13:57:13 +0000126define i32 @icmp_sext_zext_store_i8_i16() {
127entry:
128 %0 = load i8, i8* getelementptr inbounds ([16 x i8], [16 x i8]* @d_uch, i32 0, i32 2), align 1
129 %conv = zext i8 %0 to i16
130 store i16 %conv, i16* @sh1, align 2
131 %conv1 = zext i8 %0 to i32
132 %1 = load i16, i16* getelementptr inbounds ([16 x i16], [16 x i16]* @d_sh, i32 0, i32 2), align 2
133 %conv2 = sext i16 %1 to i32
134 %cmp = icmp eq i32 %conv1, %conv2
135 %conv3 = zext i1 %cmp to i32
136 ret i32 %conv3
137}
138
Sam Parker8c4b9642018-08-10 13:57:13 +0000139; CHECK-COMMON-LABEL: or_icmp_ugt:
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000140; CHECK-COMMON: ldrb
141; CHECK-COMMON: sub.w
142; CHECK-COMMON-NOT: uxt
143; CHECK-COMMON: cmp.w
144; CHECK-COMMON-NOT: uxt
145; CHECK-COMMON: cmp
Sam Parker8c4b9642018-08-10 13:57:13 +0000146define i1 @or_icmp_ugt(i32 %arg, i8* %ptr) {
147entry:
148 %0 = load i8, i8* %ptr
149 %1 = zext i8 %0 to i32
150 %mul = shl nuw nsw i32 %1, 1
151 %add0 = add nuw nsw i32 %mul, 6
152 %cmp0 = icmp ne i32 %arg, %add0
153 %add1 = add i8 %0, -1
154 %cmp1 = icmp ugt i8 %add1, 3
155 %or = or i1 %cmp0, %cmp1
156 ret i1 %or
157}
158
159; CHECK-COMMON-LABEL: icmp_switch_trunc:
160; CHECK-COMMON-NOT: uxt
161define i16 @icmp_switch_trunc(i16 zeroext %arg) {
162entry:
163 %conv = add nuw i16 %arg, 15
164 %mul = mul nuw nsw i16 %conv, 3
165 %trunc = trunc i16 %arg to i3
166 switch i3 %trunc, label %default [
167 i3 0, label %sw.bb
168 i3 1, label %sw.bb.i
169 ]
170
171sw.bb:
172 %cmp0 = icmp ult i16 %mul, 127
173 %select = select i1 %cmp0, i16 %mul, i16 127
174 br label %exit
175
176sw.bb.i:
177 %cmp1 = icmp ugt i16 %mul, 34
178 %select.i = select i1 %cmp1, i16 %mul, i16 34
179 br label %exit
180
181default:
182 br label %exit
183
184exit:
185 %res = phi i16 [ %select, %sw.bb ], [ %select.i, %sw.bb.i ], [ %mul, %default ]
186 ret i16 %res
187}
188
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000189; We currently only handle truncs as sinks, so a uxt will still be needed for
190; the icmp ugt instruction.
Sam Parker8c4b9642018-08-10 13:57:13 +0000191; CHECK-COMMON-LABEL: urem_trunc_icmps
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000192; CHECK-COMMON: cmp
Sam Parker8c4b9642018-08-10 13:57:13 +0000193; CHECK-COMMON: uxt
Sam Parker0e2f0bd2018-08-16 11:54:09 +0000194; CHECK-COMMON: cmp
Sam Parker8c4b9642018-08-10 13:57:13 +0000195define void @urem_trunc_icmps(i16** %in, i32* %g, i32* %k) {
196entry:
197 %ptr = load i16*, i16** %in, align 4
198 %ld = load i16, i16* %ptr, align 2
199 %cmp.i = icmp eq i16 %ld, 0
200 br i1 %cmp.i, label %exit, label %cond.false.i
201
202cond.false.i:
203 %rem = urem i16 5, %ld
204 %extract.t = trunc i16 %rem to i8
205 br label %body
206
207body:
208 %cond.in.i.off0 = phi i8 [ %extract.t, %cond.false.i ], [ %add, %for.inc ]
209 %cmp = icmp ugt i8 %cond.in.i.off0, 7
210 %conv5 = zext i1 %cmp to i32
211 store i32 %conv5, i32* %g, align 4
212 %.pr = load i32, i32* %k, align 4
213 %tobool13150 = icmp eq i32 %.pr, 0
214 br i1 %tobool13150, label %for.inc, label %exit
215
216for.inc:
217 %add = add nuw i8 %cond.in.i.off0, 1
218 br label %body
219
220exit:
221 ret void
222}
223
224; CHECK-COMMON-LABEL: phi_feeding_switch
225; CHECK-COMMON: ldrb
226; CHECK-COMMON: uxtb
Sam Parker8c4b9642018-08-10 13:57:13 +0000227define void @phi_feeding_switch(i8* %memblock, i8* %store, i16 %arg) {
228entry:
229 %pre = load i8, i8* %memblock, align 1
230 %conv = trunc i16 %arg to i8
231 br label %header
232
233header:
234 %phi.0 = phi i8 [ %pre, %entry ], [ %count, %latch ]
235 %phi.1 = phi i8 [ %conv, %entry ], [ %phi.3, %latch ]
236 %phi.2 = phi i8 [ 0, %entry], [ %count, %latch ]
237 switch i8 %phi.0, label %default [
238 i8 43, label %for.inc.i
239 i8 45, label %for.inc.i.i
240 ]
241
242for.inc.i:
243 %xor = xor i8 %phi.1, 1
244 br label %latch
245
246for.inc.i.i:
247 %and = and i8 %phi.1, 3
248 br label %latch
249
250default:
251 %sub = sub i8 %phi.0, 1
252 %cmp2 = icmp ugt i8 %sub, 4
253 br i1 %cmp2, label %latch, label %exit
254
255latch:
256 %phi.3 = phi i8 [ %xor, %for.inc.i ], [ %and, %for.inc.i.i ], [ %phi.2, %default ]
257 %count = add nuw i8 %phi.2, 1
258 store i8 %count, i8* %store, align 1
259 br label %header
260
261exit:
262 ret void
263}
264
Sam Parker8c4b9642018-08-10 13:57:13 +0000265; Check that %exp requires uxth in all cases, and will also be required to
266; promote %1 for the call - unless we can generate a uadd16.
267; CHECK-COMMON-LABEL: zext_load_sink_call:
268; CHECK-COMMON: uxt
269; uadd16
270; cmp
271; CHECK-COMMON: uxt
272define i32 @zext_load_sink_call(i16* %ptr, i16 %exp) {
273entry:
274 %0 = load i16, i16* %ptr, align 4
275 %1 = add i16 %exp, 3
276 %cmp = icmp eq i16 %0, %exp
277 br i1 %cmp, label %exit, label %if.then
278
279if.then:
280 %conv0 = zext i16 %0 to i32
281 %conv1 = zext i16 %1 to i32
282 %call = tail call arm_aapcs_vfpcc i32 @dummy(i32 %conv0, i32 %conv1)
283 br label %exit
284
285exit:
286 %exitval = phi i32 [ %call, %if.then ], [ 0, %entry ]
287 ret i32 %exitval
288}
289
290%class.ae = type { i8 }
291%class.x = type { i8 }
292%class.v = type { %class.q }
293%class.q = type { i16 }
294
295; CHECK-COMMON-LABEL: trunc_i16_i9_switch
296; CHECK-COMMON-NOT: uxt
297define i32 @trunc_i16_i9_switch(%class.ae* %this) {
298entry:
299 %call = tail call %class.x* @_ZNK2ae2afEv(%class.ae* %this)
300 %call2 = tail call %class.v* @_ZN1x2acEv(%class.x* %call)
301 %0 = getelementptr inbounds %class.v, %class.v* %call2, i32 0, i32 0, i32 0
302 %1 = load i16, i16* %0, align 2
303 %2 = trunc i16 %1 to i9
304 %trunc = and i9 %2, -64
305 switch i9 %trunc, label %cleanup.fold.split [
306 i9 0, label %cleanup
307 i9 -256, label %if.then7
308 ]
309
310if.then7:
311 %3 = and i16 %1, 7
312 %tobool = icmp eq i16 %3, 0
313 %cond = select i1 %tobool, i32 2, i32 1
314 br label %cleanup
315
316cleanup.fold.split:
317 br label %cleanup
318
319cleanup:
320 %retval.0 = phi i32 [ %cond, %if.then7 ], [ 0, %entry ], [ 2, %cleanup.fold.split ]
321 ret i32 %retval.0
322}
323
Sam Parker569b2452018-09-12 09:11:48 +0000324; CHECK-COMMON-LABEL: bitcast_i16
325; CHECK-COMMON-NOT: uxt
326define i16 @bitcast_i16(i16 zeroext %arg0, i16 zeroext %arg1) {
327entry:
328 %cast = bitcast i16 12345 to i16
329 %add = add nuw i16 %arg0, 1
330 %cmp = icmp ule i16 %add, %cast
331 %res = select i1 %cmp, i16 %arg1, i16 32657
332 ret i16 %res
333}
334
335; CHECK-COMMON-LABEL: bitcast_i8
336; CHECK-COMMON-NOT: uxt
337define i8 @bitcast_i8(i8 zeroext %arg0, i8 zeroext %arg1) {
338entry:
339 %cast = bitcast i8 127 to i8
340 %mul = shl nuw i8 %arg0, 1
341 %cmp = icmp uge i8 %mul, %arg1
342 %res = select i1 %cmp, i8 %cast, i8 128
343 ret i8 %res
344}
345
346; CHECK-COMMON-LABEL: bitcast_i16_minus
347; CHECK-COMMON-NOT: uxt
348define i16 @bitcast_i16_minus(i16 zeroext %arg0, i16 zeroext %arg1) {
349entry:
350 %cast = bitcast i16 -12345 to i16
351 %xor = xor i16 %arg0, 7
352 %cmp = icmp eq i16 %xor, %arg1
353 %res = select i1 %cmp, i16 %cast, i16 32657
354 ret i16 %res
355}
356
357; CHECK-COMMON-LABEL: bitcast_i8_minus
358; CHECK-COMMON-NOT: uxt
359define i8 @bitcast_i8_minus(i8 zeroext %arg0, i8 zeroext %arg1) {
360entry:
361 %cast = bitcast i8 -127 to i8
362 %and = and i8 %arg0, 3
363 %cmp = icmp ne i8 %and, %arg1
364 %res = select i1 %cmp, i8 %cast, i8 128
365 ret i8 %res
366}
367
Sam Parker8c4b9642018-08-10 13:57:13 +0000368declare %class.x* @_ZNK2ae2afEv(%class.ae*) local_unnamed_addr
369declare %class.v* @_ZN1x2acEv(%class.x*) local_unnamed_addr
370declare i32 @dummy(i32, i32)
371
372@d_uch = hidden local_unnamed_addr global [16 x i8] zeroinitializer, align 1
373@sh1 = hidden local_unnamed_addr global i16 0, align 2
374@d_sh = hidden local_unnamed_addr global [16 x i16] zeroinitializer, align 2