blob: 8518f4c1f49f2490d21e3663a7944232d50f6aa9 [file] [log] [blame]
Dan Gohman1cf96c02015-12-09 16:23:59 +00001; RUN: llc < %s -asm-verbose=false -verify-machineinstrs | FileCheck %s
Dan Gohman81719f82015-11-25 16:55:01 +00002
3; Test the register stackifier pass.
4
Dan Gohman0c6f5ac2016-01-07 03:19:23 +00005target datalayout = "e-m:e-p:32:32-i64:64-n32:64-S128"
Dan Gohman81719f82015-11-25 16:55:01 +00006target triple = "wasm32-unknown-unknown"
7
8; No because of pointer aliasing.
9
10; CHECK-LABEL: no0:
11; CHECK: return $1{{$}}
12define i32 @no0(i32* %p, i32* %q) {
13 %t = load i32, i32* %q
14 store i32 0, i32* %p
15 ret i32 %t
16}
17
18; No because of side effects.
19
20; CHECK-LABEL: no1:
21; CHECK: return $1{{$}}
22define i32 @no1(i32* %p, i32* dereferenceable(4) %q) {
23 %t = load volatile i32, i32* %q, !invariant.load !0
24 store volatile i32 0, i32* %p
25 ret i32 %t
26}
27
28; Yes because of invariant load and no side effects.
29
30; CHECK-LABEL: yes0:
31; CHECK: return $pop0{{$}}
32define i32 @yes0(i32* %p, i32* dereferenceable(4) %q) {
33 %t = load i32, i32* %q, !invariant.load !0
34 store i32 0, i32* %p
35 ret i32 %t
36}
37
38; Yes because of no intervening side effects.
39
40; CHECK-LABEL: yes1:
41; CHECK: return $pop0{{$}}
42define i32 @yes1(i32* %q) {
43 %t = load volatile i32, i32* %q
44 ret i32 %t
45}
46
Dan Gohman2644d742016-05-17 04:05:31 +000047; Yes because undefined behavior can be sunk past a store.
48
49; CHECK-LABEL: sink_trap:
50; CHECK: return $pop0{{$}}
51define i32 @sink_trap(i32 %x, i32 %y, i32* %p) {
52 %t = sdiv i32 %x, %y
53 store volatile i32 0, i32* %p
54 ret i32 %t
55}
56
57; Yes because the call is readnone.
58
59; CHECK-LABEL: sink_readnone_call:
60; CHECK: return $pop0{{$}}
61declare i32 @readnone_callee() readnone nounwind
62define i32 @sink_readnone_call(i32 %x, i32 %y, i32* %p) {
63 %t = call i32 @readnone_callee()
64 store volatile i32 0, i32* %p
65 ret i32 %t
66}
67
68; No because the call is readonly and there's an intervening store.
69
70; CHECK-LABEL: no_sink_readonly_call:
71; CHECK: return ${{[0-9]+}}{{$}}
72declare i32 @readonly_callee() readonly nounwind
73define i32 @no_sink_readonly_call(i32 %x, i32 %y, i32* %p) {
74 %t = call i32 @readonly_callee()
75 store i32 0, i32* %p
76 ret i32 %t
77}
78
Dan Gohman4da4abd2015-12-05 00:51:40 +000079; Don't schedule stack uses into the stack. To reduce register pressure, the
80; scheduler might be tempted to move the definition of $2 down. However, this
81; would risk getting incorrect liveness if the instructions are later
82; rearranged to make the stack contiguous.
83
84; CHECK-LABEL: stack_uses:
Derek Schuffb861ec82016-04-12 20:12:05 +000085; CHECK: .param i32, i32, i32, i32{{$}}
Dan Gohman4da4abd2015-12-05 00:51:40 +000086; CHECK-NEXT: .result i32{{$}}
Dan Gohman1d68e80f2016-01-12 19:14:46 +000087; CHECK-NEXT: block{{$}}
Dan Gohmanb6fd39a2016-01-19 16:59:23 +000088; CHECK-NEXT: i32.const $push13=, 1{{$}}
89; CHECK-NEXT: i32.lt_s $push0=, $0, $pop13{{$}}
90; CHECK-NEXT: i32.const $push1=, 2{{$}}
91; CHECK-NEXT: i32.lt_s $push2=, $1, $pop1{{$}}
92; CHECK-NEXT: i32.xor $push5=, $pop0, $pop2{{$}}
93; CHECK-NEXT: i32.const $push12=, 1{{$}}
94; CHECK-NEXT: i32.lt_s $push3=, $2, $pop12{{$}}
95; CHECK-NEXT: i32.const $push11=, 2{{$}}
96; CHECK-NEXT: i32.lt_s $push4=, $3, $pop11{{$}}
97; CHECK-NEXT: i32.xor $push6=, $pop3, $pop4{{$}}
98; CHECK-NEXT: i32.xor $push7=, $pop5, $pop6{{$}}
99; CHECK-NEXT: i32.const $push10=, 1{{$}}
100; CHECK-NEXT: i32.ne $push8=, $pop7, $pop10{{$}}
Dan Gohman06b49582016-02-08 21:50:13 +0000101; CHECK-NEXT: br_if 0, $pop8{{$}}
Dan Gohmanb6fd39a2016-01-19 16:59:23 +0000102; CHECK-NEXT: i32.const $push9=, 0{{$}}
103; CHECK-NEXT: return $pop9{{$}}
Dan Gohman2644d742016-05-17 04:05:31 +0000104; CHECK-NEXT: .LBB7_2:
Dan Gohman1d68e80f2016-01-12 19:14:46 +0000105; CHECK-NEXT: end_block{{$}}
Dan Gohmanb6fd39a2016-01-19 16:59:23 +0000106; CHECK-NEXT: i32.const $push14=, 1{{$}}
107; CHECK-NEXT: return $pop14{{$}}
Dan Gohmanf0b165a2015-12-05 03:03:35 +0000108define i32 @stack_uses(i32 %x, i32 %y, i32 %z, i32 %w) {
Dan Gohman4da4abd2015-12-05 00:51:40 +0000109entry:
Dan Gohmanf0b165a2015-12-05 03:03:35 +0000110 %c = icmp sle i32 %x, 0
111 %d = icmp sle i32 %y, 1
112 %e = icmp sle i32 %z, 0
113 %f = icmp sle i32 %w, 1
114 %g = xor i1 %c, %d
115 %h = xor i1 %e, %f
116 %i = xor i1 %g, %h
117 br i1 %i, label %true, label %false
Dan Gohman4da4abd2015-12-05 00:51:40 +0000118true:
119 ret i32 0
120false:
121 ret i32 1
122}
123
Dan Gohman8887d1f2015-12-25 00:31:02 +0000124; Test an interesting case where the load has multiple uses and cannot
Dan Gohmanadf28172016-01-28 01:22:44 +0000125; be trivially stackified. However, it can be stackified with a tee_local.
Dan Gohman8887d1f2015-12-25 00:31:02 +0000126
127; CHECK-LABEL: multiple_uses:
Derek Schuffb861ec82016-04-12 20:12:05 +0000128; CHECK: .param i32, i32, i32{{$}}
Dan Gohman1d68e80f2016-01-12 19:14:46 +0000129; CHECK-NEXT: .local i32{{$}}
Dan Gohman1d68e80f2016-01-12 19:14:46 +0000130; CHECK-NEXT: block{{$}}
Dan Gohman8aa237c2016-02-16 15:17:21 +0000131; CHECK-NEXT: i32.load $push[[NUM0:[0-9]+]]=, 0($2){{$}}
132; CHECK-NEXT: tee_local $push[[NUM1:[0-9]+]]=, $3=, $pop[[NUM0]]{{$}}
133; CHECK-NEXT: i32.ge_u $push[[NUM2:[0-9]+]]=, $pop[[NUM1]], $1{{$}}
134; CHECK-NEXT: br_if 0, $pop[[NUM2]]{{$}}
135; CHECK-NEXT: i32.lt_u $push[[NUM3:[0-9]+]]=, $3, $0{{$}}
136; CHECK-NEXT: br_if 0, $pop[[NUM3]]{{$}}
Dan Gohman8887d1f2015-12-25 00:31:02 +0000137; CHECK-NEXT: i32.store $discard=, 0($2), $3{{$}}
Dan Gohman2644d742016-05-17 04:05:31 +0000138; CHECK-NEXT: .LBB8_3:
Dan Gohman1d68e80f2016-01-12 19:14:46 +0000139; CHECK-NEXT: end_block{{$}}
Dan Gohman8887d1f2015-12-25 00:31:02 +0000140; CHECK-NEXT: return{{$}}
141define void @multiple_uses(i32* %arg0, i32* %arg1, i32* %arg2) nounwind {
142bb:
143 br label %loop
144
145loop:
146 %tmp7 = load i32, i32* %arg2
147 %tmp8 = inttoptr i32 %tmp7 to i32*
148 %tmp9 = icmp uge i32* %tmp8, %arg1
149 %tmp10 = icmp ult i32* %tmp8, %arg0
150 %tmp11 = or i1 %tmp9, %tmp10
151 br i1 %tmp11, label %back, label %then
152
153then:
154 store i32 %tmp7, i32* %arg2
155 br label %back
156
157back:
158 br i1 undef, label %return, label %loop
159
160return:
161 ret void
162}
163
Dan Gohman7e649172016-01-20 04:21:16 +0000164; Don't stackify stores effects across other instructions with side effects.
165
166; CHECK: side_effects:
167; CHECK: store
168; CHECK-NEXT: call
169; CHECK-NEXT: store
170; CHECK-NEXT: call
171declare void @evoke_side_effects()
172define hidden void @stackify_store_across_side_effects(double* nocapture %d) {
173entry:
174 store double 2.0, double* %d
175 call void @evoke_side_effects()
176 store double 2.0, double* %d
177 call void @evoke_side_effects()
178 ret void
179}
180
Dan Gohmanadf28172016-01-28 01:22:44 +0000181; Div instructions have side effects and can't be reordered, but this entire
182; function should still be able to be stackified because it's already in
183; tree order.
184
185; CHECK-LABEL: div_tree:
Derek Schuffb861ec82016-04-12 20:12:05 +0000186; CHECK: .param i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32, i32{{$}}
Dan Gohmanadf28172016-01-28 01:22:44 +0000187; CHECK-NEXT: .result i32{{$}}
188; CHECK-NEXT: i32.div_s $push0=, $0, $1
189; CHECK-NEXT: i32.div_s $push1=, $2, $3
190; CHECK-NEXT: i32.div_s $push2=, $pop0, $pop1
191; CHECK-NEXT: i32.div_s $push3=, $4, $5
192; CHECK-NEXT: i32.div_s $push4=, $6, $7
193; CHECK-NEXT: i32.div_s $push5=, $pop3, $pop4
194; CHECK-NEXT: i32.div_s $push6=, $pop2, $pop5
195; CHECK-NEXT: i32.div_s $push7=, $8, $9
196; CHECK-NEXT: i32.div_s $push8=, $10, $11
197; CHECK-NEXT: i32.div_s $push9=, $pop7, $pop8
198; CHECK-NEXT: i32.div_s $push10=, $12, $13
199; CHECK-NEXT: i32.div_s $push11=, $14, $15
200; CHECK-NEXT: i32.div_s $push12=, $pop10, $pop11
201; CHECK-NEXT: i32.div_s $push13=, $pop9, $pop12
202; CHECK-NEXT: i32.div_s $push14=, $pop6, $pop13
203; CHECK-NEXT: return $pop14
204define i32 @div_tree(i32 %a, i32 %b, i32 %c, i32 %d, i32 %e, i32 %f, i32 %g, i32 %h, i32 %i, i32 %j, i32 %k, i32 %l, i32 %m, i32 %n, i32 %o, i32 %p) {
205entry:
206 %div = sdiv i32 %a, %b
207 %div1 = sdiv i32 %c, %d
208 %div2 = sdiv i32 %div, %div1
209 %div3 = sdiv i32 %e, %f
210 %div4 = sdiv i32 %g, %h
211 %div5 = sdiv i32 %div3, %div4
212 %div6 = sdiv i32 %div2, %div5
213 %div7 = sdiv i32 %i, %j
214 %div8 = sdiv i32 %k, %l
215 %div9 = sdiv i32 %div7, %div8
216 %div10 = sdiv i32 %m, %n
217 %div11 = sdiv i32 %o, %p
218 %div12 = sdiv i32 %div10, %div11
219 %div13 = sdiv i32 %div9, %div12
220 %div14 = sdiv i32 %div6, %div13
221 ret i32 %div14
222}
223
224; A simple multiple-use case.
225
226; CHECK-LABEL: simple_multiple_use:
Derek Schuffb861ec82016-04-12 20:12:05 +0000227; CHECK: .param i32, i32{{$}}
Dan Gohman8aa237c2016-02-16 15:17:21 +0000228; CHECK-NEXT: i32.mul $push[[NUM0:[0-9]+]]=, $1, $0{{$}}
Dan Gohman0cfb5f82016-05-10 04:24:02 +0000229; CHECK-NEXT: tee_local $push[[NUM1:[0-9]+]]=, $[[NUM2:[0-9]+]]=, $pop[[NUM0]]{{$}}
Dan Gohman8aa237c2016-02-16 15:17:21 +0000230; CHECK-NEXT: call use_a@FUNCTION, $pop[[NUM1]]{{$}}
Dan Gohman0cfb5f82016-05-10 04:24:02 +0000231; CHECK-NEXT: call use_b@FUNCTION, $[[NUM2]]{{$}}
Dan Gohmanadf28172016-01-28 01:22:44 +0000232; CHECK-NEXT: return{{$}}
233declare void @use_a(i32)
234declare void @use_b(i32)
235define void @simple_multiple_use(i32 %x, i32 %y) {
236 %mul = mul i32 %y, %x
237 call void @use_a(i32 %mul)
238 call void @use_b(i32 %mul)
239 ret void
240}
241
242; Multiple uses of the same value in one instruction.
243
244; CHECK-LABEL: multiple_uses_in_same_insn:
Derek Schuffb861ec82016-04-12 20:12:05 +0000245; CHECK: .param i32, i32{{$}}
Dan Gohman8aa237c2016-02-16 15:17:21 +0000246; CHECK-NEXT: i32.mul $push[[NUM0:[0-9]+]]=, $1, $0{{$}}
Dan Gohman0cfb5f82016-05-10 04:24:02 +0000247; CHECK-NEXT: tee_local $push[[NUM1:[0-9]+]]=, $[[NUM2:[0-9]+]]=, $pop[[NUM0]]{{$}}
248; CHECK-NEXT: call use_2@FUNCTION, $pop[[NUM1]], $[[NUM2]]{{$}}
Dan Gohmanadf28172016-01-28 01:22:44 +0000249; CHECK-NEXT: return{{$}}
250declare void @use_2(i32, i32)
251define void @multiple_uses_in_same_insn(i32 %x, i32 %y) {
252 %mul = mul i32 %y, %x
253 call void @use_2(i32 %mul, i32 %mul)
254 ret void
255}
256
257; Commute operands to achieve better stackifying.
258
259; CHECK-LABEL: commute:
Derek Schuffb861ec82016-04-12 20:12:05 +0000260; CHECK-NOT: param
261; CHECK: .result i32{{$}}
Dan Gohmanadf28172016-01-28 01:22:44 +0000262; CHECK-NEXT: i32.call $push0=, red@FUNCTION{{$}}
263; CHECK-NEXT: i32.call $push1=, green@FUNCTION{{$}}
264; CHECK-NEXT: i32.add $push2=, $pop0, $pop1{{$}}
265; CHECK-NEXT: i32.call $push3=, blue@FUNCTION{{$}}
266; CHECK-NEXT: i32.add $push4=, $pop2, $pop3{{$}}
267; CHECK-NEXT: return $pop4{{$}}
268declare i32 @red()
269declare i32 @green()
270declare i32 @blue()
271define i32 @commute() {
272 %call = call i32 @red()
273 %call1 = call i32 @green()
274 %add = add i32 %call1, %call
275 %call2 = call i32 @blue()
276 %add3 = add i32 %add, %call2
277 ret i32 %add3
278}
279
Dan Gohmanfbfe5ec2016-01-28 03:59:09 +0000280; Don't stackify a register when it would move a the def of the register past
281; an implicit get_local for the register.
282
283; CHECK-LABEL: no_stackify_past_use:
284; CHECK: i32.call $1=, callee@FUNCTION, $0
285; CHECK: i32.const $push0=, 1
286; CHECK: i32.add $push1=, $0, $pop0
287; CHECK: i32.call $push2=, callee@FUNCTION, $pop1
288; CHECK: i32.add $push3=, $1, $pop2
289; CHECK: i32.mul $push4=, $1, $pop3
290; CHECK: return $pop4
291declare i32 @callee(i32)
292define i32 @no_stackify_past_use(i32 %arg) {
293 %tmp1 = call i32 @callee(i32 %arg)
294 %tmp2 = add i32 %arg, 1
295 %tmp3 = call i32 @callee(i32 %tmp2)
296 %tmp5 = add i32 %tmp3, %tmp1
297 %tmp6 = mul i32 %tmp5, %tmp1
298 ret i32 %tmp6
299}
300
Dan Gohman8aa237c2016-02-16 15:17:21 +0000301; Stackify individual defs of virtual registers with multiple defs.
302
303; CHECK-LABEL: multiple_defs:
304; CHECK: f64.add $push[[NUM0:[0-9]+]]=, ${{[0-9]+}}, $pop{{[0-9]+}}{{$}}
305; CHECK-NEXT: tee_local $push[[NUM1:[0-9]+]]=, $[[NUM2:[0-9]+]]=, $pop[[NUM0]]{{$}}
306; CHECK-NEXT: f64.select $push{{[0-9]+}}=, $pop{{[0-9]+}}, $pop[[NUM1]], ${{[0-9]+}}{{$}}
307; CHECK: $[[NUM2]]=,
Dan Gohman8aa237c2016-02-16 15:17:21 +0000308define void @multiple_defs(i32 %arg, i32 %arg1, i1 %arg2, i1 %arg3, i1 %arg4) {
309bb:
310 br label %bb5
311
312bb5: ; preds = %bb21, %bb
313 %tmp = phi double [ 0.000000e+00, %bb ], [ %tmp22, %bb21 ]
314 %tmp6 = phi double [ 0.000000e+00, %bb ], [ %tmp23, %bb21 ]
315 %tmp7 = fcmp olt double %tmp6, 2.323450e+01
316 br i1 %tmp7, label %bb8, label %bb21
317
318bb8: ; preds = %bb17, %bb5
319 %tmp9 = phi double [ %tmp19, %bb17 ], [ %tmp, %bb5 ]
320 %tmp10 = fadd double %tmp6, -1.000000e+00
321 %tmp11 = select i1 %arg2, double -1.135357e+04, double %tmp10
322 %tmp12 = fadd double %tmp11, %tmp9
323 br i1 %arg3, label %bb17, label %bb13
324
325bb13: ; preds = %bb8
326 %tmp14 = or i32 %arg1, 2
327 %tmp15 = icmp eq i32 %tmp14, 14
328 %tmp16 = select i1 %tmp15, double -1.135357e+04, double 0xBFCE147AE147B000
329 br label %bb17
330
331bb17: ; preds = %bb13, %bb8
332 %tmp18 = phi double [ %tmp16, %bb13 ], [ %tmp10, %bb8 ]
333 %tmp19 = fadd double %tmp18, %tmp12
334 %tmp20 = fcmp olt double %tmp6, 2.323450e+01
335 br i1 %tmp20, label %bb8, label %bb21
336
337bb21: ; preds = %bb17, %bb5
338 %tmp22 = phi double [ %tmp, %bb5 ], [ %tmp9, %bb17 ]
339 %tmp23 = fadd double %tmp6, 1.000000e+00
340 br label %bb5
341}
342
Derek Schufff8f8f092016-02-16 21:44:19 +0000343; Don't move calls past loads
344; CHECK-LABEL: no_stackify_call_past_load:
345; CHECK: i32.call $0=, red
346; CHECK: i32.const $push0=, 0
347; CHECK: i32.load $1=, count($pop0)
348@count = hidden global i32 0, align 4
349define i32 @no_stackify_call_past_load() {
350 %a = call i32 @red()
351 %b = load i32, i32* @count, align 4
352 call i32 @callee(i32 %a)
353 ret i32 %b
354 ; use of a
355}
356
357; Don't move stores past loads if there may be aliasing
358; CHECK-LABEL: no_stackify_store_past_load
Dan Gohman0cfb5f82016-05-10 04:24:02 +0000359; CHECK: i32.store $[[L0:[0-9]+]]=, 0($1), $0
Derek Schufff8f8f092016-02-16 21:44:19 +0000360; CHECK: i32.load {{.*}}, 0($2)
Dan Gohman0cfb5f82016-05-10 04:24:02 +0000361; CHECK: i32.call {{.*}}, callee@FUNCTION, $[[L0]]{{$}}
Derek Schufff8f8f092016-02-16 21:44:19 +0000362define i32 @no_stackify_store_past_load(i32 %a, i32* %p1, i32* %p2) {
363 store i32 %a, i32* %p1
364 %b = load i32, i32* %p2, align 4
365 call i32 @callee(i32 %a)
366 ret i32 %b
367}
368
369; Can still stackify past invariant loads.
370; CHECK-LABEL: store_past_invar_load
371; CHECK: i32.store $push{{.*}}, 0($1), $0
372; CHECK: i32.call {{.*}}, callee@FUNCTION, $pop
373; CHECK: i32.load $push{{.*}}, 0($2)
374; CHECK: return $pop
375define i32 @store_past_invar_load(i32 %a, i32* %p1, i32* dereferenceable(4) %p2) {
376 store i32 %a, i32* %p1
377 %b = load i32, i32* %p2, !invariant.load !0
378 call i32 @callee(i32 %a)
379 ret i32 %b
380}
381
Dan Gohman595e8ab2016-02-22 17:45:20 +0000382; CHECK-LABEL: ignore_dbg_value:
Derek Schuffb861ec82016-04-12 20:12:05 +0000383; CHECK-NEXT: .Lfunc_begin
Dan Gohman595e8ab2016-02-22 17:45:20 +0000384; CHECK-NEXT: unreachable
385declare void @llvm.dbg.value(metadata, i64, metadata, metadata)
386define void @ignore_dbg_value() {
Derek Schuffb861ec82016-04-12 20:12:05 +0000387 call void @llvm.dbg.value(metadata i32 0, i64 0, metadata !7, metadata !9), !dbg !10
Dan Gohman595e8ab2016-02-22 17:45:20 +0000388 unreachable
389}
390
Dan Gohman450a8072016-05-05 20:41:15 +0000391; Don't stackify an expression that might use the stack into a return, since we
392; might insert a prologue before the return.
393
394; CHECK-LABEL: no_stackify_past_epilogue:
395; CHECK: return ${{[0-9]+}}{{$}}
396declare i32 @use_memory(i32*)
397define i32 @no_stackify_past_epilogue() {
398 %x = alloca i32
399 %call = call i32 @use_memory(i32* %x)
400 ret i32 %call
401}
402
Derek Schuffb861ec82016-04-12 20:12:05 +0000403!llvm.module.flags = !{!0}
404!llvm.dbg.cu = !{!1}
Dan Gohman595e8ab2016-02-22 17:45:20 +0000405
Derek Schuffb861ec82016-04-12 20:12:05 +0000406!0 = !{i32 2, !"Debug Info Version", i32 3}
Adrian Prantlab239892016-04-15 19:32:22 +0000407!1 = distinct !DICompileUnit(language: DW_LANG_C99, file: !2, producer: "clang version 3.9.0 (trunk 266005) (llvm/trunk 266105)", isOptimized: false, runtimeVersion: 0, emissionKind: FullDebug, enums: !3)
Derek Schuffb861ec82016-04-12 20:12:05 +0000408!2 = !DIFile(filename: "test.c", directory: "/")
409!3 = !{}
Adrian Prantl7a717c42016-04-15 19:38:14 +0000410!5 = distinct !DISubprogram(name: "test", scope: !2, file: !2, line: 10, type: !6, isLocal: false, isDefinition: true, scopeLine: 11, flags: DIFlagPrototyped, isOptimized: true, unit: !1, variables: !3)
Derek Schuffb861ec82016-04-12 20:12:05 +0000411!6 = !DISubroutineType(types: !3)
412!7 = !DILocalVariable(name: "nzcnt", scope: !5, file: !2, line: 15, type: !8)
413!8 = !DIBasicType(name: "int", size: 32, align: 32, encoding: DW_ATE_signed)
414!9 = !DIExpression()
415!10 = !DILocation(line: 15, column: 6, scope: !5)