blob: cd414c7cb331bc986529c315729048bb9abf0239 [file] [log] [blame]
Matthias Braunc1e029e2015-06-01 21:26:26 +00001; RUN: llc -verify-machineinstrs -o - %s | FileCheck %s
2; LiveRangeEdit::eliminateDeadDef did not update LiveInterval sub ranges
3; properly.
4target datalayout = "e-p:32:32-p1:64:64-p2:64:64-p3:32:32-p4:64:64-p5:32:32-p24:64:64-i64:64-v16:16-v24:32-v32:32-v48:64-v96:128-v192:256-v256:256-v512:512-v1024:1024-v2048:2048-n32:64"
5target triple = "amdgcn--"
6
7; CHECK-LABEL: foobar:
8; Output with subregister liveness disabled:
9; CHECK: v_mov_b32_e32 v1, 1
10; CHECK: v_mov_b32_e32 v0, 0
11; CHECK: v_cmp_eq_i32_e32 vcc, s0, v0
12; CHECK: v_cmp_eq_i32_e64 s[0:1], s0, v1
13; CHECK: v_mov_b32_e32 v1, 3
14; CHECK: v_mov_b32_e32 v0, 2
15; CHECK: v_cmp_eq_i32_e64 s[2:3], s0, v0
16; CHECK: v_cmp_eq_i32_e64 s[4:5], s0, v1
17; CHECK: v_cndmask_b32_e64 v3, 0, -1, s[4:5]
18; CHECK: v_cndmask_b32_e64 v2, 0, -1, s[2:3]
19; CHECK: v_cndmask_b32_e64 v1, 0, -1, s[0:1]
20; CHECK: v_cndmask_b32_e64 v0, 0, -1, vcc
21; CHECK: v_cmp_ne_i32_e32 vcc, 0, v1
22; CHECK: v_cndmask_b32_e64 v1, 0, v0, vcc
23; CHECK: s_mov_b32 s3, 0xf000
24; CHECK: s_mov_b32 s2, -1
25; CHECK: buffer_store_dwordx2 v[0:1], s[0:3], 0
26; CHECK: s_endpgm
27; Output with subregister liveness enabled:
28; XCHECK: v_mov_b32_e32 v1, 1
29; XCHECK: v_mov_b32_e32 v0, 0
30; XCHECK: v_cmp_eq_i32_e32 vcc, s0, v1
31; XCHECK: v_mov_b32_e32 v1, 3
32; XCHECK: v_mov_b32_e32 v0, 2
33; XCHECK: v_cmp_eq_i32_e64 s[0:1], s0, v0
34; XCHECK: v_cmp_eq_i32_e64 s[2:3], s0, v1
35; XCHECK: v_cndmask_b32_e64 v3, 0, -1, s[2:3]
36; XCHECK: v_cndmask_b32_e64 v2, 0, -1, s[0:1]
37; XCHECK: v_cndmask_b32_e64 v1, 0, -1, vcc
38; XCHECK: v_cmp_ne_i32_e32 vcc, 0, v1
39; XCHECK: v_cndmask_b32_e64 v1, 0, v0, vcc
40; XCHECK: s_mov_b32 s3, 0xf000
41; XCHECK: s_mov_b32 s2, -1
42; XCHECK: buffer_store_dwordx2 v[0:1], s[0:3], 0
43; XCHECK: s_endpgm
44define void @foobar() {
45 %v0 = icmp eq <4 x i32> undef, <i32 0, i32 1, i32 2, i32 3>
46 %v3 = sext <4 x i1> %v0 to <4 x i32>
47 %v4 = extractelement <4 x i32> %v3, i32 1
48 %v5 = icmp ne i32 %v4, 0
49 %v6 = select i1 %v5, i32 undef, i32 0
50 %v15 = insertelement <2 x i32> undef, i32 %v6, i32 1
51 store <2 x i32> %v15, <2 x i32> addrspace(1)* undef, align 8
52 ret void
53}
54
55declare double @llvm.fma.f64(double, double, double)