blob: 8296af2cc6a41e93aac25a2d09e21f91e1fcf9e4 [file] [log] [blame]
Matt Arsenault80edab92016-01-18 21:43:36 +00001; RUN: llc -march=amdgcn -mcpu=tahiti < %s | FileCheck -check-prefix=FAST64 -check-prefix=GCN %s
2; RUN: llc -march=amdgcn -mcpu=bonaire < %s | FileCheck -check-prefix=SLOW64 -check-prefix=GCN %s
3
4
5; lshr (i64 x), c: c > 32 => reg_sequence lshr (i32 hi_32(x)), (c - 32), 0
6; GCN-LABEL: {{^}}lshr_i64_35:
7; GCN: buffer_load_dword [[VAL:v[0-9]+]]
8; GCN: v_lshrrev_b32_e32 v[[LO:[0-9]+]], 3, [[VAL]]
9; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
10; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
11define void @lshr_i64_35(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
12 %val = load i64, i64 addrspace(1)* %in
13 %shl = lshr i64 %val, 35
14 store i64 %shl, i64 addrspace(1)* %out
15 ret void
16}
17
18; GCN-LABEL: {{^}}lshr_i64_63:
19; GCN: buffer_load_dword [[VAL:v[0-9]+]]
20; GCN: v_lshrrev_b32_e32 v[[LO:[0-9]+]], 31, [[VAL]]
21; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
22; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
23define void @lshr_i64_63(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
24 %val = load i64, i64 addrspace(1)* %in
25 %shl = lshr i64 %val, 63
26 store i64 %shl, i64 addrspace(1)* %out
27 ret void
28}
29
30; GCN-LABEL: {{^}}lshr_i64_33:
31; GCN: buffer_load_dword [[VAL:v[0-9]+]]
32; GCN: v_lshrrev_b32_e32 v[[LO:[0-9]+]], 1, [[VAL]]
33; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
34; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
35define void @lshr_i64_33(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
36 %val = load i64, i64 addrspace(1)* %in
37 %shl = lshr i64 %val, 33
38 store i64 %shl, i64 addrspace(1)* %out
39 ret void
40}
41
42; GCN-LABEL: {{^}}lshr_i64_32:
43; GCN: buffer_load_dword v[[LO:[0-9]+]]
44; GCN: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
45; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
46define void @lshr_i64_32(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
47 %val = load i64, i64 addrspace(1)* %in
48 %shl = lshr i64 %val, 32
49 store i64 %shl, i64 addrspace(1)* %out
50 ret void
51}
52
53; GCN-LABEL: {{^}}lshr_and_i64_35:
54; XGCN: buffer_load_dword [[VAL:v[0-9]+]]
55; XGCN: v_lshlrev_b32_e32 v[[LO:[0-9]+]], 3, [[VAL]]
56; XGCN: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
57; XGCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
58define void @lshr_and_i64_35(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
59 %val = load i64, i64 addrspace(1)* %in
60 %and = and i64 %val, 2147483647 ; 0x7fffffff
61 %shl = lshr i64 %and, 35
62 store i64 %shl, i64 addrspace(1)* %out
63 ret void
64}
Matt Arsenault3cbbc102016-01-18 21:55:14 +000065
66; lshl (i64 x), c: c > 32 => reg_sequence lshl 0, (i32 lo_32(x)), (c - 32)
67
68; GCN-LABEL: {{^}}shl_i64_const_35:
69; GCN: buffer_load_dword [[VAL:v[0-9]+]]
70; GCN: v_lshlrev_b32_e32 v[[HI:[0-9]+]], 3, [[VAL]]
71; GCN: v_mov_b32_e32 v[[LO:[0-9]+]], 0{{$}}
72; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
73define void @shl_i64_const_35(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
74 %val = load i64, i64 addrspace(1)* %in
75 %shl = shl i64 %val, 35
76 store i64 %shl, i64 addrspace(1)* %out
77 ret void
78}
79
80; GCN-LABEL: {{^}}shl_i64_const_32:
81; GCN: buffer_load_dword v[[HI:[0-9]+]]
82; GCN: v_mov_b32_e32 v[[LO:[0-9]+]], 0{{$}}
83; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
84define void @shl_i64_const_32(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
85 %val = load i64, i64 addrspace(1)* %in
86 %shl = shl i64 %val, 32
87 store i64 %shl, i64 addrspace(1)* %out
88 ret void
89}
90
91; GCN-LABEL: {{^}}shl_i64_const_63:
92; GCN: buffer_load_dword [[VAL:v[0-9]+]]
93; GCN: v_lshlrev_b32_e32 v[[HI:[0-9]+]], 31, [[VAL]]
94; GCN: v_mov_b32_e32 v[[LO:[0-9]+]], 0{{$}}
95; GCN: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
96define void @shl_i64_const_63(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
97 %val = load i64, i64 addrspace(1)* %in
98 %shl = shl i64 %val, 63
99 store i64 %shl, i64 addrspace(1)* %out
100 ret void
101}
102
103; ashr (i64 x), 63 => (ashr lo(x), 31), lo(x)
104
105; GCN-LABEL: {{^}}ashr_i64_const_gt_32:
106define void @ashr_i64_const_gt_32(i64 addrspace(1)* %out, i64 addrspace(1)* %in) {
107 %val = load i64, i64 addrspace(1)* %in
108 %shl = ashr i64 %val, 35
109 store i64 %shl, i64 addrspace(1)* %out
110 ret void
111}