blob: add90e9c2f3a98994abd568e95708e8321153367 [file] [log] [blame]
Matt Arsenault2920f622016-12-22 03:21:45 +00001; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=FUNC %s
2; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=R600 -check-prefix=FUNC %s
Matt Arsenault8596f712014-11-28 22:51:38 +00003
4declare i32 @llvm.r600.read.tidig.x() nounwind readnone
Tom Stellard75aadc22012-12-11 21:25:42 +00005
Tom Stellard79243d92014-10-01 17:15:17 +00006; FUNC-LABEL: {{^}}setcc_v2i32:
Tom Stellardc0845332013-11-22 23:07:58 +00007; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW]}}, KC0[3].X, KC0[3].Z
8; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW]}}, KC0[2].W, KC0[3].Y
Aaron Watry91d28862013-06-25 13:55:49 +00009
Matt Arsenault2920f622016-12-22 03:21:45 +000010; GCN-DAG: v_cmp_eq_u32_e32
11; GCN-DAG: v_cmp_eq_u32_e64
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000012define amdgpu_kernel void @setcc_v2i32(<2 x i32> addrspace(1)* %out, <2 x i32> %a, <2 x i32> %b) #0 {
Aaron Watry91d28862013-06-25 13:55:49 +000013 %result = icmp eq <2 x i32> %a, %b
14 %sext = sext <2 x i1> %result to <2 x i32>
15 store <2 x i32> %sext, <2 x i32> addrspace(1)* %out
16 ret void
17}
18
Tom Stellard79243d92014-10-01 17:15:17 +000019; FUNC-LABEL: {{^}}setcc_v4i32:
Tom Stellardc0845332013-11-22 23:07:58 +000020; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
21; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
22; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
23; R600-DAG: SETE_INT * T{{[0-9]+\.[XYZW], T[0-9]+\.[XYZW], T[0-9]+\.[XYZW]}}
Aaron Watry91d28862013-06-25 13:55:49 +000024
Matt Arsenault2920f622016-12-22 03:21:45 +000025; GCN: v_cmp_eq_u32_e32
26; GCN: v_cmp_eq_u32_e64
27; GCN: v_cmp_eq_u32_e64
28; GCN: v_cmp_eq_u32_e64
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000029define amdgpu_kernel void @setcc_v4i32(<4 x i32> addrspace(1)* %out, <4 x i32> addrspace(1)* %in) #0 {
David Blaikie79e6c742015-02-27 19:29:02 +000030 %b_ptr = getelementptr <4 x i32>, <4 x i32> addrspace(1)* %in, i32 1
Matt Arsenault2920f622016-12-22 03:21:45 +000031 %a = load <4 x i32>, <4 x i32> addrspace(1)* %in
32 %b = load <4 x i32>, <4 x i32> addrspace(1)* %b_ptr
Tom Stellard75aadc22012-12-11 21:25:42 +000033 %result = icmp eq <4 x i32> %a, %b
34 %sext = sext <4 x i1> %result to <4 x i32>
35 store <4 x i32> %sext, <4 x i32> addrspace(1)* %out
36 ret void
37}
Tom Stellardc0845332013-11-22 23:07:58 +000038
39;;;==========================================================================;;;
40;; Float comparisons
41;;;==========================================================================;;;
42
Tom Stellard79243d92014-10-01 17:15:17 +000043; FUNC-LABEL: {{^}}f32_oeq:
Tom Stellardc0845332013-11-22 23:07:58 +000044; R600: SETE_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +000045; GCN: v_cmp_eq_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000046define amdgpu_kernel void @f32_oeq(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +000047entry:
48 %0 = fcmp oeq float %a, %b
49 %1 = sext i1 %0 to i32
50 store i32 %1, i32 addrspace(1)* %out
51 ret void
52}
53
Tom Stellard79243d92014-10-01 17:15:17 +000054; FUNC-LABEL: {{^}}f32_ogt:
Tom Stellardc0845332013-11-22 23:07:58 +000055; R600: SETGT_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +000056; GCN: v_cmp_gt_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000057define amdgpu_kernel void @f32_ogt(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +000058entry:
59 %0 = fcmp ogt float %a, %b
60 %1 = sext i1 %0 to i32
61 store i32 %1, i32 addrspace(1)* %out
62 ret void
63}
64
Tom Stellard79243d92014-10-01 17:15:17 +000065; FUNC-LABEL: {{^}}f32_oge:
Tom Stellardc0845332013-11-22 23:07:58 +000066; R600: SETGE_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +000067; GCN: v_cmp_ge_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000068define amdgpu_kernel void @f32_oge(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +000069entry:
70 %0 = fcmp oge float %a, %b
71 %1 = sext i1 %0 to i32
72 store i32 %1, i32 addrspace(1)* %out
73 ret void
74}
75
Tom Stellard79243d92014-10-01 17:15:17 +000076; FUNC-LABEL: {{^}}f32_olt:
Tom Stellardc0845332013-11-22 23:07:58 +000077; R600: SETGT_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +000078; GCN: v_cmp_lt_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000079define amdgpu_kernel void @f32_olt(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +000080entry:
81 %0 = fcmp olt float %a, %b
82 %1 = sext i1 %0 to i32
83 store i32 %1, i32 addrspace(1)* %out
84 ret void
85}
86
Tom Stellard79243d92014-10-01 17:15:17 +000087; FUNC-LABEL: {{^}}f32_ole:
Tom Stellardc0845332013-11-22 23:07:58 +000088; R600: SETGE_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +000089; GCN: v_cmp_le_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +000090define amdgpu_kernel void @f32_ole(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +000091entry:
92 %0 = fcmp ole float %a, %b
93 %1 = sext i1 %0 to i32
94 store i32 %1, i32 addrspace(1)* %out
95 ret void
96}
97
Tom Stellard79243d92014-10-01 17:15:17 +000098; FUNC-LABEL: {{^}}f32_one:
Tom Stellardc0845332013-11-22 23:07:58 +000099; R600-DAG: SETE_DX10
100; R600-DAG: SETE_DX10
101; R600-DAG: AND_INT
102; R600-DAG: SETNE_DX10
103; R600-DAG: AND_INT
104; R600-DAG: SETNE_INT
Matt Arsenaultbecd6562014-12-03 05:22:35 +0000105
Matt Arsenault2920f622016-12-22 03:21:45 +0000106; GCN: v_cmp_lg_f32_e32 vcc
107; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000108define amdgpu_kernel void @f32_one(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000109entry:
110 %0 = fcmp one float %a, %b
111 %1 = sext i1 %0 to i32
112 store i32 %1, i32 addrspace(1)* %out
113 ret void
114}
115
Tom Stellard79243d92014-10-01 17:15:17 +0000116; FUNC-LABEL: {{^}}f32_ord:
Tom Stellardc0845332013-11-22 23:07:58 +0000117; R600-DAG: SETE_DX10
118; R600-DAG: SETE_DX10
119; R600-DAG: AND_INT
120; R600-DAG: SETNE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000121; GCN: v_cmp_o_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000122define amdgpu_kernel void @f32_ord(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000123entry:
124 %0 = fcmp ord float %a, %b
125 %1 = sext i1 %0 to i32
126 store i32 %1, i32 addrspace(1)* %out
127 ret void
128}
129
Tom Stellard79243d92014-10-01 17:15:17 +0000130; FUNC-LABEL: {{^}}f32_ueq:
Tom Stellardc0845332013-11-22 23:07:58 +0000131; R600-DAG: SETNE_DX10
132; R600-DAG: SETNE_DX10
133; R600-DAG: OR_INT
134; R600-DAG: SETE_DX10
135; R600-DAG: OR_INT
136; R600-DAG: SETNE_INT
Matt Arsenaultbecd6562014-12-03 05:22:35 +0000137
Matt Arsenault2920f622016-12-22 03:21:45 +0000138; GCN: v_cmp_nlg_f32_e32 vcc
139; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000140define amdgpu_kernel void @f32_ueq(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000141entry:
142 %0 = fcmp ueq float %a, %b
143 %1 = sext i1 %0 to i32
144 store i32 %1, i32 addrspace(1)* %out
145 ret void
146}
147
Tom Stellard79243d92014-10-01 17:15:17 +0000148; FUNC-LABEL: {{^}}f32_ugt:
Tom Stellardc0845332013-11-22 23:07:58 +0000149; R600: SETGE
150; R600: SETE_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +0000151; GCN: v_cmp_nle_f32_e32 vcc
152; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000153define amdgpu_kernel void @f32_ugt(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000154entry:
155 %0 = fcmp ugt float %a, %b
156 %1 = sext i1 %0 to i32
157 store i32 %1, i32 addrspace(1)* %out
158 ret void
159}
160
Tom Stellard79243d92014-10-01 17:15:17 +0000161; FUNC-LABEL: {{^}}f32_uge:
Tom Stellardc0845332013-11-22 23:07:58 +0000162; R600: SETGT
163; R600: SETE_DX10
Matt Arsenault8b989ef2014-12-11 22:15:39 +0000164
Matt Arsenault2920f622016-12-22 03:21:45 +0000165; GCN: v_cmp_nlt_f32_e32 vcc
166; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000167define amdgpu_kernel void @f32_uge(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000168entry:
169 %0 = fcmp uge float %a, %b
170 %1 = sext i1 %0 to i32
171 store i32 %1, i32 addrspace(1)* %out
172 ret void
173}
174
Tom Stellard79243d92014-10-01 17:15:17 +0000175; FUNC-LABEL: {{^}}f32_ult:
Tom Stellardc0845332013-11-22 23:07:58 +0000176; R600: SETGE
177; R600: SETE_DX10
Matt Arsenault8b989ef2014-12-11 22:15:39 +0000178
Matt Arsenault2920f622016-12-22 03:21:45 +0000179; GCN: v_cmp_nge_f32_e32 vcc
180; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000181define amdgpu_kernel void @f32_ult(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000182entry:
183 %0 = fcmp ult float %a, %b
184 %1 = sext i1 %0 to i32
185 store i32 %1, i32 addrspace(1)* %out
186 ret void
187}
188
Tom Stellard79243d92014-10-01 17:15:17 +0000189; FUNC-LABEL: {{^}}f32_ule:
Tom Stellardc0845332013-11-22 23:07:58 +0000190; R600: SETGT
191; R600: SETE_DX10
Matt Arsenault8b989ef2014-12-11 22:15:39 +0000192
Matt Arsenault2920f622016-12-22 03:21:45 +0000193; GCN: v_cmp_ngt_f32_e32 vcc
194; GCN-NEXT: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1, vcc
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000195define amdgpu_kernel void @f32_ule(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000196entry:
197 %0 = fcmp ule float %a, %b
198 %1 = sext i1 %0 to i32
199 store i32 %1, i32 addrspace(1)* %out
200 ret void
201}
202
Tom Stellard79243d92014-10-01 17:15:17 +0000203; FUNC-LABEL: {{^}}f32_une:
Tom Stellardc0845332013-11-22 23:07:58 +0000204; R600: SETNE_DX10
Matt Arsenault2920f622016-12-22 03:21:45 +0000205; GCN: v_cmp_neq_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000206define amdgpu_kernel void @f32_une(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000207entry:
208 %0 = fcmp une float %a, %b
209 %1 = sext i1 %0 to i32
210 store i32 %1, i32 addrspace(1)* %out
211 ret void
212}
213
Tom Stellard79243d92014-10-01 17:15:17 +0000214; FUNC-LABEL: {{^}}f32_uno:
Tom Stellardc0845332013-11-22 23:07:58 +0000215; R600: SETNE_DX10
216; R600: SETNE_DX10
217; R600: OR_INT
218; R600: SETNE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000219; GCN: v_cmp_u_f32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000220define amdgpu_kernel void @f32_uno(i32 addrspace(1)* %out, float %a, float %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000221entry:
222 %0 = fcmp uno float %a, %b
223 %1 = sext i1 %0 to i32
224 store i32 %1, i32 addrspace(1)* %out
225 ret void
226}
227
228;;;==========================================================================;;;
229;; 32-bit integer comparisons
230;;;==========================================================================;;;
231
Tom Stellard79243d92014-10-01 17:15:17 +0000232; FUNC-LABEL: {{^}}i32_eq:
Tom Stellardc0845332013-11-22 23:07:58 +0000233; R600: SETE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000234; GCN: v_cmp_eq_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000235define amdgpu_kernel void @i32_eq(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000236entry:
237 %0 = icmp eq i32 %a, %b
238 %1 = sext i1 %0 to i32
239 store i32 %1, i32 addrspace(1)* %out
240 ret void
241}
242
Tom Stellard79243d92014-10-01 17:15:17 +0000243; FUNC-LABEL: {{^}}i32_ne:
Tom Stellardc0845332013-11-22 23:07:58 +0000244; R600: SETNE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000245; GCN: v_cmp_ne_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000246define amdgpu_kernel void @i32_ne(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000247entry:
248 %0 = icmp ne i32 %a, %b
249 %1 = sext i1 %0 to i32
250 store i32 %1, i32 addrspace(1)* %out
251 ret void
252}
253
Tom Stellard79243d92014-10-01 17:15:17 +0000254; FUNC-LABEL: {{^}}i32_ugt:
Tom Stellardc0845332013-11-22 23:07:58 +0000255; R600: SETGT_UINT
Matt Arsenault2920f622016-12-22 03:21:45 +0000256; GCN: v_cmp_gt_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000257define amdgpu_kernel void @i32_ugt(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000258entry:
259 %0 = icmp ugt i32 %a, %b
260 %1 = sext i1 %0 to i32
261 store i32 %1, i32 addrspace(1)* %out
262 ret void
263}
264
Tom Stellard79243d92014-10-01 17:15:17 +0000265; FUNC-LABEL: {{^}}i32_uge:
Tom Stellardc0845332013-11-22 23:07:58 +0000266; R600: SETGE_UINT
Matt Arsenault2920f622016-12-22 03:21:45 +0000267; GCN: v_cmp_ge_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000268define amdgpu_kernel void @i32_uge(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000269entry:
270 %0 = icmp uge i32 %a, %b
271 %1 = sext i1 %0 to i32
272 store i32 %1, i32 addrspace(1)* %out
273 ret void
274}
275
Tom Stellard79243d92014-10-01 17:15:17 +0000276; FUNC-LABEL: {{^}}i32_ult:
Tom Stellardc0845332013-11-22 23:07:58 +0000277; R600: SETGT_UINT
Matt Arsenault2920f622016-12-22 03:21:45 +0000278; GCN: v_cmp_lt_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000279define amdgpu_kernel void @i32_ult(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000280entry:
281 %0 = icmp ult i32 %a, %b
282 %1 = sext i1 %0 to i32
283 store i32 %1, i32 addrspace(1)* %out
284 ret void
285}
286
Tom Stellard79243d92014-10-01 17:15:17 +0000287; FUNC-LABEL: {{^}}i32_ule:
Tom Stellardc0845332013-11-22 23:07:58 +0000288; R600: SETGE_UINT
Matt Arsenault2920f622016-12-22 03:21:45 +0000289; GCN: v_cmp_le_u32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000290define amdgpu_kernel void @i32_ule(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000291entry:
292 %0 = icmp ule i32 %a, %b
293 %1 = sext i1 %0 to i32
294 store i32 %1, i32 addrspace(1)* %out
295 ret void
296}
297
Tom Stellard79243d92014-10-01 17:15:17 +0000298; FUNC-LABEL: {{^}}i32_sgt:
Tom Stellardc0845332013-11-22 23:07:58 +0000299; R600: SETGT_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000300; GCN: v_cmp_gt_i32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000301define amdgpu_kernel void @i32_sgt(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000302entry:
303 %0 = icmp sgt i32 %a, %b
304 %1 = sext i1 %0 to i32
305 store i32 %1, i32 addrspace(1)* %out
306 ret void
307}
308
Tom Stellard79243d92014-10-01 17:15:17 +0000309; FUNC-LABEL: {{^}}i32_sge:
Tom Stellardc0845332013-11-22 23:07:58 +0000310; R600: SETGE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000311; GCN: v_cmp_ge_i32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000312define amdgpu_kernel void @i32_sge(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000313entry:
314 %0 = icmp sge i32 %a, %b
315 %1 = sext i1 %0 to i32
316 store i32 %1, i32 addrspace(1)* %out
317 ret void
318}
319
Tom Stellard79243d92014-10-01 17:15:17 +0000320; FUNC-LABEL: {{^}}i32_slt:
Tom Stellardc0845332013-11-22 23:07:58 +0000321; R600: SETGT_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000322; GCN: v_cmp_lt_i32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000323define amdgpu_kernel void @i32_slt(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000324entry:
325 %0 = icmp slt i32 %a, %b
326 %1 = sext i1 %0 to i32
327 store i32 %1, i32 addrspace(1)* %out
328 ret void
329}
330
Tom Stellard79243d92014-10-01 17:15:17 +0000331; FUNC-LABEL: {{^}}i32_sle:
Tom Stellardc0845332013-11-22 23:07:58 +0000332; R600: SETGE_INT
Matt Arsenault2920f622016-12-22 03:21:45 +0000333; GCN: v_cmp_le_i32
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000334define amdgpu_kernel void @i32_sle(i32 addrspace(1)* %out, i32 %a, i32 %b) #0 {
Tom Stellardc0845332013-11-22 23:07:58 +0000335entry:
336 %0 = icmp sle i32 %a, %b
337 %1 = sext i1 %0 to i32
338 store i32 %1, i32 addrspace(1)* %out
339 ret void
340}
Matt Arsenault8596f712014-11-28 22:51:38 +0000341
342; FIXME: This does 4 compares
343; FUNC-LABEL: {{^}}v3i32_eq:
Matt Arsenault2920f622016-12-22 03:21:45 +0000344; GCN-DAG: v_cmp_eq_u32
345; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
346; GCN-DAG: v_cmp_eq_u32
347; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
348; GCN-DAG: v_cmp_eq_u32
349; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
350; GCN: s_endpgm
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000351define amdgpu_kernel void @v3i32_eq(<3 x i32> addrspace(1)* %out, <3 x i32> addrspace(1)* %ptra, <3 x i32> addrspace(1)* %ptrb) #0 {
Matt Arsenault8596f712014-11-28 22:51:38 +0000352 %tid = call i32 @llvm.r600.read.tidig.x() nounwind readnone
David Blaikie79e6c742015-02-27 19:29:02 +0000353 %gep.a = getelementptr <3 x i32>, <3 x i32> addrspace(1)* %ptra, i32 %tid
354 %gep.b = getelementptr <3 x i32>, <3 x i32> addrspace(1)* %ptrb, i32 %tid
355 %gep.out = getelementptr <3 x i32>, <3 x i32> addrspace(1)* %out, i32 %tid
David Blaikiea79ac142015-02-27 21:17:42 +0000356 %a = load <3 x i32>, <3 x i32> addrspace(1)* %gep.a
357 %b = load <3 x i32>, <3 x i32> addrspace(1)* %gep.b
Matt Arsenault8596f712014-11-28 22:51:38 +0000358 %cmp = icmp eq <3 x i32> %a, %b
359 %ext = sext <3 x i1> %cmp to <3 x i32>
360 store <3 x i32> %ext, <3 x i32> addrspace(1)* %gep.out
361 ret void
362}
363
364; FUNC-LABEL: {{^}}v3i8_eq:
Matt Arsenault2920f622016-12-22 03:21:45 +0000365; GCN-DAG: v_cmp_eq_u32
366; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
367; GCN-DAG: v_cmp_eq_u32
368; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
369; GCN-DAG: v_cmp_eq_u32
370; GCN-DAG: v_cndmask_b32_e64 {{v[0-9]+}}, 0, -1,
371; GCN: s_endpgm
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000372define amdgpu_kernel void @v3i8_eq(<3 x i8> addrspace(1)* %out, <3 x i8> addrspace(1)* %ptra, <3 x i8> addrspace(1)* %ptrb) #0 {
Matt Arsenault8596f712014-11-28 22:51:38 +0000373 %tid = call i32 @llvm.r600.read.tidig.x() nounwind readnone
David Blaikie79e6c742015-02-27 19:29:02 +0000374 %gep.a = getelementptr <3 x i8>, <3 x i8> addrspace(1)* %ptra, i32 %tid
375 %gep.b = getelementptr <3 x i8>, <3 x i8> addrspace(1)* %ptrb, i32 %tid
376 %gep.out = getelementptr <3 x i8>, <3 x i8> addrspace(1)* %out, i32 %tid
David Blaikiea79ac142015-02-27 21:17:42 +0000377 %a = load <3 x i8>, <3 x i8> addrspace(1)* %gep.a
378 %b = load <3 x i8>, <3 x i8> addrspace(1)* %gep.b
Matt Arsenault8596f712014-11-28 22:51:38 +0000379 %cmp = icmp eq <3 x i8> %a, %b
380 %ext = sext <3 x i1> %cmp to <3 x i8>
381 store <3 x i8> %ext, <3 x i8> addrspace(1)* %gep.out
382 ret void
383}
Tom Stellard2e045bb2016-01-20 00:13:22 +0000384
385; Make sure we don't try to emit i1 setcc ops
386; FUNC-LABEL: setcc-i1
Matt Arsenault2920f622016-12-22 03:21:45 +0000387; GCN: s_and_b32 [[AND:s[0-9]+]], s{{[0-9]+}}, 1
388; GCN: s_cmp_eq_u32 [[AND]], 0
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000389define amdgpu_kernel void @setcc-i1(i32 %in) #0 {
Tom Stellard2e045bb2016-01-20 00:13:22 +0000390 %and = and i32 %in, 1
391 %cmp = icmp eq i32 %and, 0
392 br i1 %cmp, label %endif, label %if
393if:
394 unreachable
395endif:
396 ret void
397}
Tom Stellardd1efda82016-01-20 21:48:24 +0000398
399; FUNC-LABEL: setcc-i1-and-xor
Matt Arsenault2920f622016-12-22 03:21:45 +0000400; GCN-DAG: v_cmp_ge_f32_e64 [[A:s\[[0-9]+:[0-9]+\]]], s{{[0-9]+}}, 0{{$}}
401; GCN-DAG: v_cmp_le_f32_e64 [[B:s\[[0-9]+:[0-9]+\]]], s{{[0-9]+}}, 1.0
402; GCN: s_and_b64 s[2:3], [[A]], [[B]]
Matt Arsenault3dbeefa2017-03-21 21:39:51 +0000403define amdgpu_kernel void @setcc-i1-and-xor(i32 addrspace(1)* %out, float %cond) #0 {
Tom Stellardd1efda82016-01-20 21:48:24 +0000404bb0:
405 %tmp5 = fcmp oge float %cond, 0.000000e+00
406 %tmp7 = fcmp ole float %cond, 1.000000e+00
407 %tmp9 = and i1 %tmp5, %tmp7
408 %tmp11 = xor i1 %tmp9, 1
409 br i1 %tmp11, label %bb2, label %bb1
410
411bb1:
412 store i32 0, i32 addrspace(1)* %out
413 br label %bb2
414
415bb2:
416 ret void
417}
Matt Arsenault2920f622016-12-22 03:21:45 +0000418
419attributes #0 = { nounwind }