blob: b697967f1a23034035cf1d5c84ae5b4886b894bb [file] [log] [blame]
Matt Arsenaultd1097a32016-06-02 19:54:26 +00001; RUN: llc -march=amdgcn -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-NOHSA -check-prefix=FUNC %s
2; RUN: llc -mtriple=amdgcn--amdhsa -mcpu=kaveri -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-HSA -check-prefix=FUNC %s
3; RUN: llc -march=amdgcn -mcpu=tonga -verify-machineinstrs < %s | FileCheck -check-prefix=GCN -check-prefix=GCN-NOHSA -check-prefix=FUNC %s
4; RUN: llc -march=r600 -mcpu=redwood < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
5; RUN: llc -march=r600 -mcpu=cayman < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
6
7
8; FUNC-LABEL: {{^}}global_load_i8:
9; GCN-NOHSA: buffer_load_ubyte v{{[0-9]+}}
10; GCN-HSA: flat_load_ubyte
11
12; EG: VTX_READ_8 T{{[0-9]+}}.X, T{{[0-9]+}}.X, 0
13define void @global_load_i8(i8 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
14entry:
15 %ld = load i8, i8 addrspace(1)* %in
16 store i8 %ld, i8 addrspace(1)* %out
17 ret void
18}
19
20; FUNC-LABEL: {{^}}global_load_v2i8:
21; GCN-NOHSA: buffer_load_ushort v
22; GCN-HSA: flat_load_ushort v
23
24; EG: VTX_READ_16
25define void @global_load_v2i8(<2 x i8> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
26entry:
27 %ld = load <2 x i8>, <2 x i8> addrspace(1)* %in
28 store <2 x i8> %ld, <2 x i8> addrspace(1)* %out
29 ret void
30}
31
32; FUNC-LABEL: {{^}}global_load_v3i8:
33; GCN-NOHSA: buffer_load_dword v
34; GCN-HSA: flat_load_dword v
35
36; EG-DAG: VTX_READ_32
37define void @global_load_v3i8(<3 x i8> addrspace(1)* %out, <3 x i8> addrspace(1)* %in) #0 {
38entry:
39 %ld = load <3 x i8>, <3 x i8> addrspace(1)* %in
40 store <3 x i8> %ld, <3 x i8> addrspace(1)* %out
41 ret void
42}
43
44; FUNC-LABEL: {{^}}global_load_v4i8:
45; GCN-NOHSA: buffer_load_dword v
46; GCN-HSA: flat_load_dword v
47
48; EG: VTX_READ_32
49define void @global_load_v4i8(<4 x i8> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
50entry:
51 %ld = load <4 x i8>, <4 x i8> addrspace(1)* %in
52 store <4 x i8> %ld, <4 x i8> addrspace(1)* %out
53 ret void
54}
55
56; FUNC-LABEL: {{^}}global_load_v8i8:
57; GCN-NOHSA: buffer_load_dwordx2
58; GCN-HSA: flat_load_dwordx2
59
60; EG: VTX_READ_64
61define void @global_load_v8i8(<8 x i8> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
62entry:
63 %ld = load <8 x i8>, <8 x i8> addrspace(1)* %in
64 store <8 x i8> %ld, <8 x i8> addrspace(1)* %out
65 ret void
66}
67
68; FUNC-LABEL: {{^}}global_load_v16i8:
69; GCN-NOHSA: buffer_load_dwordx4
70
71; GCN-HSA: flat_load_dwordx4
72
73; EG: VTX_READ_128
74define void @global_load_v16i8(<16 x i8> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
75entry:
76 %ld = load <16 x i8>, <16 x i8> addrspace(1)* %in
77 store <16 x i8> %ld, <16 x i8> addrspace(1)* %out
78 ret void
79}
80
81; FUNC-LABEL: {{^}}global_zextload_i8_to_i32:
82; GCN-NOHSA: buffer_load_ubyte v{{[0-9]+}},
83; GCN-HSA: flat_load_ubyte
84
85; EG: VTX_READ_8 T{{[0-9]+\.X, T[0-9]+\.X}}
86define void @global_zextload_i8_to_i32(i32 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
87 %a = load i8, i8 addrspace(1)* %in
88 %ext = zext i8 %a to i32
89 store i32 %ext, i32 addrspace(1)* %out
90 ret void
91}
92
93; FUNC-LABEL: {{^}}global_sextload_i8_to_i32:
94; GCN-NOHSA: buffer_load_sbyte
95; GCN-HSA: flat_load_sbyte
96
97; EG: VTX_READ_8 [[DST:T[0-9]\.[XYZW]]], [[DST]]
98; EG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST]], 0.0, literal
99; EG: 8
100define void @global_sextload_i8_to_i32(i32 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
101 %ld = load i8, i8 addrspace(1)* %in
102 %ext = sext i8 %ld to i32
103 store i32 %ext, i32 addrspace(1)* %out
104 ret void
105}
106
107; FUNC-LABEL: {{^}}global_zextload_v1i8_to_v1i32:
108define void @global_zextload_v1i8_to_v1i32(<1 x i32> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
109 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
110 %ext = zext <1 x i8> %load to <1 x i32>
111 store <1 x i32> %ext, <1 x i32> addrspace(1)* %out
112 ret void
113}
114
115; FUNC-LABEL: {{^}}global_sextload_v1i8_to_v1i32:
116define void @global_sextload_v1i8_to_v1i32(<1 x i32> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
117 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
118 %ext = sext <1 x i8> %load to <1 x i32>
119 store <1 x i32> %ext, <1 x i32> addrspace(1)* %out
120 ret void
121}
122
123; FUNC-LABEL: {{^}}global_zextload_v2i8_to_v2i32:
Matt Arsenault327bb5a2016-07-01 22:47:50 +0000124; GCN-NOHSA: buffer_load_ushort
125; GCN-HSA: flat_load_ushort
126
Matt Arsenaultd1097a32016-06-02 19:54:26 +0000127; EG: VTX_READ_8
128; EG: VTX_READ_8
129define void @global_zextload_v2i8_to_v2i32(<2 x i32> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
130 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
131 %ext = zext <2 x i8> %load to <2 x i32>
132 store <2 x i32> %ext, <2 x i32> addrspace(1)* %out
133 ret void
134}
135
136; FUNC-LABEL: {{^}}global_sextload_v2i8_to_v2i32:
Matt Arsenault327bb5a2016-07-01 22:47:50 +0000137; GCN-NOHSA: buffer_load_ushort
138; GCN-HSA: flat_load_ushort
Matt Arsenaultd1097a32016-06-02 19:54:26 +0000139
140; EG-DAG: VTX_READ_8 [[DST_X:T[0-9]\.[XYZW]]], [[DST_X]]
141; EG-DAG: VTX_READ_8 [[DST_Y:T[0-9]\.[XYZW]]], [[DST_Y]]
142; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_X]], 0.0, literal
143; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_Y]], 0.0, literal
144; EG-DAG: 8
145; EG-DAG: 8
146define void @global_sextload_v2i8_to_v2i32(<2 x i32> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
147 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
148 %ext = sext <2 x i8> %load to <2 x i32>
149 store <2 x i32> %ext, <2 x i32> addrspace(1)* %out
150 ret void
151}
152
153; FUNC-LABEL: {{^}}global_zextload_v3i8_to_v3i32:
154; GCN-NOHSA: buffer_load_dword v
155; GCN-HSA: flat_load_dword v
156
157; GCN-DAG: v_bfe_u32 v{{[0-9]+}}, v{{[0-9]+}}, 8, 8
158; GCN-DAG: v_bfe_u32 v{{[0-9]+}}, v{{[0-9]+}}, 16, 8
159; GCN-DAG: v_and_b32_e32 v{{[0-9]+}}, 0xff,
160define void @global_zextload_v3i8_to_v3i32(<3 x i32> addrspace(1)* %out, <3 x i8> addrspace(1)* %in) #0 {
161entry:
162 %ld = load <3 x i8>, <3 x i8> addrspace(1)* %in
163 %ext = zext <3 x i8> %ld to <3 x i32>
164 store <3 x i32> %ext, <3 x i32> addrspace(1)* %out
165 ret void
166}
167
168; FUNC-LABEL: {{^}}global_sextload_v3i8_to_v3i32:
169; GCN-NOHSA: buffer_load_dword v
170; GCN-HSA: flat_load_dword v
171
172; GCN-DAG: v_bfe_i32 v{{[0-9]+}}, v{{[0-9]+}}, 8, 8
173; GCN-DAG: v_bfe_i32 v{{[0-9]+}}, v{{[0-9]+}}, 0, 8
174; GCN-DAG: v_bfe_i32 v{{[0-9]+}}, v{{[0-9]+}}, 16, 8
175define void @global_sextload_v3i8_to_v3i32(<3 x i32> addrspace(1)* %out, <3 x i8> addrspace(1)* %in) #0 {
176entry:
177 %ld = load <3 x i8>, <3 x i8> addrspace(1)* %in
178 %ext = sext <3 x i8> %ld to <3 x i32>
179 store <3 x i32> %ext, <3 x i32> addrspace(1)* %out
180 ret void
181}
182
183; FUNC-LABEL: {{^}}global_zextload_v4i8_to_v4i32:
Matt Arsenault327bb5a2016-07-01 22:47:50 +0000184; GCN-NOHSA: buffer_load_dword
185; GCN-HSA: flat_load_dword
Matt Arsenaultd1097a32016-06-02 19:54:26 +0000186
187; EG: VTX_READ_8
188; EG: VTX_READ_8
189; EG: VTX_READ_8
190; EG: VTX_READ_8
191define void @global_zextload_v4i8_to_v4i32(<4 x i32> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
192 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
193 %ext = zext <4 x i8> %load to <4 x i32>
194 store <4 x i32> %ext, <4 x i32> addrspace(1)* %out
195 ret void
196}
197
198; FUNC-LABEL: {{^}}global_sextload_v4i8_to_v4i32:
Matt Arsenault327bb5a2016-07-01 22:47:50 +0000199; GCN-NOHSA: buffer_load_dword
200; GCN-HSA: flat_load_dword
Matt Arsenaultd1097a32016-06-02 19:54:26 +0000201
202; EG-DAG: VTX_READ_8 [[DST_X:T[0-9]\.[XYZW]]], [[DST_X]]
203; EG-DAG: VTX_READ_8 [[DST_Y:T[0-9]\.[XYZW]]], [[DST_Y]]
204; EG-DAG: VTX_READ_8 [[DST_Z:T[0-9]\.[XYZW]]], [[DST_Z]]
205; EG-DAG: VTX_READ_8 [[DST_W:T[0-9]\.[XYZW]]], [[DST_W]]
206; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_X]], 0.0, literal
207; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_Y]], 0.0, literal
208; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_Z]], 0.0, literal
209; EG-DAG: BFE_INT {{[* ]*}}T{{[0-9].[XYZW]}}, [[DST_W]], 0.0, literal
210; EG-DAG: 8
211; EG-DAG: 8
212; EG-DAG: 8
213; EG-DAG: 8
214define void @global_sextload_v4i8_to_v4i32(<4 x i32> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
215 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
216 %ext = sext <4 x i8> %load to <4 x i32>
217 store <4 x i32> %ext, <4 x i32> addrspace(1)* %out
218 ret void
219}
220
221; FUNC-LABEL: {{^}}global_zextload_v8i8_to_v8i32:
222define void @global_zextload_v8i8_to_v8i32(<8 x i32> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
223 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
224 %ext = zext <8 x i8> %load to <8 x i32>
225 store <8 x i32> %ext, <8 x i32> addrspace(1)* %out
226 ret void
227}
228
229; FUNC-LABEL: {{^}}global_sextload_v8i8_to_v8i32:
230define void @global_sextload_v8i8_to_v8i32(<8 x i32> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
231 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
232 %ext = sext <8 x i8> %load to <8 x i32>
233 store <8 x i32> %ext, <8 x i32> addrspace(1)* %out
234 ret void
235}
236
237; FUNC-LABEL: {{^}}global_zextload_v16i8_to_v16i32:
238define void @global_zextload_v16i8_to_v16i32(<16 x i32> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
239 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
240 %ext = zext <16 x i8> %load to <16 x i32>
241 store <16 x i32> %ext, <16 x i32> addrspace(1)* %out
242 ret void
243}
244
245; FUNC-LABEL: {{^}}global_sextload_v16i8_to_v16i32:
246define void @global_sextload_v16i8_to_v16i32(<16 x i32> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
247 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
248 %ext = sext <16 x i8> %load to <16 x i32>
249 store <16 x i32> %ext, <16 x i32> addrspace(1)* %out
250 ret void
251}
252
253; FUNC-LABEL: {{^}}global_zextload_v32i8_to_v32i32:
254define void @global_zextload_v32i8_to_v32i32(<32 x i32> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
255 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
256 %ext = zext <32 x i8> %load to <32 x i32>
257 store <32 x i32> %ext, <32 x i32> addrspace(1)* %out
258 ret void
259}
260
261; FUNC-LABEL: {{^}}global_sextload_v32i8_to_v32i32:
262define void @global_sextload_v32i8_to_v32i32(<32 x i32> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
263 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
264 %ext = sext <32 x i8> %load to <32 x i32>
265 store <32 x i32> %ext, <32 x i32> addrspace(1)* %out
266 ret void
267}
268
269; FUNC-LABEL: {{^}}global_zextload_v64i8_to_v64i32:
270define void @global_zextload_v64i8_to_v64i32(<64 x i32> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
271 %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
272 %ext = zext <64 x i8> %load to <64 x i32>
273 store <64 x i32> %ext, <64 x i32> addrspace(1)* %out
274 ret void
275}
276
277; FUNC-LABEL: {{^}}global_sextload_v64i8_to_v64i32:
278define void @global_sextload_v64i8_to_v64i32(<64 x i32> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
279 %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
280 %ext = sext <64 x i8> %load to <64 x i32>
281 store <64 x i32> %ext, <64 x i32> addrspace(1)* %out
282 ret void
283}
284
285; FUNC-LABEL: {{^}}global_zextload_i8_to_i64:
286; GCN-DAG: v_mov_b32_e32 v[[HI:[0-9]+]], 0{{$}}
287
288; GCN-NOHSA-DAG: buffer_load_ubyte v[[LO:[0-9]+]],
289; GCN-NOHSA: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]]
290
291; GCN-HSA-DAG: flat_load_ubyte v[[LO:[0-9]+]],
292; GCN-HSA: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v{{\[}}[[LO]]:[[HI]]]
293define void @global_zextload_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
294 %a = load i8, i8 addrspace(1)* %in
295 %ext = zext i8 %a to i64
296 store i64 %ext, i64 addrspace(1)* %out
297 ret void
298}
299
300; FUNC-LABEL: {{^}}global_sextload_i8_to_i64:
301; GCN-NOHSA: buffer_load_sbyte v[[LO:[0-9]+]],
302; GCN-HSA: flat_load_sbyte v[[LO:[0-9]+]],
303; GCN: v_ashrrev_i32_e32 v[[HI:[0-9]+]], 31, v[[LO]]
304
305; GCN-NOHSA: buffer_store_dwordx2 v{{\[}}[[LO]]:[[HI]]{{\]}}
306; GCN-HSA: flat_store_dwordx2 v{{\[[0-9]+:[0-9]+\]}}, v{{\[}}[[LO]]:[[HI]]{{\]}}
307define void @global_sextload_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
308 %a = load i8, i8 addrspace(1)* %in
309 %ext = sext i8 %a to i64
310 store i64 %ext, i64 addrspace(1)* %out
311 ret void
312}
313
314; FUNC-LABEL: {{^}}global_zextload_v1i8_to_v1i64:
315define void @global_zextload_v1i8_to_v1i64(<1 x i64> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
316 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
317 %ext = zext <1 x i8> %load to <1 x i64>
318 store <1 x i64> %ext, <1 x i64> addrspace(1)* %out
319 ret void
320}
321
322; FUNC-LABEL: {{^}}global_sextload_v1i8_to_v1i64:
323define void @global_sextload_v1i8_to_v1i64(<1 x i64> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
324 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
325 %ext = sext <1 x i8> %load to <1 x i64>
326 store <1 x i64> %ext, <1 x i64> addrspace(1)* %out
327 ret void
328}
329
330; FUNC-LABEL: {{^}}global_zextload_v2i8_to_v2i64:
331define void @global_zextload_v2i8_to_v2i64(<2 x i64> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
332 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
333 %ext = zext <2 x i8> %load to <2 x i64>
334 store <2 x i64> %ext, <2 x i64> addrspace(1)* %out
335 ret void
336}
337
338; FUNC-LABEL: {{^}}global_sextload_v2i8_to_v2i64:
339define void @global_sextload_v2i8_to_v2i64(<2 x i64> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
340 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
341 %ext = sext <2 x i8> %load to <2 x i64>
342 store <2 x i64> %ext, <2 x i64> addrspace(1)* %out
343 ret void
344}
345
346; FUNC-LABEL: {{^}}global_zextload_v4i8_to_v4i64:
347define void @global_zextload_v4i8_to_v4i64(<4 x i64> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
348 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
349 %ext = zext <4 x i8> %load to <4 x i64>
350 store <4 x i64> %ext, <4 x i64> addrspace(1)* %out
351 ret void
352}
353
354; FUNC-LABEL: {{^}}global_sextload_v4i8_to_v4i64:
355define void @global_sextload_v4i8_to_v4i64(<4 x i64> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
356 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
357 %ext = sext <4 x i8> %load to <4 x i64>
358 store <4 x i64> %ext, <4 x i64> addrspace(1)* %out
359 ret void
360}
361
362; FUNC-LABEL: {{^}}global_zextload_v8i8_to_v8i64:
363define void @global_zextload_v8i8_to_v8i64(<8 x i64> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
364 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
365 %ext = zext <8 x i8> %load to <8 x i64>
366 store <8 x i64> %ext, <8 x i64> addrspace(1)* %out
367 ret void
368}
369
370; FUNC-LABEL: {{^}}global_sextload_v8i8_to_v8i64:
371define void @global_sextload_v8i8_to_v8i64(<8 x i64> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
372 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
373 %ext = sext <8 x i8> %load to <8 x i64>
374 store <8 x i64> %ext, <8 x i64> addrspace(1)* %out
375 ret void
376}
377
378; FUNC-LABEL: {{^}}global_zextload_v16i8_to_v16i64:
379define void @global_zextload_v16i8_to_v16i64(<16 x i64> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
380 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
381 %ext = zext <16 x i8> %load to <16 x i64>
382 store <16 x i64> %ext, <16 x i64> addrspace(1)* %out
383 ret void
384}
385
386; FUNC-LABEL: {{^}}global_sextload_v16i8_to_v16i64:
387define void @global_sextload_v16i8_to_v16i64(<16 x i64> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
388 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
389 %ext = sext <16 x i8> %load to <16 x i64>
390 store <16 x i64> %ext, <16 x i64> addrspace(1)* %out
391 ret void
392}
393
394; FUNC-LABEL: {{^}}global_zextload_v32i8_to_v32i64:
395define void @global_zextload_v32i8_to_v32i64(<32 x i64> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
396 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
397 %ext = zext <32 x i8> %load to <32 x i64>
398 store <32 x i64> %ext, <32 x i64> addrspace(1)* %out
399 ret void
400}
401
402; FUNC-LABEL: {{^}}global_sextload_v32i8_to_v32i64:
403define void @global_sextload_v32i8_to_v32i64(<32 x i64> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
404 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
405 %ext = sext <32 x i8> %load to <32 x i64>
406 store <32 x i64> %ext, <32 x i64> addrspace(1)* %out
407 ret void
408}
409
410; XFUNC-LABEL: {{^}}global_zextload_v64i8_to_v64i64:
411; define void @global_zextload_v64i8_to_v64i64(<64 x i64> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
412; %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
413; %ext = zext <64 x i8> %load to <64 x i64>
414; store <64 x i64> %ext, <64 x i64> addrspace(1)* %out
415; ret void
416; }
417
418; XFUNC-LABEL: {{^}}global_sextload_v64i8_to_v64i64:
419; define void @global_sextload_v64i8_to_v64i64(<64 x i64> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
420; %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
421; %ext = sext <64 x i8> %load to <64 x i64>
422; store <64 x i64> %ext, <64 x i64> addrspace(1)* %out
423; ret void
424; }
425
426; FUNC-LABEL: {{^}}global_zextload_i8_to_i16:
427; GCN-NOHSA: buffer_load_ubyte v[[VAL:[0-9]+]],
428; GCN-NOHSA: buffer_store_short v[[VAL]]
429
430; GCN-HSA: flat_load_ubyte v[[VAL:[0-9]+]],
431; GCN-HSA: flat_store_short v{{\[[0-9]+:[0-9]+\]}}, v[[VAL]]
432define void @global_zextload_i8_to_i16(i16 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
433 %a = load i8, i8 addrspace(1)* %in
434 %ext = zext i8 %a to i16
435 store i16 %ext, i16 addrspace(1)* %out
436 ret void
437}
438
439; FUNC-LABEL: {{^}}global_sextload_i8_to_i16:
440; GCN-NOHSA: buffer_load_sbyte v[[VAL:[0-9]+]],
441; GCN-HSA: flat_load_sbyte v[[VAL:[0-9]+]],
442
443; GCN-NOHSA: buffer_store_short v[[VAL]]
444; GCN-HSA: flat_store_short v{{\[[0-9]+:[0-9]+\]}}, v[[VAL]]
445define void @global_sextload_i8_to_i16(i16 addrspace(1)* %out, i8 addrspace(1)* %in) #0 {
446 %a = load i8, i8 addrspace(1)* %in
447 %ext = sext i8 %a to i16
448 store i16 %ext, i16 addrspace(1)* %out
449 ret void
450}
451
452; FUNC-LABEL: {{^}}global_zextload_v1i8_to_v1i16:
453define void @global_zextload_v1i8_to_v1i16(<1 x i16> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
454 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
455 %ext = zext <1 x i8> %load to <1 x i16>
456 store <1 x i16> %ext, <1 x i16> addrspace(1)* %out
457 ret void
458}
459
460; FUNC-LABEL: {{^}}global_sextload_v1i8_to_v1i16:
461define void @global_sextload_v1i8_to_v1i16(<1 x i16> addrspace(1)* %out, <1 x i8> addrspace(1)* %in) #0 {
462 %load = load <1 x i8>, <1 x i8> addrspace(1)* %in
463 %ext = sext <1 x i8> %load to <1 x i16>
464 store <1 x i16> %ext, <1 x i16> addrspace(1)* %out
465 ret void
466}
467
468; FUNC-LABEL: {{^}}global_zextload_v2i8_to_v2i16:
469define void @global_zextload_v2i8_to_v2i16(<2 x i16> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
470 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
471 %ext = zext <2 x i8> %load to <2 x i16>
472 store <2 x i16> %ext, <2 x i16> addrspace(1)* %out
473 ret void
474}
475
476; FUNC-LABEL: {{^}}global_sextload_v2i8_to_v2i16:
477define void @global_sextload_v2i8_to_v2i16(<2 x i16> addrspace(1)* %out, <2 x i8> addrspace(1)* %in) #0 {
478 %load = load <2 x i8>, <2 x i8> addrspace(1)* %in
479 %ext = sext <2 x i8> %load to <2 x i16>
480 store <2 x i16> %ext, <2 x i16> addrspace(1)* %out
481 ret void
482}
483
484; FUNC-LABEL: {{^}}global_zextload_v4i8_to_v4i16:
485define void @global_zextload_v4i8_to_v4i16(<4 x i16> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
486 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
487 %ext = zext <4 x i8> %load to <4 x i16>
488 store <4 x i16> %ext, <4 x i16> addrspace(1)* %out
489 ret void
490}
491
492; FUNC-LABEL: {{^}}global_sextload_v4i8_to_v4i16:
493define void @global_sextload_v4i8_to_v4i16(<4 x i16> addrspace(1)* %out, <4 x i8> addrspace(1)* %in) #0 {
494 %load = load <4 x i8>, <4 x i8> addrspace(1)* %in
495 %ext = sext <4 x i8> %load to <4 x i16>
496 store <4 x i16> %ext, <4 x i16> addrspace(1)* %out
497 ret void
498}
499
500; FUNC-LABEL: {{^}}global_zextload_v8i8_to_v8i16:
501define void @global_zextload_v8i8_to_v8i16(<8 x i16> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
502 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
503 %ext = zext <8 x i8> %load to <8 x i16>
504 store <8 x i16> %ext, <8 x i16> addrspace(1)* %out
505 ret void
506}
507
508; FUNC-LABEL: {{^}}global_sextload_v8i8_to_v8i16:
509define void @global_sextload_v8i8_to_v8i16(<8 x i16> addrspace(1)* %out, <8 x i8> addrspace(1)* %in) #0 {
510 %load = load <8 x i8>, <8 x i8> addrspace(1)* %in
511 %ext = sext <8 x i8> %load to <8 x i16>
512 store <8 x i16> %ext, <8 x i16> addrspace(1)* %out
513 ret void
514}
515
516; FUNC-LABEL: {{^}}global_zextload_v16i8_to_v16i16:
517define void @global_zextload_v16i8_to_v16i16(<16 x i16> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
518 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
519 %ext = zext <16 x i8> %load to <16 x i16>
520 store <16 x i16> %ext, <16 x i16> addrspace(1)* %out
521 ret void
522}
523
524; FUNC-LABEL: {{^}}global_sextload_v16i8_to_v16i16:
525define void @global_sextload_v16i8_to_v16i16(<16 x i16> addrspace(1)* %out, <16 x i8> addrspace(1)* %in) #0 {
526 %load = load <16 x i8>, <16 x i8> addrspace(1)* %in
527 %ext = sext <16 x i8> %load to <16 x i16>
528 store <16 x i16> %ext, <16 x i16> addrspace(1)* %out
529 ret void
530}
531
532; FUNC-LABEL: {{^}}global_zextload_v32i8_to_v32i16:
533define void @global_zextload_v32i8_to_v32i16(<32 x i16> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
534 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
535 %ext = zext <32 x i8> %load to <32 x i16>
536 store <32 x i16> %ext, <32 x i16> addrspace(1)* %out
537 ret void
538}
539
540; FUNC-LABEL: {{^}}global_sextload_v32i8_to_v32i16:
541define void @global_sextload_v32i8_to_v32i16(<32 x i16> addrspace(1)* %out, <32 x i8> addrspace(1)* %in) #0 {
542 %load = load <32 x i8>, <32 x i8> addrspace(1)* %in
543 %ext = sext <32 x i8> %load to <32 x i16>
544 store <32 x i16> %ext, <32 x i16> addrspace(1)* %out
545 ret void
546}
547
548; XFUNC-LABEL: {{^}}global_zextload_v64i8_to_v64i16:
549; define void @global_zextload_v64i8_to_v64i16(<64 x i16> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
550; %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
551; %ext = zext <64 x i8> %load to <64 x i16>
552; store <64 x i16> %ext, <64 x i16> addrspace(1)* %out
553; ret void
554; }
555
556; XFUNC-LABEL: {{^}}global_sextload_v64i8_to_v64i16:
557; define void @global_sextload_v64i8_to_v64i16(<64 x i16> addrspace(1)* %out, <64 x i8> addrspace(1)* %in) #0 {
558; %load = load <64 x i8>, <64 x i8> addrspace(1)* %in
559; %ext = sext <64 x i8> %load to <64 x i16>
560; store <64 x i16> %ext, <64 x i16> addrspace(1)* %out
561; ret void
562; }
563
564attributes #0 = { nounwind }