blob: dc056e0ecdd5c149ed9340af2d3b67f79d1d3355 [file] [log] [blame]
Matt Arsenaultf9a995d2014-03-06 17:34:12 +00001; RUN: llc -march=r600 -mcpu=cypress < %s | FileCheck -check-prefix=EG -check-prefix=FUNC %s
Tom Stellard919bb6b2014-04-29 23:12:53 +00002; RUN: llc -march=r600 -mcpu=SI -verify-machineinstrs< %s | FileCheck -check-prefix=SI -check-prefix=FUNC %s
Matt Arsenault00a0d6f2013-11-13 02:39:07 +00003
Matt Arsenaultf9a995d2014-03-06 17:34:12 +00004; FUNC-LABEL: @anyext_load_i8:
Matt Arsenault00a0d6f2013-11-13 02:39:07 +00005; EG: AND_INT
Tom Stellarde9373602014-01-22 19:24:14 +00006; EG: 255
Matt Arsenault00a0d6f2013-11-13 02:39:07 +00007define void @anyext_load_i8(i8 addrspace(1)* nocapture noalias %out, i8 addrspace(1)* nocapture noalias %src) nounwind {
8 %cast = bitcast i8 addrspace(1)* %src to i32 addrspace(1)*
9 %load = load i32 addrspace(1)* %cast, align 1
10 %x = bitcast i32 %load to <4 x i8>
11 %castOut = bitcast i8 addrspace(1)* %out to <4 x i8> addrspace(1)*
12 store <4 x i8> %x, <4 x i8> addrspace(1)* %castOut, align 1
13 ret void
14}
15
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000016; FUNC-LABEL: @anyext_load_i16:
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000017; EG: AND_INT
Tom Stellarde9373602014-01-22 19:24:14 +000018; EG: AND_INT
19; EG-DAG: 65535
20; EG-DAG: -65536
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000021define void @anyext_load_i16(i16 addrspace(1)* nocapture noalias %out, i16 addrspace(1)* nocapture noalias %src) nounwind {
22 %cast = bitcast i16 addrspace(1)* %src to i32 addrspace(1)*
23 %load = load i32 addrspace(1)* %cast, align 1
24 %x = bitcast i32 %load to <2 x i16>
25 %castOut = bitcast i16 addrspace(1)* %out to <2 x i16> addrspace(1)*
26 store <2 x i16> %x, <2 x i16> addrspace(1)* %castOut, align 1
27 ret void
28}
29
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000030; FUNC-LABEL: @anyext_load_lds_i8:
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000031; EG: AND_INT
Tom Stellarde9373602014-01-22 19:24:14 +000032; EG: 255
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000033define void @anyext_load_lds_i8(i8 addrspace(3)* nocapture noalias %out, i8 addrspace(3)* nocapture noalias %src) nounwind {
34 %cast = bitcast i8 addrspace(3)* %src to i32 addrspace(3)*
35 %load = load i32 addrspace(3)* %cast, align 1
36 %x = bitcast i32 %load to <4 x i8>
37 %castOut = bitcast i8 addrspace(3)* %out to <4 x i8> addrspace(3)*
38 store <4 x i8> %x, <4 x i8> addrspace(3)* %castOut, align 1
39 ret void
40}
41
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000042; FUNC-LABEL: @anyext_load_lds_i16:
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000043; EG: AND_INT
Tom Stellarde9373602014-01-22 19:24:14 +000044; EG: AND_INT
45; EG-DAG: 65535
46; EG-DAG: -65536
Matt Arsenault00a0d6f2013-11-13 02:39:07 +000047define void @anyext_load_lds_i16(i16 addrspace(3)* nocapture noalias %out, i16 addrspace(3)* nocapture noalias %src) nounwind {
48 %cast = bitcast i16 addrspace(3)* %src to i32 addrspace(3)*
49 %load = load i32 addrspace(3)* %cast, align 1
50 %x = bitcast i32 %load to <2 x i16>
51 %castOut = bitcast i16 addrspace(3)* %out to <2 x i16> addrspace(3)*
52 store <2 x i16> %x, <2 x i16> addrspace(3)* %castOut, align 1
53 ret void
54}
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000055
56; FUNC-LABEL: @sextload_global_i8_to_i64
57; SI: BUFFER_LOAD_SBYTE [[LOAD:v[0-9]+]],
58; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
59; SI: BUFFER_STORE_DWORDX2
60define void @sextload_global_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) nounwind {
61 %a = load i8 addrspace(1)* %in, align 8
62 %ext = sext i8 %a to i64
63 store i64 %ext, i64 addrspace(1)* %out, align 8
64 ret void
65}
66
67; FUNC-LABEL: @sextload_global_i16_to_i64
68; SI: BUFFER_LOAD_SSHORT [[LOAD:v[0-9]+]],
69; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
70; SI: BUFFER_STORE_DWORDX2
71define void @sextload_global_i16_to_i64(i64 addrspace(1)* %out, i16 addrspace(1)* %in) nounwind {
72 %a = load i16 addrspace(1)* %in, align 8
73 %ext = sext i16 %a to i64
74 store i64 %ext, i64 addrspace(1)* %out, align 8
75 ret void
76}
77
78; FUNC-LABEL: @sextload_global_i32_to_i64
79; SI: BUFFER_LOAD_DWORD [[LOAD:v[0-9]+]],
80; SI: V_ASHRREV_I32_e32 v{{[0-9]+}}, 31, [[LOAD]]
81; SI: BUFFER_STORE_DWORDX2
82define void @sextload_global_i32_to_i64(i64 addrspace(1)* %out, i32 addrspace(1)* %in) nounwind {
83 %a = load i32 addrspace(1)* %in, align 8
84 %ext = sext i32 %a to i64
85 store i64 %ext, i64 addrspace(1)* %out, align 8
86 ret void
87}
88
89; FUNC-LABEL: @zextload_global_i8_to_i64
Tom Stellard1aa6cb42014-04-18 00:36:21 +000090; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000091; SI: BUFFER_LOAD_UBYTE [[LOAD:v[0-9]+]],
Tom Stellard1aa6cb42014-04-18 00:36:21 +000092; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
Matt Arsenaultf9a995d2014-03-06 17:34:12 +000093; SI: BUFFER_STORE_DWORDX2
94define void @zextload_global_i8_to_i64(i64 addrspace(1)* %out, i8 addrspace(1)* %in) nounwind {
95 %a = load i8 addrspace(1)* %in, align 8
96 %ext = zext i8 %a to i64
97 store i64 %ext, i64 addrspace(1)* %out, align 8
98 ret void
99}
100
101; FUNC-LABEL: @zextload_global_i16_to_i64
Tom Stellard1aa6cb42014-04-18 00:36:21 +0000102; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
Matt Arsenaultf9a995d2014-03-06 17:34:12 +0000103; SI: BUFFER_LOAD_USHORT [[LOAD:v[0-9]+]],
Tom Stellard1aa6cb42014-04-18 00:36:21 +0000104; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
Matt Arsenaultf9a995d2014-03-06 17:34:12 +0000105; SI: BUFFER_STORE_DWORDX2
106define void @zextload_global_i16_to_i64(i64 addrspace(1)* %out, i16 addrspace(1)* %in) nounwind {
107 %a = load i16 addrspace(1)* %in, align 8
108 %ext = zext i16 %a to i64
109 store i64 %ext, i64 addrspace(1)* %out, align 8
110 ret void
111}
112
113; FUNC-LABEL: @zextload_global_i32_to_i64
Tom Stellard1aa6cb42014-04-18 00:36:21 +0000114; SI: S_MOV_B32 [[ZERO:s[0-9]+]], 0
Matt Arsenaultf9a995d2014-03-06 17:34:12 +0000115; SI: BUFFER_LOAD_DWORD [[LOAD:v[0-9]+]],
Tom Stellard1aa6cb42014-04-18 00:36:21 +0000116; SI: V_MOV_B32_e32 {{v[0-9]+}}, [[ZERO]]
Matt Arsenaultf9a995d2014-03-06 17:34:12 +0000117; SI: BUFFER_STORE_DWORDX2
118define void @zextload_global_i32_to_i64(i64 addrspace(1)* %out, i32 addrspace(1)* %in) nounwind {
119 %a = load i32 addrspace(1)* %in, align 8
120 %ext = zext i32 %a to i64
121 store i64 %ext, i64 addrspace(1)* %out, align 8
122 ret void
123}