blob: 48fd388e9a4cebcc2d5ba03c94bc617884653a20 [file] [log] [blame]
Bob Wilsone76c5942009-10-08 23:33:03 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilsone60fee02009-06-22 23:27:02 +00002
3define <8 x i8> @vrshls8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +00004;CHECK: vrshls8:
5;CHECK: vrshl.s8
Bob Wilsone60fee02009-06-22 23:27:02 +00006 %tmp1 = load <8 x i8>* %A
7 %tmp2 = load <8 x i8>* %B
8 %tmp3 = call <8 x i8> @llvm.arm.neon.vrshifts.v8i8(<8 x i8> %tmp1, <8 x i8> %tmp2)
9 ret <8 x i8> %tmp3
10}
11
12define <4 x i16> @vrshls16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000013;CHECK: vrshls16:
14;CHECK: vrshl.s16
Bob Wilsone60fee02009-06-22 23:27:02 +000015 %tmp1 = load <4 x i16>* %A
16 %tmp2 = load <4 x i16>* %B
17 %tmp3 = call <4 x i16> @llvm.arm.neon.vrshifts.v4i16(<4 x i16> %tmp1, <4 x i16> %tmp2)
18 ret <4 x i16> %tmp3
19}
20
21define <2 x i32> @vrshls32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000022;CHECK: vrshls32:
23;CHECK: vrshl.s32
Bob Wilsone60fee02009-06-22 23:27:02 +000024 %tmp1 = load <2 x i32>* %A
25 %tmp2 = load <2 x i32>* %B
26 %tmp3 = call <2 x i32> @llvm.arm.neon.vrshifts.v2i32(<2 x i32> %tmp1, <2 x i32> %tmp2)
27 ret <2 x i32> %tmp3
28}
29
30define <1 x i64> @vrshls64(<1 x i64>* %A, <1 x i64>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000031;CHECK: vrshls64:
32;CHECK: vrshl.s64
Bob Wilsone60fee02009-06-22 23:27:02 +000033 %tmp1 = load <1 x i64>* %A
34 %tmp2 = load <1 x i64>* %B
35 %tmp3 = call <1 x i64> @llvm.arm.neon.vrshifts.v1i64(<1 x i64> %tmp1, <1 x i64> %tmp2)
36 ret <1 x i64> %tmp3
37}
38
39define <8 x i8> @vrshlu8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000040;CHECK: vrshlu8:
41;CHECK: vrshl.u8
Bob Wilsone60fee02009-06-22 23:27:02 +000042 %tmp1 = load <8 x i8>* %A
43 %tmp2 = load <8 x i8>* %B
44 %tmp3 = call <8 x i8> @llvm.arm.neon.vrshiftu.v8i8(<8 x i8> %tmp1, <8 x i8> %tmp2)
45 ret <8 x i8> %tmp3
46}
47
48define <4 x i16> @vrshlu16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000049;CHECK: vrshlu16:
50;CHECK: vrshl.u16
Bob Wilsone60fee02009-06-22 23:27:02 +000051 %tmp1 = load <4 x i16>* %A
52 %tmp2 = load <4 x i16>* %B
53 %tmp3 = call <4 x i16> @llvm.arm.neon.vrshiftu.v4i16(<4 x i16> %tmp1, <4 x i16> %tmp2)
54 ret <4 x i16> %tmp3
55}
56
57define <2 x i32> @vrshlu32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000058;CHECK: vrshlu32:
59;CHECK: vrshl.u32
Bob Wilsone60fee02009-06-22 23:27:02 +000060 %tmp1 = load <2 x i32>* %A
61 %tmp2 = load <2 x i32>* %B
62 %tmp3 = call <2 x i32> @llvm.arm.neon.vrshiftu.v2i32(<2 x i32> %tmp1, <2 x i32> %tmp2)
63 ret <2 x i32> %tmp3
64}
65
66define <1 x i64> @vrshlu64(<1 x i64>* %A, <1 x i64>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000067;CHECK: vrshlu64:
68;CHECK: vrshl.u64
Bob Wilsone60fee02009-06-22 23:27:02 +000069 %tmp1 = load <1 x i64>* %A
70 %tmp2 = load <1 x i64>* %B
71 %tmp3 = call <1 x i64> @llvm.arm.neon.vrshiftu.v1i64(<1 x i64> %tmp1, <1 x i64> %tmp2)
72 ret <1 x i64> %tmp3
73}
74
75define <16 x i8> @vrshlQs8(<16 x i8>* %A, <16 x i8>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000076;CHECK: vrshlQs8:
77;CHECK: vrshl.s8
Bob Wilsone60fee02009-06-22 23:27:02 +000078 %tmp1 = load <16 x i8>* %A
79 %tmp2 = load <16 x i8>* %B
80 %tmp3 = call <16 x i8> @llvm.arm.neon.vrshifts.v16i8(<16 x i8> %tmp1, <16 x i8> %tmp2)
81 ret <16 x i8> %tmp3
82}
83
84define <8 x i16> @vrshlQs16(<8 x i16>* %A, <8 x i16>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000085;CHECK: vrshlQs16:
86;CHECK: vrshl.s16
Bob Wilsone60fee02009-06-22 23:27:02 +000087 %tmp1 = load <8 x i16>* %A
88 %tmp2 = load <8 x i16>* %B
89 %tmp3 = call <8 x i16> @llvm.arm.neon.vrshifts.v8i16(<8 x i16> %tmp1, <8 x i16> %tmp2)
90 ret <8 x i16> %tmp3
91}
92
93define <4 x i32> @vrshlQs32(<4 x i32>* %A, <4 x i32>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +000094;CHECK: vrshlQs32:
95;CHECK: vrshl.s32
Bob Wilsone60fee02009-06-22 23:27:02 +000096 %tmp1 = load <4 x i32>* %A
97 %tmp2 = load <4 x i32>* %B
98 %tmp3 = call <4 x i32> @llvm.arm.neon.vrshifts.v4i32(<4 x i32> %tmp1, <4 x i32> %tmp2)
99 ret <4 x i32> %tmp3
100}
101
102define <2 x i64> @vrshlQs64(<2 x i64>* %A, <2 x i64>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000103;CHECK: vrshlQs64:
104;CHECK: vrshl.s64
Bob Wilsone60fee02009-06-22 23:27:02 +0000105 %tmp1 = load <2 x i64>* %A
106 %tmp2 = load <2 x i64>* %B
107 %tmp3 = call <2 x i64> @llvm.arm.neon.vrshifts.v2i64(<2 x i64> %tmp1, <2 x i64> %tmp2)
108 ret <2 x i64> %tmp3
109}
110
111define <16 x i8> @vrshlQu8(<16 x i8>* %A, <16 x i8>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000112;CHECK: vrshlQu8:
113;CHECK: vrshl.u8
Bob Wilsone60fee02009-06-22 23:27:02 +0000114 %tmp1 = load <16 x i8>* %A
115 %tmp2 = load <16 x i8>* %B
116 %tmp3 = call <16 x i8> @llvm.arm.neon.vrshiftu.v16i8(<16 x i8> %tmp1, <16 x i8> %tmp2)
117 ret <16 x i8> %tmp3
118}
119
120define <8 x i16> @vrshlQu16(<8 x i16>* %A, <8 x i16>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000121;CHECK: vrshlQu16:
122;CHECK: vrshl.u16
Bob Wilsone60fee02009-06-22 23:27:02 +0000123 %tmp1 = load <8 x i16>* %A
124 %tmp2 = load <8 x i16>* %B
125 %tmp3 = call <8 x i16> @llvm.arm.neon.vrshiftu.v8i16(<8 x i16> %tmp1, <8 x i16> %tmp2)
126 ret <8 x i16> %tmp3
127}
128
129define <4 x i32> @vrshlQu32(<4 x i32>* %A, <4 x i32>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000130;CHECK: vrshlQu32:
131;CHECK: vrshl.u32
Bob Wilsone60fee02009-06-22 23:27:02 +0000132 %tmp1 = load <4 x i32>* %A
133 %tmp2 = load <4 x i32>* %B
134 %tmp3 = call <4 x i32> @llvm.arm.neon.vrshiftu.v4i32(<4 x i32> %tmp1, <4 x i32> %tmp2)
135 ret <4 x i32> %tmp3
136}
137
138define <2 x i64> @vrshlQu64(<2 x i64>* %A, <2 x i64>* %B) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000139;CHECK: vrshlQu64:
140;CHECK: vrshl.u64
Bob Wilsone60fee02009-06-22 23:27:02 +0000141 %tmp1 = load <2 x i64>* %A
142 %tmp2 = load <2 x i64>* %B
143 %tmp3 = call <2 x i64> @llvm.arm.neon.vrshiftu.v2i64(<2 x i64> %tmp1, <2 x i64> %tmp2)
144 ret <2 x i64> %tmp3
145}
146
147define <8 x i8> @vrshrs8(<8 x i8>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000148;CHECK: vrshrs8:
149;CHECK: vrshr.s8
Bob Wilsone60fee02009-06-22 23:27:02 +0000150 %tmp1 = load <8 x i8>* %A
151 %tmp2 = call <8 x i8> @llvm.arm.neon.vrshifts.v8i8(<8 x i8> %tmp1, <8 x i8> < i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8 >)
152 ret <8 x i8> %tmp2
153}
154
155define <4 x i16> @vrshrs16(<4 x i16>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000156;CHECK: vrshrs16:
157;CHECK: vrshr.s16
Bob Wilsone60fee02009-06-22 23:27:02 +0000158 %tmp1 = load <4 x i16>* %A
159 %tmp2 = call <4 x i16> @llvm.arm.neon.vrshifts.v4i16(<4 x i16> %tmp1, <4 x i16> < i16 -16, i16 -16, i16 -16, i16 -16 >)
160 ret <4 x i16> %tmp2
161}
162
163define <2 x i32> @vrshrs32(<2 x i32>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000164;CHECK: vrshrs32:
165;CHECK: vrshr.s32
Bob Wilsone60fee02009-06-22 23:27:02 +0000166 %tmp1 = load <2 x i32>* %A
167 %tmp2 = call <2 x i32> @llvm.arm.neon.vrshifts.v2i32(<2 x i32> %tmp1, <2 x i32> < i32 -32, i32 -32 >)
168 ret <2 x i32> %tmp2
169}
170
171define <1 x i64> @vrshrs64(<1 x i64>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000172;CHECK: vrshrs64:
173;CHECK: vrshr.s64
Bob Wilsone60fee02009-06-22 23:27:02 +0000174 %tmp1 = load <1 x i64>* %A
175 %tmp2 = call <1 x i64> @llvm.arm.neon.vrshifts.v1i64(<1 x i64> %tmp1, <1 x i64> < i64 -64 >)
176 ret <1 x i64> %tmp2
177}
178
179define <8 x i8> @vrshru8(<8 x i8>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000180;CHECK: vrshru8:
181;CHECK: vrshr.u8
Bob Wilsone60fee02009-06-22 23:27:02 +0000182 %tmp1 = load <8 x i8>* %A
183 %tmp2 = call <8 x i8> @llvm.arm.neon.vrshiftu.v8i8(<8 x i8> %tmp1, <8 x i8> < i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8 >)
184 ret <8 x i8> %tmp2
185}
186
187define <4 x i16> @vrshru16(<4 x i16>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000188;CHECK: vrshru16:
189;CHECK: vrshr.u16
Bob Wilsone60fee02009-06-22 23:27:02 +0000190 %tmp1 = load <4 x i16>* %A
191 %tmp2 = call <4 x i16> @llvm.arm.neon.vrshiftu.v4i16(<4 x i16> %tmp1, <4 x i16> < i16 -16, i16 -16, i16 -16, i16 -16 >)
192 ret <4 x i16> %tmp2
193}
194
195define <2 x i32> @vrshru32(<2 x i32>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000196;CHECK: vrshru32:
197;CHECK: vrshr.u32
Bob Wilsone60fee02009-06-22 23:27:02 +0000198 %tmp1 = load <2 x i32>* %A
199 %tmp2 = call <2 x i32> @llvm.arm.neon.vrshiftu.v2i32(<2 x i32> %tmp1, <2 x i32> < i32 -32, i32 -32 >)
200 ret <2 x i32> %tmp2
201}
202
203define <1 x i64> @vrshru64(<1 x i64>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000204;CHECK: vrshru64:
205;CHECK: vrshr.u64
Bob Wilsone60fee02009-06-22 23:27:02 +0000206 %tmp1 = load <1 x i64>* %A
207 %tmp2 = call <1 x i64> @llvm.arm.neon.vrshiftu.v1i64(<1 x i64> %tmp1, <1 x i64> < i64 -64 >)
208 ret <1 x i64> %tmp2
209}
210
211define <16 x i8> @vrshrQs8(<16 x i8>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000212;CHECK: vrshrQs8:
213;CHECK: vrshr.s8
Bob Wilsone60fee02009-06-22 23:27:02 +0000214 %tmp1 = load <16 x i8>* %A
215 %tmp2 = call <16 x i8> @llvm.arm.neon.vrshifts.v16i8(<16 x i8> %tmp1, <16 x i8> < i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8 >)
216 ret <16 x i8> %tmp2
217}
218
219define <8 x i16> @vrshrQs16(<8 x i16>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000220;CHECK: vrshrQs16:
221;CHECK: vrshr.s16
Bob Wilsone60fee02009-06-22 23:27:02 +0000222 %tmp1 = load <8 x i16>* %A
223 %tmp2 = call <8 x i16> @llvm.arm.neon.vrshifts.v8i16(<8 x i16> %tmp1, <8 x i16> < i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16 >)
224 ret <8 x i16> %tmp2
225}
226
227define <4 x i32> @vrshrQs32(<4 x i32>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000228;CHECK: vrshrQs32:
229;CHECK: vrshr.s32
Bob Wilsone60fee02009-06-22 23:27:02 +0000230 %tmp1 = load <4 x i32>* %A
231 %tmp2 = call <4 x i32> @llvm.arm.neon.vrshifts.v4i32(<4 x i32> %tmp1, <4 x i32> < i32 -32, i32 -32, i32 -32, i32 -32 >)
232 ret <4 x i32> %tmp2
233}
234
235define <2 x i64> @vrshrQs64(<2 x i64>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000236;CHECK: vrshrQs64:
237;CHECK: vrshr.s64
Bob Wilsone60fee02009-06-22 23:27:02 +0000238 %tmp1 = load <2 x i64>* %A
239 %tmp2 = call <2 x i64> @llvm.arm.neon.vrshifts.v2i64(<2 x i64> %tmp1, <2 x i64> < i64 -64, i64 -64 >)
240 ret <2 x i64> %tmp2
241}
242
243define <16 x i8> @vrshrQu8(<16 x i8>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000244;CHECK: vrshrQu8:
245;CHECK: vrshr.u8
Bob Wilsone60fee02009-06-22 23:27:02 +0000246 %tmp1 = load <16 x i8>* %A
247 %tmp2 = call <16 x i8> @llvm.arm.neon.vrshiftu.v16i8(<16 x i8> %tmp1, <16 x i8> < i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8, i8 -8 >)
248 ret <16 x i8> %tmp2
249}
250
251define <8 x i16> @vrshrQu16(<8 x i16>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000252;CHECK: vrshrQu16:
253;CHECK: vrshr.u16
Bob Wilsone60fee02009-06-22 23:27:02 +0000254 %tmp1 = load <8 x i16>* %A
255 %tmp2 = call <8 x i16> @llvm.arm.neon.vrshiftu.v8i16(<8 x i16> %tmp1, <8 x i16> < i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16, i16 -16 >)
256 ret <8 x i16> %tmp2
257}
258
259define <4 x i32> @vrshrQu32(<4 x i32>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000260;CHECK: vrshrQu32:
261;CHECK: vrshr.u32
Bob Wilsone60fee02009-06-22 23:27:02 +0000262 %tmp1 = load <4 x i32>* %A
263 %tmp2 = call <4 x i32> @llvm.arm.neon.vrshiftu.v4i32(<4 x i32> %tmp1, <4 x i32> < i32 -32, i32 -32, i32 -32, i32 -32 >)
264 ret <4 x i32> %tmp2
265}
266
267define <2 x i64> @vrshrQu64(<2 x i64>* %A) nounwind {
Bob Wilsone76c5942009-10-08 23:33:03 +0000268;CHECK: vrshrQu64:
269;CHECK: vrshr.u64
Bob Wilsone60fee02009-06-22 23:27:02 +0000270 %tmp1 = load <2 x i64>* %A
271 %tmp2 = call <2 x i64> @llvm.arm.neon.vrshiftu.v2i64(<2 x i64> %tmp1, <2 x i64> < i64 -64, i64 -64 >)
272 ret <2 x i64> %tmp2
273}
274
275declare <8 x i8> @llvm.arm.neon.vrshifts.v8i8(<8 x i8>, <8 x i8>) nounwind readnone
276declare <4 x i16> @llvm.arm.neon.vrshifts.v4i16(<4 x i16>, <4 x i16>) nounwind readnone
277declare <2 x i32> @llvm.arm.neon.vrshifts.v2i32(<2 x i32>, <2 x i32>) nounwind readnone
278declare <1 x i64> @llvm.arm.neon.vrshifts.v1i64(<1 x i64>, <1 x i64>) nounwind readnone
279
280declare <8 x i8> @llvm.arm.neon.vrshiftu.v8i8(<8 x i8>, <8 x i8>) nounwind readnone
281declare <4 x i16> @llvm.arm.neon.vrshiftu.v4i16(<4 x i16>, <4 x i16>) nounwind readnone
282declare <2 x i32> @llvm.arm.neon.vrshiftu.v2i32(<2 x i32>, <2 x i32>) nounwind readnone
283declare <1 x i64> @llvm.arm.neon.vrshiftu.v1i64(<1 x i64>, <1 x i64>) nounwind readnone
284
285declare <16 x i8> @llvm.arm.neon.vrshifts.v16i8(<16 x i8>, <16 x i8>) nounwind readnone
286declare <8 x i16> @llvm.arm.neon.vrshifts.v8i16(<8 x i16>, <8 x i16>) nounwind readnone
287declare <4 x i32> @llvm.arm.neon.vrshifts.v4i32(<4 x i32>, <4 x i32>) nounwind readnone
288declare <2 x i64> @llvm.arm.neon.vrshifts.v2i64(<2 x i64>, <2 x i64>) nounwind readnone
289
290declare <16 x i8> @llvm.arm.neon.vrshiftu.v16i8(<16 x i8>, <16 x i8>) nounwind readnone
291declare <8 x i16> @llvm.arm.neon.vrshiftu.v8i16(<8 x i16>, <8 x i16>) nounwind readnone
292declare <4 x i32> @llvm.arm.neon.vrshiftu.v4i32(<4 x i32>, <4 x i32>) nounwind readnone
293declare <2 x i64> @llvm.arm.neon.vrshiftu.v2i64(<2 x i64>, <2 x i64>) nounwind readnone