blob: 5e872ab6d0b258a7453e5fe935cc5d7ed7ebd77f [file] [log] [blame]
Bob Wilsonfe27c512009-10-07 23:47:21 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilson5bafff32009-06-22 23:27:02 +00002
3define <8 x i8> @v_movi8() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +00004;CHECK: v_movi8:
Bob Wilsone45f72c2010-07-02 17:23:44 +00005;CHECK: vmov.i8 d0, #0x8
Bob Wilson5bafff32009-06-22 23:27:02 +00006 ret <8 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
7}
8
9define <4 x i16> @v_movi16a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000010;CHECK: v_movi16a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000011;CHECK: vmov.i16 d0, #0x10
Bob Wilson5bafff32009-06-22 23:27:02 +000012 ret <4 x i16> < i16 16, i16 16, i16 16, i16 16 >
13}
14
Bob Wilson5bafff32009-06-22 23:27:02 +000015define <4 x i16> @v_movi16b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000016;CHECK: v_movi16b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000017;CHECK: vmov.i16 d0, #0x1000
Bob Wilson5bafff32009-06-22 23:27:02 +000018 ret <4 x i16> < i16 4096, i16 4096, i16 4096, i16 4096 >
19}
20
Bob Wilson7e3f0d22010-07-14 06:31:50 +000021define <4 x i16> @v_mvni16a() nounwind {
22;CHECK: v_mvni16a:
23;CHECK: vmvn.i16 d0, #0x10
24 ret <4 x i16> < i16 65519, i16 65519, i16 65519, i16 65519 >
25}
26
27define <4 x i16> @v_mvni16b() nounwind {
28;CHECK: v_mvni16b:
29;CHECK: vmvn.i16 d0, #0x1000
30 ret <4 x i16> < i16 61439, i16 61439, i16 61439, i16 61439 >
31}
32
Bob Wilson5bafff32009-06-22 23:27:02 +000033define <2 x i32> @v_movi32a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000034;CHECK: v_movi32a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000035;CHECK: vmov.i32 d0, #0x20
Bob Wilson5bafff32009-06-22 23:27:02 +000036 ret <2 x i32> < i32 32, i32 32 >
37}
38
Bob Wilson5bafff32009-06-22 23:27:02 +000039define <2 x i32> @v_movi32b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000040;CHECK: v_movi32b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000041;CHECK: vmov.i32 d0, #0x2000
Bob Wilson5bafff32009-06-22 23:27:02 +000042 ret <2 x i32> < i32 8192, i32 8192 >
43}
44
Bob Wilson5bafff32009-06-22 23:27:02 +000045define <2 x i32> @v_movi32c() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000046;CHECK: v_movi32c:
Bob Wilsone45f72c2010-07-02 17:23:44 +000047;CHECK: vmov.i32 d0, #0x200000
Bob Wilson5bafff32009-06-22 23:27:02 +000048 ret <2 x i32> < i32 2097152, i32 2097152 >
49}
50
Bob Wilson5bafff32009-06-22 23:27:02 +000051define <2 x i32> @v_movi32d() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000052;CHECK: v_movi32d:
Bob Wilsone45f72c2010-07-02 17:23:44 +000053;CHECK: vmov.i32 d0, #0x20000000
Bob Wilson5bafff32009-06-22 23:27:02 +000054 ret <2 x i32> < i32 536870912, i32 536870912 >
55}
56
Bob Wilson5bafff32009-06-22 23:27:02 +000057define <2 x i32> @v_movi32e() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000058;CHECK: v_movi32e:
Bob Wilsone45f72c2010-07-02 17:23:44 +000059;CHECK: vmov.i32 d0, #0x20FF
Bob Wilson5bafff32009-06-22 23:27:02 +000060 ret <2 x i32> < i32 8447, i32 8447 >
61}
62
Bob Wilson5bafff32009-06-22 23:27:02 +000063define <2 x i32> @v_movi32f() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000064;CHECK: v_movi32f:
Bob Wilsone45f72c2010-07-02 17:23:44 +000065;CHECK: vmov.i32 d0, #0x20FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +000066 ret <2 x i32> < i32 2162687, i32 2162687 >
67}
68
Bob Wilson7e3f0d22010-07-14 06:31:50 +000069define <2 x i32> @v_mvni32a() nounwind {
70;CHECK: v_mvni32a:
71;CHECK: vmvn.i32 d0, #0x20
72 ret <2 x i32> < i32 4294967263, i32 4294967263 >
73}
74
75define <2 x i32> @v_mvni32b() nounwind {
76;CHECK: v_mvni32b:
77;CHECK: vmvn.i32 d0, #0x2000
78 ret <2 x i32> < i32 4294959103, i32 4294959103 >
79}
80
81define <2 x i32> @v_mvni32c() nounwind {
82;CHECK: v_mvni32c:
83;CHECK: vmvn.i32 d0, #0x200000
84 ret <2 x i32> < i32 4292870143, i32 4292870143 >
85}
86
87define <2 x i32> @v_mvni32d() nounwind {
88;CHECK: v_mvni32d:
89;CHECK: vmvn.i32 d0, #0x20000000
90 ret <2 x i32> < i32 3758096383, i32 3758096383 >
91}
92
93define <2 x i32> @v_mvni32e() nounwind {
94;CHECK: v_mvni32e:
95;CHECK: vmvn.i32 d0, #0x20FF
96 ret <2 x i32> < i32 4294958848, i32 4294958848 >
97}
98
99define <2 x i32> @v_mvni32f() nounwind {
100;CHECK: v_mvni32f:
101;CHECK: vmvn.i32 d0, #0x20FFFF
102 ret <2 x i32> < i32 4292804608, i32 4292804608 >
103}
104
Bob Wilson5bafff32009-06-22 23:27:02 +0000105define <1 x i64> @v_movi64() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000106;CHECK: v_movi64:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000107;CHECK: vmov.i64 d0, #0xFF0000FF0000FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +0000108 ret <1 x i64> < i64 18374687574888349695 >
109}
110
111define <16 x i8> @v_movQi8() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000112;CHECK: v_movQi8:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000113;CHECK: vmov.i8 q0, #0x8
Bob Wilson5bafff32009-06-22 23:27:02 +0000114 ret <16 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
115}
116
117define <8 x i16> @v_movQi16a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000118;CHECK: v_movQi16a:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000119;CHECK: vmov.i16 q0, #0x10
Bob Wilson5bafff32009-06-22 23:27:02 +0000120 ret <8 x i16> < i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16 >
121}
122
Bob Wilson5bafff32009-06-22 23:27:02 +0000123define <8 x i16> @v_movQi16b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000124;CHECK: v_movQi16b:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000125;CHECK: vmov.i16 q0, #0x1000
Bob Wilson5bafff32009-06-22 23:27:02 +0000126 ret <8 x i16> < i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096 >
127}
128
129define <4 x i32> @v_movQi32a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000130;CHECK: v_movQi32a:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000131;CHECK: vmov.i32 q0, #0x20
Bob Wilson5bafff32009-06-22 23:27:02 +0000132 ret <4 x i32> < i32 32, i32 32, i32 32, i32 32 >
133}
134
Bob Wilson5bafff32009-06-22 23:27:02 +0000135define <4 x i32> @v_movQi32b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000136;CHECK: v_movQi32b:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000137;CHECK: vmov.i32 q0, #0x2000
Bob Wilson5bafff32009-06-22 23:27:02 +0000138 ret <4 x i32> < i32 8192, i32 8192, i32 8192, i32 8192 >
139}
140
Bob Wilson5bafff32009-06-22 23:27:02 +0000141define <4 x i32> @v_movQi32c() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000142;CHECK: v_movQi32c:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000143;CHECK: vmov.i32 q0, #0x200000
Bob Wilson5bafff32009-06-22 23:27:02 +0000144 ret <4 x i32> < i32 2097152, i32 2097152, i32 2097152, i32 2097152 >
145}
146
Bob Wilson5bafff32009-06-22 23:27:02 +0000147define <4 x i32> @v_movQi32d() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000148;CHECK: v_movQi32d:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000149;CHECK: vmov.i32 q0, #0x20000000
Bob Wilson5bafff32009-06-22 23:27:02 +0000150 ret <4 x i32> < i32 536870912, i32 536870912, i32 536870912, i32 536870912 >
151}
152
Bob Wilson5bafff32009-06-22 23:27:02 +0000153define <4 x i32> @v_movQi32e() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000154;CHECK: v_movQi32e:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000155;CHECK: vmov.i32 q0, #0x20FF
Bob Wilson5bafff32009-06-22 23:27:02 +0000156 ret <4 x i32> < i32 8447, i32 8447, i32 8447, i32 8447 >
157}
158
Bob Wilson5bafff32009-06-22 23:27:02 +0000159define <4 x i32> @v_movQi32f() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000160;CHECK: v_movQi32f:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000161;CHECK: vmov.i32 q0, #0x20FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +0000162 ret <4 x i32> < i32 2162687, i32 2162687, i32 2162687, i32 2162687 >
163}
164
Bob Wilson5bafff32009-06-22 23:27:02 +0000165define <2 x i64> @v_movQi64() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000166;CHECK: v_movQi64:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000167;CHECK: vmov.i64 q0, #0xFF0000FF0000FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +0000168 ret <2 x i64> < i64 18374687574888349695, i64 18374687574888349695 >
169}
Bob Wilson83815ae2009-10-09 20:20:54 +0000170
Bob Wilson54c78ef2009-11-06 23:33:28 +0000171; Check for correct assembler printing for immediate values.
172%struct.int8x8_t = type { <8 x i8> }
Rafael Espindola1e819662010-06-17 15:18:27 +0000173define void @vdupn128(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
Bob Wilson54c78ef2009-11-06 23:33:28 +0000174entry:
175;CHECK: vdupn128:
176;CHECK: vmov.i8 d0, #0x80
177 %0 = getelementptr inbounds %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
178 store <8 x i8> <i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128>, <8 x i8>* %0, align 8
179 ret void
180}
181
Rafael Espindola1e819662010-06-17 15:18:27 +0000182define void @vdupnneg75(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
Bob Wilson54c78ef2009-11-06 23:33:28 +0000183entry:
184;CHECK: vdupnneg75:
185;CHECK: vmov.i8 d0, #0xB5
186 %0 = getelementptr inbounds %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
187 store <8 x i8> <i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75>, <8 x i8>* %0, align 8
188 ret void
189}
190
Bob Wilson83815ae2009-10-09 20:20:54 +0000191define <8 x i16> @vmovls8(<8 x i8>* %A) nounwind {
192;CHECK: vmovls8:
193;CHECK: vmovl.s8
194 %tmp1 = load <8 x i8>* %A
195 %tmp2 = call <8 x i16> @llvm.arm.neon.vmovls.v8i16(<8 x i8> %tmp1)
196 ret <8 x i16> %tmp2
197}
198
199define <4 x i32> @vmovls16(<4 x i16>* %A) nounwind {
200;CHECK: vmovls16:
201;CHECK: vmovl.s16
202 %tmp1 = load <4 x i16>* %A
203 %tmp2 = call <4 x i32> @llvm.arm.neon.vmovls.v4i32(<4 x i16> %tmp1)
204 ret <4 x i32> %tmp2
205}
206
207define <2 x i64> @vmovls32(<2 x i32>* %A) nounwind {
208;CHECK: vmovls32:
209;CHECK: vmovl.s32
210 %tmp1 = load <2 x i32>* %A
211 %tmp2 = call <2 x i64> @llvm.arm.neon.vmovls.v2i64(<2 x i32> %tmp1)
212 ret <2 x i64> %tmp2
213}
214
215define <8 x i16> @vmovlu8(<8 x i8>* %A) nounwind {
216;CHECK: vmovlu8:
217;CHECK: vmovl.u8
218 %tmp1 = load <8 x i8>* %A
219 %tmp2 = call <8 x i16> @llvm.arm.neon.vmovlu.v8i16(<8 x i8> %tmp1)
220 ret <8 x i16> %tmp2
221}
222
223define <4 x i32> @vmovlu16(<4 x i16>* %A) nounwind {
224;CHECK: vmovlu16:
225;CHECK: vmovl.u16
226 %tmp1 = load <4 x i16>* %A
227 %tmp2 = call <4 x i32> @llvm.arm.neon.vmovlu.v4i32(<4 x i16> %tmp1)
228 ret <4 x i32> %tmp2
229}
230
231define <2 x i64> @vmovlu32(<2 x i32>* %A) nounwind {
232;CHECK: vmovlu32:
233;CHECK: vmovl.u32
234 %tmp1 = load <2 x i32>* %A
235 %tmp2 = call <2 x i64> @llvm.arm.neon.vmovlu.v2i64(<2 x i32> %tmp1)
236 ret <2 x i64> %tmp2
237}
238
239declare <8 x i16> @llvm.arm.neon.vmovls.v8i16(<8 x i8>) nounwind readnone
240declare <4 x i32> @llvm.arm.neon.vmovls.v4i32(<4 x i16>) nounwind readnone
241declare <2 x i64> @llvm.arm.neon.vmovls.v2i64(<2 x i32>) nounwind readnone
242
243declare <8 x i16> @llvm.arm.neon.vmovlu.v8i16(<8 x i8>) nounwind readnone
244declare <4 x i32> @llvm.arm.neon.vmovlu.v4i32(<4 x i16>) nounwind readnone
245declare <2 x i64> @llvm.arm.neon.vmovlu.v2i64(<2 x i32>) nounwind readnone
246
247define <8 x i8> @vmovni16(<8 x i16>* %A) nounwind {
248;CHECK: vmovni16:
249;CHECK: vmovn.i16
250 %tmp1 = load <8 x i16>* %A
251 %tmp2 = call <8 x i8> @llvm.arm.neon.vmovn.v8i8(<8 x i16> %tmp1)
252 ret <8 x i8> %tmp2
253}
254
255define <4 x i16> @vmovni32(<4 x i32>* %A) nounwind {
256;CHECK: vmovni32:
257;CHECK: vmovn.i32
258 %tmp1 = load <4 x i32>* %A
259 %tmp2 = call <4 x i16> @llvm.arm.neon.vmovn.v4i16(<4 x i32> %tmp1)
260 ret <4 x i16> %tmp2
261}
262
263define <2 x i32> @vmovni64(<2 x i64>* %A) nounwind {
264;CHECK: vmovni64:
265;CHECK: vmovn.i64
266 %tmp1 = load <2 x i64>* %A
267 %tmp2 = call <2 x i32> @llvm.arm.neon.vmovn.v2i32(<2 x i64> %tmp1)
268 ret <2 x i32> %tmp2
269}
270
271declare <8 x i8> @llvm.arm.neon.vmovn.v8i8(<8 x i16>) nounwind readnone
272declare <4 x i16> @llvm.arm.neon.vmovn.v4i16(<4 x i32>) nounwind readnone
273declare <2 x i32> @llvm.arm.neon.vmovn.v2i32(<2 x i64>) nounwind readnone
274
275define <8 x i8> @vqmovns16(<8 x i16>* %A) nounwind {
276;CHECK: vqmovns16:
277;CHECK: vqmovn.s16
278 %tmp1 = load <8 x i16>* %A
279 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16> %tmp1)
280 ret <8 x i8> %tmp2
281}
282
283define <4 x i16> @vqmovns32(<4 x i32>* %A) nounwind {
284;CHECK: vqmovns32:
285;CHECK: vqmovn.s32
286 %tmp1 = load <4 x i32>* %A
287 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32> %tmp1)
288 ret <4 x i16> %tmp2
289}
290
291define <2 x i32> @vqmovns64(<2 x i64>* %A) nounwind {
292;CHECK: vqmovns64:
293;CHECK: vqmovn.s64
294 %tmp1 = load <2 x i64>* %A
295 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64> %tmp1)
296 ret <2 x i32> %tmp2
297}
298
299define <8 x i8> @vqmovnu16(<8 x i16>* %A) nounwind {
300;CHECK: vqmovnu16:
301;CHECK: vqmovn.u16
302 %tmp1 = load <8 x i16>* %A
303 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16> %tmp1)
304 ret <8 x i8> %tmp2
305}
306
307define <4 x i16> @vqmovnu32(<4 x i32>* %A) nounwind {
308;CHECK: vqmovnu32:
309;CHECK: vqmovn.u32
310 %tmp1 = load <4 x i32>* %A
311 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32> %tmp1)
312 ret <4 x i16> %tmp2
313}
314
315define <2 x i32> @vqmovnu64(<2 x i64>* %A) nounwind {
316;CHECK: vqmovnu64:
317;CHECK: vqmovn.u64
318 %tmp1 = load <2 x i64>* %A
319 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64> %tmp1)
320 ret <2 x i32> %tmp2
321}
322
323define <8 x i8> @vqmovuns16(<8 x i16>* %A) nounwind {
324;CHECK: vqmovuns16:
325;CHECK: vqmovun.s16
326 %tmp1 = load <8 x i16>* %A
327 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16> %tmp1)
328 ret <8 x i8> %tmp2
329}
330
331define <4 x i16> @vqmovuns32(<4 x i32>* %A) nounwind {
332;CHECK: vqmovuns32:
333;CHECK: vqmovun.s32
334 %tmp1 = load <4 x i32>* %A
335 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32> %tmp1)
336 ret <4 x i16> %tmp2
337}
338
339define <2 x i32> @vqmovuns64(<2 x i64>* %A) nounwind {
340;CHECK: vqmovuns64:
341;CHECK: vqmovun.s64
342 %tmp1 = load <2 x i64>* %A
343 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64> %tmp1)
344 ret <2 x i32> %tmp2
345}
346
347declare <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16>) nounwind readnone
348declare <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32>) nounwind readnone
349declare <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64>) nounwind readnone
350
351declare <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16>) nounwind readnone
352declare <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32>) nounwind readnone
353declare <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64>) nounwind readnone
354
355declare <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16>) nounwind readnone
356declare <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32>) nounwind readnone
357declare <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64>) nounwind readnone