blob: f80301863d7b9aa17e813a19801886c92cc21dbd [file] [log] [blame]
Bob Wilsonfe27c512009-10-07 23:47:21 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilson5bafff32009-06-22 23:27:02 +00002
3define <8 x i8> @v_movi8() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +00004;CHECK: v_movi8:
Bob Wilsone45f72c2010-07-02 17:23:44 +00005;CHECK: vmov.i8 d0, #0x8
Bob Wilson5bafff32009-06-22 23:27:02 +00006 ret <8 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
7}
8
9define <4 x i16> @v_movi16a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000010;CHECK: v_movi16a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000011;CHECK: vmov.i16 d0, #0x10
Bob Wilson5bafff32009-06-22 23:27:02 +000012 ret <4 x i16> < i16 16, i16 16, i16 16, i16 16 >
13}
14
Bob Wilson5bafff32009-06-22 23:27:02 +000015define <4 x i16> @v_movi16b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000016;CHECK: v_movi16b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000017;CHECK: vmov.i16 d0, #0x1000
Bob Wilson5bafff32009-06-22 23:27:02 +000018 ret <4 x i16> < i16 4096, i16 4096, i16 4096, i16 4096 >
19}
20
21define <2 x i32> @v_movi32a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000022;CHECK: v_movi32a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000023;CHECK: vmov.i32 d0, #0x20
Bob Wilson5bafff32009-06-22 23:27:02 +000024 ret <2 x i32> < i32 32, i32 32 >
25}
26
Bob Wilson5bafff32009-06-22 23:27:02 +000027define <2 x i32> @v_movi32b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000028;CHECK: v_movi32b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000029;CHECK: vmov.i32 d0, #0x2000
Bob Wilson5bafff32009-06-22 23:27:02 +000030 ret <2 x i32> < i32 8192, i32 8192 >
31}
32
Bob Wilson5bafff32009-06-22 23:27:02 +000033define <2 x i32> @v_movi32c() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000034;CHECK: v_movi32c:
Bob Wilsone45f72c2010-07-02 17:23:44 +000035;CHECK: vmov.i32 d0, #0x200000
Bob Wilson5bafff32009-06-22 23:27:02 +000036 ret <2 x i32> < i32 2097152, i32 2097152 >
37}
38
Bob Wilson5bafff32009-06-22 23:27:02 +000039define <2 x i32> @v_movi32d() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000040;CHECK: v_movi32d:
Bob Wilsone45f72c2010-07-02 17:23:44 +000041;CHECK: vmov.i32 d0, #0x20000000
Bob Wilson5bafff32009-06-22 23:27:02 +000042 ret <2 x i32> < i32 536870912, i32 536870912 >
43}
44
Bob Wilson5bafff32009-06-22 23:27:02 +000045define <2 x i32> @v_movi32e() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000046;CHECK: v_movi32e:
Bob Wilsone45f72c2010-07-02 17:23:44 +000047;CHECK: vmov.i32 d0, #0x20FF
Bob Wilson5bafff32009-06-22 23:27:02 +000048 ret <2 x i32> < i32 8447, i32 8447 >
49}
50
Bob Wilson5bafff32009-06-22 23:27:02 +000051define <2 x i32> @v_movi32f() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000052;CHECK: v_movi32f:
Bob Wilsone45f72c2010-07-02 17:23:44 +000053;CHECK: vmov.i32 d0, #0x20FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +000054 ret <2 x i32> < i32 2162687, i32 2162687 >
55}
56
Bob Wilson5bafff32009-06-22 23:27:02 +000057define <1 x i64> @v_movi64() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000058;CHECK: v_movi64:
Bob Wilsone45f72c2010-07-02 17:23:44 +000059;CHECK: vmov.i64 d0, #0xFF0000FF0000FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +000060 ret <1 x i64> < i64 18374687574888349695 >
61}
62
63define <16 x i8> @v_movQi8() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000064;CHECK: v_movQi8:
Bob Wilsone45f72c2010-07-02 17:23:44 +000065;CHECK: vmov.i8 q0, #0x8
Bob Wilson5bafff32009-06-22 23:27:02 +000066 ret <16 x i8> < i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8, i8 8 >
67}
68
69define <8 x i16> @v_movQi16a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000070;CHECK: v_movQi16a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000071;CHECK: vmov.i16 q0, #0x10
Bob Wilson5bafff32009-06-22 23:27:02 +000072 ret <8 x i16> < i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16, i16 16 >
73}
74
Bob Wilson5bafff32009-06-22 23:27:02 +000075define <8 x i16> @v_movQi16b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000076;CHECK: v_movQi16b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000077;CHECK: vmov.i16 q0, #0x1000
Bob Wilson5bafff32009-06-22 23:27:02 +000078 ret <8 x i16> < i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096, i16 4096 >
79}
80
81define <4 x i32> @v_movQi32a() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000082;CHECK: v_movQi32a:
Bob Wilsone45f72c2010-07-02 17:23:44 +000083;CHECK: vmov.i32 q0, #0x20
Bob Wilson5bafff32009-06-22 23:27:02 +000084 ret <4 x i32> < i32 32, i32 32, i32 32, i32 32 >
85}
86
Bob Wilson5bafff32009-06-22 23:27:02 +000087define <4 x i32> @v_movQi32b() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000088;CHECK: v_movQi32b:
Bob Wilsone45f72c2010-07-02 17:23:44 +000089;CHECK: vmov.i32 q0, #0x2000
Bob Wilson5bafff32009-06-22 23:27:02 +000090 ret <4 x i32> < i32 8192, i32 8192, i32 8192, i32 8192 >
91}
92
Bob Wilson5bafff32009-06-22 23:27:02 +000093define <4 x i32> @v_movQi32c() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +000094;CHECK: v_movQi32c:
Bob Wilsone45f72c2010-07-02 17:23:44 +000095;CHECK: vmov.i32 q0, #0x200000
Bob Wilson5bafff32009-06-22 23:27:02 +000096 ret <4 x i32> < i32 2097152, i32 2097152, i32 2097152, i32 2097152 >
97}
98
Bob Wilson5bafff32009-06-22 23:27:02 +000099define <4 x i32> @v_movQi32d() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000100;CHECK: v_movQi32d:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000101;CHECK: vmov.i32 q0, #0x20000000
Bob Wilson5bafff32009-06-22 23:27:02 +0000102 ret <4 x i32> < i32 536870912, i32 536870912, i32 536870912, i32 536870912 >
103}
104
Bob Wilson5bafff32009-06-22 23:27:02 +0000105define <4 x i32> @v_movQi32e() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000106;CHECK: v_movQi32e:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000107;CHECK: vmov.i32 q0, #0x20FF
Bob Wilson5bafff32009-06-22 23:27:02 +0000108 ret <4 x i32> < i32 8447, i32 8447, i32 8447, i32 8447 >
109}
110
Bob Wilson5bafff32009-06-22 23:27:02 +0000111define <4 x i32> @v_movQi32f() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000112;CHECK: v_movQi32f:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000113;CHECK: vmov.i32 q0, #0x20FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +0000114 ret <4 x i32> < i32 2162687, i32 2162687, i32 2162687, i32 2162687 >
115}
116
Bob Wilson5bafff32009-06-22 23:27:02 +0000117define <2 x i64> @v_movQi64() nounwind {
Bob Wilsonfe27c512009-10-07 23:47:21 +0000118;CHECK: v_movQi64:
Bob Wilsone45f72c2010-07-02 17:23:44 +0000119;CHECK: vmov.i64 q0, #0xFF0000FF0000FFFF
Bob Wilson5bafff32009-06-22 23:27:02 +0000120 ret <2 x i64> < i64 18374687574888349695, i64 18374687574888349695 >
121}
Bob Wilson83815ae2009-10-09 20:20:54 +0000122
Bob Wilson54c78ef2009-11-06 23:33:28 +0000123; Check for correct assembler printing for immediate values.
124%struct.int8x8_t = type { <8 x i8> }
Rafael Espindola1e819662010-06-17 15:18:27 +0000125define void @vdupn128(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
Bob Wilson54c78ef2009-11-06 23:33:28 +0000126entry:
127;CHECK: vdupn128:
128;CHECK: vmov.i8 d0, #0x80
129 %0 = getelementptr inbounds %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
130 store <8 x i8> <i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128, i8 -128>, <8 x i8>* %0, align 8
131 ret void
132}
133
Rafael Espindola1e819662010-06-17 15:18:27 +0000134define void @vdupnneg75(%struct.int8x8_t* noalias nocapture sret %agg.result) nounwind {
Bob Wilson54c78ef2009-11-06 23:33:28 +0000135entry:
136;CHECK: vdupnneg75:
137;CHECK: vmov.i8 d0, #0xB5
138 %0 = getelementptr inbounds %struct.int8x8_t* %agg.result, i32 0, i32 0 ; <<8 x i8>*> [#uses=1]
139 store <8 x i8> <i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75, i8 -75>, <8 x i8>* %0, align 8
140 ret void
141}
142
Bob Wilson83815ae2009-10-09 20:20:54 +0000143define <8 x i16> @vmovls8(<8 x i8>* %A) nounwind {
144;CHECK: vmovls8:
145;CHECK: vmovl.s8
146 %tmp1 = load <8 x i8>* %A
147 %tmp2 = call <8 x i16> @llvm.arm.neon.vmovls.v8i16(<8 x i8> %tmp1)
148 ret <8 x i16> %tmp2
149}
150
151define <4 x i32> @vmovls16(<4 x i16>* %A) nounwind {
152;CHECK: vmovls16:
153;CHECK: vmovl.s16
154 %tmp1 = load <4 x i16>* %A
155 %tmp2 = call <4 x i32> @llvm.arm.neon.vmovls.v4i32(<4 x i16> %tmp1)
156 ret <4 x i32> %tmp2
157}
158
159define <2 x i64> @vmovls32(<2 x i32>* %A) nounwind {
160;CHECK: vmovls32:
161;CHECK: vmovl.s32
162 %tmp1 = load <2 x i32>* %A
163 %tmp2 = call <2 x i64> @llvm.arm.neon.vmovls.v2i64(<2 x i32> %tmp1)
164 ret <2 x i64> %tmp2
165}
166
167define <8 x i16> @vmovlu8(<8 x i8>* %A) nounwind {
168;CHECK: vmovlu8:
169;CHECK: vmovl.u8
170 %tmp1 = load <8 x i8>* %A
171 %tmp2 = call <8 x i16> @llvm.arm.neon.vmovlu.v8i16(<8 x i8> %tmp1)
172 ret <8 x i16> %tmp2
173}
174
175define <4 x i32> @vmovlu16(<4 x i16>* %A) nounwind {
176;CHECK: vmovlu16:
177;CHECK: vmovl.u16
178 %tmp1 = load <4 x i16>* %A
179 %tmp2 = call <4 x i32> @llvm.arm.neon.vmovlu.v4i32(<4 x i16> %tmp1)
180 ret <4 x i32> %tmp2
181}
182
183define <2 x i64> @vmovlu32(<2 x i32>* %A) nounwind {
184;CHECK: vmovlu32:
185;CHECK: vmovl.u32
186 %tmp1 = load <2 x i32>* %A
187 %tmp2 = call <2 x i64> @llvm.arm.neon.vmovlu.v2i64(<2 x i32> %tmp1)
188 ret <2 x i64> %tmp2
189}
190
191declare <8 x i16> @llvm.arm.neon.vmovls.v8i16(<8 x i8>) nounwind readnone
192declare <4 x i32> @llvm.arm.neon.vmovls.v4i32(<4 x i16>) nounwind readnone
193declare <2 x i64> @llvm.arm.neon.vmovls.v2i64(<2 x i32>) nounwind readnone
194
195declare <8 x i16> @llvm.arm.neon.vmovlu.v8i16(<8 x i8>) nounwind readnone
196declare <4 x i32> @llvm.arm.neon.vmovlu.v4i32(<4 x i16>) nounwind readnone
197declare <2 x i64> @llvm.arm.neon.vmovlu.v2i64(<2 x i32>) nounwind readnone
198
199define <8 x i8> @vmovni16(<8 x i16>* %A) nounwind {
200;CHECK: vmovni16:
201;CHECK: vmovn.i16
202 %tmp1 = load <8 x i16>* %A
203 %tmp2 = call <8 x i8> @llvm.arm.neon.vmovn.v8i8(<8 x i16> %tmp1)
204 ret <8 x i8> %tmp2
205}
206
207define <4 x i16> @vmovni32(<4 x i32>* %A) nounwind {
208;CHECK: vmovni32:
209;CHECK: vmovn.i32
210 %tmp1 = load <4 x i32>* %A
211 %tmp2 = call <4 x i16> @llvm.arm.neon.vmovn.v4i16(<4 x i32> %tmp1)
212 ret <4 x i16> %tmp2
213}
214
215define <2 x i32> @vmovni64(<2 x i64>* %A) nounwind {
216;CHECK: vmovni64:
217;CHECK: vmovn.i64
218 %tmp1 = load <2 x i64>* %A
219 %tmp2 = call <2 x i32> @llvm.arm.neon.vmovn.v2i32(<2 x i64> %tmp1)
220 ret <2 x i32> %tmp2
221}
222
223declare <8 x i8> @llvm.arm.neon.vmovn.v8i8(<8 x i16>) nounwind readnone
224declare <4 x i16> @llvm.arm.neon.vmovn.v4i16(<4 x i32>) nounwind readnone
225declare <2 x i32> @llvm.arm.neon.vmovn.v2i32(<2 x i64>) nounwind readnone
226
227define <8 x i8> @vqmovns16(<8 x i16>* %A) nounwind {
228;CHECK: vqmovns16:
229;CHECK: vqmovn.s16
230 %tmp1 = load <8 x i16>* %A
231 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16> %tmp1)
232 ret <8 x i8> %tmp2
233}
234
235define <4 x i16> @vqmovns32(<4 x i32>* %A) nounwind {
236;CHECK: vqmovns32:
237;CHECK: vqmovn.s32
238 %tmp1 = load <4 x i32>* %A
239 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32> %tmp1)
240 ret <4 x i16> %tmp2
241}
242
243define <2 x i32> @vqmovns64(<2 x i64>* %A) nounwind {
244;CHECK: vqmovns64:
245;CHECK: vqmovn.s64
246 %tmp1 = load <2 x i64>* %A
247 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64> %tmp1)
248 ret <2 x i32> %tmp2
249}
250
251define <8 x i8> @vqmovnu16(<8 x i16>* %A) nounwind {
252;CHECK: vqmovnu16:
253;CHECK: vqmovn.u16
254 %tmp1 = load <8 x i16>* %A
255 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16> %tmp1)
256 ret <8 x i8> %tmp2
257}
258
259define <4 x i16> @vqmovnu32(<4 x i32>* %A) nounwind {
260;CHECK: vqmovnu32:
261;CHECK: vqmovn.u32
262 %tmp1 = load <4 x i32>* %A
263 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32> %tmp1)
264 ret <4 x i16> %tmp2
265}
266
267define <2 x i32> @vqmovnu64(<2 x i64>* %A) nounwind {
268;CHECK: vqmovnu64:
269;CHECK: vqmovn.u64
270 %tmp1 = load <2 x i64>* %A
271 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64> %tmp1)
272 ret <2 x i32> %tmp2
273}
274
275define <8 x i8> @vqmovuns16(<8 x i16>* %A) nounwind {
276;CHECK: vqmovuns16:
277;CHECK: vqmovun.s16
278 %tmp1 = load <8 x i16>* %A
279 %tmp2 = call <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16> %tmp1)
280 ret <8 x i8> %tmp2
281}
282
283define <4 x i16> @vqmovuns32(<4 x i32>* %A) nounwind {
284;CHECK: vqmovuns32:
285;CHECK: vqmovun.s32
286 %tmp1 = load <4 x i32>* %A
287 %tmp2 = call <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32> %tmp1)
288 ret <4 x i16> %tmp2
289}
290
291define <2 x i32> @vqmovuns64(<2 x i64>* %A) nounwind {
292;CHECK: vqmovuns64:
293;CHECK: vqmovun.s64
294 %tmp1 = load <2 x i64>* %A
295 %tmp2 = call <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64> %tmp1)
296 ret <2 x i32> %tmp2
297}
298
299declare <8 x i8> @llvm.arm.neon.vqmovns.v8i8(<8 x i16>) nounwind readnone
300declare <4 x i16> @llvm.arm.neon.vqmovns.v4i16(<4 x i32>) nounwind readnone
301declare <2 x i32> @llvm.arm.neon.vqmovns.v2i32(<2 x i64>) nounwind readnone
302
303declare <8 x i8> @llvm.arm.neon.vqmovnu.v8i8(<8 x i16>) nounwind readnone
304declare <4 x i16> @llvm.arm.neon.vqmovnu.v4i16(<4 x i32>) nounwind readnone
305declare <2 x i32> @llvm.arm.neon.vqmovnu.v2i32(<2 x i64>) nounwind readnone
306
307declare <8 x i8> @llvm.arm.neon.vqmovnsu.v8i8(<8 x i16>) nounwind readnone
308declare <4 x i16> @llvm.arm.neon.vqmovnsu.v4i16(<4 x i32>) nounwind readnone
309declare <2 x i32> @llvm.arm.neon.vqmovnsu.v2i32(<2 x i64>) nounwind readnone