blob: 44c4e30f1ecca1fd2f0579aeb104318b23d53ee8 [file] [log] [blame]
Bob Wilson1c70c0a2009-10-08 06:02:10 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilsone60fee02009-06-22 23:27:02 +00002
3define <4 x i16> @vpaddls8(<8 x i8>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +00004;CHECK: vpaddls8:
5;CHECK: vpaddl.s8
Bob Wilsone60fee02009-06-22 23:27:02 +00006 %tmp1 = load <8 x i8>* %A
7 %tmp2 = call <4 x i16> @llvm.arm.neon.vpaddls.v4i16.v8i8(<8 x i8> %tmp1)
8 ret <4 x i16> %tmp2
9}
10
11define <2 x i32> @vpaddls16(<4 x i16>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000012;CHECK: vpaddls16:
13;CHECK: vpaddl.s16
Bob Wilsone60fee02009-06-22 23:27:02 +000014 %tmp1 = load <4 x i16>* %A
15 %tmp2 = call <2 x i32> @llvm.arm.neon.vpaddls.v2i32.v4i16(<4 x i16> %tmp1)
16 ret <2 x i32> %tmp2
17}
18
19define <1 x i64> @vpaddls32(<2 x i32>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000020;CHECK: vpaddls32:
21;CHECK: vpaddl.s32
Bob Wilsone60fee02009-06-22 23:27:02 +000022 %tmp1 = load <2 x i32>* %A
23 %tmp2 = call <1 x i64> @llvm.arm.neon.vpaddls.v1i64.v2i32(<2 x i32> %tmp1)
24 ret <1 x i64> %tmp2
25}
26
27define <4 x i16> @vpaddlu8(<8 x i8>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000028;CHECK: vpaddlu8:
29;CHECK: vpaddl.u8
Bob Wilsone60fee02009-06-22 23:27:02 +000030 %tmp1 = load <8 x i8>* %A
31 %tmp2 = call <4 x i16> @llvm.arm.neon.vpaddlu.v4i16.v8i8(<8 x i8> %tmp1)
32 ret <4 x i16> %tmp2
33}
34
35define <2 x i32> @vpaddlu16(<4 x i16>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000036;CHECK: vpaddlu16:
37;CHECK: vpaddl.u16
Bob Wilsone60fee02009-06-22 23:27:02 +000038 %tmp1 = load <4 x i16>* %A
39 %tmp2 = call <2 x i32> @llvm.arm.neon.vpaddlu.v2i32.v4i16(<4 x i16> %tmp1)
40 ret <2 x i32> %tmp2
41}
42
43define <1 x i64> @vpaddlu32(<2 x i32>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000044;CHECK: vpaddlu32:
45;CHECK: vpaddl.u32
Bob Wilsone60fee02009-06-22 23:27:02 +000046 %tmp1 = load <2 x i32>* %A
47 %tmp2 = call <1 x i64> @llvm.arm.neon.vpaddlu.v1i64.v2i32(<2 x i32> %tmp1)
48 ret <1 x i64> %tmp2
49}
50
51define <8 x i16> @vpaddlQs8(<16 x i8>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000052;CHECK: vpaddlQs8:
53;CHECK: vpaddl.s8
Bob Wilsone60fee02009-06-22 23:27:02 +000054 %tmp1 = load <16 x i8>* %A
55 %tmp2 = call <8 x i16> @llvm.arm.neon.vpaddls.v8i16.v16i8(<16 x i8> %tmp1)
56 ret <8 x i16> %tmp2
57}
58
59define <4 x i32> @vpaddlQs16(<8 x i16>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000060;CHECK: vpaddlQs16:
61;CHECK: vpaddl.s16
Bob Wilsone60fee02009-06-22 23:27:02 +000062 %tmp1 = load <8 x i16>* %A
63 %tmp2 = call <4 x i32> @llvm.arm.neon.vpaddls.v4i32.v8i16(<8 x i16> %tmp1)
64 ret <4 x i32> %tmp2
65}
66
67define <2 x i64> @vpaddlQs32(<4 x i32>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000068;CHECK: vpaddlQs32:
69;CHECK: vpaddl.s32
Bob Wilsone60fee02009-06-22 23:27:02 +000070 %tmp1 = load <4 x i32>* %A
71 %tmp2 = call <2 x i64> @llvm.arm.neon.vpaddls.v2i64.v4i32(<4 x i32> %tmp1)
72 ret <2 x i64> %tmp2
73}
74
75define <8 x i16> @vpaddlQu8(<16 x i8>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000076;CHECK: vpaddlQu8:
77;CHECK: vpaddl.u8
Bob Wilsone60fee02009-06-22 23:27:02 +000078 %tmp1 = load <16 x i8>* %A
79 %tmp2 = call <8 x i16> @llvm.arm.neon.vpaddlu.v8i16.v16i8(<16 x i8> %tmp1)
80 ret <8 x i16> %tmp2
81}
82
83define <4 x i32> @vpaddlQu16(<8 x i16>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000084;CHECK: vpaddlQu16:
85;CHECK: vpaddl.u16
Bob Wilsone60fee02009-06-22 23:27:02 +000086 %tmp1 = load <8 x i16>* %A
87 %tmp2 = call <4 x i32> @llvm.arm.neon.vpaddlu.v4i32.v8i16(<8 x i16> %tmp1)
88 ret <4 x i32> %tmp2
89}
90
91define <2 x i64> @vpaddlQu32(<4 x i32>* %A) nounwind {
Bob Wilson1c70c0a2009-10-08 06:02:10 +000092;CHECK: vpaddlQu32:
93;CHECK: vpaddl.u32
Bob Wilsone60fee02009-06-22 23:27:02 +000094 %tmp1 = load <4 x i32>* %A
95 %tmp2 = call <2 x i64> @llvm.arm.neon.vpaddlu.v2i64.v4i32(<4 x i32> %tmp1)
96 ret <2 x i64> %tmp2
97}
98
99declare <4 x i16> @llvm.arm.neon.vpaddls.v4i16.v8i8(<8 x i8>) nounwind readnone
100declare <2 x i32> @llvm.arm.neon.vpaddls.v2i32.v4i16(<4 x i16>) nounwind readnone
101declare <1 x i64> @llvm.arm.neon.vpaddls.v1i64.v2i32(<2 x i32>) nounwind readnone
102
103declare <4 x i16> @llvm.arm.neon.vpaddlu.v4i16.v8i8(<8 x i8>) nounwind readnone
104declare <2 x i32> @llvm.arm.neon.vpaddlu.v2i32.v4i16(<4 x i16>) nounwind readnone
105declare <1 x i64> @llvm.arm.neon.vpaddlu.v1i64.v2i32(<2 x i32>) nounwind readnone
106
107declare <8 x i16> @llvm.arm.neon.vpaddls.v8i16.v16i8(<16 x i8>) nounwind readnone
108declare <4 x i32> @llvm.arm.neon.vpaddls.v4i32.v8i16(<8 x i16>) nounwind readnone
109declare <2 x i64> @llvm.arm.neon.vpaddls.v2i64.v4i32(<4 x i32>) nounwind readnone
110
111declare <8 x i16> @llvm.arm.neon.vpaddlu.v8i16.v16i8(<16 x i8>) nounwind readnone
112declare <4 x i32> @llvm.arm.neon.vpaddlu.v4i32.v8i16(<8 x i16>) nounwind readnone
113declare <2 x i64> @llvm.arm.neon.vpaddlu.v2i64.v4i32(<4 x i32>) nounwind readnone