blob: 0624f2977ea46280729be08e3afb63dbf691ea53 [file] [log] [blame]
Dan Gohmanfce288f2009-09-09 00:09:15 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilson9b600c62009-08-06 00:38:31 +00002
Bob Wilsonec1d81c2009-10-06 21:16:19 +00003%struct.__neon_int8x8x4_t = type { <8 x i8>, <8 x i8>, <8 x i8>, <8 x i8> }
4%struct.__neon_int16x4x4_t = type { <4 x i16>, <4 x i16>, <4 x i16>, <4 x i16> }
5%struct.__neon_int32x2x4_t = type { <2 x i32>, <2 x i32>, <2 x i32>, <2 x i32> }
6%struct.__neon_float32x2x4_t = type { <2 x float>, <2 x float>, <2 x float>, <2 x float> }
Bob Wilson0ea38bb2009-10-07 23:54:04 +00007%struct.__neon_int64x1x4_t = type { <1 x i64>, <1 x i64>, <1 x i64>, <1 x i64> }
Bob Wilson9b600c62009-08-06 00:38:31 +00008
Bob Wilson7708c222009-10-07 18:09:32 +00009%struct.__neon_int8x16x4_t = type { <16 x i8>, <16 x i8>, <16 x i8>, <16 x i8> }
10%struct.__neon_int16x8x4_t = type { <8 x i16>, <8 x i16>, <8 x i16>, <8 x i16> }
11%struct.__neon_int32x4x4_t = type { <4 x i32>, <4 x i32>, <4 x i32>, <4 x i32> }
12%struct.__neon_float32x4x4_t = type { <4 x float>, <4 x float>, <4 x float>, <4 x float> }
13
Bob Wilson9b600c62009-08-06 00:38:31 +000014define <8 x i8> @vld4i8(i8* %A) nounwind {
15;CHECK: vld4i8:
16;CHECK: vld4.8
Bob Wilsonec1d81c2009-10-06 21:16:19 +000017 %tmp1 = call %struct.__neon_int8x8x4_t @llvm.arm.neon.vld4.v8i8(i8* %A)
18 %tmp2 = extractvalue %struct.__neon_int8x8x4_t %tmp1, 0
19 %tmp3 = extractvalue %struct.__neon_int8x8x4_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000020 %tmp4 = add <8 x i8> %tmp2, %tmp3
21 ret <8 x i8> %tmp4
22}
23
24define <4 x i16> @vld4i16(i16* %A) nounwind {
25;CHECK: vld4i16:
26;CHECK: vld4.16
Bob Wilsonec1d81c2009-10-06 21:16:19 +000027 %tmp1 = call %struct.__neon_int16x4x4_t @llvm.arm.neon.vld4.v4i16(i16* %A)
28 %tmp2 = extractvalue %struct.__neon_int16x4x4_t %tmp1, 0
29 %tmp3 = extractvalue %struct.__neon_int16x4x4_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000030 %tmp4 = add <4 x i16> %tmp2, %tmp3
31 ret <4 x i16> %tmp4
32}
33
34define <2 x i32> @vld4i32(i32* %A) nounwind {
35;CHECK: vld4i32:
36;CHECK: vld4.32
Bob Wilsonec1d81c2009-10-06 21:16:19 +000037 %tmp1 = call %struct.__neon_int32x2x4_t @llvm.arm.neon.vld4.v2i32(i32* %A)
38 %tmp2 = extractvalue %struct.__neon_int32x2x4_t %tmp1, 0
39 %tmp3 = extractvalue %struct.__neon_int32x2x4_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000040 %tmp4 = add <2 x i32> %tmp2, %tmp3
41 ret <2 x i32> %tmp4
42}
43
44define <2 x float> @vld4f(float* %A) nounwind {
45;CHECK: vld4f:
46;CHECK: vld4.32
Bob Wilsonec1d81c2009-10-06 21:16:19 +000047 %tmp1 = call %struct.__neon_float32x2x4_t @llvm.arm.neon.vld4.v2f32(float* %A)
48 %tmp2 = extractvalue %struct.__neon_float32x2x4_t %tmp1, 0
49 %tmp3 = extractvalue %struct.__neon_float32x2x4_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000050 %tmp4 = add <2 x float> %tmp2, %tmp3
51 ret <2 x float> %tmp4
52}
53
Bob Wilson0ea38bb2009-10-07 23:54:04 +000054define <1 x i64> @vld4i64(i64* %A) nounwind {
55;CHECK: vld4i64:
56;CHECK: vld1.64
57 %tmp1 = call %struct.__neon_int64x1x4_t @llvm.arm.neon.vld4.v1i64(i64* %A)
58 %tmp2 = extractvalue %struct.__neon_int64x1x4_t %tmp1, 0
59 %tmp3 = extractvalue %struct.__neon_int64x1x4_t %tmp1, 2
60 %tmp4 = add <1 x i64> %tmp2, %tmp3
61 ret <1 x i64> %tmp4
62}
63
Bob Wilson7708c222009-10-07 18:09:32 +000064define <16 x i8> @vld4Qi8(i8* %A) nounwind {
65;CHECK: vld4Qi8:
66;CHECK: vld4.8
67;CHECK: vld4.8
68 %tmp1 = call %struct.__neon_int8x16x4_t @llvm.arm.neon.vld4.v16i8(i8* %A)
69 %tmp2 = extractvalue %struct.__neon_int8x16x4_t %tmp1, 0
70 %tmp3 = extractvalue %struct.__neon_int8x16x4_t %tmp1, 2
71 %tmp4 = add <16 x i8> %tmp2, %tmp3
72 ret <16 x i8> %tmp4
73}
74
75define <8 x i16> @vld4Qi16(i16* %A) nounwind {
76;CHECK: vld4Qi16:
77;CHECK: vld4.16
78;CHECK: vld4.16
79 %tmp1 = call %struct.__neon_int16x8x4_t @llvm.arm.neon.vld4.v8i16(i16* %A)
80 %tmp2 = extractvalue %struct.__neon_int16x8x4_t %tmp1, 0
81 %tmp3 = extractvalue %struct.__neon_int16x8x4_t %tmp1, 2
82 %tmp4 = add <8 x i16> %tmp2, %tmp3
83 ret <8 x i16> %tmp4
84}
85
86define <4 x i32> @vld4Qi32(i32* %A) nounwind {
87;CHECK: vld4Qi32:
88;CHECK: vld4.32
89;CHECK: vld4.32
90 %tmp1 = call %struct.__neon_int32x4x4_t @llvm.arm.neon.vld4.v4i32(i32* %A)
91 %tmp2 = extractvalue %struct.__neon_int32x4x4_t %tmp1, 0
92 %tmp3 = extractvalue %struct.__neon_int32x4x4_t %tmp1, 2
93 %tmp4 = add <4 x i32> %tmp2, %tmp3
94 ret <4 x i32> %tmp4
95}
96
97define <4 x float> @vld4Qf(float* %A) nounwind {
98;CHECK: vld4Qf:
99;CHECK: vld4.32
100;CHECK: vld4.32
101 %tmp1 = call %struct.__neon_float32x4x4_t @llvm.arm.neon.vld4.v4f32(float* %A)
102 %tmp2 = extractvalue %struct.__neon_float32x4x4_t %tmp1, 0
103 %tmp3 = extractvalue %struct.__neon_float32x4x4_t %tmp1, 2
104 %tmp4 = add <4 x float> %tmp2, %tmp3
105 ret <4 x float> %tmp4
106}
107
Bob Wilsonec1d81c2009-10-06 21:16:19 +0000108declare %struct.__neon_int8x8x4_t @llvm.arm.neon.vld4.v8i8(i8*) nounwind readonly
109declare %struct.__neon_int16x4x4_t @llvm.arm.neon.vld4.v4i16(i8*) nounwind readonly
110declare %struct.__neon_int32x2x4_t @llvm.arm.neon.vld4.v2i32(i8*) nounwind readonly
111declare %struct.__neon_float32x2x4_t @llvm.arm.neon.vld4.v2f32(i8*) nounwind readonly
Bob Wilson0ea38bb2009-10-07 23:54:04 +0000112declare %struct.__neon_int64x1x4_t @llvm.arm.neon.vld4.v1i64(i8*) nounwind readonly
Bob Wilson7708c222009-10-07 18:09:32 +0000113
114declare %struct.__neon_int8x16x4_t @llvm.arm.neon.vld4.v16i8(i8*) nounwind readonly
115declare %struct.__neon_int16x8x4_t @llvm.arm.neon.vld4.v8i16(i8*) nounwind readonly
116declare %struct.__neon_int32x4x4_t @llvm.arm.neon.vld4.v4i32(i8*) nounwind readonly
117declare %struct.__neon_float32x4x4_t @llvm.arm.neon.vld4.v4f32(i8*) nounwind readonly