blob: 4ed53092c3f12bc9e6c988c0ba7348d5c48de0ac [file] [log] [blame]
Dan Gohmanfce288f2009-09-09 00:09:15 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilson9b600c62009-08-06 00:38:31 +00002
Bob Wilsonec1d81c2009-10-06 21:16:19 +00003%struct.__neon_int8x8x3_t = type { <8 x i8>, <8 x i8>, <8 x i8> }
4%struct.__neon_int16x4x3_t = type { <4 x i16>, <4 x i16>, <4 x i16> }
5%struct.__neon_int32x2x3_t = type { <2 x i32>, <2 x i32>, <2 x i32> }
6%struct.__neon_float32x2x3_t = type { <2 x float>, <2 x float>, <2 x float> }
Bob Wilson9b600c62009-08-06 00:38:31 +00007
Bob Wilsonff8952e2009-10-07 17:24:55 +00008%struct.__neon_int8x16x3_t = type { <16 x i8>, <16 x i8>, <16 x i8> }
9%struct.__neon_int16x8x3_t = type { <8 x i16>, <8 x i16>, <8 x i16> }
10%struct.__neon_int32x4x3_t = type { <4 x i32>, <4 x i32>, <4 x i32> }
11%struct.__neon_float32x4x3_t = type { <4 x float>, <4 x float>, <4 x float> }
12
Bob Wilson9b600c62009-08-06 00:38:31 +000013define <8 x i8> @vld3i8(i8* %A) nounwind {
14;CHECK: vld3i8:
15;CHECK: vld3.8
Bob Wilsonec1d81c2009-10-06 21:16:19 +000016 %tmp1 = call %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8* %A)
17 %tmp2 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 0
18 %tmp3 = extractvalue %struct.__neon_int8x8x3_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000019 %tmp4 = add <8 x i8> %tmp2, %tmp3
20 ret <8 x i8> %tmp4
21}
22
23define <4 x i16> @vld3i16(i16* %A) nounwind {
24;CHECK: vld3i16:
25;CHECK: vld3.16
Bob Wilsonec1d81c2009-10-06 21:16:19 +000026 %tmp1 = call %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i16* %A)
27 %tmp2 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 0
28 %tmp3 = extractvalue %struct.__neon_int16x4x3_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000029 %tmp4 = add <4 x i16> %tmp2, %tmp3
30 ret <4 x i16> %tmp4
31}
32
33define <2 x i32> @vld3i32(i32* %A) nounwind {
34;CHECK: vld3i32:
35;CHECK: vld3.32
Bob Wilsonec1d81c2009-10-06 21:16:19 +000036 %tmp1 = call %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i32* %A)
37 %tmp2 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 0
38 %tmp3 = extractvalue %struct.__neon_int32x2x3_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000039 %tmp4 = add <2 x i32> %tmp2, %tmp3
40 ret <2 x i32> %tmp4
41}
42
43define <2 x float> @vld3f(float* %A) nounwind {
44;CHECK: vld3f:
45;CHECK: vld3.32
Bob Wilsonec1d81c2009-10-06 21:16:19 +000046 %tmp1 = call %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(float* %A)
47 %tmp2 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 0
48 %tmp3 = extractvalue %struct.__neon_float32x2x3_t %tmp1, 2
Bob Wilson9b600c62009-08-06 00:38:31 +000049 %tmp4 = add <2 x float> %tmp2, %tmp3
50 ret <2 x float> %tmp4
51}
52
Bob Wilsonff8952e2009-10-07 17:24:55 +000053define <16 x i8> @vld3Qi8(i8* %A) nounwind {
54;CHECK: vld3Qi8:
55;CHECK: vld3.8
56;CHECK: vld3.8
57 %tmp1 = call %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8* %A)
58 %tmp2 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 0
59 %tmp3 = extractvalue %struct.__neon_int8x16x3_t %tmp1, 2
60 %tmp4 = add <16 x i8> %tmp2, %tmp3
61 ret <16 x i8> %tmp4
62}
63
64define <8 x i16> @vld3Qi16(i16* %A) nounwind {
65;CHECK: vld3Qi16:
66;CHECK: vld3.16
67;CHECK: vld3.16
68 %tmp1 = call %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i16* %A)
69 %tmp2 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 0
70 %tmp3 = extractvalue %struct.__neon_int16x8x3_t %tmp1, 2
71 %tmp4 = add <8 x i16> %tmp2, %tmp3
72 ret <8 x i16> %tmp4
73}
74
75define <4 x i32> @vld3Qi32(i32* %A) nounwind {
76;CHECK: vld3Qi32:
77;CHECK: vld3.32
78;CHECK: vld3.32
79 %tmp1 = call %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i32* %A)
80 %tmp2 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 0
81 %tmp3 = extractvalue %struct.__neon_int32x4x3_t %tmp1, 2
82 %tmp4 = add <4 x i32> %tmp2, %tmp3
83 ret <4 x i32> %tmp4
84}
85
86define <4 x float> @vld3Qf(float* %A) nounwind {
87;CHECK: vld3Qf:
88;CHECK: vld3.32
89;CHECK: vld3.32
90 %tmp1 = call %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(float* %A)
91 %tmp2 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 0
92 %tmp3 = extractvalue %struct.__neon_float32x4x3_t %tmp1, 2
93 %tmp4 = add <4 x float> %tmp2, %tmp3
94 ret <4 x float> %tmp4
95}
96
Bob Wilsonec1d81c2009-10-06 21:16:19 +000097declare %struct.__neon_int8x8x3_t @llvm.arm.neon.vld3.v8i8(i8*) nounwind readonly
98declare %struct.__neon_int16x4x3_t @llvm.arm.neon.vld3.v4i16(i8*) nounwind readonly
99declare %struct.__neon_int32x2x3_t @llvm.arm.neon.vld3.v2i32(i8*) nounwind readonly
100declare %struct.__neon_float32x2x3_t @llvm.arm.neon.vld3.v2f32(i8*) nounwind readonly
Bob Wilsonff8952e2009-10-07 17:24:55 +0000101
102declare %struct.__neon_int8x16x3_t @llvm.arm.neon.vld3.v16i8(i8*) nounwind readonly
103declare %struct.__neon_int16x8x3_t @llvm.arm.neon.vld3.v8i16(i8*) nounwind readonly
104declare %struct.__neon_int32x4x3_t @llvm.arm.neon.vld3.v4i32(i8*) nounwind readonly
105declare %struct.__neon_float32x4x3_t @llvm.arm.neon.vld3.v4f32(i8*) nounwind readonly