blob: 56149dac30d9293c1e01b2c9ff2ead0f50c6fe55 [file] [log] [blame]
Bob Wilsond48ca592009-10-07 23:47:21 +00001; RUN: llc < %s -march=arm -mattr=+neon | FileCheck %s
Bob Wilsone60fee02009-06-22 23:27:02 +00002
3define <8 x i16> @vmulls8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +00004;CHECK: vmulls8:
5;CHECK: vmull.s8
Bob Wilsone60fee02009-06-22 23:27:02 +00006 %tmp1 = load <8 x i8>* %A
7 %tmp2 = load <8 x i8>* %B
8 %tmp3 = call <8 x i16> @llvm.arm.neon.vmulls.v8i16(<8 x i8> %tmp1, <8 x i8> %tmp2)
9 ret <8 x i16> %tmp3
10}
11
12define <4 x i32> @vmulls16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000013;CHECK: vmulls16:
14;CHECK: vmull.s16
Bob Wilsone60fee02009-06-22 23:27:02 +000015 %tmp1 = load <4 x i16>* %A
16 %tmp2 = load <4 x i16>* %B
17 %tmp3 = call <4 x i32> @llvm.arm.neon.vmulls.v4i32(<4 x i16> %tmp1, <4 x i16> %tmp2)
18 ret <4 x i32> %tmp3
19}
20
21define <2 x i64> @vmulls32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000022;CHECK: vmulls32:
23;CHECK: vmull.s32
Bob Wilsone60fee02009-06-22 23:27:02 +000024 %tmp1 = load <2 x i32>* %A
25 %tmp2 = load <2 x i32>* %B
26 %tmp3 = call <2 x i64> @llvm.arm.neon.vmulls.v2i64(<2 x i32> %tmp1, <2 x i32> %tmp2)
27 ret <2 x i64> %tmp3
28}
29
30define <8 x i16> @vmullu8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000031;CHECK: vmullu8:
32;CHECK: vmull.u8
Bob Wilsone60fee02009-06-22 23:27:02 +000033 %tmp1 = load <8 x i8>* %A
34 %tmp2 = load <8 x i8>* %B
35 %tmp3 = call <8 x i16> @llvm.arm.neon.vmullu.v8i16(<8 x i8> %tmp1, <8 x i8> %tmp2)
36 ret <8 x i16> %tmp3
37}
38
39define <4 x i32> @vmullu16(<4 x i16>* %A, <4 x i16>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000040;CHECK: vmullu16:
41;CHECK: vmull.u16
Bob Wilsone60fee02009-06-22 23:27:02 +000042 %tmp1 = load <4 x i16>* %A
43 %tmp2 = load <4 x i16>* %B
44 %tmp3 = call <4 x i32> @llvm.arm.neon.vmullu.v4i32(<4 x i16> %tmp1, <4 x i16> %tmp2)
45 ret <4 x i32> %tmp3
46}
47
48define <2 x i64> @vmullu32(<2 x i32>* %A, <2 x i32>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000049;CHECK: vmullu32:
50;CHECK: vmull.u32
Bob Wilsone60fee02009-06-22 23:27:02 +000051 %tmp1 = load <2 x i32>* %A
52 %tmp2 = load <2 x i32>* %B
53 %tmp3 = call <2 x i64> @llvm.arm.neon.vmullu.v2i64(<2 x i32> %tmp1, <2 x i32> %tmp2)
54 ret <2 x i64> %tmp3
55}
56
57define <8 x i16> @vmullp8(<8 x i8>* %A, <8 x i8>* %B) nounwind {
Bob Wilsond48ca592009-10-07 23:47:21 +000058;CHECK: vmullp8:
59;CHECK: vmull.p8
Bob Wilsone60fee02009-06-22 23:27:02 +000060 %tmp1 = load <8 x i8>* %A
61 %tmp2 = load <8 x i8>* %B
62 %tmp3 = call <8 x i16> @llvm.arm.neon.vmullp.v8i16(<8 x i8> %tmp1, <8 x i8> %tmp2)
63 ret <8 x i16> %tmp3
64}
65
66declare <8 x i16> @llvm.arm.neon.vmulls.v8i16(<8 x i8>, <8 x i8>) nounwind readnone
67declare <4 x i32> @llvm.arm.neon.vmulls.v4i32(<4 x i16>, <4 x i16>) nounwind readnone
68declare <2 x i64> @llvm.arm.neon.vmulls.v2i64(<2 x i32>, <2 x i32>) nounwind readnone
69
70declare <8 x i16> @llvm.arm.neon.vmullu.v8i16(<8 x i8>, <8 x i8>) nounwind readnone
71declare <4 x i32> @llvm.arm.neon.vmullu.v4i32(<4 x i16>, <4 x i16>) nounwind readnone
72declare <2 x i64> @llvm.arm.neon.vmullu.v2i64(<2 x i32>, <2 x i32>) nounwind readnone
73
74declare <8 x i16> @llvm.arm.neon.vmullp.v8i16(<8 x i8>, <8 x i8>) nounwind readnone