blob: 4238f5b389342506394453f3df856e5b4a3963ad [file] [log] [blame]
Anders Carlsson85b2a472009-02-17 03:05:04 +00001/*===---- tmmintrin.h - SSSE3 intrinsics -----------------------------------===
2 *
3 * Permission is hereby granted, free of charge, to any person obtaining a copy
4 * of this software and associated documentation files (the "Software"), to deal
5 * in the Software without restriction, including without limitation the rights
6 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
7 * copies of the Software, and to permit persons to whom the Software is
8 * furnished to do so, subject to the following conditions:
9 *
10 * The above copyright notice and this permission notice shall be included in
11 * all copies or substantial portions of the Software.
12 *
13 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
14 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
15 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
16 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
17 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
18 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
19 * THE SOFTWARE.
20 *
21 *===-----------------------------------------------------------------------===
22 */
23
24#ifndef __TMMINTRIN_H
25#define __TMMINTRIN_H
26
27#ifndef __SSSE3__
28#error "SSSE3 instruction set not enabled"
29#else
30
31#include <pmmintrin.h>
32
Chris Lattner1bddbcb2010-03-22 18:14:12 +000033static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000034_mm_abs_pi8(__m64 __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000035{
David Blaikie4f918ae2013-01-16 23:08:36 +000036 return (__m64)__builtin_ia32_pabsb((__v8qi)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000037}
38
Chris Lattner1bddbcb2010-03-22 18:14:12 +000039static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000040_mm_abs_epi8(__m128i __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000041{
David Blaikie4f918ae2013-01-16 23:08:36 +000042 return (__m128i)__builtin_ia32_pabsb128((__v16qi)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000043}
44
Chris Lattner1bddbcb2010-03-22 18:14:12 +000045static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000046_mm_abs_pi16(__m64 __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000047{
David Blaikie4f918ae2013-01-16 23:08:36 +000048 return (__m64)__builtin_ia32_pabsw((__v4hi)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000049}
50
Chris Lattner1bddbcb2010-03-22 18:14:12 +000051static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000052_mm_abs_epi16(__m128i __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000053{
David Blaikie4f918ae2013-01-16 23:08:36 +000054 return (__m128i)__builtin_ia32_pabsw128((__v8hi)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000055}
56
Chris Lattner1bddbcb2010-03-22 18:14:12 +000057static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000058_mm_abs_pi32(__m64 __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000059{
David Blaikie4f918ae2013-01-16 23:08:36 +000060 return (__m64)__builtin_ia32_pabsd((__v2si)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000061}
62
Chris Lattner1bddbcb2010-03-22 18:14:12 +000063static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000064_mm_abs_epi32(__m128i __a)
Anders Carlsson85b2a472009-02-17 03:05:04 +000065{
David Blaikie4f918ae2013-01-16 23:08:36 +000066 return (__m128i)__builtin_ia32_pabsd128((__v4si)__a);
Anders Carlsson85b2a472009-02-17 03:05:04 +000067}
68
Bob Wilson32bae372011-11-05 06:08:06 +000069#define _mm_alignr_epi8(a, b, n) __extension__ ({ \
70 __m128i __a = (a); \
71 __m128i __b = (b); \
72 (__m128i)__builtin_ia32_palignr128((__v16qi)__a, (__v16qi)__b, (n)); })
73
74#define _mm_alignr_pi8(a, b, n) __extension__ ({ \
75 __m64 __a = (a); \
76 __m64 __b = (b); \
77 (__m64)__builtin_ia32_palignr((__v8qi)__a, (__v8qi)__b, (n)); })
Anders Carlsson85b2a472009-02-17 03:05:04 +000078
Chris Lattner1bddbcb2010-03-22 18:14:12 +000079static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000080_mm_hadd_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +000081{
David Blaikie4f918ae2013-01-16 23:08:36 +000082 return (__m128i)__builtin_ia32_phaddw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +000083}
84
Chris Lattner1bddbcb2010-03-22 18:14:12 +000085static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000086_mm_hadd_epi32(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +000087{
David Blaikie4f918ae2013-01-16 23:08:36 +000088 return (__m128i)__builtin_ia32_phaddd128((__v4si)__a, (__v4si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +000089}
90
Chris Lattner1bddbcb2010-03-22 18:14:12 +000091static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000092_mm_hadd_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +000093{
David Blaikie4f918ae2013-01-16 23:08:36 +000094 return (__m64)__builtin_ia32_phaddw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +000095}
96
Chris Lattner1bddbcb2010-03-22 18:14:12 +000097static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +000098_mm_hadd_pi32(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +000099{
David Blaikie4f918ae2013-01-16 23:08:36 +0000100 return (__m64)__builtin_ia32_phaddd((__v2si)__a, (__v2si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000101}
102
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000103static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000104_mm_hadds_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000105{
David Blaikie4f918ae2013-01-16 23:08:36 +0000106 return (__m128i)__builtin_ia32_phaddsw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000107}
108
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000109static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000110_mm_hadds_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000111{
David Blaikie4f918ae2013-01-16 23:08:36 +0000112 return (__m64)__builtin_ia32_phaddsw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000113}
114
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000115static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000116_mm_hsub_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000117{
David Blaikie4f918ae2013-01-16 23:08:36 +0000118 return (__m128i)__builtin_ia32_phsubw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000119}
120
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000121static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000122_mm_hsub_epi32(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000123{
David Blaikie4f918ae2013-01-16 23:08:36 +0000124 return (__m128i)__builtin_ia32_phsubd128((__v4si)__a, (__v4si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000125}
126
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000127static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000128_mm_hsub_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000129{
David Blaikie4f918ae2013-01-16 23:08:36 +0000130 return (__m64)__builtin_ia32_phsubw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000131}
132
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000133static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000134_mm_hsub_pi32(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000135{
David Blaikie4f918ae2013-01-16 23:08:36 +0000136 return (__m64)__builtin_ia32_phsubd((__v2si)__a, (__v2si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000137}
138
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000139static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000140_mm_hsubs_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000141{
David Blaikie4f918ae2013-01-16 23:08:36 +0000142 return (__m128i)__builtin_ia32_phsubsw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000143}
144
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000145static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000146_mm_hsubs_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000147{
David Blaikie4f918ae2013-01-16 23:08:36 +0000148 return (__m64)__builtin_ia32_phsubsw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000149}
150
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000151static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000152_mm_maddubs_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000153{
David Blaikie4f918ae2013-01-16 23:08:36 +0000154 return (__m128i)__builtin_ia32_pmaddubsw128((__v16qi)__a, (__v16qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000155}
156
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000157static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000158_mm_maddubs_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000159{
David Blaikie4f918ae2013-01-16 23:08:36 +0000160 return (__m64)__builtin_ia32_pmaddubsw((__v8qi)__a, (__v8qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000161}
162
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000163static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000164_mm_mulhrs_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000165{
David Blaikie4f918ae2013-01-16 23:08:36 +0000166 return (__m128i)__builtin_ia32_pmulhrsw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000167}
168
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000169static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000170_mm_mulhrs_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000171{
David Blaikie4f918ae2013-01-16 23:08:36 +0000172 return (__m64)__builtin_ia32_pmulhrsw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000173}
174
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000175static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000176_mm_shuffle_epi8(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000177{
David Blaikie4f918ae2013-01-16 23:08:36 +0000178 return (__m128i)__builtin_ia32_pshufb128((__v16qi)__a, (__v16qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000179}
180
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000181static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000182_mm_shuffle_pi8(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000183{
David Blaikie4f918ae2013-01-16 23:08:36 +0000184 return (__m64)__builtin_ia32_pshufb((__v8qi)__a, (__v8qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000185}
186
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000187static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000188_mm_sign_epi8(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000189{
David Blaikie4f918ae2013-01-16 23:08:36 +0000190 return (__m128i)__builtin_ia32_psignb128((__v16qi)__a, (__v16qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000191}
192
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000193static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000194_mm_sign_epi16(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000195{
David Blaikie4f918ae2013-01-16 23:08:36 +0000196 return (__m128i)__builtin_ia32_psignw128((__v8hi)__a, (__v8hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000197}
198
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000199static __inline__ __m128i __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000200_mm_sign_epi32(__m128i __a, __m128i __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000201{
David Blaikie4f918ae2013-01-16 23:08:36 +0000202 return (__m128i)__builtin_ia32_psignd128((__v4si)__a, (__v4si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000203}
204
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000205static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000206_mm_sign_pi8(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000207{
David Blaikie4f918ae2013-01-16 23:08:36 +0000208 return (__m64)__builtin_ia32_psignb((__v8qi)__a, (__v8qi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000209}
210
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000211static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000212_mm_sign_pi16(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000213{
David Blaikie4f918ae2013-01-16 23:08:36 +0000214 return (__m64)__builtin_ia32_psignw((__v4hi)__a, (__v4hi)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000215}
216
Chris Lattner1bddbcb2010-03-22 18:14:12 +0000217static __inline__ __m64 __attribute__((__always_inline__, __nodebug__))
David Blaikie4f918ae2013-01-16 23:08:36 +0000218_mm_sign_pi32(__m64 __a, __m64 __b)
Anders Carlsson85b2a472009-02-17 03:05:04 +0000219{
David Blaikie4f918ae2013-01-16 23:08:36 +0000220 return (__m64)__builtin_ia32_psignd((__v2si)__a, (__v2si)__b);
Anders Carlsson85b2a472009-02-17 03:05:04 +0000221}
222
223#endif /* __SSSE3__ */
224
225#endif /* __TMMINTRIN_H */