Craig Topper | 991d499 | 2015-11-03 06:16:31 +0000 | [diff] [blame] | 1 | /*===---- avx512erintrin.h - AVX512ER intrinsics ---------------------------=== |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 2 | * |
Chandler Carruth | 4cf5743 | 2019-04-08 20:51:30 +0000 | [diff] [blame] | 3 | * Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | * See https://llvm.org/LICENSE.txt for license information. |
| 5 | * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 6 | * |
| 7 | *===-----------------------------------------------------------------------=== |
| 8 | */ |
| 9 | #ifndef __IMMINTRIN_H |
| 10 | #error "Never use <avx512erintrin.h> directly; include <immintrin.h> instead." |
| 11 | #endif |
| 12 | |
| 13 | #ifndef __AVX512ERINTRIN_H |
| 14 | #define __AVX512ERINTRIN_H |
| 15 | |
Craig Topper | 73d1d40 | 2018-05-30 22:33:21 +0000 | [diff] [blame] | 16 | /* exp2a23 */ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 17 | #define _mm512_exp2a23_round_pd(A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 18 | (__m512d)__builtin_ia32_exp2pd_mask((__v8df)(__m512d)(A), \ |
| 19 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 20 | (__mmask8)-1, (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 21 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 22 | #define _mm512_mask_exp2a23_round_pd(S, M, A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 23 | (__m512d)__builtin_ia32_exp2pd_mask((__v8df)(__m512d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 24 | (__v8df)(__m512d)(S), (__mmask8)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 25 | (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 26 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 27 | #define _mm512_maskz_exp2a23_round_pd(M, A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 28 | (__m512d)__builtin_ia32_exp2pd_mask((__v8df)(__m512d)(A), \ |
| 29 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 30 | (__mmask8)(M), (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 31 | |
| 32 | #define _mm512_exp2a23_pd(A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 33 | _mm512_exp2a23_round_pd((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 34 | |
| 35 | #define _mm512_mask_exp2a23_pd(S, M, A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 36 | _mm512_mask_exp2a23_round_pd((S), (M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 37 | |
| 38 | #define _mm512_maskz_exp2a23_pd(M, A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 39 | _mm512_maskz_exp2a23_round_pd((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 40 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 41 | #define _mm512_exp2a23_round_ps(A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 42 | (__m512)__builtin_ia32_exp2ps_mask((__v16sf)(__m512)(A), \ |
| 43 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 44 | (__mmask16)-1, (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 45 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 46 | #define _mm512_mask_exp2a23_round_ps(S, M, A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 47 | (__m512)__builtin_ia32_exp2ps_mask((__v16sf)(__m512)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 48 | (__v16sf)(__m512)(S), (__mmask16)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 49 | (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 50 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 51 | #define _mm512_maskz_exp2a23_round_ps(M, A, R) \ |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 52 | (__m512)__builtin_ia32_exp2ps_mask((__v16sf)(__m512)(A), \ |
| 53 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 54 | (__mmask16)(M), (int)(R)) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 55 | |
| 56 | #define _mm512_exp2a23_ps(A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 57 | _mm512_exp2a23_round_ps((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 58 | |
| 59 | #define _mm512_mask_exp2a23_ps(S, M, A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 60 | _mm512_mask_exp2a23_round_ps((S), (M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 61 | |
| 62 | #define _mm512_maskz_exp2a23_ps(M, A) \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 63 | _mm512_maskz_exp2a23_round_ps((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | 2a898bf | 2015-02-01 21:34:11 +0000 | [diff] [blame] | 64 | |
Craig Topper | 73d1d40 | 2018-05-30 22:33:21 +0000 | [diff] [blame] | 65 | /* rsqrt28 */ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 66 | #define _mm512_rsqrt28_round_pd(A, R) \ |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 67 | (__m512d)__builtin_ia32_rsqrt28pd_mask((__v8df)(__m512d)(A), \ |
| 68 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 69 | (__mmask8)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 70 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 71 | #define _mm512_mask_rsqrt28_round_pd(S, M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 72 | (__m512d)__builtin_ia32_rsqrt28pd_mask((__v8df)(__m512d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 73 | (__v8df)(__m512d)(S), (__mmask8)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 74 | (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 75 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 76 | #define _mm512_maskz_rsqrt28_round_pd(M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 77 | (__m512d)__builtin_ia32_rsqrt28pd_mask((__v8df)(__m512d)(A), \ |
| 78 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 79 | (__mmask8)(M), (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 80 | |
| 81 | #define _mm512_rsqrt28_pd(A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 82 | _mm512_rsqrt28_round_pd((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 83 | |
| 84 | #define _mm512_mask_rsqrt28_pd(S, M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 85 | _mm512_mask_rsqrt28_round_pd((S), (M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 86 | |
| 87 | #define _mm512_maskz_rsqrt28_pd(M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 88 | _mm512_maskz_rsqrt28_round_pd((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 89 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 90 | #define _mm512_rsqrt28_round_ps(A, R) \ |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 91 | (__m512)__builtin_ia32_rsqrt28ps_mask((__v16sf)(__m512)(A), \ |
| 92 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 93 | (__mmask16)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 94 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 95 | #define _mm512_mask_rsqrt28_round_ps(S, M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 96 | (__m512)__builtin_ia32_rsqrt28ps_mask((__v16sf)(__m512)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 97 | (__v16sf)(__m512)(S), (__mmask16)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 98 | (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 99 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 100 | #define _mm512_maskz_rsqrt28_round_ps(M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 101 | (__m512)__builtin_ia32_rsqrt28ps_mask((__v16sf)(__m512)(A), \ |
| 102 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 103 | (__mmask16)(M), (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 104 | |
| 105 | #define _mm512_rsqrt28_ps(A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 106 | _mm512_rsqrt28_round_ps((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 107 | |
| 108 | #define _mm512_mask_rsqrt28_ps(S, M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 109 | _mm512_mask_rsqrt28_round_ps((S), (M), A, _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 110 | |
| 111 | #define _mm512_maskz_rsqrt28_ps(M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 112 | _mm512_maskz_rsqrt28_round_ps((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 113 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 114 | #define _mm_rsqrt28_round_ss(A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 115 | (__m128)__builtin_ia32_rsqrt28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 116 | (__v4sf)(__m128)(B), \ |
| 117 | (__v4sf)_mm_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 118 | (__mmask8)-1, (int)(R)) |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 119 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 120 | #define _mm_mask_rsqrt28_round_ss(S, M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 121 | (__m128)__builtin_ia32_rsqrt28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 122 | (__v4sf)(__m128)(B), \ |
| 123 | (__v4sf)(__m128)(S), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 124 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 125 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 126 | #define _mm_maskz_rsqrt28_round_ss(M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 127 | (__m128)__builtin_ia32_rsqrt28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 128 | (__v4sf)(__m128)(B), \ |
| 129 | (__v4sf)_mm_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 130 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 131 | |
| 132 | #define _mm_rsqrt28_ss(A, B) \ |
| 133 | _mm_rsqrt28_round_ss((A), (B), _MM_FROUND_CUR_DIRECTION) |
| 134 | |
| 135 | #define _mm_mask_rsqrt28_ss(S, M, A, B) \ |
| 136 | _mm_mask_rsqrt28_round_ss((S), (M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 137 | |
| 138 | #define _mm_maskz_rsqrt28_ss(M, A, B) \ |
| 139 | _mm_maskz_rsqrt28_round_ss((M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 140 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 141 | #define _mm_rsqrt28_round_sd(A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 142 | (__m128d)__builtin_ia32_rsqrt28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 143 | (__v2df)(__m128d)(B), \ |
| 144 | (__v2df)_mm_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 145 | (__mmask8)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 146 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 147 | #define _mm_mask_rsqrt28_round_sd(S, M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 148 | (__m128d)__builtin_ia32_rsqrt28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 149 | (__v2df)(__m128d)(B), \ |
| 150 | (__v2df)(__m128d)(S), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 151 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 152 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 153 | #define _mm_maskz_rsqrt28_round_sd(M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 154 | (__m128d)__builtin_ia32_rsqrt28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 155 | (__v2df)(__m128d)(B), \ |
| 156 | (__v2df)_mm_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 157 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 158 | |
| 159 | #define _mm_rsqrt28_sd(A, B) \ |
| 160 | _mm_rsqrt28_round_sd((A), (B), _MM_FROUND_CUR_DIRECTION) |
| 161 | |
| 162 | #define _mm_mask_rsqrt28_sd(S, M, A, B) \ |
| 163 | _mm_mask_rsqrt28_round_sd((S), (M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 164 | |
| 165 | #define _mm_maskz_rsqrt28_sd(M, A, B) \ |
Michael Zuckerman | 1a7889f | 2016-06-05 15:57:49 +0000 | [diff] [blame] | 166 | _mm_maskz_rsqrt28_round_sd((M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 167 | |
Craig Topper | 73d1d40 | 2018-05-30 22:33:21 +0000 | [diff] [blame] | 168 | /* rcp28 */ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 169 | #define _mm512_rcp28_round_pd(A, R) \ |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 170 | (__m512d)__builtin_ia32_rcp28pd_mask((__v8df)(__m512d)(A), \ |
| 171 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 172 | (__mmask8)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 173 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 174 | #define _mm512_mask_rcp28_round_pd(S, M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 175 | (__m512d)__builtin_ia32_rcp28pd_mask((__v8df)(__m512d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 176 | (__v8df)(__m512d)(S), (__mmask8)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 177 | (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 178 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 179 | #define _mm512_maskz_rcp28_round_pd(M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 180 | (__m512d)__builtin_ia32_rcp28pd_mask((__v8df)(__m512d)(A), \ |
| 181 | (__v8df)_mm512_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 182 | (__mmask8)(M), (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 183 | |
| 184 | #define _mm512_rcp28_pd(A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 185 | _mm512_rcp28_round_pd((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 186 | |
| 187 | #define _mm512_mask_rcp28_pd(S, M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 188 | _mm512_mask_rcp28_round_pd((S), (M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 189 | |
| 190 | #define _mm512_maskz_rcp28_pd(M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 191 | _mm512_maskz_rcp28_round_pd((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 192 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 193 | #define _mm512_rcp28_round_ps(A, R) \ |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 194 | (__m512)__builtin_ia32_rcp28ps_mask((__v16sf)(__m512)(A), \ |
| 195 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 196 | (__mmask16)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 197 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 198 | #define _mm512_mask_rcp28_round_ps(S, M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 199 | (__m512)__builtin_ia32_rcp28ps_mask((__v16sf)(__m512)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 200 | (__v16sf)(__m512)(S), (__mmask16)(M), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 201 | (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 202 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 203 | #define _mm512_maskz_rcp28_round_ps(M, A, R) \ |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 204 | (__m512)__builtin_ia32_rcp28ps_mask((__v16sf)(__m512)(A), \ |
| 205 | (__v16sf)_mm512_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 206 | (__mmask16)(M), (int)(R)) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 207 | |
| 208 | #define _mm512_rcp28_ps(A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 209 | _mm512_rcp28_round_ps((A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 210 | |
| 211 | #define _mm512_mask_rcp28_ps(S, M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 212 | _mm512_mask_rcp28_round_ps((S), (M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 213 | |
| 214 | #define _mm512_maskz_rcp28_ps(M, A) \ |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 215 | _mm512_maskz_rcp28_round_ps((M), (A), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | c4b852a | 2015-02-01 08:52:55 +0000 | [diff] [blame] | 216 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 217 | #define _mm_rcp28_round_ss(A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 218 | (__m128)__builtin_ia32_rcp28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 219 | (__v4sf)(__m128)(B), \ |
| 220 | (__v4sf)_mm_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 221 | (__mmask8)-1, (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 222 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 223 | #define _mm_mask_rcp28_round_ss(S, M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 224 | (__m128)__builtin_ia32_rcp28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 225 | (__v4sf)(__m128)(B), \ |
| 226 | (__v4sf)(__m128)(S), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 227 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 228 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 229 | #define _mm_maskz_rcp28_round_ss(M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 230 | (__m128)__builtin_ia32_rcp28ss_round_mask((__v4sf)(__m128)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 231 | (__v4sf)(__m128)(B), \ |
| 232 | (__v4sf)_mm_setzero_ps(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 233 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 234 | |
| 235 | #define _mm_rcp28_ss(A, B) \ |
| 236 | _mm_rcp28_round_ss((A), (B), _MM_FROUND_CUR_DIRECTION) |
| 237 | |
| 238 | #define _mm_mask_rcp28_ss(S, M, A, B) \ |
| 239 | _mm_mask_rcp28_round_ss((S), (M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 240 | |
| 241 | #define _mm_maskz_rcp28_ss(M, A, B) \ |
| 242 | _mm_maskz_rcp28_round_ss((M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
Craig Topper | b01fc31 | 2015-02-01 08:05:12 +0000 | [diff] [blame] | 243 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 244 | #define _mm_rcp28_round_sd(A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 245 | (__m128d)__builtin_ia32_rcp28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 246 | (__v2df)(__m128d)(B), \ |
| 247 | (__v2df)_mm_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 248 | (__mmask8)-1, (int)(R)) |
Elena Demikhovsky | fcc6df3 | 2014-07-22 11:31:39 +0000 | [diff] [blame] | 249 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 250 | #define _mm_mask_rcp28_round_sd(S, M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 251 | (__m128d)__builtin_ia32_rcp28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 252 | (__v2df)(__m128d)(B), \ |
| 253 | (__v2df)(__m128d)(S), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 254 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 255 | |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 256 | #define _mm_maskz_rcp28_round_sd(M, A, B, R) \ |
Igor Breger | 9c2a0bf | 2016-02-08 12:36:48 +0000 | [diff] [blame] | 257 | (__m128d)__builtin_ia32_rcp28sd_round_mask((__v2df)(__m128d)(A), \ |
Craig Topper | 0bb4664 | 2016-05-17 04:41:38 +0000 | [diff] [blame] | 258 | (__v2df)(__m128d)(B), \ |
| 259 | (__v2df)_mm_setzero_pd(), \ |
Craig Topper | c633867 | 2018-05-31 00:51:20 +0000 | [diff] [blame] | 260 | (__mmask8)(M), (int)(R)) |
Craig Topper | da97c20 | 2015-02-01 10:15:11 +0000 | [diff] [blame] | 261 | |
| 262 | #define _mm_rcp28_sd(A, B) \ |
| 263 | _mm_rcp28_round_sd((A), (B), _MM_FROUND_CUR_DIRECTION) |
| 264 | |
| 265 | #define _mm_mask_rcp28_sd(S, M, A, B) \ |
| 266 | _mm_mask_rcp28_round_sd((S), (M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 267 | |
| 268 | #define _mm_maskz_rcp28_sd(M, A, B) \ |
| 269 | _mm_maskz_rcp28_round_sd((M), (A), (B), _MM_FROUND_CUR_DIRECTION) |
| 270 | |
Craig Topper | 73d1d40 | 2018-05-30 22:33:21 +0000 | [diff] [blame] | 271 | #endif /* __AVX512ERINTRIN_H */ |