Marat Dukhan | 9b474cf | 2021-05-25 16:37:48 -0700 | [diff] [blame] | 1 | # Copyright 2021 Google LLC |
| 2 | # |
| 3 | # This source code is licensed under the BSD-style license found in the |
| 4 | # LICENSE file in the root directory of this source tree. |
| 5 | |
Frank Barchard | 98af05c | 2021-06-30 12:15:04 -0700 | [diff] [blame] | 6 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16__aarch64_neon_mlal_lane_prfm_cortex_a53 |
| 7 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 8 | k-block: 8 |
| 9 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16__aarch64_neon_mlal_lane_cortex_a53 |
| 10 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 11 | k-block: 8 |
Frank Barchard | 1a0b276 | 2021-06-29 18:37:59 -0700 | [diff] [blame] | 12 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_cortex_a55 |
| 13 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 14 | k-block: 16 |
| 15 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_ld64 |
| 16 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 17 | k-block: 8 |
| 18 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c4__aarch64_neondot_ld128 |
| 19 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 20 | k-block: 16 |
Marat Dukhan | cf05585 | 2021-06-26 09:05:09 -0700 | [diff] [blame] | 21 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16__neon_mlal_lane |
| 22 | init: xnn_init_qs8_conv_minmax_fp32_neon_params |
| 23 | k-block: 8 |
| 24 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16__neon_mlal_lane |
| 25 | init: xnn_init_qs8_conv_minmax_fp32_neon_params |
| 26 | k-block: 8 |
| 27 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16__neonv8_mlal_lane |
| 28 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 29 | k-block: 8 |
| 30 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16__neonv8_mlal_lane |
| 31 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 32 | k-block: 8 |
| 33 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c8__neon_mlal_padal |
| 34 | init: xnn_init_qs8_conv_minmax_fp32_neon_params |
| 35 | k-block: 16 |
| 36 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c8__neon_mlal_padal |
| 37 | init: xnn_init_qs8_conv_minmax_fp32_neon_params |
| 38 | k-block: 16 |
| 39 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c8__neonv8_mlal_padal |
| 40 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 41 | k-block: 16 |
| 42 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c8__neonv8_mlal_padal |
| 43 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 44 | k-block: 16 |
Marat Dukhan | 18630de | 2021-06-02 22:20:01 -0700 | [diff] [blame] | 45 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c4__neondot |
| 46 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 47 | k-block: 8 |
| 48 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x8c4__neondot |
| 49 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 50 | k-block: 8 |
| 51 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_6x8c4__neondot |
| 52 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 53 | k-block: 8 |
| 54 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_8x8c4__neondot |
| 55 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 56 | k-block: 8 |
| 57 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16c4__neondot |
| 58 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 59 | k-block: 8 |
| 60 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c4__neondot |
| 61 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 62 | k-block: 8 |
| 63 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_6x16c4__neondot |
| 64 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 65 | k-block: 8 |
| 66 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_8x16c4__neondot |
| 67 | init: xnn_init_qs8_conv_minmax_fp32_neonv8_params |
| 68 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 69 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 70 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 71 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 72 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 73 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 74 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 75 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 76 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 77 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 78 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 79 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 80 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 81 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 82 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 83 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 84 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 85 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 86 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 87 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 88 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 89 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 90 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 91 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 92 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 93 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 94 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 95 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 96 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 97 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 98 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 99 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 100 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 101 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 102 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 103 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 104 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 105 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 106 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 107 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 108 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 109 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 110 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 111 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 112 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 113 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 114 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 115 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 116 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 117 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 118 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 119 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 120 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 121 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 122 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 123 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 124 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 125 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 126 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 127 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 128 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 129 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 130 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 131 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 132 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 133 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 134 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 135 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 136 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 137 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 138 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 139 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 140 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 141 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 142 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 143 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 144 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 145 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 146 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 147 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 148 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 149 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 150 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 151 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 152 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 153 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 154 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 155 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 156 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 157 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 158 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 159 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 160 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 161 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 162 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 163 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 164 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 165 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 166 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 167 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 168 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 169 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 170 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 171 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 172 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 173 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 174 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__ssse3_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 175 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 176 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 177 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__ssse3_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 178 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 179 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 180 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__ssse3_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 181 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 182 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 183 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 184 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 185 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 186 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 187 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 188 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 189 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 190 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 191 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 192 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 193 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 194 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 195 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 196 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 197 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 198 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 199 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 200 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 201 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 202 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 203 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 204 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 205 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 206 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 207 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld64 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 208 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 209 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 210 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 211 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 212 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 213 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 214 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 215 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 216 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 217 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 218 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 219 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__ssse3_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 220 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 221 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 222 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__ssse3_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 223 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 224 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 225 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__ssse3_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 226 | init: xnn_init_qs8_conv_minmax_fp32_sse2_params |
| 227 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 228 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 229 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 230 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 231 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 232 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 233 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 234 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 235 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 236 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 237 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 238 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 239 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 240 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 241 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 242 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 243 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 244 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 245 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 246 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 247 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 248 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 249 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 250 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 251 | k-block: 8 |
Marat Dukhan | 801d2c2 | 2021-06-02 21:25:05 -0700 | [diff] [blame] | 252 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld128 |
Marat Dukhan | c46e671 | 2021-06-01 19:00:16 -0700 | [diff] [blame] | 253 | init: xnn_init_qs8_conv_minmax_fp32_sse4_params |
| 254 | k-block: 8 |
Marat Dukhan | 9b474cf | 2021-05-25 16:37:48 -0700 | [diff] [blame] | 255 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c8__avx2 |
| 256 | init: xnn_init_qs8_conv_minmax_fp32_avx2_params |
| 257 | k-block: 8 |
| 258 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c8__avx2 |
| 259 | init: xnn_init_qs8_conv_minmax_fp32_avx2_params |
| 260 | k-block: 8 |
| 261 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x8c8__avx2 |
| 262 | init: xnn_init_qs8_conv_minmax_fp32_avx2_params |
| 263 | k-block: 8 |
Marat Dukhan | 71855ee | 2021-05-25 19:05:06 -0700 | [diff] [blame] | 264 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16c8__avx512skx |
| 265 | init: xnn_init_qs8_conv_minmax_fp32_avx512_params |
| 266 | k-block: 8 |
| 267 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx |
| 268 | init: xnn_init_qs8_conv_minmax_fp32_avx512_params |
| 269 | k-block: 8 |
| 270 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx |
| 271 | init: xnn_init_qs8_conv_minmax_fp32_avx512_params |
| 272 | k-block: 8 |
| 273 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx |
| 274 | init: xnn_init_qs8_conv_minmax_fp32_avx512_params |
| 275 | k-block: 8 |
Marat Dukhan | 4741e41 | 2021-06-30 13:38:06 -0700 | [diff] [blame^] | 276 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_ld64 |
| 277 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 278 | k-block: 8 |
| 279 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_ld64 |
| 280 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 281 | k-block: 8 |
| 282 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_ld64 |
| 283 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 284 | k-block: 8 |
| 285 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_ld128 |
| 286 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 287 | k-block: 8 |
| 288 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_ld128 |
| 289 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 290 | k-block: 8 |
| 291 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_ld128 |
| 292 | init: xnn_init_qs8_conv_minmax_fp32_wasmsimd_params |
| 293 | k-block: 8 |
Marat Dukhan | 779b253 | 2021-06-29 14:14:13 -0700 | [diff] [blame] | 294 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x2__scalar_lrint |
| 295 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 296 | k-block: 1 |
| 297 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x2__scalar_lrint |
| 298 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 299 | k-block: 1 |
| 300 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x2__scalar_lrint |
| 301 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 302 | k-block: 1 |
| 303 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x2__scalar_lrint |
| 304 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 305 | k-block: 1 |
| 306 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4__scalar_lrint |
| 307 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 308 | k-block: 1 |
| 309 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4__scalar_lrint |
| 310 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 311 | k-block: 1 |
| 312 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4__scalar_lrint |
| 313 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 314 | k-block: 1 |
| 315 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4__scalar_lrint |
| 316 | init: xnn_init_qs8_conv_minmax_fp32_scalar_lrint_params |
| 317 | k-block: 1 |
| 318 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x2__scalar_magic |
| 319 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 320 | k-block: 1 |
| 321 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x2__scalar_magic |
| 322 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 323 | k-block: 1 |
| 324 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x2__scalar_magic |
| 325 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 326 | k-block: 1 |
| 327 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x2__scalar_magic |
| 328 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 329 | k-block: 1 |
| 330 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4__scalar_magic |
| 331 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 332 | k-block: 1 |
| 333 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4__scalar_magic |
| 334 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 335 | k-block: 1 |
| 336 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4__scalar_magic |
| 337 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 338 | k-block: 1 |
| 339 | - name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4__scalar_magic |
| 340 | init: xnn_init_qs8_conv_minmax_fp32_scalar_magic_params |
| 341 | k-block: 1 |