blob: 8f337f501d4db4684ab787e0ff7ec3731a919465 [file] [log] [blame]
Marat Dukhan9b474cf2021-05-25 16:37:48 -07001# Copyright 2021 Google LLC
2#
3# This source code is licensed under the BSD-style license found in the
4# LICENSE file in the root directory of this source tree.
5
Marat Dukhan18630de2021-06-02 22:20:01 -07006- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c4__neondot
7 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
8 k-block: 8
9- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x8c4__neondot
10 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
11 k-block: 8
12- name: xnn_qs8_igemm_minmax_fp32_ukernel_6x8c4__neondot
13 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
14 k-block: 8
15- name: xnn_qs8_igemm_minmax_fp32_ukernel_8x8c4__neondot
16 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
17 k-block: 8
18- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16c4__neondot
19 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
20 k-block: 8
21- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c4__neondot
22 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
23 k-block: 8
24- name: xnn_qs8_igemm_minmax_fp32_ukernel_6x16c4__neondot
25 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
26 k-block: 8
27- name: xnn_qs8_igemm_minmax_fp32_ukernel_8x16c4__neondot
28 init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
29 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070030- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070031 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
32 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070033- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070034 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
35 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070036- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070037 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
38 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070039- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070040 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
41 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070042- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070043 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
44 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070045- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070046 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
47 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070048- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070049 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
50 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070051- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070052 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
53 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070054- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070055 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
56 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070057- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070058 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
59 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070060- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070061 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
62 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070063- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070064 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
65 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070066- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070067 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
68 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070069- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070070 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
71 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070072- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070073 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
74 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070075- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -070076 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
77 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070078- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070079 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
80 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070081- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070082 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
83 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070084- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070085 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
86 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070087- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070088 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
89 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070090- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070091 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
92 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070093- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070094 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
95 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070096- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -070097 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
98 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -070099- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700100 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
101 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700102- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700103 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
104 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700105- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700106 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
107 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700108- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700109 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
110 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700111- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700112 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
113 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700114- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700115 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
116 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700117- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700118 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
119 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700120- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700121 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
122 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700123- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700124 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
125 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700126- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700127 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
128 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700129- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700130 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
131 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700132- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700133 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
134 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700135- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__ssse3_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700136 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
137 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700138- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__ssse3_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700139 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
140 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700141- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__ssse3_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700142 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
143 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700144- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700145 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
146 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700147- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700148 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
149 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700150- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700151 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
152 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700153- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700154 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
155 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700156- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700157 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
158 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700159- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700160 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
161 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700162- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700163 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
164 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700165- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700166 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
167 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700168- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld64
Marat Dukhanc46e6712021-06-01 19:00:16 -0700169 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
170 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700171- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700172 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
173 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700174- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700175 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
176 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700177- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700178 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
179 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700180- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__ssse3_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700181 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
182 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700183- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__ssse3_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700184 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
185 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700186- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__ssse3_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700187 init: xnn_init_qs8_conv_minmax_fp32_sse2_params
188 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700189- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700190 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
191 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700192- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700193 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
194 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700195- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700196 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
197 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700198- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700199 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
200 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700201- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700202 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
203 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700204- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700205 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
206 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700207- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700208 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
209 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700210- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700211 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
212 k-block: 8
Marat Dukhan801d2c22021-06-02 21:25:05 -0700213- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld128
Marat Dukhanc46e6712021-06-01 19:00:16 -0700214 init: xnn_init_qs8_conv_minmax_fp32_sse4_params
215 k-block: 8
Marat Dukhan9b474cf2021-05-25 16:37:48 -0700216- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c8__avx2
217 init: xnn_init_qs8_conv_minmax_fp32_avx2_params
218 k-block: 8
219- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c8__avx2
220 init: xnn_init_qs8_conv_minmax_fp32_avx2_params
221 k-block: 8
222- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x8c8__avx2
223 init: xnn_init_qs8_conv_minmax_fp32_avx2_params
224 k-block: 8
Marat Dukhan71855ee2021-05-25 19:05:06 -0700225- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x16c8__avx512skx
226 init: xnn_init_qs8_conv_minmax_fp32_avx512_params
227 k-block: 8
228- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx
229 init: xnn_init_qs8_conv_minmax_fp32_avx512_params
230 k-block: 8
231- name: xnn_qs8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx
232 init: xnn_init_qs8_conv_minmax_fp32_avx512_params
233 k-block: 8
234- name: xnn_qs8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx
235 init: xnn_init_qs8_conv_minmax_fp32_avx512_params
236 k-block: 8