blob: cb4670a12bcc8f56d2bda33f0eb745d79ddf365f [file] [log] [blame]
XNNPACK Teamb455b122019-09-27 18:10:33 -07001# Copyright 2019 Google LLC
2#
3# This source code is licensed under the BSD-style license found in the
4# LICENSE file in the root directory of this source tree.
Frank Barchard21be34f2019-10-09 19:32:19 -07005- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a53
6 k-block: 8
7 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -07008 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -07009- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a57
10 k-block: 8
11 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070012 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070013- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a75
14 k-block: 8
15 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070016 assembly: true
Frank Barchard46fb8072019-10-25 12:54:22 -070017- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a53
Frank Barchard0ecc2ab2019-11-14 10:57:48 -080018 k-block: 4
19 pipelined: true
Frank Barchard46fb8072019-10-25 12:54:22 -070020 assembly: true
Frank Barchard8fb90552020-03-16 11:36:09 -070021- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a55
22 k-block: 4
23 pipelined: true
24 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070025- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a57
26 k-block: 8
27 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070028 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070029- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a75
30 k-block: 8
31 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070032 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070033- name: xnn_f32_gemminc_ukernel_5x8__aarch64_neonfma_cortex_a75
34 k-block: 8
35 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070036 assembly: true
Frank Barcharda7fb8552019-10-23 17:14:17 -070037- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a53
Frank Barchard00bf68e2019-10-27 03:00:09 -070038 k-block: 4
Frank Barcharde64f91a2019-11-11 13:18:00 -080039 pipelined: true
Frank Barcharda7fb8552019-10-23 17:14:17 -070040 assembly: true
Frank Barchard91e19992020-03-09 18:46:14 -070041- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a55
42 k-block: 4
43 pipelined: true
44 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070045- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a57
Frank Barchardbd419712019-10-31 14:15:36 -070046 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070047 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070048- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a73
49 k-block: 8
50 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070051 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070052- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a75
53 k-block: 8
54 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070055 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070056- name: xnn_f32_gemminc_ukernel_1x12__aarch64_neonfma_cortex_a53
57 k-block: 4
58 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070059 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070060- name: xnn_f32_gemminc_ukernel_4x12__aarch64_neonfma_cortex_a53
61 k-block: 4
62 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070063 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070064- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_ld64
65 k-block: 2
Frank Barchard7e955972019-10-11 10:34:25 -070066 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070067- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_ld128
68 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070069 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070070- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_ld64
71 k-block: 2
Frank Barchard7e955972019-10-11 10:34:25 -070072 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070073- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_ld128
74 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070075 assembly: true
Frank Barchard91317c52019-11-22 10:54:35 -080076- name: xnn_f32_gemminc_ukernel_1x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070077 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080078- name: xnn_f32_gemminc_ukernel_4x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070079 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080080- name: xnn_f32_gemminc_ukernel_4x8__neon_lane_ld128
XNNPACK Teamb455b122019-09-27 18:10:33 -070081 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -080082- name: xnn_f32_gemminc_ukernel_5x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070083 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080084- name: xnn_f32_gemminc_ukernel_6x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070085 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -080086- name: xnn_f32_gemminc_ukernel_6x8__neon_lane_ld128
87 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -080088- name: xnn_f32_gemminc_ukernel_1x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070089 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080090 arch:
91 - aarch64
92- name: xnn_f32_gemminc_ukernel_4x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070093 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080094 arch:
95 - aarch64
96- name: xnn_f32_gemminc_ukernel_4x8__neonfma_lane_ld128
XNNPACK Teamb455b122019-09-27 18:10:33 -070097 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -080098 arch:
99 - aarch64
100- name: xnn_f32_gemminc_ukernel_5x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -0700101 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -0800102 arch:
103 - aarch64
104- name: xnn_f32_gemminc_ukernel_6x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -0700105 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -0800106 arch:
107 - aarch64
Frank Barchard69172d92019-11-26 16:22:39 -0800108- name: xnn_f32_gemminc_ukernel_6x8__neonfma_lane_ld128
109 k-block: 4
110 arch:
111 - aarch64
Frank Barchard5243bb02019-11-22 16:37:50 -0800112- name: xnn_f32_gemminc_ukernel_1x8__neon_dup_ld64
113 k-block: 2
114- name: xnn_f32_gemminc_ukernel_4x8__neon_dup_ld64
115 k-block: 2
116- name: xnn_f32_gemminc_ukernel_4x8__neon_dup_ld128
117 k-block: 4
118- name: xnn_f32_gemminc_ukernel_6x8__neon_dup_ld64
119 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -0800120- name: xnn_f32_gemminc_ukernel_6x8__neon_dup_ld128
121 k-block: 4
Frank Barchard5243bb02019-11-22 16:37:50 -0800122- name: xnn_f32_gemminc_ukernel_1x8__neonfma_dup_ld64
123 k-block: 2
124- name: xnn_f32_gemminc_ukernel_4x8__neonfma_dup_ld64
125 k-block: 2
126- name: xnn_f32_gemminc_ukernel_4x8__neonfma_dup_ld128
127 k-block: 4
128- name: xnn_f32_gemminc_ukernel_6x8__neonfma_dup_ld64
129 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -0800130- name: xnn_f32_gemminc_ukernel_6x8__neonfma_dup_ld128
131 k-block: 4
Frank Barchard5243bb02019-11-22 16:37:50 -0800132- name: xnn_f32_gemminc_ukernel_1x8s4__neon
133 k-block: 4
134- name: xnn_f32_gemminc_ukernel_4x8s4__neon
135 k-block: 4
136- name: xnn_f32_gemminc_ukernel_6x8s4__neon
137 k-block: 4
138- name: xnn_f32_gemminc_ukernel_8x8s4__neon
139 k-block: 4
Frank Barcharddf06d802019-11-20 15:53:46 -0800140- name: xnn_f32_gemminc_ukernel_1x8s4__neonfma
141 k-block: 4
142- name: xnn_f32_gemminc_ukernel_4x8s4__neonfma
143 k-block: 4
144- name: xnn_f32_gemminc_ukernel_6x8s4__neonfma
145 k-block: 4
146- name: xnn_f32_gemminc_ukernel_8x8s4__neonfma
147 k-block: 4
XNNPACK Teamb455b122019-09-27 18:10:33 -0700148- name: xnn_f32_gemminc_ukernel_1x8__sse_load1
149 k-block: 1
150- name: xnn_f32_gemminc_ukernel_4x8__sse_load1
151 k-block: 1
152- name: xnn_f32_gemminc_ukernel_1x8__sse_dup
153 k-block: 4
154- name: xnn_f32_gemminc_ukernel_4x8__sse_dup
155 k-block: 4
156- name: xnn_f32_gemminc_ukernel_1x8s4__sse
157 k-block: 4
158- name: xnn_f32_gemminc_ukernel_4x8s4__sse
159 k-block: 4
Marat Dukhanfda12b82019-11-21 12:27:59 -0800160- name: xnn_f32_gemminc_ukernel_1x8__avx_broadcast
161 k-block: 1
162- name: xnn_f32_gemminc_ukernel_4x8__avx_broadcast
163 k-block: 1
164- name: xnn_f32_gemminc_ukernel_5x8__avx_broadcast
165 k-block: 1
166- name: xnn_f32_gemminc_ukernel_6x8__avx_broadcast
167 k-block: 1
168- name: xnn_f32_gemminc_ukernel_7x8__avx_broadcast
169 k-block: 1
Marat Dukhan27121322019-12-09 14:57:40 -0800170- name: xnn_f32_gemminc_ukernel_1x16__avx_broadcast
171 k-block: 1
172- name: xnn_f32_gemminc_ukernel_3x16__avx_broadcast
173 k-block: 1
174- name: xnn_f32_gemminc_ukernel_4x16__avx_broadcast
175 k-block: 1
176- name: xnn_f32_gemminc_ukernel_5x16__avx_broadcast
177 k-block: 1
Marat Dukhanfda12b82019-11-21 12:27:59 -0800178- name: xnn_f32_gemminc_ukernel_1x8__fma3_broadcast
179 k-block: 1
180- name: xnn_f32_gemminc_ukernel_4x8__fma3_broadcast
181 k-block: 1
182- name: xnn_f32_gemminc_ukernel_5x8__fma3_broadcast
183 k-block: 1
184- name: xnn_f32_gemminc_ukernel_6x8__fma3_broadcast
185 k-block: 1
186- name: xnn_f32_gemminc_ukernel_7x8__fma3_broadcast
187 k-block: 1
188- name: xnn_f32_gemminc_ukernel_8x8__fma3_broadcast
189 k-block: 1
Marat Dukhan27121322019-12-09 14:57:40 -0800190- name: xnn_f32_gemminc_ukernel_1x16__fma3_broadcast
191 k-block: 1
192- name: xnn_f32_gemminc_ukernel_3x16__fma3_broadcast
193 k-block: 1
194- name: xnn_f32_gemminc_ukernel_4x16__fma3_broadcast
195 k-block: 1
196- name: xnn_f32_gemminc_ukernel_5x16__fma3_broadcast
197 k-block: 1
198- name: xnn_f32_gemminc_ukernel_1x16s4__fma3_broadcast
199 k-block: 4
200- name: xnn_f32_gemminc_ukernel_3x16s4__fma3_broadcast
201 k-block: 4
202- name: xnn_f32_gemminc_ukernel_4x16s4__fma3_broadcast
203 k-block: 4
204- name: xnn_f32_gemminc_ukernel_5x16s4__fma3_broadcast
205 k-block: 4
Marat Dukhan0f349c42019-11-27 11:58:54 -0800206- name: xnn_f32_gemminc_ukernel_1x16__avx512f_broadcast
207 k-block: 1
208- name: xnn_f32_gemminc_ukernel_4x16__avx512f_broadcast
209 k-block: 1
210- name: xnn_f32_gemminc_ukernel_5x16__avx512f_broadcast
211 k-block: 1
212- name: xnn_f32_gemminc_ukernel_6x16__avx512f_broadcast
213 k-block: 1
214- name: xnn_f32_gemminc_ukernel_7x16__avx512f_broadcast
215 k-block: 1
216- name: xnn_f32_gemminc_ukernel_8x16__avx512f_broadcast
217 k-block: 1
XNNPACK Teamb455b122019-09-27 18:10:33 -0700218- name: xnn_f32_gemminc_ukernel_1x8__psimd_loadsplat
219 k-block: 1
220- name: xnn_f32_gemminc_ukernel_4x8__psimd_loadsplat
221 k-block: 1
222- name: xnn_f32_gemminc_ukernel_6x8__psimd_loadsplat
223 k-block: 1
224- name: xnn_f32_gemminc_ukernel_1x8__psimd_splat
225 k-block: 4
226- name: xnn_f32_gemminc_ukernel_4x8__psimd_splat
227 k-block: 4
228- name: xnn_f32_gemminc_ukernel_6x8__psimd_splat
229 k-block: 4
230- name: xnn_f32_gemminc_ukernel_1x8s4__psimd
231 k-block: 4
232- name: xnn_f32_gemminc_ukernel_4x8s4__psimd
233 k-block: 4
234- name: xnn_f32_gemminc_ukernel_6x8s4__psimd
235 k-block: 4
Marat Dukhan436ebe62019-12-04 15:10:12 -0800236- name: xnn_f32_gemminc_ukernel_1x4__wasm
237 k-block: 1
238- name: xnn_f32_gemminc_ukernel_2x4__wasm
239 k-block: 1
240- name: xnn_f32_gemminc_ukernel_4x4__wasm
241 k-block: 1
XNNPACK Teamb455b122019-09-27 18:10:33 -0700242- name: xnn_f32_gemminc_ukernel_1x4__scalar
243 k-block: 1
244- name: xnn_f32_gemminc_ukernel_2x4__scalar
245 k-block: 1
246- name: xnn_f32_gemminc_ukernel_4x4__scalar
247 k-block: 1