blob: 08d7c5343ed3cc4f15d89ad83b9a0ab2e4e2f896 [file] [log] [blame]
XNNPACK Teamb455b122019-09-27 18:10:33 -07001# Copyright 2019 Google LLC
2#
3# This source code is licensed under the BSD-style license found in the
4# LICENSE file in the root directory of this source tree.
Frank Barchard21be34f2019-10-09 19:32:19 -07005- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a53
6 k-block: 8
7 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -07008 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -07009- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a57
10 k-block: 8
11 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070012 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070013- name: xnn_f32_gemminc_ukernel_1x8__aarch64_neonfma_cortex_a75
14 k-block: 8
15 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070016 assembly: true
Frank Barchard46fb8072019-10-25 12:54:22 -070017- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a53
Frank Barchard0ecc2ab2019-11-14 10:57:48 -080018 k-block: 4
19 pipelined: true
Frank Barchard46fb8072019-10-25 12:54:22 -070020 assembly: true
Frank Barchard8fb90552020-03-16 11:36:09 -070021- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a55
22 k-block: 4
23 pipelined: true
24 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070025- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a57
26 k-block: 8
27 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070028 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070029- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_cortex_a75
30 k-block: 8
31 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070032 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070033- name: xnn_f32_gemminc_ukernel_5x8__aarch64_neonfma_cortex_a75
34 k-block: 8
35 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070036 assembly: true
Frank Barcharda7fb8552019-10-23 17:14:17 -070037- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a53
Frank Barchard00bf68e2019-10-27 03:00:09 -070038 k-block: 4
Frank Barcharde64f91a2019-11-11 13:18:00 -080039 pipelined: true
Frank Barcharda7fb8552019-10-23 17:14:17 -070040 assembly: true
Frank Barchard91e19992020-03-09 18:46:14 -070041- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a55
42 k-block: 4
43 pipelined: true
44 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070045- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a57
Frank Barchardbd419712019-10-31 14:15:36 -070046 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070047 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070048- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a73
49 k-block: 8
50 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070051 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070052- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_cortex_a75
53 k-block: 8
54 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070055 assembly: true
Frank Barchard0d1052c2020-03-23 17:28:13 -070056- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_ios
57 k-block: 8
58 pipelined: true
59 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070060- name: xnn_f32_gemminc_ukernel_1x12__aarch64_neonfma_cortex_a53
61 k-block: 4
62 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070063 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070064- name: xnn_f32_gemminc_ukernel_4x12__aarch64_neonfma_cortex_a53
65 k-block: 4
66 pipelined: true
Frank Barchard7e955972019-10-11 10:34:25 -070067 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070068- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_ld64
69 k-block: 2
Frank Barchard7e955972019-10-11 10:34:25 -070070 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070071- name: xnn_f32_gemminc_ukernel_4x8__aarch64_neonfma_ld128
72 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070073 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070074- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_ld64
75 k-block: 2
Frank Barchard7e955972019-10-11 10:34:25 -070076 assembly: true
XNNPACK Teamb455b122019-09-27 18:10:33 -070077- name: xnn_f32_gemminc_ukernel_6x8__aarch64_neonfma_ld128
78 k-block: 4
Frank Barchard7e955972019-10-11 10:34:25 -070079 assembly: true
Frank Barchard91317c52019-11-22 10:54:35 -080080- name: xnn_f32_gemminc_ukernel_1x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070081 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080082- name: xnn_f32_gemminc_ukernel_4x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070083 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080084- name: xnn_f32_gemminc_ukernel_4x8__neon_lane_ld128
XNNPACK Teamb455b122019-09-27 18:10:33 -070085 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -080086- name: xnn_f32_gemminc_ukernel_5x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070087 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080088- name: xnn_f32_gemminc_ukernel_6x8__neon_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070089 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -080090- name: xnn_f32_gemminc_ukernel_6x8__neon_lane_ld128
91 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -080092- name: xnn_f32_gemminc_ukernel_1x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070093 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080094 arch:
95 - aarch64
96- name: xnn_f32_gemminc_ukernel_4x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -070097 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -080098 arch:
99 - aarch64
100- name: xnn_f32_gemminc_ukernel_4x8__neonfma_lane_ld128
XNNPACK Teamb455b122019-09-27 18:10:33 -0700101 k-block: 4
Frank Barchard91317c52019-11-22 10:54:35 -0800102 arch:
103 - aarch64
104- name: xnn_f32_gemminc_ukernel_5x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -0700105 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -0800106 arch:
107 - aarch64
108- name: xnn_f32_gemminc_ukernel_6x8__neonfma_lane_ld64
XNNPACK Teamb455b122019-09-27 18:10:33 -0700109 k-block: 2
Frank Barchard91317c52019-11-22 10:54:35 -0800110 arch:
111 - aarch64
Frank Barchard69172d92019-11-26 16:22:39 -0800112- name: xnn_f32_gemminc_ukernel_6x8__neonfma_lane_ld128
113 k-block: 4
114 arch:
115 - aarch64
Frank Barchard5243bb02019-11-22 16:37:50 -0800116- name: xnn_f32_gemminc_ukernel_1x8__neon_dup_ld64
117 k-block: 2
118- name: xnn_f32_gemminc_ukernel_4x8__neon_dup_ld64
119 k-block: 2
120- name: xnn_f32_gemminc_ukernel_4x8__neon_dup_ld128
121 k-block: 4
122- name: xnn_f32_gemminc_ukernel_6x8__neon_dup_ld64
123 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -0800124- name: xnn_f32_gemminc_ukernel_6x8__neon_dup_ld128
125 k-block: 4
Frank Barchard5243bb02019-11-22 16:37:50 -0800126- name: xnn_f32_gemminc_ukernel_1x8__neonfma_dup_ld64
127 k-block: 2
128- name: xnn_f32_gemminc_ukernel_4x8__neonfma_dup_ld64
129 k-block: 2
130- name: xnn_f32_gemminc_ukernel_4x8__neonfma_dup_ld128
131 k-block: 4
132- name: xnn_f32_gemminc_ukernel_6x8__neonfma_dup_ld64
133 k-block: 2
Frank Barchard69172d92019-11-26 16:22:39 -0800134- name: xnn_f32_gemminc_ukernel_6x8__neonfma_dup_ld128
135 k-block: 4
Frank Barchard5243bb02019-11-22 16:37:50 -0800136- name: xnn_f32_gemminc_ukernel_1x8s4__neon
137 k-block: 4
138- name: xnn_f32_gemminc_ukernel_4x8s4__neon
139 k-block: 4
140- name: xnn_f32_gemminc_ukernel_6x8s4__neon
141 k-block: 4
142- name: xnn_f32_gemminc_ukernel_8x8s4__neon
143 k-block: 4
Frank Barcharddf06d802019-11-20 15:53:46 -0800144- name: xnn_f32_gemminc_ukernel_1x8s4__neonfma
145 k-block: 4
146- name: xnn_f32_gemminc_ukernel_4x8s4__neonfma
147 k-block: 4
148- name: xnn_f32_gemminc_ukernel_6x8s4__neonfma
149 k-block: 4
150- name: xnn_f32_gemminc_ukernel_8x8s4__neonfma
151 k-block: 4
XNNPACK Teamb455b122019-09-27 18:10:33 -0700152- name: xnn_f32_gemminc_ukernel_1x8__sse_load1
153 k-block: 1
154- name: xnn_f32_gemminc_ukernel_4x8__sse_load1
155 k-block: 1
156- name: xnn_f32_gemminc_ukernel_1x8__sse_dup
157 k-block: 4
158- name: xnn_f32_gemminc_ukernel_4x8__sse_dup
159 k-block: 4
160- name: xnn_f32_gemminc_ukernel_1x8s4__sse
161 k-block: 4
162- name: xnn_f32_gemminc_ukernel_4x8s4__sse
163 k-block: 4
Marat Dukhanfda12b82019-11-21 12:27:59 -0800164- name: xnn_f32_gemminc_ukernel_1x8__avx_broadcast
165 k-block: 1
166- name: xnn_f32_gemminc_ukernel_4x8__avx_broadcast
167 k-block: 1
168- name: xnn_f32_gemminc_ukernel_5x8__avx_broadcast
169 k-block: 1
170- name: xnn_f32_gemminc_ukernel_6x8__avx_broadcast
171 k-block: 1
172- name: xnn_f32_gemminc_ukernel_7x8__avx_broadcast
173 k-block: 1
Marat Dukhan27121322019-12-09 14:57:40 -0800174- name: xnn_f32_gemminc_ukernel_1x16__avx_broadcast
175 k-block: 1
176- name: xnn_f32_gemminc_ukernel_3x16__avx_broadcast
177 k-block: 1
178- name: xnn_f32_gemminc_ukernel_4x16__avx_broadcast
179 k-block: 1
180- name: xnn_f32_gemminc_ukernel_5x16__avx_broadcast
181 k-block: 1
Marat Dukhanfda12b82019-11-21 12:27:59 -0800182- name: xnn_f32_gemminc_ukernel_1x8__fma3_broadcast
183 k-block: 1
184- name: xnn_f32_gemminc_ukernel_4x8__fma3_broadcast
185 k-block: 1
186- name: xnn_f32_gemminc_ukernel_5x8__fma3_broadcast
187 k-block: 1
188- name: xnn_f32_gemminc_ukernel_6x8__fma3_broadcast
189 k-block: 1
190- name: xnn_f32_gemminc_ukernel_7x8__fma3_broadcast
191 k-block: 1
192- name: xnn_f32_gemminc_ukernel_8x8__fma3_broadcast
193 k-block: 1
Marat Dukhan27121322019-12-09 14:57:40 -0800194- name: xnn_f32_gemminc_ukernel_1x16__fma3_broadcast
195 k-block: 1
196- name: xnn_f32_gemminc_ukernel_3x16__fma3_broadcast
197 k-block: 1
198- name: xnn_f32_gemminc_ukernel_4x16__fma3_broadcast
199 k-block: 1
200- name: xnn_f32_gemminc_ukernel_5x16__fma3_broadcast
201 k-block: 1
202- name: xnn_f32_gemminc_ukernel_1x16s4__fma3_broadcast
203 k-block: 4
204- name: xnn_f32_gemminc_ukernel_3x16s4__fma3_broadcast
205 k-block: 4
206- name: xnn_f32_gemminc_ukernel_4x16s4__fma3_broadcast
207 k-block: 4
208- name: xnn_f32_gemminc_ukernel_5x16s4__fma3_broadcast
209 k-block: 4
Marat Dukhan0f349c42019-11-27 11:58:54 -0800210- name: xnn_f32_gemminc_ukernel_1x16__avx512f_broadcast
211 k-block: 1
212- name: xnn_f32_gemminc_ukernel_4x16__avx512f_broadcast
213 k-block: 1
214- name: xnn_f32_gemminc_ukernel_5x16__avx512f_broadcast
215 k-block: 1
216- name: xnn_f32_gemminc_ukernel_6x16__avx512f_broadcast
217 k-block: 1
218- name: xnn_f32_gemminc_ukernel_7x16__avx512f_broadcast
219 k-block: 1
220- name: xnn_f32_gemminc_ukernel_8x16__avx512f_broadcast
221 k-block: 1
XNNPACK Teamb455b122019-09-27 18:10:33 -0700222- name: xnn_f32_gemminc_ukernel_1x8__psimd_loadsplat
223 k-block: 1
224- name: xnn_f32_gemminc_ukernel_4x8__psimd_loadsplat
225 k-block: 1
226- name: xnn_f32_gemminc_ukernel_6x8__psimd_loadsplat
227 k-block: 1
228- name: xnn_f32_gemminc_ukernel_1x8__psimd_splat
229 k-block: 4
230- name: xnn_f32_gemminc_ukernel_4x8__psimd_splat
231 k-block: 4
232- name: xnn_f32_gemminc_ukernel_6x8__psimd_splat
233 k-block: 4
234- name: xnn_f32_gemminc_ukernel_1x8s4__psimd
235 k-block: 4
236- name: xnn_f32_gemminc_ukernel_4x8s4__psimd
237 k-block: 4
238- name: xnn_f32_gemminc_ukernel_6x8s4__psimd
239 k-block: 4
Marat Dukhan436ebe62019-12-04 15:10:12 -0800240- name: xnn_f32_gemminc_ukernel_1x4__wasm
241 k-block: 1
242- name: xnn_f32_gemminc_ukernel_2x4__wasm
243 k-block: 1
244- name: xnn_f32_gemminc_ukernel_4x4__wasm
245 k-block: 1
XNNPACK Teamb455b122019-09-27 18:10:33 -0700246- name: xnn_f32_gemminc_ukernel_1x4__scalar
247 k-block: 1
248- name: xnn_f32_gemminc_ukernel_2x4__scalar
249 k-block: 1
250- name: xnn_f32_gemminc_ukernel_4x4__scalar
251 k-block: 1