blob: 43dae10667cc5e6ead7085012fc6ed3b18757549 [file] [log] [blame]
# Copyright 2021 Google LLC
#
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x16__neon_mlal_lane
init: xnn_init_qu8_conv_minmax_fp32_neon_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x16__neon_mlal_lane
init: xnn_init_qu8_conv_minmax_fp32_neon_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x16__neonv8_mlal_lane
init: xnn_init_qu8_conv_minmax_fp32_neonv8_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x16__neonv8_mlal_lane
init: xnn_init_qu8_conv_minmax_fp32_neonv8_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld64
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__sse2_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__sse41_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__avx_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__xop_ld128
init: xnn_init_qu8_conv_minmax_fp32_sse2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x8c8__avx2
init: xnn_init_qu8_conv_minmax_fp32_avx2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x8c8__avx2
init: xnn_init_qu8_conv_minmax_fp32_avx2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x8c8__avx2
init: xnn_init_qu8_conv_minmax_fp32_avx2_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x16c8__avx512skx
init: xnn_init_qu8_conv_minmax_fp32_avx512_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x16c8__avx512skx
init: xnn_init_qu8_conv_minmax_fp32_avx512_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x16c8__avx512skx
init: xnn_init_qu8_conv_minmax_fp32_avx512_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x16c8__avx512skx
init: xnn_init_qu8_conv_minmax_fp32_avx512_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c2__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c2__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c2__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c2__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c8__wasmsimd_dot16x2_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4c8__wasmsimd_dot16x2_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_mul32_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_mul32_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_mul32_ld64
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4c8__wasmsimd_mul32_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4c8__wasmsimd_mul32_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4c8__wasmsimd_mul32_ld128
init: xnn_init_qu8_conv_minmax_fp32_wasmsimd_params
k-block: 8
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x2__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x2__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x2__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x2__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4__scalar_lrint
init: xnn_init_qu8_conv_minmax_fp32_scalar_lrint_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x2__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x2__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x2__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x2__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_1x4__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_2x4__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_3x4__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1
- name: xnn_qu8_igemm_minmax_fp32_ukernel_4x4__scalar_magic
init: xnn_init_qu8_conv_minmax_fp32_scalar_magic_params
k-block: 1