LD1R and LD2R variants of c2 microkernel
- Instead of 1 LD1 and 4 DUP, use 4 LD1R or 2 LD2R
PiperOrigin-RevId: 410613731
diff --git a/test/qs8-igemm-minmax-fp32.yaml b/test/qs8-igemm-minmax-fp32.yaml
index 174e5a0..7051d5d 100644
--- a/test/qs8-igemm-minmax-fp32.yaml
+++ b/test/qs8-igemm-minmax-fp32.yaml
@@ -3,6 +3,30 @@
# This source code is licensed under the BSD-style license found in the
# LICENSE file in the root directory of this source tree.
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neon_mlal_ld1r
+ init: xnn_init_qs8_conv_minmax_fp32_neon_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2__neon_mlal_ld1r
+ init: xnn_init_qs8_conv_minmax_fp32_neon_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neonv8_mlal_ld1r
+ init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2__neonv8_mlal_ld1r
+ init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neon_mlal_ld2r
+ init: xnn_init_qs8_conv_minmax_fp32_neon_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2__neon_mlal_ld2r
+ init: xnn_init_qs8_conv_minmax_fp32_neon_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neonv8_mlal_ld2r
+ init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
+ k-block: 16
+- name: xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2__neonv8_mlal_ld2r
+ init: xnn_init_qs8_conv_minmax_fp32_neonv8_params
+ k-block: 16
- name: xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2__neon_mlal_ld4r
init: xnn_init_qs8_conv_minmax_fp32_neon_params
k-block: 16