NEON implementations of QC8 DWCONV microkernels

PiperOrigin-RevId: 382205004
diff --git a/CMakeLists.txt b/CMakeLists.txt
index e0cec34..2d48053 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -999,6 +999,14 @@
   src/math/sqrt-neon-nr1rsqrts.c
   src/math/sqrt-neon-nr2rsqrts.c
   src/math/sqrt-neon-nr3rsqrts.c
+  src/qc8-dwconv/gen/up8x9-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up8x25-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up24x9-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up24x25-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up32x9-minmax-fp32-neon-mul16.c
+  src/qc8-dwconv/gen/up32x25-minmax-fp32-neon-mul16.c
   src/qc8-gemm/gen/1x8c8-minmax-fp32-neon-mlal-padal.c
   src/qc8-gemm/gen/1x16-minmax-fp32-neon-mlal-lane.c
   src/qc8-gemm/gen/2x8c8-minmax-fp32-neon-mlal-padal.c
@@ -1431,6 +1439,14 @@
   src/math/roundne-neonv8.c
   src/math/roundu-neonv8.c
   src/math/roundz-neonv8.c
+  src/qc8-dwconv/gen/up8x9-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up8x25-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up24x9-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up24x25-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up32x9-minmax-fp32-neonv8-mul16.c
+  src/qc8-dwconv/gen/up32x25-minmax-fp32-neonv8-mul16.c
   src/qc8-gemm/gen/1x8c8-minmax-fp32-neonv8-mlal-padal.c
   src/qc8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c
   src/qc8-gemm/gen/2x8c8-minmax-fp32-neonv8-mlal-padal.c