Add Channel Tile of 16 for float and 32 for half float.

- includes fix for test generator to pass primary_tile to test

PiperOrigin-RevId: 404035415
diff --git a/CMakeLists.txt b/CMakeLists.txt
index 7c7c3ee..cb61805 100755
--- a/CMakeLists.txt
+++ b/CMakeLists.txt
@@ -1806,6 +1806,18 @@
   src/f32-dwconv/gen/up8x9-minmax-neonfma.c
   src/f32-dwconv/gen/up8x25-minmax-neonfma-acc2.c
   src/f32-dwconv/gen/up8x25-minmax-neonfma.c
+  src/f32-dwconv/gen/up16x4-minmax-neon-acc2.c
+  src/f32-dwconv/gen/up16x4-minmax-neon.c
+  src/f32-dwconv/gen/up16x4-minmax-neonfma-acc2.c
+  src/f32-dwconv/gen/up16x4-minmax-neonfma.c
+  src/f32-dwconv/gen/up16x9-minmax-neon-acc2.c
+  src/f32-dwconv/gen/up16x9-minmax-neon.c
+  src/f32-dwconv/gen/up16x9-minmax-neonfma-acc2.c
+  src/f32-dwconv/gen/up16x9-minmax-neonfma.c
+  src/f32-dwconv/gen/up16x25-minmax-neon-acc2.c
+  src/f32-dwconv/gen/up16x25-minmax-neon.c
+  src/f32-dwconv/gen/up16x25-minmax-neonfma-acc2.c
+  src/f32-dwconv/gen/up16x25-minmax-neonfma.c
   src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-dup-ld64.c
   src/f32-gemm/gen-inc/1x8s4inc-minmax-neonfma.c
   src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld64.c
@@ -2278,6 +2290,12 @@
   src/f16-dwconv/gen/up16x9-minmax-neonfp16arith.c
   src/f16-dwconv/gen/up16x25-minmax-neonfp16arith-acc2.c
   src/f16-dwconv/gen/up16x25-minmax-neonfp16arith.c
+  src/f16-dwconv/gen/up32x4-minmax-neonfp16arith-acc2.c
+  src/f16-dwconv/gen/up32x4-minmax-neonfp16arith.c
+  src/f16-dwconv/gen/up32x9-minmax-neonfp16arith-acc2.c
+  src/f16-dwconv/gen/up32x9-minmax-neonfp16arith.c
+  src/f16-dwconv/gen/up32x25-minmax-neonfp16arith-acc2.c
+  src/f16-dwconv/gen/up32x25-minmax-neonfp16arith.c
   src/f16-gavgpool/7p7x-minmax-neonfp16arith-c8.c
   src/f16-gavgpool/7x-minmax-neonfp16arith-c8.c
   src/f16-gemm/gen-inc/1x8inc-minmax-neonfp16arith-ld64.c