4x8 QU8 Neon Dotproduct microkernel rename from ld64 to ld128

- rename ld64 to ld128 for filenames and functions

PiperOrigin-RevId: 394751366
diff --git a/bench/qu8-gemm-e2e.cc b/bench/qu8-gemm-e2e.cc
index a4e8a1a..0c833f9 100644
--- a/bench/qu8-gemm-e2e.cc
+++ b/bench/qu8-gemm-e2e.cc
@@ -98,10 +98,10 @@
       4 /* mr */, 16  /* nr */, 2 /* log2_kr */, 0 /* log2_sr */,
       benchmark::utils::CheckNEONDOT);
   }
-  static void qu8_gemm_4x8c4__aarch64_neondot_ld64(benchmark::State& state, models::ExecutionPlanFactory model) {
+  static void qu8_gemm_4x8c4__aarch64_neondot_ld128(benchmark::State& state, models::ExecutionPlanFactory model) {
     GEMMEnd2EndBenchmark(state, model,
-      xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__aarch64_neondot_ld64,
-      xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__aarch64_neondot_ld64,
+      xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__aarch64_neondot_ld128,
+      xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__aarch64_neondot_ld128,
       xnn_qu8_gemm_minmax_rndnu_ukernel_1x8c4__neondot,
       xnn_qu8_igemm_minmax_rndnu_ukernel_1x8c4__neondot,
       xnn_init_qu8_conv_minmax_rndnu_neon_params,
@@ -118,10 +118,10 @@
       4 /* mr */, 8  /* nr */, 2 /* log2_kr */, 0 /* log2_sr */,
       benchmark::utils::CheckNEONDOT);
   }
-  BENCHMARK_QU8_END2END(qu8_gemm_4x16c4__aarch64_neondot_ld128);
-  BENCHMARK_QU8_END2END(qu8_gemm_4x16c4__aarch64_neondot_cortex_a55);
-  BENCHMARK_QU8_END2END(qu8_gemm_4x8c4__aarch64_neondot_ld64);
   BENCHMARK_QU8_END2END(qu8_gemm_4x8c4__aarch64_neondot_cortex_a55);
+  BENCHMARK_QU8_END2END(qu8_gemm_4x16c4__aarch64_neondot_cortex_a55);
+  BENCHMARK_QU8_END2END(qu8_gemm_4x8c4__aarch64_neondot_ld128);
+  BENCHMARK_QU8_END2END(qu8_gemm_4x16c4__aarch64_neondot_ld128);
 #endif  // XNN_ARCH_ARM64 && XNN_ENABLE_ASSEMBLY
 
 #if XNN_ARCH_ARM || XNN_ARCH_ARM64