AVX and AVX512F versions of PReLU micro-kernel

Up to 2X faster PReLU operator on AVX512F-enabled CPU

PiperOrigin-RevId: 300268958
diff --git a/BUILD.bazel b/BUILD.bazel
index a69a5e5..de80a64 100644
--- a/BUILD.bazel
+++ b/BUILD.bazel
@@ -1073,6 +1073,8 @@
     "src/f32-igemm/gen/3x16-avx-broadcast.c",
     "src/f32-igemm/gen/4x16-avx-broadcast.c",
     "src/f32-igemm/gen/5x16-avx-broadcast.c",
+    "src/f32-prelu/gen/avx-2x8.c",
+    "src/f32-prelu/gen/avx-2x16.c",
     "src/f32-rmax/avx.c",
     "src/f32-vbinary/gen/vadd-avx-x8.c",
     "src/f32-vbinary/gen/vadd-avx-x16.c",
@@ -1303,6 +1305,8 @@
     "src/f32-igemm/gen/6x16-avx512f-broadcast.c",
     "src/f32-igemm/gen/7x16-avx512f-broadcast.c",
     "src/f32-igemm/gen/8x16-avx512f-broadcast.c",
+    "src/f32-prelu/gen/avx512f-2x16.c",
+    "src/f32-prelu/gen/avx512f-2x32.c",
     "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c",
     "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c",
     "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c",