Elementwise minimum and maximum micro-kernels
PiperOrigin-RevId: 284032447
diff --git a/test/f32-vmax.cc b/test/f32-vmax.cc
new file mode 100644
index 0000000..51e37d1
--- /dev/null
+++ b/test/f32-vmax.cc
@@ -0,0 +1,979 @@
+// Copyright 2019 Google LLC
+//
+// This source code is licensed under the BSD-style license found in the
+// LICENSE file in the root directory of this source tree.
+//
+// Auto-generated file. Do not edit!
+// Specification: test/f32-vmax.yaml
+// Generator: tools/generate-vbinary-test.py
+
+
+#include <gtest/gtest.h>
+
+#include <xnnpack/common.h>
+#include <xnnpack/isa-checks.h>
+
+#include <xnnpack/vbinary.h>
+#include "vbinary-microkernel-tester.h"
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMAX__NEON_X4, batch_eq_4) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+
+ TEST(F32_VMAX__NEON_X4, batch_div_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, batch_lt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, batch_gt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, inplace_a) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, inplace_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, inplace_a_and_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X4, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMAX__NEON_X8, batch_eq_8) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+
+ TEST(F32_VMAX__NEON_X8, batch_div_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, batch_lt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, batch_gt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, inplace_a) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, inplace_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, inplace_a_and_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__NEON_X8, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMAX__SSE_X4, batch_eq_4) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+
+ TEST(F32_VMAX__SSE_X4, batch_div_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, batch_lt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, batch_gt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, inplace_a) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, inplace_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, inplace_a_and_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X4, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMAX__SSE_X8, batch_eq_8) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+
+ TEST(F32_VMAX__SSE_X8, batch_div_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, batch_lt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, batch_gt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, inplace_a) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, inplace_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, inplace_a_and_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+
+ TEST(F32_VMAX__SSE_X8, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Max);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMAX__PSIMD_X4, batch_eq_4) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, batch_div_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, batch_lt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, batch_gt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, inplace_a) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, inplace_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, inplace_a_and_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X4, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMAX__PSIMD_X8, batch_eq_8) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, batch_div_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, batch_lt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, batch_gt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, inplace_a) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, inplace_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, inplace_a_and_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__PSIMD_X8, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAX__WASM_X1, batch_eq_1) {
+ VBinOpMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAX__WASM_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X1, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X1, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X1, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAX__WASM_X2, batch_eq_2) {
+ VBinOpMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAX__WASM_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAX__WASM_X4, batch_eq_4) {
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAX__WASM_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAX__WASM_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+TEST(F32_VMAX__SCALAR_X1, batch_eq_1) {
+ VBinOpMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAX__SCALAR_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X1, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X1, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X1, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, batch_eq_2) {
+ VBinOpMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAX__SCALAR_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, batch_eq_4) {
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAX__SCALAR_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAX__SCALAR_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmax_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Max, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
\ No newline at end of file
diff --git a/test/f32-vmax.yaml b/test/f32-vmax.yaml
new file mode 100644
index 0000000..001aa5a
--- /dev/null
+++ b/test/f32-vmax.yaml
@@ -0,0 +1,16 @@
+# Copyright 2019 Google LLC
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+- name: xnn_f32_vmax_ukernel__neon_x4
+- name: xnn_f32_vmax_ukernel__neon_x8
+- name: xnn_f32_vmax_ukernel__sse_x4
+- name: xnn_f32_vmax_ukernel__sse_x8
+- name: xnn_f32_vmax_ukernel__psimd_x4
+- name: xnn_f32_vmax_ukernel__psimd_x8
+- name: xnn_f32_vmax_ukernel__wasm_x1
+- name: xnn_f32_vmax_ukernel__wasm_x2
+- name: xnn_f32_vmax_ukernel__wasm_x4
+- name: xnn_f32_vmax_ukernel__scalar_x1
+- name: xnn_f32_vmax_ukernel__scalar_x2
+- name: xnn_f32_vmax_ukernel__scalar_x4
diff --git a/test/f32-vmaxc.cc b/test/f32-vmaxc.cc
new file mode 100644
index 0000000..f20478f
--- /dev/null
+++ b/test/f32-vmaxc.cc
@@ -0,0 +1,739 @@
+// Copyright 2019 Google LLC
+//
+// This source code is licensed under the BSD-style license found in the
+// LICENSE file in the root directory of this source tree.
+//
+// Auto-generated file. Do not edit!
+// Specification: test/f32-vmaxc.yaml
+// Generator: tools/generate-vbinary-test.py
+
+
+#include <gtest/gtest.h>
+
+#include <xnnpack/common.h>
+#include <xnnpack/isa-checks.h>
+
+#include <xnnpack/vbinary.h>
+#include "vbinaryc-microkernel-tester.h"
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMAXC__NEON_X4, batch_eq_4) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+
+ TEST(F32_VMAXC__NEON_X4, batch_div_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X4, batch_lt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X4, batch_gt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X4, inplace) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X4, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X4, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMAXC__NEON_X8, batch_eq_8) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+
+ TEST(F32_VMAXC__NEON_X8, batch_div_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X8, batch_lt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X8, batch_gt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X8, inplace) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X8, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__NEON_X8, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMAXC__SSE_X4, batch_eq_4) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+
+ TEST(F32_VMAXC__SSE_X4, batch_div_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X4, batch_lt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X4, batch_gt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X4, inplace) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X4, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X4, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMAXC__SSE_X8, batch_eq_8) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+
+ TEST(F32_VMAXC__SSE_X8, batch_div_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X8, batch_lt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X8, batch_gt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X8, inplace) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X8, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+
+ TEST(F32_VMAXC__SSE_X8, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MaxC);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMAXC__PSIMD_X4, batch_eq_4) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, batch_div_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, batch_lt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, batch_gt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, inplace) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X4, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMAXC__PSIMD_X8, batch_eq_8) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, batch_div_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, batch_lt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, batch_gt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, inplace) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__PSIMD_X8, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAXC__WASM_X1, batch_eq_1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAXC__WASM_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X1, inplace) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAXC__WASM_X2, batch_eq_2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAXC__WASM_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X2, inplace) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMAXC__WASM_X4, batch_eq_4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMAXC__WASM_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X4, inplace) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMAXC__WASM_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+TEST(F32_VMAXC__SCALAR_X1, batch_eq_1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAXC__SCALAR_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X1, inplace) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, batch_eq_2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAXC__SCALAR_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, inplace) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, batch_eq_4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMAXC__SCALAR_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, inplace) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMAXC__SCALAR_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmaxc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MaxC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
\ No newline at end of file
diff --git a/test/f32-vmaxc.yaml b/test/f32-vmaxc.yaml
new file mode 100644
index 0000000..d0e4079
--- /dev/null
+++ b/test/f32-vmaxc.yaml
@@ -0,0 +1,16 @@
+# Copyright 2019 Google LLC
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+- name: xnn_f32_vmaxc_ukernel__neon_x4
+- name: xnn_f32_vmaxc_ukernel__neon_x8
+- name: xnn_f32_vmaxc_ukernel__sse_x4
+- name: xnn_f32_vmaxc_ukernel__sse_x8
+- name: xnn_f32_vmaxc_ukernel__psimd_x4
+- name: xnn_f32_vmaxc_ukernel__psimd_x8
+- name: xnn_f32_vmaxc_ukernel__wasm_x1
+- name: xnn_f32_vmaxc_ukernel__wasm_x2
+- name: xnn_f32_vmaxc_ukernel__wasm_x4
+- name: xnn_f32_vmaxc_ukernel__scalar_x1
+- name: xnn_f32_vmaxc_ukernel__scalar_x2
+- name: xnn_f32_vmaxc_ukernel__scalar_x4
diff --git a/test/f32-vmin.cc b/test/f32-vmin.cc
new file mode 100644
index 0000000..6a5e7e7
--- /dev/null
+++ b/test/f32-vmin.cc
@@ -0,0 +1,979 @@
+// Copyright 2019 Google LLC
+//
+// This source code is licensed under the BSD-style license found in the
+// LICENSE file in the root directory of this source tree.
+//
+// Auto-generated file. Do not edit!
+// Specification: test/f32-vmin.yaml
+// Generator: tools/generate-vbinary-test.py
+
+
+#include <gtest/gtest.h>
+
+#include <xnnpack/common.h>
+#include <xnnpack/isa-checks.h>
+
+#include <xnnpack/vbinary.h>
+#include "vbinary-microkernel-tester.h"
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMIN__NEON_X4, batch_eq_4) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+
+ TEST(F32_VMIN__NEON_X4, batch_div_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, batch_lt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, batch_gt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, inplace_a) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, inplace_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, inplace_a_and_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X4, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__neon_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMIN__NEON_X8, batch_eq_8) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+
+ TEST(F32_VMIN__NEON_X8, batch_div_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, batch_lt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, batch_gt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, inplace_a) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, inplace_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, inplace_a_and_b) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__NEON_X8, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__neon_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMIN__SSE_X4, batch_eq_4) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+
+ TEST(F32_VMIN__SSE_X4, batch_div_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, batch_lt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, batch_gt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, inplace_a) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, inplace_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, inplace_a_and_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X4, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__sse_x4, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMIN__SSE_X8, batch_eq_8) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+
+ TEST(F32_VMIN__SSE_X8, batch_div_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, batch_lt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, batch_gt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, inplace_a) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, inplace_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, inplace_a_and_b) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+
+ TEST(F32_VMIN__SSE_X8, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__sse_x8, VBinOpMicrokernelTester::OpType::Min);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMIN__PSIMD_X4, batch_eq_4) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, batch_div_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, batch_lt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, batch_gt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, inplace_a) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, inplace_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, inplace_a_and_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X4, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__psimd_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMIN__PSIMD_X8, batch_eq_8) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, batch_div_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, batch_lt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, batch_gt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, inplace_a) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, inplace_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, inplace_a_and_b) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__PSIMD_X8, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__psimd_x8, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMIN__WASM_X1, batch_eq_1) {
+ VBinOpMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMIN__WASM_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X1, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X1, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X1, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMIN__WASM_X2, batch_eq_2) {
+ VBinOpMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMIN__WASM_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMIN__WASM_X4, batch_eq_4) {
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMIN__WASM_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMIN__WASM_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__wasm_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+TEST(F32_VMIN__SCALAR_X1, batch_eq_1) {
+ VBinOpMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMIN__SCALAR_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X1, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X1, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X1, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x1, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, batch_eq_2) {
+ VBinOpMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMIN__SCALAR_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x2, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, batch_eq_4) {
+ VBinOpMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMIN__SCALAR_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, inplace_a) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, inplace_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, inplace_a_and_b) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace_a(true)
+ .inplace_b(true)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMIN__SCALAR_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vmin_ukernel__scalar_x4, VBinOpMicrokernelTester::OpType::Min, VBinOpMicrokernelTester::Variant::Scalar);
+ }
+}
\ No newline at end of file
diff --git a/test/f32-vmin.yaml b/test/f32-vmin.yaml
new file mode 100644
index 0000000..13227a3
--- /dev/null
+++ b/test/f32-vmin.yaml
@@ -0,0 +1,16 @@
+# Copyright 2019 Google LLC
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+- name: xnn_f32_vmin_ukernel__neon_x4
+- name: xnn_f32_vmin_ukernel__neon_x8
+- name: xnn_f32_vmin_ukernel__sse_x4
+- name: xnn_f32_vmin_ukernel__sse_x8
+- name: xnn_f32_vmin_ukernel__psimd_x4
+- name: xnn_f32_vmin_ukernel__psimd_x8
+- name: xnn_f32_vmin_ukernel__wasm_x1
+- name: xnn_f32_vmin_ukernel__wasm_x2
+- name: xnn_f32_vmin_ukernel__wasm_x4
+- name: xnn_f32_vmin_ukernel__scalar_x1
+- name: xnn_f32_vmin_ukernel__scalar_x2
+- name: xnn_f32_vmin_ukernel__scalar_x4
diff --git a/test/f32-vminc.cc b/test/f32-vminc.cc
new file mode 100644
index 0000000..49fced9
--- /dev/null
+++ b/test/f32-vminc.cc
@@ -0,0 +1,739 @@
+// Copyright 2019 Google LLC
+//
+// This source code is licensed under the BSD-style license found in the
+// LICENSE file in the root directory of this source tree.
+//
+// Auto-generated file. Do not edit!
+// Specification: test/f32-vminc.yaml
+// Generator: tools/generate-vbinary-test.py
+
+
+#include <gtest/gtest.h>
+
+#include <xnnpack/common.h>
+#include <xnnpack/isa-checks.h>
+
+#include <xnnpack/vbinary.h>
+#include "vbinaryc-microkernel-tester.h"
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMINC__NEON_X4, batch_eq_4) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+
+ TEST(F32_VMINC__NEON_X4, batch_div_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X4, batch_lt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X4, batch_gt_4) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X4, inplace) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X4, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X4, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__neon_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_ARM || XNN_ARCH_ARM64
+ TEST(F32_VMINC__NEON_X8, batch_eq_8) {
+ TEST_REQUIRES_ARM_NEON;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+
+ TEST(F32_VMINC__NEON_X8, batch_div_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X8, batch_lt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X8, batch_gt_8) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X8, inplace) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X8, qmin) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__NEON_X8, qmax) {
+ TEST_REQUIRES_ARM_NEON;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__neon_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+#endif // XNN_ARCH_ARM || XNN_ARCH_ARM64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMINC__SSE_X4, batch_eq_4) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+
+ TEST(F32_VMINC__SSE_X4, batch_div_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X4, batch_lt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X4, batch_gt_4) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X4, inplace) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X4, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X4, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__sse_x4, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if XNN_ARCH_X86 || XNN_ARCH_X86_64
+ TEST(F32_VMINC__SSE_X8, batch_eq_8) {
+ TEST_REQUIRES_X86_SSE;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+
+ TEST(F32_VMINC__SSE_X8, batch_div_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X8, batch_lt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X8, batch_gt_8) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X8, inplace) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X8, qmin) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+
+ TEST(F32_VMINC__SSE_X8, qmax) {
+ TEST_REQUIRES_X86_SSE;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__sse_x8, VBinOpCMicrokernelTester::OpType::MinC);
+ }
+ }
+#endif // XNN_ARCH_X86 || XNN_ARCH_X86_64
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMINC__PSIMD_X4, batch_eq_4) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, batch_div_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, batch_lt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, batch_gt_4) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, inplace) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X4, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__psimd_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+ TEST(F32_VMINC__PSIMD_X8, batch_eq_8) {
+ TEST_REQUIRES_PSIMD;
+ VBinOpCMicrokernelTester()
+ .batch_size(8)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, batch_div_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 16; batch_size < 80; batch_size += 8) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, batch_lt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, batch_gt_8) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 9; batch_size < 16; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, inplace) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, qmin) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__PSIMD_X8, qmax) {
+ TEST_REQUIRES_PSIMD;
+ for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__psimd_x8, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // !XNN_ARCH_ASMJS && !XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMINC__WASM_X1, batch_eq_1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vminc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMINC__WASM_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X1, inplace) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMINC__WASM_X2, batch_eq_2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMINC__WASM_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X2, inplace) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+#if XNN_ARCH_WASM
+ TEST(F32_VMINC__WASM_X4, batch_eq_4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+
+ TEST(F32_VMINC__WASM_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X4, inplace) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+
+ TEST(F32_VMINC__WASM_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__wasm_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+ }
+#endif // XNN_ARCH_WASM
+
+
+TEST(F32_VMINC__SCALAR_X1, batch_eq_1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(1)
+ .Test(xnn_f32_vminc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMINC__SCALAR_X1, batch_gt_1) {
+ for (size_t batch_size = 2; batch_size < 10; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X1, inplace) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X1, qmin) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X1, qmax) {
+ for (size_t batch_size = 1; batch_size <= 5; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x1, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, batch_eq_2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(2)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMINC__SCALAR_X2, batch_div_2) {
+ for (size_t batch_size = 4; batch_size < 20; batch_size += 2) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, batch_lt_2) {
+ for (size_t batch_size = 1; batch_size < 2; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, batch_gt_2) {
+ for (size_t batch_size = 3; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, inplace) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, qmin) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X2, qmax) {
+ for (size_t batch_size = 1; batch_size <= 10; batch_size += 1) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x2, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, batch_eq_4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(4)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+}
+
+TEST(F32_VMINC__SCALAR_X4, batch_div_4) {
+ for (size_t batch_size = 8; batch_size < 40; batch_size += 4) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, batch_lt_4) {
+ for (size_t batch_size = 1; batch_size < 4; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, batch_gt_4) {
+ for (size_t batch_size = 5; batch_size < 8; batch_size++) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, inplace) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .inplace(true)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, qmin) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmin(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
+
+TEST(F32_VMINC__SCALAR_X4, qmax) {
+ for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) {
+ VBinOpCMicrokernelTester()
+ .batch_size(batch_size)
+ .qmax(128)
+ .Test(xnn_f32_vminc_ukernel__scalar_x4, VBinOpCMicrokernelTester::OpType::MinC, VBinOpCMicrokernelTester::Variant::Scalar);
+ }
+}
\ No newline at end of file
diff --git a/test/f32-vminc.yaml b/test/f32-vminc.yaml
new file mode 100644
index 0000000..bb73ae3
--- /dev/null
+++ b/test/f32-vminc.yaml
@@ -0,0 +1,16 @@
+# Copyright 2019 Google LLC
+#
+# This source code is licensed under the BSD-style license found in the
+# LICENSE file in the root directory of this source tree.
+- name: xnn_f32_vminc_ukernel__neon_x4
+- name: xnn_f32_vminc_ukernel__neon_x8
+- name: xnn_f32_vminc_ukernel__sse_x4
+- name: xnn_f32_vminc_ukernel__sse_x8
+- name: xnn_f32_vminc_ukernel__psimd_x4
+- name: xnn_f32_vminc_ukernel__psimd_x8
+- name: xnn_f32_vminc_ukernel__wasm_x1
+- name: xnn_f32_vminc_ukernel__wasm_x2
+- name: xnn_f32_vminc_ukernel__wasm_x4
+- name: xnn_f32_vminc_ukernel__scalar_x1
+- name: xnn_f32_vminc_ukernel__scalar_x2
+- name: xnn_f32_vminc_ukernel__scalar_x4
diff --git a/test/vbinary-microkernel-tester.h b/test/vbinary-microkernel-tester.h
index 0189883..3eadc77 100644
--- a/test/vbinary-microkernel-tester.h
+++ b/test/vbinary-microkernel-tester.h
@@ -24,6 +24,8 @@
public:
enum class OpType {
Add,
+ Max,
+ Min,
Mul,
Sub,
};
@@ -114,6 +116,12 @@
case OpType::Add:
y_ref[i] = a_data[i] + b_data[i];
break;
+ case OpType::Max:
+ y_ref[i] = std::max<float>(a_data[i], b_data[i]);
+ break;
+ case OpType::Min:
+ y_ref[i] = std::min<float>(a_data[i], b_data[i]);
+ break;
case OpType::Mul:
y_ref[i] = a_data[i] * b_data[i];
break;
diff --git a/test/vbinaryc-microkernel-tester.h b/test/vbinaryc-microkernel-tester.h
index eec19d0..75091e8 100644
--- a/test/vbinaryc-microkernel-tester.h
+++ b/test/vbinaryc-microkernel-tester.h
@@ -24,6 +24,8 @@
public:
enum class OpType {
AddC,
+ MaxC,
+ MinC,
MulC,
SubC,
RSubC,
@@ -104,6 +106,12 @@
case OpType::AddC:
y_ref[i] = a_data[i] + b;
break;
+ case OpType::MaxC:
+ y_ref[i] = std::max<float>(a_data[i], b);
+ break;
+ case OpType::MinC:
+ y_ref[i] = std::min<float>(a_data[i], b);
+ break;
case OpType::MulC:
y_ref[i] = a_data[i] * b;
break;