Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 1 | // Copyright 2019 Google LLC |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 2 | // |
| 3 | // This source code is licensed under the BSD-style license found in the |
| 4 | // LICENSE file in the root directory of this source tree. |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 5 | // |
| 6 | // Auto-generated file. Do not edit! |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 7 | // Specification: test/u8-vclamp.yaml |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 8 | // Generator: tools/generate-vunary-test.py |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 9 | |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 10 | |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 11 | #include <gtest/gtest.h> |
| 12 | |
Marat Dukhan | 1dadbf7 | 2019-10-01 10:46:20 -0700 | [diff] [blame] | 13 | #include <xnnpack/common.h> |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 14 | #include <xnnpack/isa-checks.h> |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 15 | |
Marat Dukhan | 60d3f24 | 2021-05-13 11:59:02 -0700 | [diff] [blame] | 16 | #include <xnnpack/vunary.h> |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 17 | #include "vunary-microkernel-tester.h" |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 18 | |
| 19 | |
Marat Dukhan | 1dadbf7 | 2019-10-01 10:46:20 -0700 | [diff] [blame] | 20 | #if XNN_ARCH_ARM || XNN_ARCH_ARM64 |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 21 | TEST(U8_VCLAMP__NEON_X64, batch_eq_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 22 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 23 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 24 | .batch_size(64) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 25 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 26 | } |
| 27 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 28 | TEST(U8_VCLAMP__NEON_X64, batch_div_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 29 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 30 | for (size_t batch_size = 128; batch_size < 640; batch_size += 64) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 31 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 32 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 33 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 34 | } |
| 35 | } |
| 36 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 37 | TEST(U8_VCLAMP__NEON_X64, batch_lt_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 38 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 39 | for (size_t batch_size = 1; batch_size < 64; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 40 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 41 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 42 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 43 | } |
| 44 | } |
| 45 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 46 | TEST(U8_VCLAMP__NEON_X64, batch_gt_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 47 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 48 | for (size_t batch_size = 65; batch_size < 128; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 49 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 50 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 51 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 52 | } |
| 53 | } |
| 54 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 55 | TEST(U8_VCLAMP__NEON_X64, inplace) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 56 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 57 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 58 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 59 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 60 | .inplace(true) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 61 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 62 | } |
| 63 | } |
| 64 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 65 | TEST(U8_VCLAMP__NEON_X64, qmin) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 66 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 67 | for (uint8_t qmin = 1; qmin < 255; qmin++) { |
| 68 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 69 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 70 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 71 | .qmin(qmin) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 72 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 73 | } |
| 74 | } |
| 75 | } |
| 76 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 77 | TEST(U8_VCLAMP__NEON_X64, qmax) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 78 | TEST_REQUIRES_ARM_NEON; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 79 | for (uint8_t qmax = 1; qmax < 255; qmax++) { |
| 80 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 81 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 82 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 83 | .qmax(qmax) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 84 | .Test(xnn_u8_vclamp_ukernel__neon_x64, xnn_init_u8_minmax_neon_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 85 | } |
| 86 | } |
| 87 | } |
Marat Dukhan | 1dadbf7 | 2019-10-01 10:46:20 -0700 | [diff] [blame] | 88 | #endif // XNN_ARCH_ARM || XNN_ARCH_ARM64 |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 89 | |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 90 | |
Marat Dukhan | 1dadbf7 | 2019-10-01 10:46:20 -0700 | [diff] [blame] | 91 | #if XNN_ARCH_X86 || XNN_ARCH_X86_64 |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 92 | TEST(U8_VCLAMP__SSE2_X64, batch_eq_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 93 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 94 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 95 | .batch_size(64) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 96 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 97 | } |
| 98 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 99 | TEST(U8_VCLAMP__SSE2_X64, batch_div_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 100 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 101 | for (size_t batch_size = 128; batch_size < 640; batch_size += 64) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 102 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 103 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 104 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 105 | } |
| 106 | } |
| 107 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 108 | TEST(U8_VCLAMP__SSE2_X64, batch_lt_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 109 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 110 | for (size_t batch_size = 1; batch_size < 64; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 111 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 112 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 113 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 114 | } |
| 115 | } |
| 116 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 117 | TEST(U8_VCLAMP__SSE2_X64, batch_gt_64) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 118 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 119 | for (size_t batch_size = 65; batch_size < 128; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 120 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 121 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 122 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 123 | } |
| 124 | } |
| 125 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 126 | TEST(U8_VCLAMP__SSE2_X64, inplace) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 127 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 128 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 129 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 130 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 131 | .inplace(true) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 132 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 133 | } |
| 134 | } |
| 135 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 136 | TEST(U8_VCLAMP__SSE2_X64, qmin) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 137 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 138 | for (uint8_t qmin = 1; qmin < 255; qmin++) { |
| 139 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 140 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 141 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 142 | .qmin(qmin) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 143 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 144 | } |
| 145 | } |
| 146 | } |
| 147 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 148 | TEST(U8_VCLAMP__SSE2_X64, qmax) { |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 149 | TEST_REQUIRES_X86_SSE2; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 150 | for (uint8_t qmax = 1; qmax < 255; qmax++) { |
| 151 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 152 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 153 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 154 | .qmax(qmax) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 155 | .Test(xnn_u8_vclamp_ukernel__sse2_x64, xnn_init_u8_minmax_sse2_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 156 | } |
| 157 | } |
| 158 | } |
Marat Dukhan | 1dadbf7 | 2019-10-01 10:46:20 -0700 | [diff] [blame] | 159 | #endif // XNN_ARCH_X86 || XNN_ARCH_X86_64 |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 160 | |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 161 | |
Marat Dukhan | 4c61779 | 2021-12-21 15:47:58 -0800 | [diff] [blame] | 162 | #if XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 163 | TEST(U8_VCLAMP__WASMSIMD_X64, batch_eq_64) { |
| 164 | VUnaryMicrokernelTester() |
| 165 | .batch_size(64) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 166 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 167 | } |
| 168 | |
| 169 | TEST(U8_VCLAMP__WASMSIMD_X64, batch_div_64) { |
| 170 | for (size_t batch_size = 128; batch_size < 640; batch_size += 64) { |
| 171 | VUnaryMicrokernelTester() |
| 172 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 173 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 174 | } |
| 175 | } |
| 176 | |
| 177 | TEST(U8_VCLAMP__WASMSIMD_X64, batch_lt_64) { |
| 178 | for (size_t batch_size = 1; batch_size < 64; batch_size++) { |
| 179 | VUnaryMicrokernelTester() |
| 180 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 181 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 182 | } |
| 183 | } |
| 184 | |
| 185 | TEST(U8_VCLAMP__WASMSIMD_X64, batch_gt_64) { |
| 186 | for (size_t batch_size = 65; batch_size < 128; batch_size++) { |
| 187 | VUnaryMicrokernelTester() |
| 188 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 189 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 190 | } |
| 191 | } |
| 192 | |
| 193 | TEST(U8_VCLAMP__WASMSIMD_X64, inplace) { |
| 194 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 195 | VUnaryMicrokernelTester() |
| 196 | .batch_size(batch_size) |
| 197 | .inplace(true) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 198 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 199 | } |
| 200 | } |
| 201 | |
| 202 | TEST(U8_VCLAMP__WASMSIMD_X64, qmin) { |
| 203 | for (uint8_t qmin = 1; qmin < 255; qmin++) { |
| 204 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 205 | VUnaryMicrokernelTester() |
| 206 | .batch_size(batch_size) |
| 207 | .qmin(qmin) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 208 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 209 | } |
| 210 | } |
| 211 | } |
| 212 | |
| 213 | TEST(U8_VCLAMP__WASMSIMD_X64, qmax) { |
| 214 | for (uint8_t qmax = 1; qmax < 255; qmax++) { |
| 215 | for (size_t batch_size = 1; batch_size <= 320; batch_size += 63) { |
| 216 | VUnaryMicrokernelTester() |
| 217 | .batch_size(batch_size) |
| 218 | .qmax(qmax) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 219 | .Test(xnn_u8_vclamp_ukernel__wasmsimd_x64, xnn_init_u8_minmax_wasmsimd_params); |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 220 | } |
| 221 | } |
| 222 | } |
Marat Dukhan | 4c61779 | 2021-12-21 15:47:58 -0800 | [diff] [blame] | 223 | #endif // XNN_ARCH_WASMSIMD || XNN_ARCH_WASMRELAXEDSIMD |
Marat Dukhan | 1f5b108 | 2021-08-16 17:01:44 -0700 | [diff] [blame] | 224 | |
| 225 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 226 | TEST(U8_VCLAMP__SCALAR_X4, batch_eq_4) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 227 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 228 | .batch_size(4) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 229 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 230 | } |
| 231 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 232 | TEST(U8_VCLAMP__SCALAR_X4, batch_div_4) { |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 233 | for (size_t batch_size = 8; batch_size < 40; batch_size += 4) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 234 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 235 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 236 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 237 | } |
| 238 | } |
| 239 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 240 | TEST(U8_VCLAMP__SCALAR_X4, batch_lt_4) { |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 241 | for (size_t batch_size = 1; batch_size < 4; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 242 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 243 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 244 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 245 | } |
| 246 | } |
| 247 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 248 | TEST(U8_VCLAMP__SCALAR_X4, batch_gt_4) { |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 249 | for (size_t batch_size = 5; batch_size < 8; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 250 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 251 | .batch_size(batch_size) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 252 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 253 | } |
| 254 | } |
| 255 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 256 | TEST(U8_VCLAMP__SCALAR_X4, inplace) { |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 257 | for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 258 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 259 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 260 | .inplace(true) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 261 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 262 | } |
| 263 | } |
| 264 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 265 | TEST(U8_VCLAMP__SCALAR_X4, qmin) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 266 | for (uint8_t qmin = 1; qmin < 255; qmin++) { |
| 267 | for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) { |
| 268 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 269 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 270 | .qmin(qmin) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 271 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 272 | } |
| 273 | } |
| 274 | } |
| 275 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 276 | TEST(U8_VCLAMP__SCALAR_X4, qmax) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 277 | for (uint8_t qmax = 1; qmax < 255; qmax++) { |
| 278 | for (size_t batch_size = 1; batch_size <= 20; batch_size += 3) { |
| 279 | VUnaryMicrokernelTester() |
Marat Dukhan | 5c5fa96 | 2020-03-10 18:38:33 -0700 | [diff] [blame] | 280 | .batch_size(batch_size) |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 281 | .qmax(qmax) |
Marat Dukhan | 0d10cc7 | 2021-12-23 19:49:19 -0800 | [diff] [blame^] | 282 | .Test(xnn_u8_vclamp_ukernel__scalar_x4, xnn_init_u8_minmax_scalar_params); |
XNNPACK Team | b455b12 | 2019-09-27 18:10:33 -0700 | [diff] [blame] | 283 | } |
| 284 | } |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 285 | } |