Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 1 | // Copyright 2019 Google LLC |
| 2 | // |
| 3 | // This source code is licensed under the BSD-style license found in the |
| 4 | // LICENSE file in the root directory of this source tree. |
| 5 | // |
| 6 | // Auto-generated file. Do not edit! |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 7 | // Specification: test/f16-vhswish.yaml |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 8 | // Generator: tools/generate-vunary-test.py |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 9 | |
| 10 | |
| 11 | #include <gtest/gtest.h> |
| 12 | |
| 13 | #include <xnnpack/common.h> |
| 14 | #include <xnnpack/isa-checks.h> |
| 15 | |
Marat Dukhan | a91559a | 2021-05-05 23:58:21 -0700 | [diff] [blame] | 16 | #include <xnnpack/vunary.h> |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 17 | #include "vunary-microkernel-tester.h" |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 18 | |
| 19 | |
| 20 | #if XNN_ARCH_ARM64 |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 21 | TEST(F16_VHSWISH__NEONFP16ARITH_X8, batch_eq_8) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 22 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 23 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 24 | .batch_size(8) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 25 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x8, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 26 | } |
| 27 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 28 | TEST(F16_VHSWISH__NEONFP16ARITH_X8, batch_div_8) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 29 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 30 | for (size_t batch_size = 16; batch_size < 80; batch_size += 8) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 31 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 32 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 33 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x8, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 34 | } |
| 35 | } |
| 36 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 37 | TEST(F16_VHSWISH__NEONFP16ARITH_X8, batch_lt_8) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 38 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 39 | for (size_t batch_size = 1; batch_size < 8; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 40 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 41 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 42 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x8, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 43 | } |
| 44 | } |
| 45 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 46 | TEST(F16_VHSWISH__NEONFP16ARITH_X8, batch_gt_8) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 47 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 48 | for (size_t batch_size = 9; batch_size < 16; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 49 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 50 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 51 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x8, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 52 | } |
| 53 | } |
| 54 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 55 | TEST(F16_VHSWISH__NEONFP16ARITH_X8, inplace) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 56 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 57 | for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 58 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 59 | .batch_size(batch_size) |
| 60 | .inplace(true) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 61 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x8, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 62 | } |
| 63 | } |
| 64 | #endif // XNN_ARCH_ARM64 |
| 65 | |
| 66 | |
| 67 | #if XNN_ARCH_ARM64 |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 68 | TEST(F16_VHSWISH__NEONFP16ARITH_X16, batch_eq_16) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 69 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 70 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 71 | .batch_size(16) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 72 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x16, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 73 | } |
| 74 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 75 | TEST(F16_VHSWISH__NEONFP16ARITH_X16, batch_div_16) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 76 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 77 | for (size_t batch_size = 32; batch_size < 160; batch_size += 16) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 78 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 79 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 80 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x16, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 81 | } |
| 82 | } |
| 83 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 84 | TEST(F16_VHSWISH__NEONFP16ARITH_X16, batch_lt_16) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 85 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 86 | for (size_t batch_size = 1; batch_size < 16; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 87 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 88 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 89 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x16, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 90 | } |
| 91 | } |
| 92 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 93 | TEST(F16_VHSWISH__NEONFP16ARITH_X16, batch_gt_16) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 94 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 95 | for (size_t batch_size = 17; batch_size < 32; batch_size++) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 96 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 97 | .batch_size(batch_size) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 98 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x16, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 99 | } |
| 100 | } |
| 101 | |
Marat Dukhan | 6674d69 | 2021-05-05 22:27:00 -0700 | [diff] [blame] | 102 | TEST(F16_VHSWISH__NEONFP16ARITH_X16, inplace) { |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 103 | TEST_REQUIRES_ARM_NEON_FP16_ARITH; |
| 104 | for (size_t batch_size = 1; batch_size <= 80; batch_size += 15) { |
Marat Dukhan | a6c0516 | 2021-05-13 16:52:02 -0700 | [diff] [blame] | 105 | VUnaryMicrokernelTester() |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 106 | .batch_size(batch_size) |
| 107 | .inplace(true) |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 108 | .Test(xnn_f16_vhswish_ukernel__neonfp16arith_x16, xnn_init_f16_hswish_neon_params); |
Frank Barchard | b196659 | 2020-05-12 13:47:06 -0700 | [diff] [blame] | 109 | } |
| 110 | } |
| 111 | #endif // XNN_ARCH_ARM64 |
Marat Dukhan | 751f622 | 2022-01-09 23:10:04 -0800 | [diff] [blame] | 112 | |
| 113 | |
| 114 | #if XNN_ARCH_X86 || XNN_ARCH_X86_64 |
| 115 | TEST(F16_VHSWISH__F16C_X8, batch_eq_8) { |
| 116 | TEST_REQUIRES_X86_F16C; |
| 117 | VUnaryMicrokernelTester() |
| 118 | .batch_size(8) |
| 119 | .Test(xnn_f16_vhswish_ukernel__f16c_x8, xnn_init_f16_hswish_avx_params); |
| 120 | } |
| 121 | |
| 122 | TEST(F16_VHSWISH__F16C_X8, batch_div_8) { |
| 123 | TEST_REQUIRES_X86_F16C; |
| 124 | for (size_t batch_size = 16; batch_size < 80; batch_size += 8) { |
| 125 | VUnaryMicrokernelTester() |
| 126 | .batch_size(batch_size) |
| 127 | .Test(xnn_f16_vhswish_ukernel__f16c_x8, xnn_init_f16_hswish_avx_params); |
| 128 | } |
| 129 | } |
| 130 | |
| 131 | TEST(F16_VHSWISH__F16C_X8, batch_lt_8) { |
| 132 | TEST_REQUIRES_X86_F16C; |
| 133 | for (size_t batch_size = 1; batch_size < 8; batch_size++) { |
| 134 | VUnaryMicrokernelTester() |
| 135 | .batch_size(batch_size) |
| 136 | .Test(xnn_f16_vhswish_ukernel__f16c_x8, xnn_init_f16_hswish_avx_params); |
| 137 | } |
| 138 | } |
| 139 | |
| 140 | TEST(F16_VHSWISH__F16C_X8, batch_gt_8) { |
| 141 | TEST_REQUIRES_X86_F16C; |
| 142 | for (size_t batch_size = 9; batch_size < 16; batch_size++) { |
| 143 | VUnaryMicrokernelTester() |
| 144 | .batch_size(batch_size) |
| 145 | .Test(xnn_f16_vhswish_ukernel__f16c_x8, xnn_init_f16_hswish_avx_params); |
| 146 | } |
| 147 | } |
| 148 | |
| 149 | TEST(F16_VHSWISH__F16C_X8, inplace) { |
| 150 | TEST_REQUIRES_X86_F16C; |
| 151 | for (size_t batch_size = 1; batch_size <= 40; batch_size += 7) { |
| 152 | VUnaryMicrokernelTester() |
| 153 | .batch_size(batch_size) |
| 154 | .inplace(true) |
| 155 | .Test(xnn_f16_vhswish_ukernel__f16c_x8, xnn_init_f16_hswish_avx_params); |
| 156 | } |
| 157 | } |
| 158 | #endif // XNN_ARCH_X86 || XNN_ARCH_X86_64 |
| 159 | |
| 160 | |
| 161 | #if XNN_ARCH_X86 || XNN_ARCH_X86_64 |
| 162 | TEST(F16_VHSWISH__F16C_X16, batch_eq_16) { |
| 163 | TEST_REQUIRES_X86_F16C; |
| 164 | VUnaryMicrokernelTester() |
| 165 | .batch_size(16) |
| 166 | .Test(xnn_f16_vhswish_ukernel__f16c_x16, xnn_init_f16_hswish_avx_params); |
| 167 | } |
| 168 | |
| 169 | TEST(F16_VHSWISH__F16C_X16, batch_div_16) { |
| 170 | TEST_REQUIRES_X86_F16C; |
| 171 | for (size_t batch_size = 32; batch_size < 160; batch_size += 16) { |
| 172 | VUnaryMicrokernelTester() |
| 173 | .batch_size(batch_size) |
| 174 | .Test(xnn_f16_vhswish_ukernel__f16c_x16, xnn_init_f16_hswish_avx_params); |
| 175 | } |
| 176 | } |
| 177 | |
| 178 | TEST(F16_VHSWISH__F16C_X16, batch_lt_16) { |
| 179 | TEST_REQUIRES_X86_F16C; |
| 180 | for (size_t batch_size = 1; batch_size < 16; batch_size++) { |
| 181 | VUnaryMicrokernelTester() |
| 182 | .batch_size(batch_size) |
| 183 | .Test(xnn_f16_vhswish_ukernel__f16c_x16, xnn_init_f16_hswish_avx_params); |
| 184 | } |
| 185 | } |
| 186 | |
| 187 | TEST(F16_VHSWISH__F16C_X16, batch_gt_16) { |
| 188 | TEST_REQUIRES_X86_F16C; |
| 189 | for (size_t batch_size = 17; batch_size < 32; batch_size++) { |
| 190 | VUnaryMicrokernelTester() |
| 191 | .batch_size(batch_size) |
| 192 | .Test(xnn_f16_vhswish_ukernel__f16c_x16, xnn_init_f16_hswish_avx_params); |
| 193 | } |
| 194 | } |
| 195 | |
| 196 | TEST(F16_VHSWISH__F16C_X16, inplace) { |
| 197 | TEST_REQUIRES_X86_F16C; |
| 198 | for (size_t batch_size = 1; batch_size <= 80; batch_size += 15) { |
| 199 | VUnaryMicrokernelTester() |
| 200 | .batch_size(batch_size) |
| 201 | .inplace(true) |
| 202 | .Test(xnn_f16_vhswish_ukernel__f16c_x16, xnn_init_f16_hswish_avx_params); |
| 203 | } |
| 204 | } |
| 205 | #endif // XNN_ARCH_X86 || XNN_ARCH_X86_64 |