blob: eb4e63032d719143f5355d81b0b5be5f1b6b9d8b [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070011# ---[ Project and semantic versioning.
12PROJECT(XNNPACK C CXX ASM)
13
14# ---[ Options.
15SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
16SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
Marat Dukhanefc184a2020-02-13 09:47:01 -080017OPTION(XNNPACK_ENABLE_ASSEMBLY "Build XNNPACK with assembly micro-kernels" ON)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070018OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
19OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
Mo Zhou6cafcdb2020-04-26 10:41:41 +080020OPTION(XNNPACK_USE_SYSTEM_LIBS "Use system-provided dependency libraries" OFF)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070021
22# ---[ CMake options
Marat Dukhanbcbae1e2020-04-13 10:54:18 -070023INCLUDE(GNUInstallDirs)
24
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070025IF(XNNPACK_BUILD_TESTS)
26 ENABLE_TESTING()
27ENDIF()
28
Marat Dukhanefc184a2020-02-13 09:47:01 -080029IF(XNNPACK_ENABLE_ASSEMBLY)
30 ADD_DEFINITIONS(-DXNN_ENABLE_ASSEMBLY=1)
31ELSE()
32 ADD_DEFINITIONS(-DXNN_ENABLE_ASSEMBLY=0)
33ENDIF()
34
Marat Dukhan1b555e02020-04-14 22:40:29 -070035IF(MSVC)
36 # Disable "unary minus operator applied to unsigned type, result still unsigned" warning
37 ADD_COMPILE_OPTIONS("/wd4146")
38ENDIF()
39
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070040# ---[ Build flags
41IF(NOT CMAKE_SYSTEM_PROCESSOR)
42 IF(IOS)
43 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
44 IF(IOS_ARCH_COUNT GREATER 1)
45 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
46 "Specify a single architecture in IOS_ARCH and re-configure. ")
47 ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +090048 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|AMD64|armv7.*|arm64.*)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070049 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
50 ENDIF()
51 ELSE()
52 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
53 ENDIF()
Marat Dukhan7795c3a2020-04-14 20:45:36 -070054ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86|x86_64|AMD64|armv[5-8].*|aarch64)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070055 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
56ENDIF()
57
58IF(NOT CMAKE_SYSTEM_NAME)
59 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
Marat Dukhan78583c72020-04-26 22:00:43 -070060ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android|Windows|CYGWIN|MSYS)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070061 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
62ENDIF()
63
64# ---[ Download deps
Mo Zhou6cafcdb2020-04-26 10:41:41 +080065IF(NOT XNNPACK_USE_SYSTEM_LIBS)
66 IF(NOT DEFINED CLOG_SOURCE_DIR)
67 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
68 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
69 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
70 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
71 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
72 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
73 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
74 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070075
Mo Zhou6cafcdb2020-04-26 10:41:41 +080076 IF(NOT DEFINED CPUINFO_SOURCE_DIR)
77 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
78 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
79 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
80 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
81 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
82 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
83 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
84 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070085
Mo Zhou6cafcdb2020-04-26 10:41:41 +080086 IF(NOT DEFINED FP16_SOURCE_DIR)
87 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
88 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
89 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
90 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
91 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
92 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
93 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
94 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070095
Mo Zhou6cafcdb2020-04-26 10:41:41 +080096 IF(NOT DEFINED FXDIV_SOURCE_DIR)
97 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
98 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
99 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
100 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
101 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
102 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
103 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
104 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700105
Mo Zhou6cafcdb2020-04-26 10:41:41 +0800106 IF(NOT DEFINED PSIMD_SOURCE_DIR)
107 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
108 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
109 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
110 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
111 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
112 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
113 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
114 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700115
Mo Zhou6cafcdb2020-04-26 10:41:41 +0800116 IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
117 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
118 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
119 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
120 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
121 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
122 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
123 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
124 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700125
Mo Zhou6cafcdb2020-04-26 10:41:41 +0800126 IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
127 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
128 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
129 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
130 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
131 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
132 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
133 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
134 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700135
Mo Zhou6cafcdb2020-04-26 10:41:41 +0800136 IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
137 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
138 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
139 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
140 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
141 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
142 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
143 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
144 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700145ENDIF()
146
147# ---[ XNNPACK library
148SET(XNNPACK_OPERATOR_SRCS
Marat Dukhane8265432020-04-28 18:42:59 -0700149 src/operators/add-nc.c
150 src/operators/argmax-pooling-nhwc.c
151 src/operators/average-pooling-nhwc.c
152 src/operators/binary-elementwise-nd.c
153 src/operators/channel-pad-nc.c
154 src/operators/channel-shuffle-nc.c
155 src/operators/clamp-nc.c
156 src/operators/convolution-nchw.c
157 src/operators/convolution-nhwc.c
158 src/operators/deconvolution-nhwc.c
159 src/operators/fully-connected-nc.c
160 src/operators/global-average-pooling-ncw.c
161 src/operators/global-average-pooling-nwc.c
162 src/operators/hardswish-nc.c
163 src/operators/leaky-relu-nc.c
164 src/operators/max-pooling-nhwc.c
165 src/operators/prelu-nc.c
166 src/operators/resize-bilinear-nhwc.c
167 src/operators/sigmoid-nc.c
168 src/operators/softmax-nc.c
169 src/operators/unpooling-nhwc.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700170
171SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
172LIST(APPEND XNNPACK_COLD_SRCS
173 src/init.c
Ashkan Aliabadi1f8a2b82019-11-20 11:27:00 -0800174 src/memory.c
Marat Dukhan98ca6352020-02-03 12:53:02 -0800175 src/operator-delete.c
176 src/runtime.c
177 src/subgraph.c
178 src/tensor.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700179
180SET(XNNPACK_HOT_SRCS
181 src/indirection.c
182 src/operator-run.c)
183
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800184SET(XNNPACK_TABLE_SRCS
185 src/tables/exp2-k-over-64.c
186 src/tables/exp2-k-over-2048.c)
187
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700188SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800189 src/f32-argmaxpool/4x-scalar-c1.c
190 src/f32-argmaxpool/9p8x-scalar-c1.c
191 src/f32-argmaxpool/9x-scalar-c1.c
Marat Dukhan99936602020-04-11 16:47:01 -0700192 src/f32-avgpool/9p8x-minmax-scalar-c1.c
193 src/f32-avgpool/9x-minmax-scalar-c1.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700194 src/f32-clamp/gen/scalar-x1.c
195 src/f32-clamp/gen/scalar-x2.c
196 src/f32-clamp/gen/scalar-x4.c
Marat Dukhan6b7dfae2019-12-04 16:00:52 -0800197 src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan441e2212019-12-04 18:30:49 -0800198 src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700199 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700200 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700201 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800202 src/f32-dwconv-spchw/5x5p2-scalar.c
Erich Elsen38709a62019-11-08 11:58:45 -0800203 src/f32-dwconv-spchw/5x5s2p2-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700204 src/f32-dwconv/gen/up1x4-scalar.c
205 src/f32-dwconv/gen/up1x4-scalar-acc2.c
206 src/f32-dwconv/gen/up1x9-scalar.c
207 src/f32-dwconv/gen/up1x9-scalar-acc2.c
208 src/f32-dwconv/gen/up1x25-scalar.c
209 src/f32-dwconv/gen/up1x25-scalar-acc2.c
210 src/f32-dwconv/gen/up2x4-scalar.c
211 src/f32-dwconv/gen/up2x4-scalar-acc2.c
212 src/f32-dwconv/gen/up2x9-scalar.c
213 src/f32-dwconv/gen/up2x9-scalar-acc2.c
214 src/f32-dwconv/gen/up2x25-scalar.c
215 src/f32-dwconv/gen/up2x25-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700216 src/f32-dwconv/gen/up1x4-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700217 src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700218 src/f32-dwconv/gen/up1x9-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700219 src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c
220 src/f32-dwconv/gen/up1x25-minmax-scalar.c
221 src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700222 src/f32-dwconv/gen/up2x4-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700223 src/f32-dwconv/gen/up2x4-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700224 src/f32-dwconv/gen/up2x9-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700225 src/f32-dwconv/gen/up2x9-minmax-scalar-acc2.c
226 src/f32-dwconv/gen/up2x25-minmax-scalar.c
227 src/f32-dwconv/gen/up2x25-minmax-scalar-acc2.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700228 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhanb9d07cf2020-04-11 20:25:31 -0700229 src/f32-gavgpool/7p7x-minmax-scalar-c1.c
230 src/f32-gavgpool/7x-minmax-scalar-c1.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700231 src/f32-gemm/gen/1x4-scalar.c
232 src/f32-gemm/gen/2x4-scalar.c
233 src/f32-gemm/gen/4x2-scalar.c
234 src/f32-gemm/gen/4x4-scalar.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700235 src/f32-gemm/gen/1x4-minmax-scalar.c
236 src/f32-gemm/gen/2x4-minmax-scalar.c
237 src/f32-gemm/gen/4x2-minmax-scalar.c
238 src/f32-gemm/gen/4x4-minmax-scalar.c
239 src/f32-gemm/gen-inc/1x4inc-minmax-scalar.c
240 src/f32-gemm/gen-inc/2x4inc-minmax-scalar.c
241 src/f32-gemm/gen-inc/4x4inc-minmax-scalar.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800242 src/f32-hswish/gen/scalar-x1.c
243 src/f32-hswish/gen/scalar-x2.c
244 src/f32-hswish/gen/scalar-x4.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700245 src/f32-ibilinear/gen/scalar-c1.c
246 src/f32-ibilinear/gen/scalar-c2.c
247 src/f32-ibilinear/gen/scalar-c4.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700248 src/f32-igemm/gen/1x4-scalar.c
249 src/f32-igemm/gen/2x4-scalar.c
250 src/f32-igemm/gen/4x2-scalar.c
251 src/f32-igemm/gen/4x4-scalar.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700252 src/f32-igemm/gen/1x4-minmax-scalar.c
253 src/f32-igemm/gen/2x4-minmax-scalar.c
254 src/f32-igemm/gen/4x2-minmax-scalar.c
255 src/f32-igemm/gen/4x4-minmax-scalar.c
Marat Dukhan99936602020-04-11 16:47:01 -0700256 src/f32-maxpool/9p8x-minmax-scalar-c1.c
257 src/f32-pavgpool/9p8x-minmax-scalar-c1.c
258 src/f32-pavgpool/9x-minmax-scalar-c1.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700259 src/f32-ppmm/gen/2x4-minmax-scalar.c
260 src/f32-ppmm/gen/3x3-minmax-scalar.c
261 src/f32-ppmm/gen/4x2-minmax-scalar.c
262 src/f32-ppmm/gen/4x4-minmax-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800263 src/f32-prelu/gen/scalar-2x1.c
264 src/f32-prelu/gen/scalar-2x4.c
Marat Dukhanf46f6752020-01-21 11:03:49 -0800265 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x1.c
266 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x2.c
267 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x2-acc2.c
268 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4.c
269 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4-acc2.c
270 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4-acc4.c
271 src/f32-raddstoreexpminusmax/gen/scalar-p5-x1.c
272 src/f32-raddstoreexpminusmax/gen/scalar-p5-x2.c
273 src/f32-raddstoreexpminusmax/gen/scalar-p5-x2-acc2.c
274 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4.c
275 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4-acc2.c
276 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4-acc4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700277 src/f32-rmax/scalar.c
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800278 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x1.c
279 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x2.c
280 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x4.c
281 src/f32-sigmoid/gen/scalar-lut64-p2-div-x1.c
282 src/f32-sigmoid/gen/scalar-lut64-p2-div-x2.c
283 src/f32-sigmoid/gen/scalar-lut64-p2-div-x4.c
284 src/f32-sigmoid/gen/scalar-p5-div-x1.c
285 src/f32-sigmoid/gen/scalar-p5-div-x2.c
286 src/f32-sigmoid/gen/scalar-p5-div-x4.c
Marat Dukhan355ab432020-04-09 19:01:52 -0700287 src/f32-spmm/gen/1x1-minmax-scalar-pipelined.c
288 src/f32-spmm/gen/1x1-minmax-scalar.c
289 src/f32-spmm/gen/2x1-minmax-scalar-pipelined.c
290 src/f32-spmm/gen/2x1-minmax-scalar.c
291 src/f32-spmm/gen/4x1-minmax-scalar-pipelined.c
292 src/f32-spmm/gen/4x1-minmax-scalar.c
293 src/f32-spmm/gen/8x1-minmax-scalar-pipelined.c
294 src/f32-spmm/gen/8x1-minmax-scalar.c
295 src/f32-spmm/gen/8x2-minmax-scalar.c
296 src/f32-spmm/gen/8x4-minmax-scalar.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700297 src/f32-vbinary/gen/vadd-minmax-scalar-x1.c
298 src/f32-vbinary/gen/vadd-minmax-scalar-x2.c
299 src/f32-vbinary/gen/vadd-minmax-scalar-x4.c
300 src/f32-vbinary/gen/vaddc-minmax-scalar-x1.c
301 src/f32-vbinary/gen/vaddc-minmax-scalar-x2.c
302 src/f32-vbinary/gen/vaddc-minmax-scalar-x4.c
303 src/f32-vbinary/gen/vdiv-minmax-scalar-x1.c
304 src/f32-vbinary/gen/vdiv-minmax-scalar-x2.c
305 src/f32-vbinary/gen/vdiv-minmax-scalar-x4.c
306 src/f32-vbinary/gen/vdivc-minmax-scalar-x1.c
307 src/f32-vbinary/gen/vdivc-minmax-scalar-x2.c
308 src/f32-vbinary/gen/vdivc-minmax-scalar-x4.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800309 src/f32-vbinary/gen/vmax-scalar-x1.c
310 src/f32-vbinary/gen/vmax-scalar-x2.c
311 src/f32-vbinary/gen/vmax-scalar-x4.c
312 src/f32-vbinary/gen/vmaxc-scalar-x1.c
313 src/f32-vbinary/gen/vmaxc-scalar-x2.c
314 src/f32-vbinary/gen/vmaxc-scalar-x4.c
315 src/f32-vbinary/gen/vmin-scalar-x1.c
316 src/f32-vbinary/gen/vmin-scalar-x2.c
317 src/f32-vbinary/gen/vmin-scalar-x4.c
318 src/f32-vbinary/gen/vminc-scalar-x1.c
319 src/f32-vbinary/gen/vminc-scalar-x2.c
320 src/f32-vbinary/gen/vminc-scalar-x4.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700321 src/f32-vbinary/gen/vmul-minmax-scalar-x1.c
322 src/f32-vbinary/gen/vmul-minmax-scalar-x2.c
323 src/f32-vbinary/gen/vmul-minmax-scalar-x4.c
324 src/f32-vbinary/gen/vmulc-minmax-scalar-x1.c
325 src/f32-vbinary/gen/vmulc-minmax-scalar-x2.c
326 src/f32-vbinary/gen/vmulc-minmax-scalar-x4.c
327 src/f32-vbinary/gen/vrdivc-minmax-scalar-x1.c
328 src/f32-vbinary/gen/vrdivc-minmax-scalar-x2.c
329 src/f32-vbinary/gen/vrdivc-minmax-scalar-x4.c
330 src/f32-vbinary/gen/vrsubc-minmax-scalar-x1.c
331 src/f32-vbinary/gen/vrsubc-minmax-scalar-x2.c
332 src/f32-vbinary/gen/vrsubc-minmax-scalar-x4.c
333 src/f32-vbinary/gen/vsub-minmax-scalar-x1.c
334 src/f32-vbinary/gen/vsub-minmax-scalar-x2.c
335 src/f32-vbinary/gen/vsub-minmax-scalar-x4.c
336 src/f32-vbinary/gen/vsubc-minmax-scalar-x1.c
337 src/f32-vbinary/gen/vsubc-minmax-scalar-x2.c
338 src/f32-vbinary/gen/vsubc-minmax-scalar-x4.c
Marat Dukhan99936602020-04-11 16:47:01 -0700339 src/f32-vmulcaddc/gen/c1-minmax-scalar-2x.c
340 src/f32-vmulcaddc/gen/c2-minmax-scalar-2x.c
341 src/f32-vmulcaddc/gen/c4-minmax-scalar-2x.c
Marat Dukhan5739f702019-12-22 19:45:09 -0800342 src/math/expminus-scalar-lut2048-p1.c
343 src/math/expminus-scalar-lut64-p2.c
344 src/math/expminus-scalar-p5.c
345 src/math/sigmoid-scalar-lut2048-p1-div.c
346 src/math/sigmoid-scalar-lut64-p2-div.c
347 src/math/sigmoid-scalar-p5-div.c
Marat Dukhan99936602020-04-11 16:47:01 -0700348 src/q8-avgpool/9p8x-minmax-scalar-c1.c
349 src/q8-avgpool/9x-minmax-scalar-c1.c
Marat Dukhande06f492020-04-09 00:19:31 -0700350 src/q8-dwconv/up1x9-minmax-scalar.c
Marat Dukhan99936602020-04-11 16:47:01 -0700351 src/q8-gavgpool/7p7x-minmax-scalar-c1.c
352 src/q8-gavgpool/7x-minmax-scalar-c1.c
Marat Dukhande06f492020-04-09 00:19:31 -0700353 src/q8-gemm/2x2-minmax-scalar.c
354 src/q8-igemm/2x2-minmax-scalar.c
Marat Dukhan99936602020-04-11 16:47:01 -0700355 src/q8-vadd/minmax-scalar.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700356 src/u8-clamp/scalar-x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700357 src/u8-lut32norm/scalar.c
Marat Dukhan99936602020-04-11 16:47:01 -0700358 src/u8-maxpool/9p8x-minmax-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700359 src/u8-rmax/scalar.c
360 src/x32-packx/x2-scalar.c
361 src/x32-packx/x3-scalar.c
362 src/x32-packx/x4-scalar.c
363 src/x32-pad/x2-scalar.c
364 src/x32-unpool/scalar.c
365 src/x32-zip/x2-scalar.c
366 src/x32-zip/x3-scalar.c
367 src/x32-zip/x4-scalar.c
368 src/x32-zip/xm-scalar.c
369 src/x8-lut/scalar.c
370 src/x8-zip/x2-scalar.c
371 src/x8-zip/x3-scalar.c
372 src/x8-zip/x4-scalar.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700373 src/x8-zip/xm-scalar.c
374 src/requantization/precise-scalar.c
375 src/requantization/fp32-scalar.c
376 src/requantization/q31-scalar.c
377 src/requantization/gemmlowp-scalar.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700378
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800379SET(XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800380 src/f32-argmaxpool/4x-psimd-c4.c
381 src/f32-argmaxpool/9p8x-psimd-c4.c
382 src/f32-argmaxpool/9x-psimd-c4.c
Marat Dukhan99936602020-04-11 16:47:01 -0700383 src/f32-avgpool/9p8x-minmax-psimd-c4.c
384 src/f32-avgpool/9x-minmax-psimd-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700385 src/f32-clamp/gen/psimd-x4.c
386 src/f32-clamp/gen/psimd-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700387 src/f32-dwconv/gen/up4x25-minmax-psimd-acc2.c
388 src/f32-dwconv/gen/up4x25-minmax-psimd.c
389 src/f32-dwconv/gen/up4x4-minmax-psimd-acc2.c
390 src/f32-dwconv/gen/up4x4-minmax-psimd.c
391 src/f32-dwconv/gen/up4x9-minmax-psimd-acc2.c
392 src/f32-dwconv/gen/up4x9-minmax-psimd.c
393 src/f32-dwconv/gen/up8x25-minmax-psimd-acc2.c
394 src/f32-dwconv/gen/up8x25-minmax-psimd.c
395 src/f32-dwconv/gen/up8x4-minmax-psimd-acc2.c
396 src/f32-dwconv/gen/up8x4-minmax-psimd.c
397 src/f32-dwconv/gen/up8x9-minmax-psimd-acc2.c
398 src/f32-dwconv/gen/up8x9-minmax-psimd.c
Marat Dukhanb9d07cf2020-04-11 20:25:31 -0700399 src/f32-gavgpool/7p7x-minmax-psimd-c4.c
400 src/f32-gavgpool/7x-minmax-psimd-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700401 src/f32-gemm/gen/1x8-minmax-psimd-loadsplat.c
402 src/f32-gemm/gen/1x8-minmax-psimd-splat.c
403 src/f32-gemm/gen/1x8s4-minmax-psimd.c
404 src/f32-gemm/gen/4x2c4-minmax-psimd.c
405 src/f32-gemm/gen/4x8-minmax-psimd-loadsplat.c
406 src/f32-gemm/gen/4x8-minmax-psimd-splat.c
407 src/f32-gemm/gen/4x8s4-minmax-psimd.c
408 src/f32-gemm/gen/6x8-minmax-psimd-loadsplat.c
409 src/f32-gemm/gen/6x8-minmax-psimd-splat.c
410 src/f32-gemm/gen/6x8s4-minmax-psimd.c
411 src/f32-gemm/gen-inc/1x8inc-minmax-psimd-loadsplat.c
412 src/f32-gemm/gen-inc/1x8inc-minmax-psimd-splat.c
413 src/f32-gemm/gen-inc/1x8s4inc-minmax-psimd.c
414 src/f32-gemm/gen-inc/4x8inc-minmax-psimd-loadsplat.c
415 src/f32-gemm/gen-inc/4x8inc-minmax-psimd-splat.c
416 src/f32-gemm/gen-inc/4x8s4inc-minmax-psimd.c
417 src/f32-gemm/gen-inc/6x8inc-minmax-psimd-loadsplat.c
418 src/f32-gemm/gen-inc/6x8inc-minmax-psimd-splat.c
419 src/f32-gemm/gen-inc/6x8s4inc-minmax-psimd.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800420 src/f32-hswish/gen/psimd-x4.c
421 src/f32-hswish/gen/psimd-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700422 src/f32-ibilinear/gen/psimd-c4.c
423 src/f32-ibilinear/gen/psimd-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700424 src/f32-igemm/gen/1x8-minmax-psimd-loadsplat.c
425 src/f32-igemm/gen/1x8-minmax-psimd-splat.c
426 src/f32-igemm/gen/1x8s4-minmax-psimd.c
427 src/f32-igemm/gen/4x2c4-minmax-psimd.c
428 src/f32-igemm/gen/4x8-minmax-psimd-loadsplat.c
429 src/f32-igemm/gen/4x8-minmax-psimd-splat.c
430 src/f32-igemm/gen/4x8s4-minmax-psimd.c
431 src/f32-igemm/gen/6x8-minmax-psimd-loadsplat.c
432 src/f32-igemm/gen/6x8-minmax-psimd-splat.c
433 src/f32-igemm/gen/6x8s4-minmax-psimd.c
Marat Dukhan99936602020-04-11 16:47:01 -0700434 src/f32-maxpool/9p8x-minmax-psimd-c4.c
435 src/f32-pavgpool/9p8x-minmax-psimd-c4.c
436 src/f32-pavgpool/9x-minmax-psimd-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700437 src/f32-ppmm/gen/4x8-minmax-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800438 src/f32-prelu/gen/psimd-2x4.c
439 src/f32-prelu/gen/psimd-2x8.c
Marat Dukhanb39689d2020-01-24 13:32:20 -0800440 src/f32-rmax/psimd.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700441 src/f32-vbinary/gen/vadd-minmax-psimd-x4.c
442 src/f32-vbinary/gen/vadd-minmax-psimd-x8.c
443 src/f32-vbinary/gen/vaddc-minmax-psimd-x4.c
444 src/f32-vbinary/gen/vaddc-minmax-psimd-x8.c
445 src/f32-vbinary/gen/vdiv-minmax-psimd-x4.c
446 src/f32-vbinary/gen/vdiv-minmax-psimd-x8.c
447 src/f32-vbinary/gen/vdivc-minmax-psimd-x4.c
448 src/f32-vbinary/gen/vdivc-minmax-psimd-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800449 src/f32-vbinary/gen/vmax-psimd-x4.c
450 src/f32-vbinary/gen/vmax-psimd-x8.c
451 src/f32-vbinary/gen/vmaxc-psimd-x4.c
452 src/f32-vbinary/gen/vmaxc-psimd-x8.c
453 src/f32-vbinary/gen/vmin-psimd-x4.c
454 src/f32-vbinary/gen/vmin-psimd-x8.c
455 src/f32-vbinary/gen/vminc-psimd-x4.c
456 src/f32-vbinary/gen/vminc-psimd-x8.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700457 src/f32-vbinary/gen/vmul-minmax-psimd-x4.c
458 src/f32-vbinary/gen/vmul-minmax-psimd-x8.c
459 src/f32-vbinary/gen/vmulc-minmax-psimd-x4.c
460 src/f32-vbinary/gen/vmulc-minmax-psimd-x8.c
461 src/f32-vbinary/gen/vrdivc-minmax-psimd-x4.c
462 src/f32-vbinary/gen/vrdivc-minmax-psimd-x8.c
463 src/f32-vbinary/gen/vrsubc-minmax-psimd-x4.c
464 src/f32-vbinary/gen/vrsubc-minmax-psimd-x8.c
465 src/f32-vbinary/gen/vsub-minmax-psimd-x4.c
466 src/f32-vbinary/gen/vsub-minmax-psimd-x8.c
467 src/f32-vbinary/gen/vsubc-minmax-psimd-x4.c
468 src/f32-vbinary/gen/vsubc-minmax-psimd-x8.c
Marat Dukhan99936602020-04-11 16:47:01 -0700469 src/f32-vmulcaddc/gen/c4-minmax-psimd-2x.c
470 src/f32-vmulcaddc/gen/c8-minmax-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700471 src/x32-packx/x4-psimd.c
472 src/x32-pad/x2-psimd.c
473 src/x32-unpool/psimd.c
474 src/x32-zip/x2-psimd.c
475 src/x32-zip/x3-psimd.c
476 src/x32-zip/x4-psimd.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700477 src/x32-zip/xm-psimd.c
478 src/requantization/precise-psimd.c
479 src/requantization/fp32-psimd.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700480
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800481SET(XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS
Marat Dukhanb39689d2020-01-24 13:32:20 -0800482 src/f32-raddstoreexpminusmax/gen/psimd-p5-x4.c
483 src/f32-raddstoreexpminusmax/gen/psimd-p5-x8.c
484 src/f32-raddstoreexpminusmax/gen/psimd-p5-x8-acc2.c
485 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12.c
486 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12-acc2.c
487 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12-acc3.c
488 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16.c
489 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16-acc2.c
490 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16-acc4.c
491 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20.c
492 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20-acc2.c
493 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20-acc5.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800494 src/f32-sigmoid/gen/psimd-p5-div-x4.c
495 src/f32-sigmoid/gen/psimd-p5-div-x8.c
496 src/f32-sigmoid/gen/psimd-p5-div-x12.c
497 src/f32-sigmoid/gen/psimd-p5-div-x16.c
498 src/f32-sigmoid/gen/psimd-p5-div-x20.c
499 src/f32-sigmoid/gen/psimd-p5-div-x24.c
500 src/math/sigmoid-psimd-p5-div.c)
501
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700502SET(XNNPACK_NEON_MICROKERNEL_SRCS
Marat Dukhan99936602020-04-11 16:47:01 -0700503 src/f32-avgpool/9p8x-minmax-neon-c4.c
504 src/f32-avgpool/9x-minmax-neon-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700505 src/f32-clamp/gen/neon-x4.c
506 src/f32-clamp/gen/neon-x8.c
Marat Dukhanf5425ea2020-04-24 01:46:00 -0700507 src/f32-dwconv/gen/up4x4-minmax-neon.c
508 src/f32-dwconv/gen/up4x4-minmax-neon-acc2.c
509 src/f32-dwconv/gen/up8x4-minmax-neon.c
510 src/f32-dwconv/gen/up8x4-minmax-neon-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700511 src/f32-dwconv/gen/up4x9-minmax-neon.c
512 src/f32-dwconv/gen/up4x9-minmax-neon-acc2.c
513 src/f32-dwconv/gen/up8x9-minmax-neon.c
514 src/f32-dwconv/gen/up8x9-minmax-neon-acc2.c
Marat Dukhanf5425ea2020-04-24 01:46:00 -0700515 src/f32-dwconv/gen/up4x25-minmax-neon.c
516 src/f32-dwconv/gen/up4x25-minmax-neon-acc2.c
517 src/f32-dwconv/gen/up8x25-minmax-neon.c
518 src/f32-dwconv/gen/up8x25-minmax-neon-acc2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800519 src/f32-gavgpool-spchw/neon-x4.c
Marat Dukhanb9d07cf2020-04-11 20:25:31 -0700520 src/f32-gavgpool/7p7x-minmax-neon-c4.c
521 src/f32-gavgpool/7x-minmax-neon-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700522 src/f32-gemm/gen/1x8-minmax-neon-lane-ld64.c
523 src/f32-gemm/gen/4x2-minmax-neon-lane-ld64.c
524 src/f32-gemm/gen/4x8-minmax-neon-lane-ld128.c
525 src/f32-gemm/gen/4x8-minmax-neon-lane-ld64.c
526 src/f32-gemm/gen/5x8-minmax-neon-lane-ld64.c
527 src/f32-gemm/gen/6x8-minmax-neon-lane-ld64.c
528 src/f32-gemm/gen/6x8-minmax-neon-lane-ld128.c
529 src/f32-gemm/gen/1x8-minmax-neon-dup-ld64.c
530 src/f32-gemm/gen/4x8-minmax-neon-dup-ld128.c
531 src/f32-gemm/gen/4x8-minmax-neon-dup-ld64.c
532 src/f32-gemm/gen/6x8-minmax-neon-dup-ld64.c
533 src/f32-gemm/gen/6x8-minmax-neon-dup-ld128.c
534 src/f32-gemm/gen/1x8s4-minmax-neon.c
535 src/f32-gemm/gen/4x8s4-minmax-neon.c
536 src/f32-gemm/gen/6x8s4-minmax-neon.c
537 src/f32-gemm/gen/8x8s4-minmax-neon.c
538 src/f32-gemm/gen-inc/1x8inc-minmax-neon-lane-ld64.c
539 src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld128.c
540 src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld64.c
541 src/f32-gemm/gen-inc/5x8inc-minmax-neon-lane-ld64.c
542 src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld64.c
543 src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld128.c
544 src/f32-gemm/gen-inc/1x8inc-minmax-neon-dup-ld64.c
545 src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld128.c
546 src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld64.c
547 src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld64.c
548 src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld128.c
549 src/f32-gemm/gen-inc/1x8s4inc-minmax-neon.c
550 src/f32-gemm/gen-inc/4x8s4inc-minmax-neon.c
551 src/f32-gemm/gen-inc/6x8s4inc-minmax-neon.c
552 src/f32-gemm/gen-inc/8x8s4inc-minmax-neon.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800553 src/f32-hswish/gen/neon-x4.c
554 src/f32-hswish/gen/neon-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700555 src/f32-ibilinear/gen/neon-c4.c
556 src/f32-ibilinear/gen/neon-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700557 src/f32-igemm/gen/1x8-minmax-neon-lane-ld64.c
558 src/f32-igemm/gen/4x2-minmax-neon-lane-ld64.c
559 src/f32-igemm/gen/4x4-minmax-neon-lane-ld64.c
560 src/f32-igemm/gen/4x8-minmax-neon-lane-ld128.c
561 src/f32-igemm/gen/4x8-minmax-neon-lane-ld64.c
562 src/f32-igemm/gen/6x8-minmax-neon-lane-ld64.c
563 src/f32-igemm/gen/6x8-minmax-neon-lane-ld128.c
564 src/f32-igemm/gen/1x8-minmax-neon-dup-ld64.c
565 src/f32-igemm/gen/4x8-minmax-neon-dup-ld128.c
566 src/f32-igemm/gen/4x8-minmax-neon-dup-ld64.c
567 src/f32-igemm/gen/6x8-minmax-neon-dup-ld64.c
568 src/f32-igemm/gen/6x8-minmax-neon-dup-ld128.c
569 src/f32-igemm/gen/1x8s4-minmax-neon.c
570 src/f32-igemm/gen/4x8s4-minmax-neon.c
571 src/f32-igemm/gen/6x8s4-minmax-neon.c
572 src/f32-igemm/gen/8x8s4-minmax-neon.c
Marat Dukhan99936602020-04-11 16:47:01 -0700573 src/f32-maxpool/9p8x-minmax-neon-c4.c
574 src/f32-pavgpool/9p8x-minmax-neon-c4.c
575 src/f32-pavgpool/9x-minmax-neon-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700576 src/f32-ppmm/gen/4x8-minmax-neon.c
577 src/f32-ppmm/gen/8x8-minmax-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800578 src/f32-prelu/gen/neon-2x4.c
579 src/f32-prelu/gen/neon-2x8.c
Marat Dukhan8137e4c2020-01-25 12:56:58 -0800580 src/f32-raddstoreexpminusmax/gen/neon-p5-x4.c
581 src/f32-raddstoreexpminusmax/gen/neon-p5-x8.c
582 src/f32-raddstoreexpminusmax/gen/neon-p5-x8-acc2.c
583 src/f32-raddstoreexpminusmax/gen/neon-p5-x12.c
584 src/f32-raddstoreexpminusmax/gen/neon-p5-x12-acc2.c
585 src/f32-raddstoreexpminusmax/gen/neon-p5-x12-acc3.c
586 src/f32-raddstoreexpminusmax/gen/neon-p5-x16.c
587 src/f32-raddstoreexpminusmax/gen/neon-p5-x16-acc2.c
588 src/f32-raddstoreexpminusmax/gen/neon-p5-x16-acc4.c
589 src/f32-raddstoreexpminusmax/gen/neon-p5-x20.c
590 src/f32-raddstoreexpminusmax/gen/neon-p5-x20-acc2.c
591 src/f32-raddstoreexpminusmax/gen/neon-p5-x20-acc5.c
592 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x4.c
593 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x8.c
594 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x8-acc2.c
595 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12.c
596 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12-acc2.c
597 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12-acc3.c
598 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16.c
599 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16-acc2.c
600 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16-acc4.c
601 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20.c
602 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20-acc2.c
603 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20-acc5.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800604 src/f32-rmax/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800605 src/f32-sigmoid/gen/neon-frac-p9-p10-nr1recps-x16.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800606 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x4.c
607 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x8.c
608 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x12.c
609 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x16.c
610 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x20.c
611 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x24.c
612 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x4.c
613 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x8.c
614 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x12.c
615 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x16.c
616 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x20.c
617 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x24.c
618 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x4.c
619 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x8.c
620 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x12.c
621 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x16.c
622 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x20.c
623 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x24.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700624 src/f32-vbinary/gen/vadd-minmax-neon-x4.c
625 src/f32-vbinary/gen/vadd-minmax-neon-x8.c
626 src/f32-vbinary/gen/vaddc-minmax-neon-x4.c
627 src/f32-vbinary/gen/vaddc-minmax-neon-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800628 src/f32-vbinary/gen/vmax-neon-x4.c
629 src/f32-vbinary/gen/vmax-neon-x8.c
630 src/f32-vbinary/gen/vmaxc-neon-x4.c
631 src/f32-vbinary/gen/vmaxc-neon-x8.c
632 src/f32-vbinary/gen/vmin-neon-x4.c
633 src/f32-vbinary/gen/vmin-neon-x8.c
634 src/f32-vbinary/gen/vminc-neon-x4.c
635 src/f32-vbinary/gen/vminc-neon-x8.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700636 src/f32-vbinary/gen/vmul-minmax-neon-x4.c
637 src/f32-vbinary/gen/vmul-minmax-neon-x8.c
638 src/f32-vbinary/gen/vmulc-minmax-neon-x4.c
639 src/f32-vbinary/gen/vmulc-minmax-neon-x8.c
640 src/f32-vbinary/gen/vrsubc-minmax-neon-x4.c
641 src/f32-vbinary/gen/vrsubc-minmax-neon-x8.c
642 src/f32-vbinary/gen/vsub-minmax-neon-x4.c
643 src/f32-vbinary/gen/vsub-minmax-neon-x8.c
644 src/f32-vbinary/gen/vsubc-minmax-neon-x4.c
645 src/f32-vbinary/gen/vsubc-minmax-neon-x8.c
Marat Dukhan99936602020-04-11 16:47:01 -0700646 src/f32-vmulcaddc/gen/c4-minmax-neon-2x.c
647 src/f32-vmulcaddc/gen/c8-minmax-neon-2x.c
648 src/q8-avgpool/9p8x-minmax-neon-c8.c
649 src/q8-avgpool/9x-minmax-neon-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -0700650 src/q8-dwconv/up8x9-minmax-neon.c
Marat Dukhan99936602020-04-11 16:47:01 -0700651 src/q8-gavgpool/7p7x-minmax-neon-c8.c
652 src/q8-gavgpool/7x-minmax-neon-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -0700653 src/q8-gemm/4x8-minmax-neon.c
654 src/q8-gemm/8x8-minmax-neon.c
655 src/q8-igemm/4x8-minmax-neon.c
656 src/q8-igemm/8x8-minmax-neon.c
Marat Dukhan99936602020-04-11 16:47:01 -0700657 src/q8-vadd/minmax-neon.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700658 src/u8-clamp/neon-x64.c
Marat Dukhan99936602020-04-11 16:47:01 -0700659 src/u8-maxpool/9p8x-minmax-neon-c16.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800660 src/u8-rmax/neon.c
661 src/x32-packx/x4-neon-st4.c
662 src/x32-pad/x2-neon.c
Marat Dukhan57dccd82020-04-14 00:53:10 -0700663 src/x32-unpool/neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800664 src/x32-zip/x2-neon.c
665 src/x32-zip/x3-neon.c
666 src/x32-zip/x4-neon.c
667 src/x32-zip/xm-neon.c
668 src/x8-zip/x2-neon.c
669 src/x8-zip/x3-neon.c
670 src/x8-zip/x4-neon.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800671 src/x8-zip/xm-neon.c
Marat Dukhan68b3b452020-01-02 10:11:15 -0800672 src/math/sigmoid-neon-frac-p9-p10-nr1recps.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800673 src/math/sigmoid-neon-rr1-lut2048-p1-nr2recps.c
674 src/math/sigmoid-neon-rr1-lut64-p2-nr2recps.c
675 src/math/sigmoid-neon-rr1-p5-nr2recps.c
676 src/math/sigmoid-neon-rr2-lut2048-p1-nr2recps.c
677 src/math/sigmoid-neon-rr2-lut64-p2-nr2recps.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700678 src/math/sigmoid-neon-rr2-p5-nr2recps.c
679 src/requantization/precise-neon.c
680 src/requantization/fp32-neon.c
681 src/requantization/q31-neon.c
682 src/requantization/gemmlowp-neon.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700683
684SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan660fd192020-03-10 04:55:30 -0700685 src/f32-ibilinear/gen/neonfma-c4.c
686 src/f32-ibilinear/gen/neonfma-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700687 src/f32-igemm/gen/1x8-minmax-neonfma-dup-ld64.c
688 src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld128.c
689 src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld64.c
690 src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld64.c
691 src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld128.c
692 src/f32-igemm/gen/1x8s4-minmax-neonfma.c
693 src/f32-igemm/gen/4x8s4-minmax-neonfma.c
694 src/f32-igemm/gen/6x8s4-minmax-neonfma.c
695 src/f32-igemm/gen/8x8s4-minmax-neonfma.c
Marat Dukhanf5425ea2020-04-24 01:46:00 -0700696 src/f32-dwconv/gen/up4x4-minmax-neonfma.c
697 src/f32-dwconv/gen/up4x4-minmax-neonfma-acc2.c
698 src/f32-dwconv/gen/up8x4-minmax-neonfma.c
699 src/f32-dwconv/gen/up8x4-minmax-neonfma-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700700 src/f32-dwconv/gen/up4x9-minmax-neonfma.c
701 src/f32-dwconv/gen/up4x9-minmax-neonfma-acc2.c
702 src/f32-dwconv/gen/up8x9-minmax-neonfma.c
703 src/f32-dwconv/gen/up8x9-minmax-neonfma-acc2.c
Marat Dukhanf5425ea2020-04-24 01:46:00 -0700704 src/f32-dwconv/gen/up4x25-minmax-neonfma.c
705 src/f32-dwconv/gen/up4x25-minmax-neonfma-acc2.c
706 src/f32-dwconv/gen/up8x25-minmax-neonfma.c
707 src/f32-dwconv/gen/up8x25-minmax-neonfma-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700708 src/f32-gemm/gen/1x8-minmax-neonfma-dup-ld64.c
709 src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld128.c
710 src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld64.c
711 src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld64.c
712 src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld128.c
713 src/f32-gemm/gen/1x8s4-minmax-neonfma.c
714 src/f32-gemm/gen/4x8s4-minmax-neonfma.c
715 src/f32-gemm/gen/6x8s4-minmax-neonfma.c
716 src/f32-gemm/gen/8x8s4-minmax-neonfma.c
717 src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-dup-ld64.c
718 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld128.c
719 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld64.c
720 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld64.c
721 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld128.c
722 src/f32-gemm/gen-inc/1x8s4inc-minmax-neonfma.c
723 src/f32-gemm/gen-inc/4x8s4inc-minmax-neonfma.c
724 src/f32-gemm/gen-inc/6x8s4inc-minmax-neonfma.c
725 src/f32-gemm/gen-inc/8x8s4inc-minmax-neonfma.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800726 src/f32-hswish/gen/neonfma-x4.c
727 src/f32-hswish/gen/neonfma-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700728 src/f32-ppmm/gen/4x8-minmax-neonfma.c
729 src/f32-ppmm/gen/8x8-minmax-neonfma.c
Marat Dukhan8137e4c2020-01-25 12:56:58 -0800730 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x4.c
731 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x8.c
732 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x8-acc2.c
733 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12.c
734 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12-acc2.c
735 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12-acc3.c
736 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16.c
737 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16-acc2.c
738 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16-acc4.c
739 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20.c
740 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20-acc2.c
741 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20-acc5.c
742 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x4.c
743 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x8.c
744 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x8-acc2.c
745 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12.c
746 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12-acc2.c
747 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12-acc3.c
748 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16.c
749 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16-acc2.c
750 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16-acc4.c
751 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20.c
752 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20-acc2.c
753 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20-acc5.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800754 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x4.c
755 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x8.c
756 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x12.c
757 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x16.c
758 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x20.c
759 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x24.c
760 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x4.c
761 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x8.c
762 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x12.c
763 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x16.c
764 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x20.c
765 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x24.c
766 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x4.c
767 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x8.c
768 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x12.c
769 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x16.c
770 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x20.c
771 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x24.c
772 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x4.c
773 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x8.c
774 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x12.c
775 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x16.c
776 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x20.c
777 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x24.c
778 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x4.c
779 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x8.c
780 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x12.c
781 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x16.c
782 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x20.c
783 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x24.c
784 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x4.c
785 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x8.c
786 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x12.c
787 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x16.c
788 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x20.c
789 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x24.c
790 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x4.c
791 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x8.c
792 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x12.c
793 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x16.c
794 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x20.c
795 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x24.c
796 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x4.c
797 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x8.c
798 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x12.c
799 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x16.c
800 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x20.c
801 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x24.c
802 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x4.c
803 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x8.c
804 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x12.c
805 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x16.c
806 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x20.c
807 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x24.c
Marat Dukhan99936602020-04-11 16:47:01 -0700808 src/f32-vmulcaddc/gen/c4-minmax-neonfma-2x.c
809 src/f32-vmulcaddc/gen/c8-minmax-neonfma-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800810 src/math/exp-neonfma-lut64-p2.c
811 src/math/exp-neonfma-p5.c
Marat Dukhan191e5cd2019-11-28 00:52:01 -0800812 src/math/expminus-neonfma-lut2048-p1.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800813 src/math/expminus-neonfma-lut64-p2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800814 src/math/expminus-neonfma-p5.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800815 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma.c
816 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2fma.c
817 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2recps.c
818 src/math/sigmoid-neonfma-rr1-lut64-p2-nr1recps1fma.c
819 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2fma.c
820 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2recps.c
821 src/math/sigmoid-neonfma-rr1-p5-nr1recps1fma.c
822 src/math/sigmoid-neonfma-rr1-p5-nr2fma.c
823 src/math/sigmoid-neonfma-rr1-p5-nr2recps.c
824 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr1recps1fma.c
825 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2fma.c
826 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2recps.c
827 src/math/sigmoid-neonfma-rr2-lut64-p2-nr1recps1fma.c
828 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2fma.c
829 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2recps.c
830 src/math/sigmoid-neonfma-rr2-p5-nr1recps1fma.c
831 src/math/sigmoid-neonfma-rr2-p5-nr2fma.c
832 src/math/sigmoid-neonfma-rr2-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700833
Marat Dukhan36aecb52019-11-22 17:21:49 -0800834SET(XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700835 src/f32-vbinary/gen/vdiv-minmax-neon-x4.c
836 src/f32-vbinary/gen/vdiv-minmax-neon-x8.c
837 src/f32-vbinary/gen/vdivc-minmax-neon-x4.c
838 src/f32-vbinary/gen/vdivc-minmax-neon-x8.c
839 src/f32-vbinary/gen/vrdivc-minmax-neon-x4.c
840 src/f32-vbinary/gen/vrdivc-minmax-neon-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700841 src/f32-gemm/gen/1x8-minmax-neonfma-lane-ld64.c
842 src/f32-gemm/gen/4x2-minmax-neonfma-lane-ld64.c
843 src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld128.c
844 src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld64.c
845 src/f32-gemm/gen/5x8-minmax-neonfma-lane-ld64.c
846 src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld64.c
847 src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld128.c
848 src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-lane-ld64.c
849 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld128.c
850 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld64.c
851 src/f32-gemm/gen-inc/5x8inc-minmax-neonfma-lane-ld64.c
852 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld64.c
853 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld128.c
854 src/f32-igemm/gen/1x8-minmax-neonfma-lane-ld64.c
855 src/f32-igemm/gen/4x2-minmax-neonfma-lane-ld64.c
856 src/f32-igemm/gen/4x4-minmax-neonfma-lane-ld64.c
857 src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld128.c
858 src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld64.c
859 src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld64.c
860 src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld128.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800861 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
862 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
863 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
864 src/f32-dwconv-spchw/3x3p1-neonfma.c
865 src/f32-dwconv-spchw/5x5p2-neonfma.c
866 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
867 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800868 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x4.c
869 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x8.c
870 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x12.c
871 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x16.c
872 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x20.c
873 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x24.c
874 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x4.c
875 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x8.c
876 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x12.c
877 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x16.c
878 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x20.c
879 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x24.c
880 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x4.c
881 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x8.c
882 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x12.c
883 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x16.c
884 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x20.c
885 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x24.c
Marat Dukhan355ab432020-04-09 19:01:52 -0700886 src/f32-spmm/gen/12x1-minmax-neonfma.c
887 src/f32-spmm/gen/12x2-minmax-neonfma.c
888 src/f32-spmm/gen/12x4-minmax-neonfma.c
889 src/f32-spmm/gen/16x1-minmax-neonfma-pipelined.c
890 src/f32-spmm/gen/16x1-minmax-neonfma-unroll2.c
891 src/f32-spmm/gen/16x1-minmax-neonfma.c
892 src/f32-spmm/gen/16x2-minmax-neonfma.c
893 src/f32-spmm/gen/16x4-minmax-neonfma.c
894 src/f32-spmm/gen/4x1-minmax-neonfma-pipelined.c
895 src/f32-spmm/gen/4x1-minmax-neonfma-unroll2.c
896 src/f32-spmm/gen/4x1-minmax-neonfma.c
897 src/f32-spmm/gen/4x2-minmax-neonfma.c
898 src/f32-spmm/gen/4x4-minmax-neonfma.c
899 src/f32-spmm/gen/8x1-minmax-neonfma-pipelined.c
900 src/f32-spmm/gen/8x1-minmax-neonfma-unroll2.c
901 src/f32-spmm/gen/8x1-minmax-neonfma.c
902 src/f32-spmm/gen/8x2-minmax-neonfma.c
903 src/f32-spmm/gen/8x4-minmax-neonfma.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800904 src/math/sigmoid-neonfma-rr1-lut2048-p1-div.c
905 src/math/sigmoid-neonfma-rr1-lut64-p2-div.c
906 src/math/sigmoid-neonfma-rr1-p5-div.c
907 src/math/sigmoid-neonfma-rr2-lut2048-p1-div.c
908 src/math/sigmoid-neonfma-rr2-lut64-p2-div.c
909 src/math/sigmoid-neonfma-rr2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700910
911SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
Frank Barchard83ea9392020-04-20 20:15:14 -0700912 src/f16-gemm/gen/1x8-minmax-neonfp16arith-ld64.c
913 src/f16-gemm/gen/4x8-minmax-neonfp16arith-ld64.c
914 src/f16-gemm/gen/6x8-minmax-neonfp16arith-ld64.c
915 src/f16-gemm/gen/8x8-minmax-neonfp16arith-ld64.c
916 src/f16-gemm/gen-inc/1x8inc-minmax-neonfp16arith-ld64.c
917 src/f16-gemm/gen-inc/4x8inc-minmax-neonfp16arith-ld64.c
918 src/f16-gemm/gen-inc/6x8inc-minmax-neonfp16arith-ld64.c
919 src/f16-gemm/gen-inc/8x8inc-minmax-neonfp16arith-ld64.c
Frank Barchardb0e4fae2020-05-04 15:27:51 -0700920 src/f16-igemm/gen/1x8-minmax-neonfp16arith-ld64.c
921 src/f16-igemm/gen/4x8-minmax-neonfp16arith-ld64.c
922 src/f16-igemm/gen/6x8-minmax-neonfp16arith-ld64.c
923 src/f16-igemm/gen/8x8-minmax-neonfp16arith-ld64.c
Marat Dukhan355ab432020-04-09 19:01:52 -0700924 src/f16-spmm/gen/8x1-minmax-neonfp16arith.c
925 src/f16-spmm/gen/8x1-minmax-neonfp16arith-unroll2.c
926 src/f16-spmm/gen/16x1-minmax-neonfp16arith.c
927 src/f16-spmm/gen/16x1-minmax-neonfp16arith-unroll2.c
928 src/f16-spmm/gen/24x1-minmax-neonfp16arith.c
929 src/f16-spmm/gen/24x1-minmax-neonfp16arith-unroll2.c
930 src/f16-spmm/gen/32x1-minmax-neonfp16arith.c
931 src/f16-spmm/gen/32x1-minmax-neonfp16arith-unroll2.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700932
933SET(XNNPACK_SSE_MICROKERNEL_SRCS
Marat Dukhan99936602020-04-11 16:47:01 -0700934 src/f32-avgpool/9p8x-minmax-sse-c4.c
935 src/f32-avgpool/9x-minmax-sse-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700936 src/f32-clamp/gen/sse-x4.c
937 src/f32-clamp/gen/sse-x8.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800938 src/f32-dwconv-spchw/3x3p1-sse.c
939 src/f32-dwconv-spchw/3x3s2p1-sse.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700940 src/f32-dwconv/gen/up4x25-minmax-sse-acc2.c
941 src/f32-dwconv/gen/up4x25-minmax-sse.c
942 src/f32-dwconv/gen/up4x4-minmax-sse-acc2.c
943 src/f32-dwconv/gen/up4x4-minmax-sse.c
944 src/f32-dwconv/gen/up4x9-minmax-sse-acc2.c
945 src/f32-dwconv/gen/up4x9-minmax-sse.c
946 src/f32-dwconv/gen/up8x25-minmax-sse-acc2.c
947 src/f32-dwconv/gen/up8x25-minmax-sse.c
948 src/f32-dwconv/gen/up8x4-minmax-sse-acc2.c
949 src/f32-dwconv/gen/up8x4-minmax-sse.c
950 src/f32-dwconv/gen/up8x9-minmax-sse-acc2.c
951 src/f32-dwconv/gen/up8x9-minmax-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700952 src/f32-gavgpool-spchw/sse-x4.c
Marat Dukhanb9d07cf2020-04-11 20:25:31 -0700953 src/f32-gavgpool/7p7x-minmax-sse-c4.c
954 src/f32-gavgpool/7x-minmax-sse-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700955 src/f32-gemm/gen/1x8-minmax-sse-dup.c
956 src/f32-gemm/gen/1x8-minmax-sse-load1.c
957 src/f32-gemm/gen/1x8s4-minmax-sse.c
958 src/f32-gemm/gen/4x2c4-minmax-sse.c
959 src/f32-gemm/gen/4x8-minmax-sse-dup.c
960 src/f32-gemm/gen/4x8-minmax-sse-load1.c
961 src/f32-gemm/gen/4x8s4-minmax-sse.c
962 src/f32-gemm/gen-inc/1x8inc-minmax-sse-dup.c
963 src/f32-gemm/gen-inc/1x8inc-minmax-sse-load1.c
964 src/f32-gemm/gen-inc/1x8s4inc-minmax-sse.c
965 src/f32-gemm/gen-inc/4x8inc-minmax-sse-dup.c
966 src/f32-gemm/gen-inc/4x8inc-minmax-sse-load1.c
967 src/f32-gemm/gen-inc/4x8s4inc-minmax-sse.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800968 src/f32-hswish/gen/sse-x4.c
969 src/f32-hswish/gen/sse-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700970 src/f32-ibilinear/gen/sse-c4.c
971 src/f32-ibilinear/gen/sse-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700972 src/f32-igemm/gen/1x8-minmax-sse-dup.c
973 src/f32-igemm/gen/1x8-minmax-sse-load1.c
974 src/f32-igemm/gen/1x8s4-minmax-sse.c
975 src/f32-igemm/gen/4x2c4-minmax-sse.c
976 src/f32-igemm/gen/4x8-minmax-sse-dup.c
977 src/f32-igemm/gen/4x8-minmax-sse-load1.c
978 src/f32-igemm/gen/4x8s4-minmax-sse.c
Marat Dukhan99936602020-04-11 16:47:01 -0700979 src/f32-maxpool/9p8x-minmax-sse-c4.c
980 src/f32-pavgpool/9p8x-minmax-sse-c4.c
981 src/f32-pavgpool/9x-minmax-sse-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700982 src/f32-ppmm/gen/4x8-minmax-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700983 src/f32-rmax/sse.c
Marat Dukhan355ab432020-04-09 19:01:52 -0700984 src/f32-spmm/gen/4x1-minmax-sse.c
985 src/f32-spmm/gen/8x1-minmax-sse.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -0700986 src/f32-vbinary/gen/vadd-minmax-sse-x4.c
987 src/f32-vbinary/gen/vadd-minmax-sse-x8.c
988 src/f32-vbinary/gen/vaddc-minmax-sse-x4.c
989 src/f32-vbinary/gen/vaddc-minmax-sse-x8.c
990 src/f32-vbinary/gen/vdiv-minmax-sse-x4.c
991 src/f32-vbinary/gen/vdiv-minmax-sse-x8.c
992 src/f32-vbinary/gen/vdivc-minmax-sse-x4.c
993 src/f32-vbinary/gen/vdivc-minmax-sse-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800994 src/f32-vbinary/gen/vmax-sse-x4.c
995 src/f32-vbinary/gen/vmax-sse-x8.c
996 src/f32-vbinary/gen/vmaxc-sse-x4.c
997 src/f32-vbinary/gen/vmaxc-sse-x8.c
998 src/f32-vbinary/gen/vmin-sse-x4.c
999 src/f32-vbinary/gen/vmin-sse-x8.c
1000 src/f32-vbinary/gen/vminc-sse-x4.c
1001 src/f32-vbinary/gen/vminc-sse-x8.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -07001002 src/f32-vbinary/gen/vmul-minmax-sse-x4.c
1003 src/f32-vbinary/gen/vmul-minmax-sse-x8.c
1004 src/f32-vbinary/gen/vmulc-minmax-sse-x4.c
1005 src/f32-vbinary/gen/vmulc-minmax-sse-x8.c
1006 src/f32-vbinary/gen/vrdivc-minmax-sse-x4.c
1007 src/f32-vbinary/gen/vrdivc-minmax-sse-x8.c
1008 src/f32-vbinary/gen/vrsubc-minmax-sse-x4.c
1009 src/f32-vbinary/gen/vrsubc-minmax-sse-x8.c
1010 src/f32-vbinary/gen/vsub-minmax-sse-x4.c
1011 src/f32-vbinary/gen/vsub-minmax-sse-x8.c
1012 src/f32-vbinary/gen/vsubc-minmax-sse-x4.c
1013 src/f32-vbinary/gen/vsubc-minmax-sse-x8.c
Marat Dukhan99936602020-04-11 16:47:01 -07001014 src/f32-vmulcaddc/gen/c4-minmax-sse-2x.c
1015 src/f32-vmulcaddc/gen/c8-minmax-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001016 src/x32-packx/x4-sse.c)
1017
1018SET(XNNPACK_SSE2_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -08001019 src/f32-argmaxpool/4x-sse2-c4.c
1020 src/f32-argmaxpool/9p8x-sse2-c4.c
1021 src/f32-argmaxpool/9x-sse2-c4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001022 src/f32-prelu/gen/sse2-2x4.c
1023 src/f32-prelu/gen/sse2-2x8.c
Marat Dukhanb39689d2020-01-24 13:32:20 -08001024 src/f32-raddstoreexpminusmax/gen/sse2-p5-x4.c
1025 src/f32-raddstoreexpminusmax/gen/sse2-p5-x8.c
1026 src/f32-raddstoreexpminusmax/gen/sse2-p5-x8-acc2.c
1027 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12.c
1028 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12-acc2.c
1029 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12-acc3.c
1030 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16.c
1031 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16-acc2.c
1032 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16-acc4.c
1033 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20.c
1034 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20-acc2.c
1035 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20-acc5.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001036 src/f32-sigmoid/gen/sse2-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001037 src/f32-sigmoid/gen/sse2-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001038 src/f32-sigmoid/gen/sse2-p5-div-x12.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001039 src/f32-sigmoid/gen/sse2-p5-div-x16.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001040 src/f32-sigmoid/gen/sse2-p5-div-x20.c
1041 src/f32-sigmoid/gen/sse2-p5-div-x24.c
Marat Dukhan99936602020-04-11 16:47:01 -07001042 src/q8-avgpool/9p8x-minmax-sse2-c8.c
1043 src/q8-avgpool/9x-minmax-sse2-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -07001044 src/q8-igemm/4x4c2-minmax-sse2.c
1045 src/q8-dwconv/up8x9-minmax-sse2.c
Marat Dukhan99936602020-04-11 16:47:01 -07001046 src/q8-gavgpool/7p7x-minmax-sse2-c8.c
1047 src/q8-gavgpool/7x-minmax-sse2-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -07001048 src/q8-gemm/2x4c8-minmax-sse2.c
1049 src/q8-gemm/4x4c2-minmax-sse2.c
Marat Dukhan99936602020-04-11 16:47:01 -07001050 src/q8-vadd/minmax-sse2.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001051 src/u8-clamp/sse2-x64.c
Marat Dukhan99936602020-04-11 16:47:01 -07001052 src/u8-maxpool/9p8x-minmax-sse2-c16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001053 src/u8-rmax/sse2.c
1054 src/x32-pad/x2-sse2.c
Marat Dukhan57dccd82020-04-14 00:53:10 -07001055 src/x32-unpool/sse2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001056 src/x32-zip/x2-sse2.c
1057 src/x32-zip/x3-sse2.c
1058 src/x32-zip/x4-sse2.c
1059 src/x32-zip/xm-sse2.c
1060 src/x8-zip/x2-sse2.c
1061 src/x8-zip/x3-sse2.c
1062 src/x8-zip/x4-sse2.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001063 src/x8-zip/xm-sse2.c
1064 src/math/exp-sse2-p5.c
Marat Dukhan80bafd22019-11-18 10:16:01 -08001065 src/math/expminus-sse2-p5.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001066 src/math/sigmoid-sse2-p5-div.c
1067 src/requantization/precise-sse2.c
1068 src/requantization/fp32-sse2.c
1069 src/requantization/q31-sse2.c
1070 src/requantization/gemmlowp-sse2.c)
1071
1072SET(XNNPACK_SSSE3_MICROKERNEL_SRCS
1073 src/requantization/precise-ssse3.c
1074 src/requantization/q31-ssse3.c
1075 src/requantization/gemmlowp-ssse3.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001076
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001077SET(XNNPACK_SSE41_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -08001078 src/f32-prelu/gen/sse41-2x4.c
1079 src/f32-prelu/gen/sse41-2x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001080 src/f32-sigmoid/gen/sse41-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001081 src/f32-sigmoid/gen/sse41-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001082 src/f32-sigmoid/gen/sse41-p5-div-x12.c
1083 src/f32-sigmoid/gen/sse41-p5-div-x16.c
1084 src/f32-sigmoid/gen/sse41-p5-div-x20.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001085 src/f32-sigmoid/gen/sse41-p5-div-x24.c
1086 src/requantization/precise-sse4.c
1087 src/requantization/q31-sse4.c
1088 src/requantization/gemmlowp-sse4.c)
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001089
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001090SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001091 src/f32-clamp/gen/avx-x8.c
1092 src/f32-clamp/gen/avx-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001093 src/f32-dwconv/gen/up16x4-minmax-avx-acc2.c
1094 src/f32-dwconv/gen/up16x4-minmax-avx.c
1095 src/f32-dwconv/gen/up8x4-minmax-avx-acc2.c
1096 src/f32-dwconv/gen/up8x4-minmax-avx.c
1097 src/f32-dwconv/gen/up16x9-minmax-avx-acc2.c
1098 src/f32-dwconv/gen/up16x9-minmax-avx.c
1099 src/f32-dwconv/gen/up8x9-minmax-avx-acc2.c
1100 src/f32-dwconv/gen/up8x9-minmax-avx.c
1101 src/f32-dwconv/gen/up16x25-minmax-avx-acc2.c
1102 src/f32-dwconv/gen/up16x25-minmax-avx.c
1103 src/f32-dwconv/gen/up8x25-minmax-avx-acc2.c
1104 src/f32-dwconv/gen/up8x25-minmax-avx.c
1105 src/f32-gemm/gen/1x8-minmax-avx-broadcast.c
1106 src/f32-gemm/gen/4x8-minmax-avx-broadcast.c
1107 src/f32-gemm/gen/5x8-minmax-avx-broadcast.c
1108 src/f32-gemm/gen/6x8-minmax-avx-broadcast.c
1109 src/f32-gemm/gen/7x8-minmax-avx-broadcast.c
1110 src/f32-gemm/gen/1x16-minmax-avx-broadcast.c
1111 src/f32-gemm/gen/3x16-minmax-avx-broadcast.c
1112 src/f32-gemm/gen/4x16-minmax-avx-broadcast.c
1113 src/f32-gemm/gen/5x16-minmax-avx-broadcast.c
1114 src/f32-gemm/gen-inc/1x8inc-minmax-avx-broadcast.c
1115 src/f32-gemm/gen-inc/4x8inc-minmax-avx-broadcast.c
1116 src/f32-gemm/gen-inc/5x8inc-minmax-avx-broadcast.c
1117 src/f32-gemm/gen-inc/6x8inc-minmax-avx-broadcast.c
1118 src/f32-gemm/gen-inc/7x8inc-minmax-avx-broadcast.c
1119 src/f32-gemm/gen-inc/1x16inc-minmax-avx-broadcast.c
1120 src/f32-gemm/gen-inc/3x16inc-minmax-avx-broadcast.c
1121 src/f32-gemm/gen-inc/4x16inc-minmax-avx-broadcast.c
1122 src/f32-gemm/gen-inc/5x16inc-minmax-avx-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001123 src/f32-hswish/gen/avx-x8.c
1124 src/f32-hswish/gen/avx-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001125 src/f32-igemm/gen/1x8-minmax-avx-broadcast.c
1126 src/f32-igemm/gen/4x8-minmax-avx-broadcast.c
1127 src/f32-igemm/gen/5x8-minmax-avx-broadcast.c
1128 src/f32-igemm/gen/6x8-minmax-avx-broadcast.c
1129 src/f32-igemm/gen/7x8-minmax-avx-broadcast.c
1130 src/f32-igemm/gen/1x16-minmax-avx-broadcast.c
1131 src/f32-igemm/gen/3x16-minmax-avx-broadcast.c
1132 src/f32-igemm/gen/4x16-minmax-avx-broadcast.c
1133 src/f32-igemm/gen/5x16-minmax-avx-broadcast.c
Marat Dukhan90eca0a2020-03-11 00:52:23 -07001134 src/f32-prelu/gen/avx-2x8.c
1135 src/f32-prelu/gen/avx-2x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001136 src/f32-rmax/avx.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -07001137 src/f32-vbinary/gen/vadd-minmax-avx-x8.c
1138 src/f32-vbinary/gen/vadd-minmax-avx-x16.c
1139 src/f32-vbinary/gen/vaddc-minmax-avx-x8.c
1140 src/f32-vbinary/gen/vaddc-minmax-avx-x16.c
1141 src/f32-vbinary/gen/vdiv-minmax-avx-x8.c
1142 src/f32-vbinary/gen/vdiv-minmax-avx-x16.c
1143 src/f32-vbinary/gen/vdivc-minmax-avx-x8.c
1144 src/f32-vbinary/gen/vdivc-minmax-avx-x16.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001145 src/f32-vbinary/gen/vmax-avx-x8.c
1146 src/f32-vbinary/gen/vmax-avx-x16.c
1147 src/f32-vbinary/gen/vmaxc-avx-x8.c
1148 src/f32-vbinary/gen/vmaxc-avx-x16.c
1149 src/f32-vbinary/gen/vmin-avx-x8.c
1150 src/f32-vbinary/gen/vmin-avx-x16.c
1151 src/f32-vbinary/gen/vminc-avx-x8.c
1152 src/f32-vbinary/gen/vminc-avx-x16.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -07001153 src/f32-vbinary/gen/vmul-minmax-avx-x8.c
1154 src/f32-vbinary/gen/vmul-minmax-avx-x16.c
1155 src/f32-vbinary/gen/vmulc-minmax-avx-x8.c
1156 src/f32-vbinary/gen/vmulc-minmax-avx-x16.c
1157 src/f32-vbinary/gen/vrdivc-minmax-avx-x8.c
1158 src/f32-vbinary/gen/vrdivc-minmax-avx-x16.c
1159 src/f32-vbinary/gen/vrsubc-minmax-avx-x8.c
1160 src/f32-vbinary/gen/vrsubc-minmax-avx-x16.c
1161 src/f32-vbinary/gen/vsub-minmax-avx-x8.c
1162 src/f32-vbinary/gen/vsub-minmax-avx-x16.c
1163 src/f32-vbinary/gen/vsubc-minmax-avx-x8.c
1164 src/f32-vbinary/gen/vsubc-minmax-avx-x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001165 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001166
Marat Dukhanfda12b82019-11-21 12:27:59 -08001167SET(XNNPACK_FMA3_MICROKERNEL_SRCS
Marat Dukhan1c587112020-04-08 20:04:28 -07001168 src/f32-dwconv/gen/up16x4-minmax-fma3-acc2.c
1169 src/f32-dwconv/gen/up16x4-minmax-fma3.c
1170 src/f32-dwconv/gen/up8x4-minmax-fma3-acc2.c
1171 src/f32-dwconv/gen/up8x4-minmax-fma3.c
1172 src/f32-dwconv/gen/up16x9-minmax-fma3-acc2.c
1173 src/f32-dwconv/gen/up16x9-minmax-fma3.c
1174 src/f32-dwconv/gen/up8x9-minmax-fma3-acc2.c
1175 src/f32-dwconv/gen/up8x9-minmax-fma3.c
1176 src/f32-dwconv/gen/up16x25-minmax-fma3-acc2.c
1177 src/f32-dwconv/gen/up16x25-minmax-fma3.c
1178 src/f32-dwconv/gen/up8x25-minmax-fma3-acc2.c
1179 src/f32-dwconv/gen/up8x25-minmax-fma3.c
1180 src/f32-gemm/gen/1x8-minmax-fma3-broadcast.c
1181 src/f32-gemm/gen/4x8-minmax-fma3-broadcast.c
1182 src/f32-gemm/gen/5x8-minmax-fma3-broadcast.c
1183 src/f32-gemm/gen/6x8-minmax-fma3-broadcast.c
1184 src/f32-gemm/gen/7x8-minmax-fma3-broadcast.c
1185 src/f32-gemm/gen/8x8-minmax-fma3-broadcast.c
1186 src/f32-gemm/gen/1x16-minmax-fma3-broadcast.c
1187 src/f32-gemm/gen/3x16-minmax-fma3-broadcast.c
1188 src/f32-gemm/gen/4x16-minmax-fma3-broadcast.c
1189 src/f32-gemm/gen/5x16-minmax-fma3-broadcast.c
1190 src/f32-gemm/gen/1x16s4-minmax-fma3-broadcast.c
1191 src/f32-gemm/gen/3x16s4-minmax-fma3-broadcast.c
1192 src/f32-gemm/gen/4x16s4-minmax-fma3-broadcast.c
1193 src/f32-gemm/gen/5x16s4-minmax-fma3-broadcast.c
1194 src/f32-gemm/gen-inc/1x8inc-minmax-fma3-broadcast.c
1195 src/f32-gemm/gen-inc/4x8inc-minmax-fma3-broadcast.c
1196 src/f32-gemm/gen-inc/5x8inc-minmax-fma3-broadcast.c
1197 src/f32-gemm/gen-inc/6x8inc-minmax-fma3-broadcast.c
1198 src/f32-gemm/gen-inc/7x8inc-minmax-fma3-broadcast.c
1199 src/f32-gemm/gen-inc/8x8inc-minmax-fma3-broadcast.c
1200 src/f32-gemm/gen-inc/1x16inc-minmax-fma3-broadcast.c
1201 src/f32-gemm/gen-inc/3x16inc-minmax-fma3-broadcast.c
1202 src/f32-gemm/gen-inc/4x16inc-minmax-fma3-broadcast.c
1203 src/f32-gemm/gen-inc/5x16inc-minmax-fma3-broadcast.c
1204 src/f32-gemm/gen-inc/1x16s4inc-minmax-fma3-broadcast.c
1205 src/f32-gemm/gen-inc/3x16s4inc-minmax-fma3-broadcast.c
1206 src/f32-gemm/gen-inc/4x16s4inc-minmax-fma3-broadcast.c
1207 src/f32-gemm/gen-inc/5x16s4inc-minmax-fma3-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001208 src/f32-hswish/gen/fma3-x8.c
1209 src/f32-hswish/gen/fma3-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001210 src/f32-igemm/gen/1x8-minmax-fma3-broadcast.c
1211 src/f32-igemm/gen/4x8-minmax-fma3-broadcast.c
1212 src/f32-igemm/gen/5x8-minmax-fma3-broadcast.c
1213 src/f32-igemm/gen/6x8-minmax-fma3-broadcast.c
1214 src/f32-igemm/gen/7x8-minmax-fma3-broadcast.c
1215 src/f32-igemm/gen/8x8-minmax-fma3-broadcast.c
1216 src/f32-igemm/gen/1x16-minmax-fma3-broadcast.c
1217 src/f32-igemm/gen/3x16-minmax-fma3-broadcast.c
1218 src/f32-igemm/gen/4x16-minmax-fma3-broadcast.c
1219 src/f32-igemm/gen/5x16-minmax-fma3-broadcast.c
1220 src/f32-igemm/gen/1x16s4-minmax-fma3-broadcast.c
1221 src/f32-igemm/gen/3x16s4-minmax-fma3-broadcast.c
1222 src/f32-igemm/gen/4x16s4-minmax-fma3-broadcast.c
1223 src/f32-igemm/gen/5x16s4-minmax-fma3-broadcast.c)
Marat Dukhanfda12b82019-11-21 12:27:59 -08001224
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001225SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001226 src/f32-raddexpminusmax/gen/avx2-p5-x64.c
1227 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc2.c
1228 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc4.c
1229 src/f32-raddexpminusmax/gen/avx2-p5-x72.c
1230 src/f32-raddexpminusmax/gen/avx2-p5-x72-acc3.c
1231 src/f32-raddexpminusmax/gen/avx2-p5-x80.c
1232 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc2.c
1233 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc5.c
1234 src/f32-raddexpminusmax/gen/avx2-p5-x96.c
1235 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc2.c
1236 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc3.c
1237 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc6.c
1238 src/f32-raddextexp/gen/avx2-p5-x64.c
1239 src/f32-raddextexp/gen/avx2-p5-x64-acc2.c
1240 src/f32-raddextexp/gen/avx2-p5-x64-acc4.c
1241 src/f32-raddextexp/gen/avx2-p5-x72.c
1242 src/f32-raddextexp/gen/avx2-p5-x72-acc3.c
1243 src/f32-raddextexp/gen/avx2-p5-x80.c
1244 src/f32-raddextexp/gen/avx2-p5-x80-acc2.c
1245 src/f32-raddextexp/gen/avx2-p5-x80-acc5.c
1246 src/f32-raddextexp/gen/avx2-p5-x96.c
1247 src/f32-raddextexp/gen/avx2-p5-x96-acc2.c
1248 src/f32-raddextexp/gen/avx2-p5-x96-acc3.c
1249 src/f32-raddextexp/gen/avx2-p5-x96-acc6.c
1250 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64.c
1251 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc2.c
1252 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc4.c
1253 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72.c
1254 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72-acc3.c
1255 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80.c
1256 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc2.c
1257 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc5.c
1258 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96.c
1259 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc2.c
1260 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc3.c
1261 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc6.c
Marat Dukhanfa0a4322020-01-06 16:14:29 -08001262 src/f32-sigmoid/gen/avx2-rr1-p5-div-x8.c
1263 src/f32-sigmoid/gen/avx2-rr1-p5-div-x16.c
1264 src/f32-sigmoid/gen/avx2-rr1-p5-div-x24.c
1265 src/f32-sigmoid/gen/avx2-rr1-p5-div-x32.c
1266 src/f32-sigmoid/gen/avx2-rr1-p5-div-x40.c
1267 src/f32-sigmoid/gen/avx2-rr1-p5-div-x48.c
1268 src/f32-sigmoid/gen/avx2-rr1-p5-div-x56.c
1269 src/f32-sigmoid/gen/avx2-rr1-p5-div-x64.c
1270 src/f32-sigmoid/gen/avx2-rr1-p5-div-x72.c
1271 src/f32-sigmoid/gen/avx2-rr1-p5-div-x80.c
1272 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x8.c
1273 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x16.c
1274 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x24.c
1275 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x32.c
1276 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x40.c
1277 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x48.c
1278 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x56.c
1279 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x64.c
1280 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x72.c
1281 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x80.c
1282 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x8.c
1283 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x16.c
1284 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x24.c
1285 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x32.c
1286 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x40.c
1287 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x48.c
1288 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x56.c
1289 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x64.c
1290 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x72.c
1291 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x80.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001292 src/f32-vscaleexpminusmax/gen/avx2-p5-x8.c
1293 src/f32-vscaleexpminusmax/gen/avx2-p5-x16.c
1294 src/f32-vscaleexpminusmax/gen/avx2-p5-x24.c
1295 src/f32-vscaleexpminusmax/gen/avx2-p5-x32.c
1296 src/f32-vscaleexpminusmax/gen/avx2-p5-x40.c
1297 src/f32-vscaleexpminusmax/gen/avx2-p5-x48.c
1298 src/f32-vscaleexpminusmax/gen/avx2-p5-x56.c
1299 src/f32-vscaleexpminusmax/gen/avx2-p5-x64.c
1300 src/f32-vscaleexpminusmax/gen/avx2-p5-x72.c
1301 src/f32-vscaleexpminusmax/gen/avx2-p5-x80.c
1302 src/f32-vscaleexpminusmax/gen/avx2-p5-x88.c
1303 src/f32-vscaleexpminusmax/gen/avx2-p5-x96.c
1304 src/f32-vscaleextexp/gen/avx2-p5-x8.c
1305 src/f32-vscaleextexp/gen/avx2-p5-x16.c
1306 src/f32-vscaleextexp/gen/avx2-p5-x24.c
1307 src/f32-vscaleextexp/gen/avx2-p5-x32.c
1308 src/f32-vscaleextexp/gen/avx2-p5-x40.c
1309 src/f32-vscaleextexp/gen/avx2-p5-x48.c
1310 src/f32-vscaleextexp/gen/avx2-p5-x56.c
1311 src/f32-vscaleextexp/gen/avx2-p5-x64.c
1312 src/f32-vscaleextexp/gen/avx2-p5-x72.c
1313 src/f32-vscaleextexp/gen/avx2-p5-x80.c
1314 src/f32-vscaleextexp/gen/avx2-p5-x88.c
1315 src/f32-vscaleextexp/gen/avx2-p5-x96.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001316 src/math/exp-avx2-p5.c
1317 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -07001318 src/math/exp-avx2-perm-p4.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001319 src/math/expminus-avx2-p5.c
Marat Dukhan72416002020-01-05 21:53:19 -08001320 src/math/extexp-avx2-p5.c
1321 src/math/sigmoid-avx2-rr2-p5-div.c
1322 src/math/sigmoid-avx2-rr1-p5-div.c
1323 src/math/sigmoid-avx2-rr2-p5-nr2fma.c
1324 src/math/sigmoid-avx2-rr1-p5-nr2fma.c
1325 src/math/sigmoid-avx2-rr2-p5-nr1fma.c
1326 src/math/sigmoid-avx2-rr1-p5-nr1fma.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001327
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001328SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001329 src/f32-clamp/gen/avx512f-x16.c
1330 src/f32-clamp/gen/avx512f-x32.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001331 src/f32-dwconv/gen/up32x4-minmax-avx512f-acc2.c
1332 src/f32-dwconv/gen/up32x4-minmax-avx512f.c
1333 src/f32-dwconv/gen/up16x4-minmax-avx512f-acc2.c
1334 src/f32-dwconv/gen/up16x4-minmax-avx512f.c
1335 src/f32-dwconv/gen/up32x9-minmax-avx512f-acc2.c
1336 src/f32-dwconv/gen/up32x9-minmax-avx512f.c
1337 src/f32-dwconv/gen/up16x9-minmax-avx512f-acc2.c
1338 src/f32-dwconv/gen/up16x9-minmax-avx512f.c
1339 src/f32-dwconv/gen/up32x25-minmax-avx512f-acc2.c
1340 src/f32-dwconv/gen/up32x25-minmax-avx512f.c
1341 src/f32-dwconv/gen/up16x25-minmax-avx512f-acc2.c
1342 src/f32-dwconv/gen/up16x25-minmax-avx512f.c
1343 src/f32-gemm/gen/1x16-minmax-avx512f-broadcast.c
1344 src/f32-gemm/gen/4x16-minmax-avx512f-broadcast.c
1345 src/f32-gemm/gen/5x16-minmax-avx512f-broadcast.c
1346 src/f32-gemm/gen/6x16-minmax-avx512f-broadcast.c
1347 src/f32-gemm/gen/7x16-minmax-avx512f-broadcast.c
1348 src/f32-gemm/gen/8x16-minmax-avx512f-broadcast.c
1349 src/f32-gemm/gen-inc/1x16inc-minmax-avx512f-broadcast.c
1350 src/f32-gemm/gen-inc/4x16inc-minmax-avx512f-broadcast.c
1351 src/f32-gemm/gen-inc/5x16inc-minmax-avx512f-broadcast.c
1352 src/f32-gemm/gen-inc/6x16inc-minmax-avx512f-broadcast.c
1353 src/f32-gemm/gen-inc/7x16inc-minmax-avx512f-broadcast.c
1354 src/f32-gemm/gen-inc/8x16inc-minmax-avx512f-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001355 src/f32-hswish/gen/avx512f-x16.c
1356 src/f32-hswish/gen/avx512f-x32.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001357 src/f32-igemm/gen/1x16-minmax-avx512f-broadcast.c
1358 src/f32-igemm/gen/4x16-minmax-avx512f-broadcast.c
1359 src/f32-igemm/gen/5x16-minmax-avx512f-broadcast.c
1360 src/f32-igemm/gen/6x16-minmax-avx512f-broadcast.c
1361 src/f32-igemm/gen/7x16-minmax-avx512f-broadcast.c
1362 src/f32-igemm/gen/8x16-minmax-avx512f-broadcast.c
Marat Dukhan90eca0a2020-03-11 00:52:23 -07001363 src/f32-prelu/gen/avx512f-2x16.c
1364 src/f32-prelu/gen/avx512f-2x32.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001365 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c
1366 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1367 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1368 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144.c
1369 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1370 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160.c
1371 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1372 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1373 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192.c
1374 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1375 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1376 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
1377 src/f32-raddextexp/gen/avx512f-p5-scalef-x128.c
1378 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc2.c
1379 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc4.c
1380 src/f32-raddextexp/gen/avx512f-p5-scalef-x144.c
1381 src/f32-raddextexp/gen/avx512f-p5-scalef-x144-acc3.c
1382 src/f32-raddextexp/gen/avx512f-p5-scalef-x160.c
1383 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc2.c
1384 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc5.c
1385 src/f32-raddextexp/gen/avx512f-p5-scalef-x192.c
1386 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc2.c
1387 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc3.c
1388 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc6.c
1389 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128.c
1390 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1391 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1392 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144.c
1393 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1394 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160.c
1395 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1396 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1397 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192.c
1398 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1399 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1400 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001401 src/f32-rmax/avx512f.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -07001402 src/f32-vbinary/gen/vadd-minmax-avx512f-x16.c
1403 src/f32-vbinary/gen/vadd-minmax-avx512f-x32.c
1404 src/f32-vbinary/gen/vaddc-minmax-avx512f-x16.c
1405 src/f32-vbinary/gen/vaddc-minmax-avx512f-x32.c
1406 src/f32-vbinary/gen/vdiv-minmax-avx512f-x16.c
1407 src/f32-vbinary/gen/vdiv-minmax-avx512f-x32.c
1408 src/f32-vbinary/gen/vdivc-minmax-avx512f-x16.c
1409 src/f32-vbinary/gen/vdivc-minmax-avx512f-x32.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001410 src/f32-vbinary/gen/vmax-avx512f-x16.c
1411 src/f32-vbinary/gen/vmax-avx512f-x32.c
1412 src/f32-vbinary/gen/vmaxc-avx512f-x16.c
1413 src/f32-vbinary/gen/vmaxc-avx512f-x32.c
1414 src/f32-vbinary/gen/vmin-avx512f-x16.c
1415 src/f32-vbinary/gen/vmin-avx512f-x32.c
1416 src/f32-vbinary/gen/vminc-avx512f-x16.c
1417 src/f32-vbinary/gen/vminc-avx512f-x32.c
Marat Dukhan91cd2b72020-04-09 23:57:31 -07001418 src/f32-vbinary/gen/vmul-minmax-avx512f-x16.c
1419 src/f32-vbinary/gen/vmul-minmax-avx512f-x32.c
1420 src/f32-vbinary/gen/vmulc-minmax-avx512f-x16.c
1421 src/f32-vbinary/gen/vmulc-minmax-avx512f-x32.c
1422 src/f32-vbinary/gen/vrdivc-minmax-avx512f-x16.c
1423 src/f32-vbinary/gen/vrdivc-minmax-avx512f-x32.c
1424 src/f32-vbinary/gen/vrsubc-minmax-avx512f-x16.c
1425 src/f32-vbinary/gen/vrsubc-minmax-avx512f-x32.c
1426 src/f32-vbinary/gen/vsub-minmax-avx512f-x16.c
1427 src/f32-vbinary/gen/vsub-minmax-avx512f-x32.c
1428 src/f32-vbinary/gen/vsubc-minmax-avx512f-x16.c
1429 src/f32-vbinary/gen/vsubc-minmax-avx512f-x32.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001430 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001431 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x16.c
1432 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x32.c
1433 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x48.c
1434 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x64.c
1435 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x80.c
1436 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x96.c
1437 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x112.c
1438 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x128.c
1439 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x144.c
1440 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x160.c
1441 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x176.c
1442 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x192.c
1443 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x16.c
1444 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x32.c
1445 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x48.c
1446 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x64.c
1447 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x80.c
1448 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x96.c
1449 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x112.c
1450 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x128.c
1451 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x144.c
1452 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x160.c
1453 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x176.c
1454 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x192.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001455 src/math/exp-avx512f-p5-scalef.c
1456 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -07001457 src/math/exp-avx512f-perm-p3.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001458 src/math/exp-avx512f-perm2-p2.c
1459 src/math/extexp-avx512f-p5.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001460
1461SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
Marat Dukhande06f492020-04-09 00:19:31 -07001462 src/q8-dwconv/up8x9-minmax-aarch32-neon.S
Marat Dukhan1c587112020-04-08 20:04:28 -07001463 src/f32-gemm/4x8-minmax-aarch32-neon-cortex-a53.S
1464 src/f32-gemm/4x8-minmax-aarch32-neon-cortex-a55.S
1465 src/f32-gemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S
1466 src/f32-gemm/gen/4x8-minmax-aarch32-neon-pld-cortex-a75.S
1467 src/f32-gemm/4x8-minmax-aarch32-neon-ld64.S
1468 src/f32-igemm/4x8-minmax-aarch32-neon-ld64.S
1469 src/f32-igemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S
1470 src/f32-igemm/gen/4x8-minmax-aarch32-neon-pld-cortex-a75.S
1471 src/f32-igemm/4x8-minmax-aarch32-neon-cortex-a53.S
1472 src/f32-igemm/4x8-minmax-aarch32-neon-cortex-a55.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001473
1474SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
Frank Barchard36b76b62020-04-10 12:39:17 -07001475 src/f16-gemm/gen/1x16-minmax-aarch64-neonfp16arith-ld32.S
Frank Barchard683f5592020-04-10 00:48:26 -07001476 src/f16-gemm/gen/4x16-minmax-aarch64-neonfp16arith-ld32.S
1477 src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-ld32.S
Frank Barchard36b76b62020-04-10 12:39:17 -07001478 src/f16-gemm/gen-inc/1x16inc-minmax-aarch64-neonfp16arith-ld32.S
Frank Barchard683f5592020-04-10 00:48:26 -07001479 src/f16-gemm/gen-inc/4x16inc-minmax-aarch64-neonfp16arith-ld32.S
1480 src/f16-gemm/gen-inc/6x16inc-minmax-aarch64-neonfp16arith-ld32.S
Frank Barchardbddfbcd2020-04-15 12:32:41 -07001481 src/f16-gemm/gen/1x8-minmax-aarch64-neonfp16arith-ld64.S
1482 src/f16-gemm/gen/4x8-minmax-aarch64-neonfp16arith-ld64.S
1483 src/f16-gemm/gen/6x8-minmax-aarch64-neonfp16arith-ld64.S
Frank Barchard3b8e5662020-04-20 12:12:53 -07001484 src/f16-gemm/gen/8x8-minmax-aarch64-neonfp16arith-ld64.S
Frank Barchardbddfbcd2020-04-15 12:32:41 -07001485 src/f16-gemm/gen-inc/1x8inc-minmax-aarch64-neonfp16arith-ld64.S
1486 src/f16-gemm/gen-inc/4x8inc-minmax-aarch64-neonfp16arith-ld64.S
1487 src/f16-gemm/gen-inc/6x8inc-minmax-aarch64-neonfp16arith-ld64.S
Frank Barchard3b8e5662020-04-20 12:12:53 -07001488 src/f16-gemm/gen-inc/8x8inc-minmax-aarch64-neonfp16arith-ld64.S
Marat Dukhan1c587112020-04-08 20:04:28 -07001489 src/f32-dwconv/up4x9-minmax-aarch64-neonfma-cortex-a55.S
1490 src/f32-dwconv/up4x9-minmax-aarch64-neonfma.S
Frank Barchard3cb54f92020-04-10 10:46:08 -07001491 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-ld64.S
Marat Dukhan1c587112020-04-08 20:04:28 -07001492 src/f32-gemm/gen/1x12-minmax-aarch64-neonfma-cortex-a53.S
1493 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a53.S
1494 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a57.S
1495 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S
1496 src/f32-gemm/gen/4x12-minmax-aarch64-neonfma-cortex-a53.S
1497 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a53.S
1498 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a55.S
1499 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a57.S
1500 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S
1501 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld128.S
1502 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld64.S
1503 src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-cortex-a57.S
1504 src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S
1505 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a53.S
1506 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a55.S
1507 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a73.S
1508 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a57.S
1509 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S
1510 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ios.S
1511 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld128.S
1512 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld64.S
Frank Barchard3cb54f92020-04-10 10:46:08 -07001513 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-ld64.S
Marat Dukhan1c587112020-04-08 20:04:28 -07001514 src/f32-gemm/gen-inc/1x12inc-minmax-aarch64-neonfma-cortex-a53.S
1515 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a53.S
1516 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a57.S
1517 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a75.S
1518 src/f32-gemm/gen-inc/4x12inc-minmax-aarch64-neonfma-cortex-a53.S
1519 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a53.S
1520 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a55.S
1521 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a57.S
1522 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a75.S
1523 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld128.S
1524 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld64.S
1525 src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-cortex-a57.S
1526 src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-cortex-a75.S
1527 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a53.S
1528 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a55.S
1529 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a73.S
1530 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a57.S
1531 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a75.S
1532 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ios.S
1533 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld128.S
1534 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld64.S
1535 src/f32-igemm/1x12-minmax-aarch64-neonfma-cortex-a53.S
1536 src/f32-igemm/1x8-minmax-aarch64-neonfma-cortex-a53.S
1537 src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a57.S
1538 src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S
1539 src/f32-igemm/4x8-minmax-aarch64-neonfma-cortex-a53.S
1540 src/f32-igemm/4x8-minmax-aarch64-neonfma-cortex-a55.S
1541 src/f32-igemm/4x12-minmax-aarch64-neonfma-cortex-a53.S
1542 src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a57.S
1543 src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S
1544 src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-cortex-a57.S
1545 src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S
1546 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a53.S
1547 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a55.S
1548 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a73.S
1549 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a57.S
1550 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S
1551 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-ios.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001552
1553SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
Marat Dukhan29c6b262020-04-14 18:07:56 -07001554IF(NOT EMSCRIPTEN AND NOT MSVC AND NOT CMAKE_C_COMPILER_ID STREQUAL "Intel")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001555 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS})
1556 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001557ENDIF()
1558IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1559 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1560 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
1561 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
1562ENDIF()
1563IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1564 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1565 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan36aecb52019-11-22 17:21:49 -08001566 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001567 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
1568 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
1569ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +09001570IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|AMD64)$" OR IOS_ARCH MATCHES "^(i386|x86_64|AMD64)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001571 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
1572 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001573 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSSE3_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001574 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001575 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhanfda12b82019-11-21 12:27:59 -08001576 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_FMA3_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001577 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001578 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
1579ENDIF()
1580
1581IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001582 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001583ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001584 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001585ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001586 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001587ELSE()
1588 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
1589ENDIF()
1590SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
1591 C_STANDARD 99
1592 C_EXTENSIONS YES)
1593IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1594 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001595 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001596 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
1597 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
1598 IF(IOS)
Tao Xu84268142020-02-03 15:18:31 -08001599 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001600 ENDIF()
1601ENDIF()
1602IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1603 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
Frank Barchard683f5592020-04-10 00:48:26 -07001604 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001605 IF(IOS)
Tao Xu84268142020-02-03 15:18:31 -08001606 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001607 ENDIF()
1608ENDIF()
Marat Dukhan7795c3a2020-04-14 20:45:36 -07001609IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86|x86_64|AMD64)$" OR IOS_ARCH MATCHES "^(i386|x86_64|AMD64)$")
1610 IF(MSVC)
1611 IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "x86" OR CMAKE_SIZEOF_VOID_P EQUAL 4)
1612 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:SSE ")
1613 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:SSE2 ")
1614 SET_PROPERTY(SOURCE ${XNNPACK_SSSE3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:SSE2 ")
1615 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:SSE2 ")
1616 ENDIF()
1617 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:AVX ")
1618 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:AVX ")
1619 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:AVX2 ")
1620 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " /arch:AVX512 ")
1621 ELSE()
1622 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
1623 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
1624 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
1625 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
1626 SET_PROPERTY(SOURCE ${XNNPACK_SSSE3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mssse3 ")
1627 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
1628 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
1629 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma ")
1630 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
1631 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
Marat Dukhan78583c72020-04-26 22:00:43 -07001632 IF(MINGW OR CMAKE_SYSTEM_NAME MATCHES "^(CYGWIN|MSYS)$")
Marat Dukhan7795c3a2020-04-14 20:45:36 -07001633 # Work-around for https://gcc.gnu.org/bugzilla/show_bug.cgi?id=65782
1634 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -fno-asynchronous-unwind-tables ")
1635 ENDIF()
Yasuhiro Matsumoto081b77c2020-03-02 10:20:53 +09001636 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001637ENDIF()
Marat Dukhanef25e752020-04-13 02:45:37 -07001638TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE "XNN_LOG_LEVEL=$<IF:$<CONFIG:Debug>,5,0>")
Marat Dukhan7795c3a2020-04-14 20:45:36 -07001639IF(MSVC)
Marat Dukhanf196d012020-04-15 11:50:03 -07001640 # Even though MSVC has __restrict, it can't be used in all the same contexts as the C99 restrict keyword
1641 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE "restrict=")
Marat Dukhan7795c3a2020-04-14 20:45:36 -07001642 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: /O2 >")
1643 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: /O2 >")
1644 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: /O1 >")
1645ELSE()
1646 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: -O2 >")
1647 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: -O2 >")
1648 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: -Os >")
1649ENDIF()
Marat Dukhanef25e752020-04-13 02:45:37 -07001650IF(NOT EMSCRIPTEN)
1651 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: -O3 >")
1652 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS "$<$<NOT:$<CONFIG:Debug>>: -O3 -ffast-math >")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001653ENDIF()
1654
1655TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
1656TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
Marat Dukhan6ae741a2020-04-13 02:33:53 -07001657IF(WIN32)
1658 # Target Windows 7+ API
1659 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE _WIN32_WINNT=0x0601)
1660ENDIF()
Ashkan Aliabadid255a312019-12-03 12:44:34 -08001661SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/xnnpack.h)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001662
Marat Dukhan43130882020-03-12 22:33:07 -07001663# ---[ Find libm
1664FIND_LIBRARY(LIBM m)
1665IF(LIBM)
1666 TARGET_LINK_LIBRARIES(XNNPACK PRIVATE ${LIBM})
1667ENDIF()
1668
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001669# ---[ Configure clog
1670IF(NOT TARGET clog)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001671 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1672 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
1673 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
1674 ADD_SUBDIRECTORY(
1675 "${CLOG_SOURCE_DIR}/deps/clog"
1676 "${CMAKE_BINARY_DIR}/clog")
1677 # We build static version of clog but a dynamic library may indirectly depend on it
1678 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
1679 ELSE()
1680 ADD_LIBRARY(clog STATIC IMPORTED)
1681 FIND_LIBRARY(CLOG_LIBRARY clog)
1682 IF(NOT CLOG_LIBRARY)
1683 MESSAGE(FATAL_ERROR "Cannot find clog")
1684 ENDIF()
1685 SET_PROPERTY(TARGET clog PROPERTY IMPORTED_LOCATION "${CLOG_LIBRARY}")
1686 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001687ENDIF()
1688TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
1689
1690# ---[ Configure cpuinfo
1691IF(NOT TARGET cpuinfo)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001692 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1693 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
1694 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
1695 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
1696 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
1697 ADD_SUBDIRECTORY(
1698 "${CPUINFO_SOURCE_DIR}"
1699 "${CMAKE_BINARY_DIR}/cpuinfo")
1700 ELSE()
1701 ADD_LIBRARY(cpuinfo SHARED IMPORTED)
1702 FIND_LIBRARY(CPUINFO_LIBRARY cpuinfo)
1703 IF(NOT CPUINFO_LIBRARY)
1704 MESSAGE(FATAL_ERROR "Cannot find cpuinfo")
1705 ENDIF()
1706 SET_PROPERTY(TARGET cpuinfo PROPERTY IMPORTED_LOCATION "${CPUINFO_LIBRARY}")
1707 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001708ENDIF()
1709TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
1710
1711# ---[ Configure pthreadpool
1712IF(NOT TARGET pthreadpool)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001713 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1714 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
1715 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
1716 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
1717 ADD_SUBDIRECTORY(
1718 "${PTHREADPOOL_SOURCE_DIR}"
1719 "${CMAKE_BINARY_DIR}/pthreadpool")
1720 ELSE()
1721 ADD_LIBRARY(pthreadpool SHARED IMPORTED)
1722 FIND_LIBRARY(PTHREADPOOL_LIBRARY pthreadpool)
1723 IF(NOT PTHREADPOOL_LIBRARY)
1724 MESSAGE(FATAL_ERROR "Cannot find pthreadpool")
1725 ENDIF()
1726 SET_PROPERTY(TARGET pthreadpool PROPERTY IMPORTED_LOCATION "${PTHREADPOOL_LIBRARY}")
1727 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001728ENDIF()
1729TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
1730
1731# ---[ Configure FXdiv
1732IF(NOT TARGET fxdiv)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001733 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1734 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
1735 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
1736 ADD_SUBDIRECTORY(
1737 "${FXDIV_SOURCE_DIR}"
1738 "${CMAKE_BINARY_DIR}/FXdiv")
1739 ELSE()
1740 FIND_FILE(FXDIV_HDR fxdiv.h PATH_SUFFIXES include)
1741 IF(NOT FXDIV_HDR)
1742 MESSAGE(FATAL_ERROR "Cannot find fxdiv")
1743 ENDIF()
1744 ADD_LIBRARY(fxdiv STATIC "${FXDIV_HDR}")
1745 SET_PROPERTY(TARGET fxdiv PROPERTY LINKER_LANGUAGE C)
1746 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001747ENDIF()
1748TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
1749
1750# ---[ Configure psimd
1751IF(NOT TARGET psimd)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001752 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1753 ADD_SUBDIRECTORY(
1754 "${PSIMD_SOURCE_DIR}"
1755 "${CMAKE_BINARY_DIR}/psimd")
1756 ELSE()
1757 FIND_FILE(PSIMD_HDR psimd.h PATH_SUFFIXES include)
1758 IF(NOT PSIMD_HDR)
1759 MESSAGE(FATAL_ERROR "Cannot find psimd")
1760 ENDIF()
1761 ADD_LIBRARY(psimd STATIC "${PSIMD_HDR}")
1762 SET_PROPERTY(TARGET psimd PROPERTY LINKER_LANGUAGE C)
1763 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001764ENDIF()
1765TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
1766
1767# ---[ Configure FP16
1768IF(NOT TARGET fp16)
Mo Zhou6cafcdb2020-04-26 10:41:41 +08001769 IF(NOT XNNPACK_USE_SYSTEM_LIBS)
1770 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
1771 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
1772 ADD_SUBDIRECTORY(
1773 "${FP16_SOURCE_DIR}"
1774 "${CMAKE_BINARY_DIR}/FP16")
1775 ELSE()
1776 FIND_FILE(FP16_HDR fp16.h PATH_SUFFIXES include)
1777 IF(NOT FP16_HDR)
1778 MESSAGE(FATAL_ERROR "Cannot find fp16")
1779 ENDIF()
1780 ADD_LIBRARY(fp16 STATIC "${FP16_HDR}")
1781 SET_PROPERTY(TARGET fp16 PROPERTY LINKER_LANGUAGE C)
1782 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001783ENDIF()
1784TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
1785
1786INSTALL(TARGETS XNNPACK
1787 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
1788 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
1789 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
1790
1791# ---[ XNNPACK unit tests
1792IF(XNNPACK_BUILD_TESTS)
1793 # ---[ Build google test
1794 IF(NOT TARGET gtest)
1795 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
1796 ADD_SUBDIRECTORY(
1797 "${GOOGLETEST_SOURCE_DIR}"
1798 "${CMAKE_BINARY_DIR}/googletest")
1799 ENDIF()
1800
Marat Dukhan20c3b922020-03-10 03:45:06 -07001801 # ---[ Build size tests
1802
Marat Dukhan43130882020-03-12 22:33:07 -07001803 ADD_EXECUTABLE(operator-size-test test/operator-size.c)
Marat Dukhan20c3b922020-03-10 03:45:06 -07001804 SET_TARGET_PROPERTIES(operator-size-test PROPERTIES
1805 C_STANDARD 99
1806 C_EXTENSIONS NO)
1807 TARGET_LINK_LIBRARIES(operator-size-test PRIVATE XNNPACK)
1808
Marat Dukhan43130882020-03-12 22:33:07 -07001809 ADD_EXECUTABLE(subgraph-size-test test/subgraph-size.c)
Marat Dukhan20c3b922020-03-10 03:45:06 -07001810 SET_TARGET_PROPERTIES(subgraph-size-test PROPERTIES
1811 C_STANDARD 99
1812 C_EXTENSIONS NO)
1813 TARGET_LINK_LIBRARIES(subgraph-size-test PRIVATE XNNPACK)
1814
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001815 # ---[ Build operator-level unit tests
Marat Dukhanefc47b82019-11-18 09:25:38 -08001816 ADD_EXECUTABLE(add-nc-test test/add-nc.cc)
1817 SET_TARGET_PROPERTIES(add-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001818 CXX_STANDARD 11
1819 CXX_STANDARD_REQUIRED YES
1820 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001821 TARGET_INCLUDE_DIRECTORIES(add-nc-test PRIVATE src test)
1822 TARGET_LINK_LIBRARIES(add-nc-test PRIVATE XNNPACK gtest gtest_main)
1823 ADD_TEST(add-nc-test add-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001824
Marat Dukhanb1a0fc32019-12-02 19:32:02 -08001825 ADD_EXECUTABLE(add-nd-test test/add-nd.cc)
1826 SET_TARGET_PROPERTIES(add-nd-test PROPERTIES
1827 CXX_STANDARD 11
1828 CXX_STANDARD_REQUIRED YES
1829 CXX_EXTENSIONS NO)
1830 TARGET_INCLUDE_DIRECTORIES(add-nd-test PRIVATE src test)
1831 TARGET_LINK_LIBRARIES(add-nd-test PRIVATE XNNPACK gtest gtest_main)
1832 ADD_TEST(add-nd-test add-nd-test)
1833
Marat Dukhanefc47b82019-11-18 09:25:38 -08001834 ADD_EXECUTABLE(argmax-pooling-nhwc-test test/argmax-pooling-nhwc.cc)
1835 SET_TARGET_PROPERTIES(argmax-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001836 CXX_STANDARD 11
1837 CXX_STANDARD_REQUIRED YES
1838 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001839 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-nhwc-test PRIVATE src test)
1840 TARGET_LINK_LIBRARIES(argmax-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1841 ADD_TEST(argmax-pooling-nhwc-test argmax-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001842
Marat Dukhanefc47b82019-11-18 09:25:38 -08001843 ADD_EXECUTABLE(average-pooling-nhwc-test test/average-pooling-nhwc.cc)
1844 SET_TARGET_PROPERTIES(average-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001845 CXX_STANDARD 11
1846 CXX_STANDARD_REQUIRED YES
1847 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001848 TARGET_INCLUDE_DIRECTORIES(average-pooling-nhwc-test PRIVATE src test)
1849 TARGET_LINK_LIBRARIES(average-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1850 ADD_TEST(average-pooling-nhwc-test average-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001851
Marat Dukhanefc47b82019-11-18 09:25:38 -08001852 ADD_EXECUTABLE(channel-pad-nc-test test/channel-pad-nc.cc)
1853 SET_TARGET_PROPERTIES(channel-pad-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001854 CXX_STANDARD 11
1855 CXX_STANDARD_REQUIRED YES
1856 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001857 TARGET_INCLUDE_DIRECTORIES(channel-pad-nc-test PRIVATE src test)
1858 TARGET_LINK_LIBRARIES(channel-pad-nc-test PRIVATE XNNPACK gtest gtest_main)
1859 ADD_TEST(channel-pad-nc-test channel-pad-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001860
Marat Dukhanefc47b82019-11-18 09:25:38 -08001861 ADD_EXECUTABLE(channel-shuffle-nc-test test/channel-shuffle-nc.cc)
1862 SET_TARGET_PROPERTIES(channel-shuffle-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001863 CXX_STANDARD 11
1864 CXX_STANDARD_REQUIRED YES
1865 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001866 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-nc-test PRIVATE src test)
1867 TARGET_LINK_LIBRARIES(channel-shuffle-nc-test PRIVATE XNNPACK gtest gtest_main)
1868 ADD_TEST(channel-shuffle-nc-test channel-shuffle-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001869
Marat Dukhanefc47b82019-11-18 09:25:38 -08001870 ADD_EXECUTABLE(clamp-nc-test test/clamp-nc.cc)
1871 SET_TARGET_PROPERTIES(clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001872 CXX_STANDARD 11
1873 CXX_STANDARD_REQUIRED YES
1874 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001875 TARGET_INCLUDE_DIRECTORIES(clamp-nc-test PRIVATE src test)
1876 TARGET_LINK_LIBRARIES(clamp-nc-test PRIVATE XNNPACK gtest gtest_main)
1877 ADD_TEST(clamp-nc-test clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001878
Marat Dukhanefc47b82019-11-18 09:25:38 -08001879 ADD_EXECUTABLE(convolution-nhwc-test test/convolution-nhwc.cc)
1880 SET_TARGET_PROPERTIES(convolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001881 CXX_STANDARD 11
1882 CXX_STANDARD_REQUIRED YES
1883 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001884 TARGET_INCLUDE_DIRECTORIES(convolution-nhwc-test PRIVATE src test)
1885 TARGET_LINK_LIBRARIES(convolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1886 ADD_TEST(convolution-nhwc-test convolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001887
Marat Dukhanefc47b82019-11-18 09:25:38 -08001888 ADD_EXECUTABLE(convolution-nchw-test test/convolution-nchw.cc)
1889 SET_TARGET_PROPERTIES(convolution-nchw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001890 CXX_STANDARD 11
1891 CXX_STANDARD_REQUIRED YES
1892 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001893 TARGET_INCLUDE_DIRECTORIES(convolution-nchw-test PRIVATE src test)
1894 TARGET_LINK_LIBRARIES(convolution-nchw-test PRIVATE XNNPACK gtest gtest_main)
1895 ADD_TEST(convolution-nchw-test convolution-nchw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001896
Marat Dukhanefc47b82019-11-18 09:25:38 -08001897 ADD_EXECUTABLE(deconvolution-nhwc-test test/deconvolution-nhwc.cc)
1898 SET_TARGET_PROPERTIES(deconvolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001899 CXX_STANDARD 11
1900 CXX_STANDARD_REQUIRED YES
1901 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001902 TARGET_INCLUDE_DIRECTORIES(deconvolution-nhwc-test PRIVATE src test)
1903 TARGET_LINK_LIBRARIES(deconvolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1904 ADD_TEST(deconvolution-nhwc-test deconvolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001905
Marat Dukhan69180502019-12-06 15:00:31 -08001906 ADD_EXECUTABLE(divide-nd-test test/divide-nd.cc)
1907 SET_TARGET_PROPERTIES(divide-nd-test PROPERTIES
1908 CXX_STANDARD 11
1909 CXX_STANDARD_REQUIRED YES
1910 CXX_EXTENSIONS NO)
1911 TARGET_INCLUDE_DIRECTORIES(divide-nd-test PRIVATE src test)
1912 TARGET_LINK_LIBRARIES(divide-nd-test PRIVATE XNNPACK gtest gtest_main)
1913 ADD_TEST(divide-nd-test divide-nd-test)
1914
Marat Dukhanefc47b82019-11-18 09:25:38 -08001915 ADD_EXECUTABLE(fully-connected-nc-test test/fully-connected-nc.cc)
1916 SET_TARGET_PROPERTIES(fully-connected-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001917 CXX_STANDARD 11
1918 CXX_STANDARD_REQUIRED YES
1919 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001920 TARGET_INCLUDE_DIRECTORIES(fully-connected-nc-test PRIVATE src test)
1921 TARGET_LINK_LIBRARIES(fully-connected-nc-test PRIVATE XNNPACK gtest gtest_main)
1922 ADD_TEST(fully-connected-nc-test fully-connected-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001923
Marat Dukhanefc47b82019-11-18 09:25:38 -08001924 ADD_EXECUTABLE(global-average-pooling-nwc-test test/global-average-pooling-nwc.cc)
1925 SET_TARGET_PROPERTIES(global-average-pooling-nwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001926 CXX_STANDARD 11
1927 CXX_STANDARD_REQUIRED YES
1928 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001929 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-nwc-test PRIVATE src test)
1930 TARGET_LINK_LIBRARIES(global-average-pooling-nwc-test PRIVATE XNNPACK gtest gtest_main)
1931 ADD_TEST(global-average-pooling-nwc-test global-average-pooling-nwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001932
Marat Dukhanefc47b82019-11-18 09:25:38 -08001933 ADD_EXECUTABLE(global-average-pooling-ncw-test test/global-average-pooling-ncw.cc)
1934 SET_TARGET_PROPERTIES(global-average-pooling-ncw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001935 CXX_STANDARD 11
1936 CXX_STANDARD_REQUIRED YES
1937 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001938 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-ncw-test PRIVATE src test)
1939 TARGET_LINK_LIBRARIES(global-average-pooling-ncw-test PRIVATE XNNPACK gtest gtest_main)
1940 ADD_TEST(global-average-pooling-ncw-test global-average-pooling-ncw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001941
Marat Dukhanefc47b82019-11-18 09:25:38 -08001942 ADD_EXECUTABLE(hardswish-nc-test test/hardswish-nc.cc)
1943 SET_TARGET_PROPERTIES(hardswish-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001944 CXX_STANDARD 11
1945 CXX_STANDARD_REQUIRED YES
1946 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001947 TARGET_INCLUDE_DIRECTORIES(hardswish-nc-test PRIVATE src test)
1948 TARGET_LINK_LIBRARIES(hardswish-nc-test PRIVATE XNNPACK gtest gtest_main)
1949 ADD_TEST(hardswish-nc-test hardswish-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001950
Marat Dukhanefc47b82019-11-18 09:25:38 -08001951 ADD_EXECUTABLE(leaky-relu-nc-test test/leaky-relu-nc.cc)
1952 SET_TARGET_PROPERTIES(leaky-relu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001953 CXX_STANDARD 11
1954 CXX_STANDARD_REQUIRED YES
1955 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001956 TARGET_INCLUDE_DIRECTORIES(leaky-relu-nc-test PRIVATE src test)
1957 TARGET_LINK_LIBRARIES(leaky-relu-nc-test PRIVATE XNNPACK gtest gtest_main)
1958 ADD_TEST(leaky-relu-nc-test leaky-relu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001959
Marat Dukhanefc47b82019-11-18 09:25:38 -08001960 ADD_EXECUTABLE(max-pooling-nhwc-test test/max-pooling-nhwc.cc)
1961 SET_TARGET_PROPERTIES(max-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001962 CXX_STANDARD 11
1963 CXX_STANDARD_REQUIRED YES
1964 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001965 TARGET_INCLUDE_DIRECTORIES(max-pooling-nhwc-test PRIVATE src test)
1966 TARGET_LINK_LIBRARIES(max-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1967 ADD_TEST(max-pooling-nhwc-test max-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001968
Marat Dukhan79e7f842019-12-05 14:35:50 -08001969 ADD_EXECUTABLE(maximum-nd-test test/multiply-nd.cc)
1970 SET_TARGET_PROPERTIES(maximum-nd-test PROPERTIES
1971 CXX_STANDARD 11
1972 CXX_STANDARD_REQUIRED YES
1973 CXX_EXTENSIONS NO)
1974 TARGET_INCLUDE_DIRECTORIES(maximum-nd-test PRIVATE src test)
1975 TARGET_LINK_LIBRARIES(maximum-nd-test PRIVATE XNNPACK gtest gtest_main)
1976 ADD_TEST(maximum-nd-test maximum-nd-test)
1977
1978 ADD_EXECUTABLE(minimum-nd-test test/multiply-nd.cc)
1979 SET_TARGET_PROPERTIES(minimum-nd-test PROPERTIES
1980 CXX_STANDARD 11
1981 CXX_STANDARD_REQUIRED YES
1982 CXX_EXTENSIONS NO)
1983 TARGET_INCLUDE_DIRECTORIES(minimum-nd-test PRIVATE src test)
1984 TARGET_LINK_LIBRARIES(minimum-nd-test PRIVATE XNNPACK gtest gtest_main)
1985 ADD_TEST(minimum-nd-test minimum-nd-test)
1986
Marat Dukhanefc47b82019-11-18 09:25:38 -08001987 ADD_EXECUTABLE(multiply-nd-test test/multiply-nd.cc)
1988 SET_TARGET_PROPERTIES(multiply-nd-test PROPERTIES
Marat Dukhan9d501d52019-11-16 02:30:50 -08001989 CXX_STANDARD 11
1990 CXX_STANDARD_REQUIRED YES
1991 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001992 TARGET_INCLUDE_DIRECTORIES(multiply-nd-test PRIVATE src test)
1993 TARGET_LINK_LIBRARIES(multiply-nd-test PRIVATE XNNPACK gtest gtest_main)
1994 ADD_TEST(multiply-nd-test multiply-nd-test)
Marat Dukhan9d501d52019-11-16 02:30:50 -08001995
Marat Dukhanefc47b82019-11-18 09:25:38 -08001996 ADD_EXECUTABLE(prelu-nc-test test/prelu-nc.cc)
1997 SET_TARGET_PROPERTIES(prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001998 CXX_STANDARD 11
1999 CXX_STANDARD_REQUIRED YES
2000 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08002001 TARGET_INCLUDE_DIRECTORIES(prelu-nc-test PRIVATE src test)
2002 TARGET_LINK_LIBRARIES(prelu-nc-test PRIVATE XNNPACK gtest gtest_main)
2003 ADD_TEST(prelu-nc-test prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002004
Marat Dukhanefc47b82019-11-18 09:25:38 -08002005 ADD_EXECUTABLE(resize-bilinear-nhwc-test test/resize-bilinear-nhwc.cc)
2006 SET_TARGET_PROPERTIES(resize-bilinear-nhwc-test PROPERTIES
Marat Dukhan69722492019-11-11 19:55:50 -08002007 CXX_STANDARD 11
2008 CXX_STANDARD_REQUIRED YES
2009 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08002010 TARGET_INCLUDE_DIRECTORIES(resize-bilinear-nhwc-test PRIVATE src test)
2011 TARGET_LINK_LIBRARIES(resize-bilinear-nhwc-test PRIVATE XNNPACK gtest gtest_main)
2012 ADD_TEST(resize-bilinear-nhwc-test resize-bilinear-nhwc-test)
Marat Dukhan69722492019-11-11 19:55:50 -08002013
Marat Dukhanefc47b82019-11-18 09:25:38 -08002014 ADD_EXECUTABLE(sigmoid-nc-test test/sigmoid-nc.cc)
2015 SET_TARGET_PROPERTIES(sigmoid-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002016 CXX_STANDARD 11
2017 CXX_STANDARD_REQUIRED YES
2018 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08002019 TARGET_INCLUDE_DIRECTORIES(sigmoid-nc-test PRIVATE src test)
2020 TARGET_LINK_LIBRARIES(sigmoid-nc-test PRIVATE XNNPACK gtest gtest_main)
2021 ADD_TEST(sigmoid-nc-test sigmoid-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002022
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002023 ADD_EXECUTABLE(softmax-nc-test test/softmax-nc.cc)
2024 SET_TARGET_PROPERTIES(softmax-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002025 CXX_STANDARD 11
2026 CXX_STANDARD_REQUIRED YES
2027 CXX_EXTENSIONS NO)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002028 TARGET_INCLUDE_DIRECTORIES(softmax-nc-test PRIVATE src test)
2029 TARGET_LINK_LIBRARIES(softmax-nc-test PRIVATE XNNPACK gtest gtest_main)
2030 ADD_TEST(softmax-nc-test softmax-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002031
Marat Dukhan05f3f6d2019-12-03 15:13:53 -08002032 ADD_EXECUTABLE(subtract-nd-test test/subtract-nd.cc)
2033 SET_TARGET_PROPERTIES(subtract-nd-test PROPERTIES
2034 CXX_STANDARD 11
2035 CXX_STANDARD_REQUIRED YES
2036 CXX_EXTENSIONS NO)
2037 TARGET_INCLUDE_DIRECTORIES(subtract-nd-test PRIVATE src test)
2038 TARGET_LINK_LIBRARIES(subtract-nd-test PRIVATE XNNPACK gtest gtest_main)
2039 ADD_TEST(subtract-nd-test subtract-nd-test)
2040
Marat Dukhanefc47b82019-11-18 09:25:38 -08002041 ADD_EXECUTABLE(unpooling-nhwc-test test/unpooling-nhwc.cc)
2042 SET_TARGET_PROPERTIES(unpooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002043 CXX_STANDARD 11
2044 CXX_STANDARD_REQUIRED YES
2045 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08002046 TARGET_INCLUDE_DIRECTORIES(unpooling-nhwc-test PRIVATE src test)
2047 TARGET_LINK_LIBRARIES(unpooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
2048 ADD_TEST(unpooling-nhwc-test unpooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002049
2050 # ---[ Build microkernel-level unit tests
Marat Dukhande06f492020-04-09 00:19:31 -07002051 ADD_EXECUTABLE(f16-gemm-minmax-test test/f16-gemm-minmax.cc)
2052 SET_TARGET_PROPERTIES(f16-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002053 CXX_STANDARD 11
2054 CXX_STANDARD_REQUIRED YES
2055 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002056 TARGET_INCLUDE_DIRECTORIES(f16-gemm-minmax-test PRIVATE src test)
2057 TARGET_LINK_LIBRARIES(f16-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2058 ADD_TEST(f16-gemm-minmax-test f16-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002059
Marat Dukhan355ab432020-04-09 19:01:52 -07002060 ADD_EXECUTABLE(f16-spmm-minmax-test test/f16-spmm-minmax.cc)
2061 SET_TARGET_PROPERTIES(f16-spmm-minmax-test PROPERTIES
2062 CXX_STANDARD 11
2063 CXX_STANDARD_REQUIRED YES
2064 CXX_EXTENSIONS YES)
2065 TARGET_INCLUDE_DIRECTORIES(f16-spmm-minmax-test PRIVATE src test)
2066 TARGET_LINK_LIBRARIES(f16-spmm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2067 ADD_TEST(f16-spmm-minmax-test f16-spmm-minmax-test)
2068
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002069 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
2070 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
2071 CXX_STANDARD 11
2072 CXX_STANDARD_REQUIRED YES
2073 CXX_EXTENSIONS YES)
2074 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
2075 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2076 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
2077
Marat Dukhan99936602020-04-11 16:47:01 -07002078 ADD_EXECUTABLE(f32-avgpool-minmax-test test/f32-avgpool-minmax.cc)
2079 SET_TARGET_PROPERTIES(f32-avgpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002080 CXX_STANDARD 11
2081 CXX_STANDARD_REQUIRED YES
2082 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002083 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-minmax-test PRIVATE src test)
2084 TARGET_LINK_LIBRARIES(f32-avgpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2085 ADD_TEST(f32-avgpool-minmax-test f32-avgpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002086
Marat Dukhan53873d02019-12-06 17:21:30 -08002087 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
2088 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002089 CXX_STANDARD 11
2090 CXX_STANDARD_REQUIRED YES
2091 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002092 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
2093 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2094 ADD_TEST(f32-clamp-test f32-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002095
2096 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
2097 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
2098 CXX_STANDARD 11
2099 CXX_STANDARD_REQUIRED YES
2100 CXX_EXTENSIONS YES)
2101 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
2102 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2103 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
2104
2105 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
2106 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
2107 CXX_STANDARD 11
2108 CXX_STANDARD_REQUIRED YES
2109 CXX_EXTENSIONS YES)
2110 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
2111 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2112 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
2113
2114 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
2115 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
2116 CXX_STANDARD 11
2117 CXX_STANDARD_REQUIRED YES
2118 CXX_EXTENSIONS YES)
2119 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
2120 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2121 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
2122
Marat Dukhan163a7e62020-04-09 04:19:26 -07002123 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
2124 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002125 CXX_STANDARD 11
2126 CXX_STANDARD_REQUIRED YES
2127 CXX_EXTENSIONS YES)
Marat Dukhan163a7e62020-04-09 04:19:26 -07002128 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
2129 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2130 ADD_TEST(f32-dwconv-test f32-dwconv-test)
2131
2132 ADD_EXECUTABLE(f32-dwconv-minmax-test test/f32-dwconv-minmax.cc)
2133 SET_TARGET_PROPERTIES(f32-dwconv-minmax-test PROPERTIES
2134 CXX_STANDARD 11
2135 CXX_STANDARD_REQUIRED YES
2136 CXX_EXTENSIONS YES)
2137 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-minmax-test PRIVATE src test)
2138 TARGET_LINK_LIBRARIES(f32-dwconv-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2139 ADD_TEST(f32-dwconv-minmax-test f32-dwconv-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002140
2141 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
2142 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
2143 CXX_STANDARD 11
2144 CXX_STANDARD_REQUIRED YES
2145 CXX_EXTENSIONS YES)
2146 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
2147 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2148 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
2149
Marat Dukhan99936602020-04-11 16:47:01 -07002150 ADD_EXECUTABLE(f32-gavgpool-minmax-test test/f32-gavgpool-minmax.cc)
2151 SET_TARGET_PROPERTIES(f32-gavgpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002152 CXX_STANDARD 11
2153 CXX_STANDARD_REQUIRED YES
2154 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002155 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-minmax-test PRIVATE src test)
2156 TARGET_LINK_LIBRARIES(f32-gavgpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2157 ADD_TEST(f32-gavgpool-minmax-test f32-gavgpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002158
Marat Dukhan163a7e62020-04-09 04:19:26 -07002159 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
2160 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
2161 CXX_STANDARD 11
2162 CXX_STANDARD_REQUIRED YES
2163 CXX_EXTENSIONS YES)
2164 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
2165 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2166 ADD_TEST(f32-gemm-test f32-gemm-test)
2167
Marat Dukhan1c587112020-04-08 20:04:28 -07002168 ADD_EXECUTABLE(f32-gemm-minmax-test test/f32-gemm-minmax.cc)
2169 SET_TARGET_PROPERTIES(f32-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002170 CXX_STANDARD 11
2171 CXX_STANDARD_REQUIRED YES
2172 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002173 TARGET_INCLUDE_DIRECTORIES(f32-gemm-minmax-test PRIVATE src test)
2174 TARGET_LINK_LIBRARIES(f32-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2175 ADD_TEST(f32-gemm-minmax-test f32-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002176
Marat Dukhan1c587112020-04-08 20:04:28 -07002177 ADD_EXECUTABLE(f32-gemminc-minmax-test test/f32-gemminc-minmax.cc)
2178 SET_TARGET_PROPERTIES(f32-gemminc-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002179 CXX_STANDARD 11
2180 CXX_STANDARD_REQUIRED YES
2181 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002182 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-minmax-test PRIVATE src test)
2183 TARGET_LINK_LIBRARIES(f32-gemminc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2184 ADD_TEST(f32-gemminc-minmax-test f32-gemminc-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002185
2186 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
2187 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
2188 CXX_STANDARD 11
2189 CXX_STANDARD_REQUIRED YES
2190 CXX_EXTENSIONS YES)
2191 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
2192 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2193 ADD_TEST(f32-hswish-test f32-hswish-test)
2194
Marat Dukhan660fd192020-03-10 04:55:30 -07002195 ADD_EXECUTABLE(f32-ibilinear-test test/f32-ibilinear.cc)
2196 SET_TARGET_PROPERTIES(f32-ibilinear-test PROPERTIES
2197 CXX_STANDARD 11
2198 CXX_STANDARD_REQUIRED YES
2199 CXX_EXTENSIONS YES)
2200 TARGET_INCLUDE_DIRECTORIES(f32-ibilinear-test PRIVATE src test)
2201 TARGET_LINK_LIBRARIES(f32-ibilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2202 ADD_TEST(f32-ibilinear-test f32-ibilinear-test)
2203
Marat Dukhan163a7e62020-04-09 04:19:26 -07002204 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
2205 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
2206 CXX_STANDARD 11
2207 CXX_STANDARD_REQUIRED YES
2208 CXX_EXTENSIONS YES)
2209 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
2210 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2211 ADD_TEST(f32-igemm-test f32-igemm-test)
2212
Marat Dukhan1c587112020-04-08 20:04:28 -07002213 ADD_EXECUTABLE(f32-igemm-minmax-test test/f32-igemm-minmax.cc)
2214 SET_TARGET_PROPERTIES(f32-igemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002215 CXX_STANDARD 11
2216 CXX_STANDARD_REQUIRED YES
2217 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002218 TARGET_INCLUDE_DIRECTORIES(f32-igemm-minmax-test PRIVATE src test)
Marat Dukhan3fd4b292020-04-13 10:29:32 -07002219 IF(MINGW)
2220 # Work-around for "too many sections" error
2221 TARGET_COMPILE_OPTIONS(f32-igemm-minmax-test PRIVATE "$<$<NOT:$<OR:$<CONFIG:Release>,$<CONFIG:MinSizeRel>>>:-Wa,-mbig-obj>")
2222 ENDIF()
Marat Dukhan1c587112020-04-08 20:04:28 -07002223 TARGET_LINK_LIBRARIES(f32-igemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2224 ADD_TEST(f32-igemm-minmax-test f32-igemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002225
Frank Barchardb0e4fae2020-05-04 15:27:51 -07002226 ADD_EXECUTABLE(f16-igemm-minmax-test test/f16-igemm-minmax.cc)
2227 SET_TARGET_PROPERTIES(f16-igemm-minmax-test PROPERTIES
2228 CXX_STANDARD 11
2229 CXX_STANDARD_REQUIRED YES
2230 CXX_EXTENSIONS YES)
2231 TARGET_INCLUDE_DIRECTORIES(f16-igemm-minmax-test PRIVATE src test)
2232 TARGET_LINK_LIBRARIES(f16-igemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2233 ADD_TEST(f16-igemm-minmax-test f16-igemm-minmax-test)
2234
Marat Dukhan99936602020-04-11 16:47:01 -07002235 ADD_EXECUTABLE(f32-maxpool-minmax-test test/f32-maxpool-minmax.cc)
2236 SET_TARGET_PROPERTIES(f32-maxpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002237 CXX_STANDARD 11
2238 CXX_STANDARD_REQUIRED YES
2239 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002240 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-minmax-test PRIVATE src test)
2241 TARGET_LINK_LIBRARIES(f32-maxpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2242 ADD_TEST(f32-maxpool-minmax-test f32-maxpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002243
Marat Dukhan99936602020-04-11 16:47:01 -07002244 ADD_EXECUTABLE(f32-pavgpool-minmax-test test/f32-pavgpool-minmax.cc)
2245 SET_TARGET_PROPERTIES(f32-pavgpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002246 CXX_STANDARD 11
2247 CXX_STANDARD_REQUIRED YES
2248 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002249 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-minmax-test PRIVATE src test)
2250 TARGET_LINK_LIBRARIES(f32-pavgpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2251 ADD_TEST(f32-pavgpool-minmax-test f32-pavgpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002252
Marat Dukhan1c587112020-04-08 20:04:28 -07002253 ADD_EXECUTABLE(f32-ppmm-minmax-test test/f32-ppmm-minmax.cc)
2254 SET_TARGET_PROPERTIES(f32-ppmm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002255 CXX_STANDARD 11
2256 CXX_STANDARD_REQUIRED YES
2257 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002258 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-minmax-test PRIVATE src test)
2259 TARGET_LINK_LIBRARIES(f32-ppmm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2260 ADD_TEST(f32-ppmm-minmax-test f32-ppmm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002261
Marat Dukhan53873d02019-12-06 17:21:30 -08002262 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
2263 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002264 CXX_STANDARD 11
2265 CXX_STANDARD_REQUIRED YES
2266 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002267 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
2268 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2269 ADD_TEST(f32-prelu-test f32-prelu-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002270
Marat Dukhan97579532019-10-18 16:40:39 -07002271 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
2272 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
2273 CXX_STANDARD 11
2274 CXX_STANDARD_REQUIRED YES
2275 CXX_EXTENSIONS YES)
2276 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
2277 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2278 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
2279
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002280 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
2281 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
2282 CXX_STANDARD 11
2283 CXX_STANDARD_REQUIRED YES
2284 CXX_EXTENSIONS YES)
2285 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07002286 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002287 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
2288
Marat Dukhan97579532019-10-18 16:40:39 -07002289 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
2290 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
2291 CXX_STANDARD 11
2292 CXX_STANDARD_REQUIRED YES
2293 CXX_EXTENSIONS YES)
2294 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
2295 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2296 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
2297
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002298 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
2299 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
2300 CXX_STANDARD 11
2301 CXX_STANDARD_REQUIRED YES
2302 CXX_EXTENSIONS YES)
2303 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
2304 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2305 ADD_TEST(f32-rmax-test f32-rmax-test)
2306
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002307 ADD_EXECUTABLE(f32-sigmoid-test test/f32-sigmoid.cc)
2308 SET_TARGET_PROPERTIES(f32-sigmoid-test PROPERTIES
2309 CXX_STANDARD 11
2310 CXX_STANDARD_REQUIRED YES
2311 CXX_EXTENSIONS YES)
2312 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-test PRIVATE src test)
2313 TARGET_LINK_LIBRARIES(f32-sigmoid-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2314 ADD_TEST(f32-sigmoid-test f32-sigmoid-test)
2315
Marat Dukhan355ab432020-04-09 19:01:52 -07002316 ADD_EXECUTABLE(f32-spmm-minmax-test test/f32-spmm-minmax.cc)
2317 SET_TARGET_PROPERTIES(f32-spmm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002318 CXX_STANDARD 11
2319 CXX_STANDARD_REQUIRED YES
2320 CXX_EXTENSIONS YES)
Marat Dukhan355ab432020-04-09 19:01:52 -07002321 TARGET_INCLUDE_DIRECTORIES(f32-spmm-minmax-test PRIVATE src test)
2322 TARGET_LINK_LIBRARIES(f32-spmm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2323 ADD_TEST(f32-spmm-minmax-test f32-spmm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002324
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002325 ADD_EXECUTABLE(f32-vadd-minmax-test test/f32-vadd-minmax.cc)
2326 SET_TARGET_PROPERTIES(f32-vadd-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002327 CXX_STANDARD 11
2328 CXX_STANDARD_REQUIRED YES
2329 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002330 TARGET_INCLUDE_DIRECTORIES(f32-vadd-minmax-test PRIVATE src test)
2331 TARGET_LINK_LIBRARIES(f32-vadd-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2332 ADD_TEST(f32-vadd-minmax-test f32-vadd-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002333
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002334 ADD_EXECUTABLE(f32-vaddc-minmax-test test/f32-vaddc-minmax.cc)
2335 SET_TARGET_PROPERTIES(f32-vaddc-minmax-test PROPERTIES
Marat Dukhanc76065f2019-11-14 18:13:33 -08002336 CXX_STANDARD 11
2337 CXX_STANDARD_REQUIRED YES
2338 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002339 TARGET_INCLUDE_DIRECTORIES(f32-vaddc-minmax-test PRIVATE src test)
2340 TARGET_LINK_LIBRARIES(f32-vaddc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2341 ADD_TEST(f32-vaddc-minmax-test f32-vaddc-minmax-test)
Marat Dukhanc76065f2019-11-14 18:13:33 -08002342
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002343 ADD_EXECUTABLE(f32-vdiv-minmax-test test/f32-vdiv-minmax.cc)
2344 SET_TARGET_PROPERTIES(f32-vdiv-minmax-test PROPERTIES
Marat Dukhan77ca6302019-12-06 12:48:15 -08002345 CXX_STANDARD 11
2346 CXX_STANDARD_REQUIRED YES
2347 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002348 TARGET_INCLUDE_DIRECTORIES(f32-vdiv-minmax-test PRIVATE src test)
2349 TARGET_LINK_LIBRARIES(f32-vdiv-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2350 ADD_TEST(f32-vdiv-minmax-test f32-vdiv-minmax-test)
Marat Dukhan77ca6302019-12-06 12:48:15 -08002351
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002352 ADD_EXECUTABLE(f32-vdivc-minmax-test test/f32-vdivc-minmax.cc)
2353 SET_TARGET_PROPERTIES(f32-vdivc-minmax-test PROPERTIES
Marat Dukhan77ca6302019-12-06 12:48:15 -08002354 CXX_STANDARD 11
2355 CXX_STANDARD_REQUIRED YES
2356 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002357 TARGET_INCLUDE_DIRECTORIES(f32-vdivc-minmax-test PRIVATE src test)
2358 TARGET_LINK_LIBRARIES(f32-vdivc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2359 ADD_TEST(f32-vdivc-minmax-test f32-vdivc-minmax-test)
Marat Dukhan77ca6302019-12-06 12:48:15 -08002360
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002361 ADD_EXECUTABLE(f32-vrdivc-minmax-test test/f32-vrdivc-minmax.cc)
2362 SET_TARGET_PROPERTIES(f32-vrdivc-minmax-test PROPERTIES
Marat Dukhan77ca6302019-12-06 12:48:15 -08002363 CXX_STANDARD 11
2364 CXX_STANDARD_REQUIRED YES
2365 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002366 TARGET_INCLUDE_DIRECTORIES(f32-vrdivc-minmax-test PRIVATE src test)
2367 TARGET_LINK_LIBRARIES(f32-vrdivc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2368 ADD_TEST(f32-vrdivc-minmax-test f32-vrdivc-minmax-test)
Marat Dukhan77ca6302019-12-06 12:48:15 -08002369
Marat Dukhan403b7d42019-12-05 12:49:11 -08002370 ADD_EXECUTABLE(f32-vmax-test test/f32-vmax.cc)
2371 SET_TARGET_PROPERTIES(f32-vmax-test PROPERTIES
2372 CXX_STANDARD 11
2373 CXX_STANDARD_REQUIRED YES
2374 CXX_EXTENSIONS YES)
2375 TARGET_INCLUDE_DIRECTORIES(f32-vmax-test PRIVATE src test)
2376 TARGET_LINK_LIBRARIES(f32-vmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2377 ADD_TEST(f32-vmax-test f32-vmax-test)
2378
2379 ADD_EXECUTABLE(f32-vmaxc-test test/f32-vmaxc.cc)
2380 SET_TARGET_PROPERTIES(f32-vmaxc-test PROPERTIES
2381 CXX_STANDARD 11
2382 CXX_STANDARD_REQUIRED YES
2383 CXX_EXTENSIONS YES)
2384 TARGET_INCLUDE_DIRECTORIES(f32-vmaxc-test PRIVATE src test)
2385 TARGET_LINK_LIBRARIES(f32-vmaxc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2386 ADD_TEST(f32-vmaxc-test f32-vmaxc-test)
2387
2388 ADD_EXECUTABLE(f32-vmin-test test/f32-vmin.cc)
2389 SET_TARGET_PROPERTIES(f32-vmin-test PROPERTIES
2390 CXX_STANDARD 11
2391 CXX_STANDARD_REQUIRED YES
2392 CXX_EXTENSIONS YES)
2393 TARGET_INCLUDE_DIRECTORIES(f32-vmin-test PRIVATE src test)
2394 TARGET_LINK_LIBRARIES(f32-vmin-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2395 ADD_TEST(f32-vmin-test f32-vmin-test)
2396
2397 ADD_EXECUTABLE(f32-vminc-test test/f32-vminc.cc)
2398 SET_TARGET_PROPERTIES(f32-vminc-test PROPERTIES
2399 CXX_STANDARD 11
2400 CXX_STANDARD_REQUIRED YES
2401 CXX_EXTENSIONS YES)
2402 TARGET_INCLUDE_DIRECTORIES(f32-vminc-test PRIVATE src test)
2403 TARGET_LINK_LIBRARIES(f32-vminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2404 ADD_TEST(f32-vminc-test f32-vminc-test)
2405
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002406 ADD_EXECUTABLE(f32-vmul-minmax-test test/f32-vmul-minmax.cc)
2407 SET_TARGET_PROPERTIES(f32-vmul-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002408 CXX_STANDARD 11
2409 CXX_STANDARD_REQUIRED YES
2410 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002411 TARGET_INCLUDE_DIRECTORIES(f32-vmul-minmax-test PRIVATE src test)
2412 TARGET_LINK_LIBRARIES(f32-vmul-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2413 ADD_TEST(f32-vmul-minmax-test f32-vmul-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002414
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002415 ADD_EXECUTABLE(f32-vmulc-minmax-test test/f32-vmulc-minmax.cc)
2416 SET_TARGET_PROPERTIES(f32-vmulc-minmax-test PROPERTIES
Marat Dukhanc76065f2019-11-14 18:13:33 -08002417 CXX_STANDARD 11
2418 CXX_STANDARD_REQUIRED YES
2419 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002420 TARGET_INCLUDE_DIRECTORIES(f32-vmulc-minmax-test PRIVATE src test)
2421 TARGET_LINK_LIBRARIES(f32-vmulc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2422 ADD_TEST(f32-vmulc-minmax-test f32-vmulc-minmax-test)
Marat Dukhanc76065f2019-11-14 18:13:33 -08002423
Marat Dukhanb9d07cf2020-04-11 20:25:31 -07002424 ADD_EXECUTABLE(f32-vmulcaddc-minmax-test test/f32-vmulcaddc-minmax.cc)
2425 SET_TARGET_PROPERTIES(f32-vmulcaddc-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002426 CXX_STANDARD 11
2427 CXX_STANDARD_REQUIRED YES
2428 CXX_EXTENSIONS YES)
Marat Dukhanb9d07cf2020-04-11 20:25:31 -07002429 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-minmax-test PRIVATE src test)
2430 TARGET_LINK_LIBRARIES(f32-vmulcaddc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2431 ADD_TEST(f32-vmulcaddc-minmax-test f32-vmulcaddc-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002432
Marat Dukhan97579532019-10-18 16:40:39 -07002433 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
2434 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
2435 CXX_STANDARD 11
2436 CXX_STANDARD_REQUIRED YES
2437 CXX_EXTENSIONS YES)
2438 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
2439 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2440 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
2441
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002442 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
Marat Dukhan9f240d12020-04-13 10:42:30 -07002443 SET_TARGET_PROPERTIES(f32-vscaleextexp-test PROPERTIES
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002444 CXX_STANDARD 11
2445 CXX_STANDARD_REQUIRED YES
2446 CXX_EXTENSIONS YES)
2447 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07002448 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002449 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
2450
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002451 ADD_EXECUTABLE(f32-vsub-minmax-test test/f32-vsub-minmax.cc)
2452 SET_TARGET_PROPERTIES(f32-vsub-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002453 CXX_STANDARD 11
2454 CXX_STANDARD_REQUIRED YES
2455 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002456 TARGET_INCLUDE_DIRECTORIES(f32-vsub-minmax-test PRIVATE src test)
2457 TARGET_LINK_LIBRARIES(f32-vsub-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2458 ADD_TEST(f32-vsub-minmax-test f32-vsub-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002459
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002460 ADD_EXECUTABLE(f32-vsubc-minmax-test test/f32-vsubc-minmax.cc)
2461 SET_TARGET_PROPERTIES(f32-vsubc-minmax-test PROPERTIES
Marat Dukhanc76065f2019-11-14 18:13:33 -08002462 CXX_STANDARD 11
2463 CXX_STANDARD_REQUIRED YES
2464 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002465 TARGET_INCLUDE_DIRECTORIES(f32-vsubc-minmax-test PRIVATE src test)
2466 TARGET_LINK_LIBRARIES(f32-vsubc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2467 ADD_TEST(f32-vsubc-minmax-test f32-vsubc-minmax-test)
Marat Dukhanc76065f2019-11-14 18:13:33 -08002468
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002469 ADD_EXECUTABLE(f32-vrsubc-minmax-test test/f32-vrsubc-minmax.cc)
2470 SET_TARGET_PROPERTIES(f32-vrsubc-minmax-test PROPERTIES
Marat Dukhanc76065f2019-11-14 18:13:33 -08002471 CXX_STANDARD 11
2472 CXX_STANDARD_REQUIRED YES
2473 CXX_EXTENSIONS YES)
Marat Dukhan91cd2b72020-04-09 23:57:31 -07002474 TARGET_INCLUDE_DIRECTORIES(f32-vrsubc-minmax-test PRIVATE src test)
2475 TARGET_LINK_LIBRARIES(f32-vrsubc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2476 ADD_TEST(f32-vrsubc-minmax-test f32-vrsubc-minmax-test)
Marat Dukhanc76065f2019-11-14 18:13:33 -08002477
Marat Dukhan99936602020-04-11 16:47:01 -07002478 ADD_EXECUTABLE(q8-avgpool-minmax-test test/q8-avgpool-minmax.cc)
2479 SET_TARGET_PROPERTIES(q8-avgpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002480 CXX_STANDARD 11
2481 CXX_STANDARD_REQUIRED YES
2482 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002483 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-minmax-test PRIVATE src test)
2484 TARGET_LINK_LIBRARIES(q8-avgpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2485 ADD_TEST(q8-avgpool-minmax-test q8-avgpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002486
Marat Dukhande06f492020-04-09 00:19:31 -07002487 ADD_EXECUTABLE(q8-dwconv-minmax-test test/q8-dwconv-minmax.cc)
2488 SET_TARGET_PROPERTIES(q8-dwconv-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002489 CXX_STANDARD 11
2490 CXX_STANDARD_REQUIRED YES
2491 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002492 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-minmax-test PRIVATE src test)
2493 TARGET_LINK_LIBRARIES(q8-dwconv-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2494 ADD_TEST(q8-dwconv-minmax-test q8-dwconv-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002495
Marat Dukhan99936602020-04-11 16:47:01 -07002496 ADD_EXECUTABLE(q8-gavgpool-minmax-test test/q8-gavgpool-minmax.cc)
2497 SET_TARGET_PROPERTIES(q8-gavgpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002498 CXX_STANDARD 11
2499 CXX_STANDARD_REQUIRED YES
2500 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002501 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-minmax-test PRIVATE src test)
2502 TARGET_LINK_LIBRARIES(q8-gavgpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2503 ADD_TEST(q8-gavgpool-test q8-gavgpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002504
Marat Dukhande06f492020-04-09 00:19:31 -07002505 ADD_EXECUTABLE(q8-gemm-minmax-test test/q8-gemm-minmax.cc)
2506 SET_TARGET_PROPERTIES(q8-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002507 CXX_STANDARD 11
2508 CXX_STANDARD_REQUIRED YES
2509 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002510 TARGET_INCLUDE_DIRECTORIES(q8-gemm-minmax-test PRIVATE src test)
2511 TARGET_LINK_LIBRARIES(q8-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2512 ADD_TEST(q8-gemm-minmax-test q8-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002513
Marat Dukhande06f492020-04-09 00:19:31 -07002514 ADD_EXECUTABLE(q8-igemm-minmax-test test/q8-igemm-minmax.cc)
2515 SET_TARGET_PROPERTIES(q8-igemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002516 CXX_STANDARD 11
2517 CXX_STANDARD_REQUIRED YES
2518 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002519 TARGET_INCLUDE_DIRECTORIES(q8-igemm-minmax-test PRIVATE src test)
2520 TARGET_LINK_LIBRARIES(q8-igemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2521 ADD_TEST(q8-igemm-minmax-test q8-igemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002522
Marat Dukhan99936602020-04-11 16:47:01 -07002523 ADD_EXECUTABLE(q8-vadd-minmax-test test/q8-vadd-minmax.cc)
2524 SET_TARGET_PROPERTIES(q8-vadd-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002525 CXX_STANDARD 11
2526 CXX_STANDARD_REQUIRED YES
2527 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002528 TARGET_INCLUDE_DIRECTORIES(q8-vadd-minmax-test PRIVATE src test)
2529 TARGET_LINK_LIBRARIES(q8-vadd-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2530 ADD_TEST(q8-vadd-minmax-test q8-vadd-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002531
Marat Dukhan53873d02019-12-06 17:21:30 -08002532 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
2533 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002534 CXX_STANDARD 11
2535 CXX_STANDARD_REQUIRED YES
2536 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002537 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
2538 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2539 ADD_TEST(u8-clamp-test u8-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002540
2541 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
2542 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
2543 CXX_STANDARD 11
2544 CXX_STANDARD_REQUIRED YES
2545 CXX_EXTENSIONS YES)
2546 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
2547 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2548 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
2549
Marat Dukhan99936602020-04-11 16:47:01 -07002550 ADD_EXECUTABLE(u8-maxpool-minmax-test test/u8-maxpool-minmax.cc)
2551 SET_TARGET_PROPERTIES(u8-maxpool-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002552 CXX_STANDARD 11
2553 CXX_STANDARD_REQUIRED YES
2554 CXX_EXTENSIONS YES)
Marat Dukhan99936602020-04-11 16:47:01 -07002555 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-minmax-test PRIVATE src test)
2556 TARGET_LINK_LIBRARIES(u8-maxpool-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2557 ADD_TEST(u8-maxpool-minmax-test u8-maxpool-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002558
2559 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
2560 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
2561 CXX_STANDARD 11
2562 CXX_STANDARD_REQUIRED YES
2563 CXX_EXTENSIONS YES)
2564 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
2565 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2566 ADD_TEST(u8-rmax-test u8-rmax-test)
2567
2568 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
2569 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
2570 CXX_STANDARD 11
2571 CXX_STANDARD_REQUIRED YES
2572 CXX_EXTENSIONS YES)
2573 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
2574 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2575 ADD_TEST(x32-packx-test x32-packx-test)
2576
2577 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
2578 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
2579 CXX_STANDARD 11
2580 CXX_STANDARD_REQUIRED YES
2581 CXX_EXTENSIONS YES)
2582 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
2583 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2584 ADD_TEST(x32-pad-test x32-pad-test)
2585
2586 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
2587 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
2588 CXX_STANDARD 11
2589 CXX_STANDARD_REQUIRED YES
2590 CXX_EXTENSIONS YES)
2591 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
2592 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2593 ADD_TEST(x32-unpool-test x32-unpool-test)
2594
2595 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
2596 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
2597 CXX_STANDARD 11
2598 CXX_STANDARD_REQUIRED YES
2599 CXX_EXTENSIONS YES)
2600 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
2601 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2602 ADD_TEST(x32-zip-test x32-zip-test)
2603
2604 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
2605 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
2606 CXX_STANDARD 11
2607 CXX_STANDARD_REQUIRED YES
2608 CXX_EXTENSIONS YES)
2609 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
2610 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2611 ADD_TEST(x8-lut-test x8-lut-test)
2612
2613 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
2614 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
2615 CXX_STANDARD 11
2616 CXX_STANDARD_REQUIRED YES
2617 CXX_EXTENSIONS YES)
2618 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
2619 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2620 ADD_TEST(x8-zip-test x8-zip-test)
Marat Dukhanfe7acb62020-03-09 19:30:05 -07002621
2622 ADD_EXECUTABLE(requantization-test test/requantization.cc)
2623 SET_TARGET_PROPERTIES(requantization-test PROPERTIES
2624 CXX_STANDARD 11
2625 CXX_STANDARD_REQUIRED YES
2626 CXX_EXTENSIONS YES)
2627 TARGET_INCLUDE_DIRECTORIES(requantization-test PRIVATE src test)
2628 TARGET_LINK_LIBRARIES(requantization-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2629 ADD_TEST(requantization-test requantization-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002630ENDIF()
2631
2632# ---[ XNNPACK microbenchmarks
2633IF(XNNPACK_BUILD_BENCHMARKS)
2634 # ---[ Build google benchmark
2635 IF(NOT TARGET benchmark)
2636 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
2637 ADD_SUBDIRECTORY(
2638 "${GOOGLEBENCHMARK_SOURCE_DIR}"
2639 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
2640 ENDIF()
2641
2642 ADD_LIBRARY(bench-utils bench/utils.cc)
2643 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
2644 CXX_STANDARD 11
2645 CXX_STANDARD_REQUIRED YES
2646 CXX_EXTENSIONS NO)
2647 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08002648 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002649
Marat Dukhancb10f262019-11-16 15:52:37 -08002650 # ---[ Build accuracy microbenchmarks
2651 ADD_EXECUTABLE(f32-exp-eval eval/f32-exp.cc)
2652 SET_TARGET_PROPERTIES(f32-exp-eval PROPERTIES
2653 CXX_STANDARD 11
2654 CXX_STANDARD_REQUIRED YES
2655 CXX_EXTENSIONS NO)
2656 TARGET_INCLUDE_DIRECTORIES(f32-exp-eval PRIVATE src)
2657 TARGET_LINK_LIBRARIES(f32-exp-eval PRIVATE XNNPACK benchmark fp16)
2658
2659 ADD_EXECUTABLE(f32-expminus-eval eval/f32-expminus.cc)
2660 SET_TARGET_PROPERTIES(f32-expminus-eval PROPERTIES
2661 CXX_STANDARD 11
2662 CXX_STANDARD_REQUIRED YES
2663 CXX_EXTENSIONS NO)
2664 TARGET_INCLUDE_DIRECTORIES(f32-expminus-eval PRIVATE src)
2665 TARGET_LINK_LIBRARIES(f32-expminus-eval PRIVATE XNNPACK benchmark fp16)
2666
2667 ADD_EXECUTABLE(f32-extexp-eval eval/f32-extexp.cc)
2668 SET_TARGET_PROPERTIES(f32-extexp-eval PROPERTIES
2669 CXX_STANDARD 11
2670 CXX_STANDARD_REQUIRED YES
2671 CXX_EXTENSIONS YES)
2672 TARGET_INCLUDE_DIRECTORIES(f32-extexp-eval PRIVATE src)
2673 TARGET_LINK_LIBRARIES(f32-extexp-eval PRIVATE XNNPACK benchmark fp16)
2674
2675 ADD_EXECUTABLE(f32-sigmoid-eval eval/f32-sigmoid.cc)
2676 SET_TARGET_PROPERTIES(f32-sigmoid-eval PROPERTIES
2677 CXX_STANDARD 11
2678 CXX_STANDARD_REQUIRED YES
2679 CXX_EXTENSIONS NO)
2680 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-eval PRIVATE src)
2681 TARGET_LINK_LIBRARIES(f32-sigmoid-eval PRIVATE XNNPACK benchmark fp16)
2682
Marat Dukhan5f18d262019-10-31 10:24:14 -07002683 # ---[ Build end-to-end microbenchmarks
Marat Dukhan17e16282019-12-10 12:09:35 -08002684 ADD_LIBRARY(bench-models STATIC
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002685 models/mobilenet-v1.cc
2686 models/mobilenet-v2.cc
2687 models/mobilenet-v3-large.cc
2688 models/mobilenet-v3-small.cc)
2689 SET_TARGET_PROPERTIES(bench-models PROPERTIES
2690 CXX_STANDARD 11
2691 CXX_STANDARD_REQUIRED YES
2692 CXX_EXTENSIONS YES)
2693 TARGET_INCLUDE_DIRECTORIES(bench-models PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2694 TARGET_LINK_LIBRARIES(bench-models PRIVATE XNNPACK benchmark bench-utils)
2695
2696 ADD_EXECUTABLE(end2end-bench bench/end2end.cc)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002697 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
2698 CXX_STANDARD 11
2699 CXX_STANDARD_REQUIRED YES
2700 CXX_EXTENSIONS NO)
2701 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002702 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002703
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002704 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002705 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
2706 CXX_STANDARD 11
2707 CXX_STANDARD_REQUIRED YES
2708 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002709 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002710 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002711
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002712 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc)
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07002713 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07002714 CXX_STANDARD 11
2715 CXX_STANDARD_REQUIRED YES
2716 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002717 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002718 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07002719
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002720 # ---[ Build operator-level microbenchmarks
2721 ADD_EXECUTABLE(add-bench bench/add.cc)
2722 SET_TARGET_PROPERTIES(add-bench PROPERTIES
2723 CXX_STANDARD 11
2724 CXX_STANDARD_REQUIRED YES
2725 CXX_EXTENSIONS NO)
2726 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2727 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2728
2729 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
2730 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
2731 CXX_STANDARD 11
2732 CXX_STANDARD_REQUIRED YES
2733 CXX_EXTENSIONS NO)
2734 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2735 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2736
2737 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
2738 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
2739 CXX_STANDARD 11
2740 CXX_STANDARD_REQUIRED YES
2741 CXX_EXTENSIONS NO)
2742 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2743 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2744
2745 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
2746 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
2747 CXX_STANDARD 11
2748 CXX_STANDARD_REQUIRED YES
2749 CXX_EXTENSIONS NO)
2750 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2751 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2752
2753 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
2754 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
2755 CXX_STANDARD 11
2756 CXX_STANDARD_REQUIRED YES
2757 CXX_EXTENSIONS NO)
2758 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2759 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2760
2761 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
2762 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
2763 CXX_STANDARD 11
2764 CXX_STANDARD_REQUIRED YES
2765 CXX_EXTENSIONS NO)
2766 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2767 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2768
2769 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
2770 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
2771 CXX_STANDARD 11
2772 CXX_STANDARD_REQUIRED YES
2773 CXX_EXTENSIONS NO)
2774 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2775 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2776
Marat Dukhan95b22432019-10-30 16:30:14 -07002777 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
2778 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
2779 CXX_STANDARD 11
2780 CXX_STANDARD_REQUIRED YES
2781 CXX_EXTENSIONS NO)
2782 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2783 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2784
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002785 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
2786 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
2787 CXX_STANDARD 11
2788 CXX_STANDARD_REQUIRED YES
2789 CXX_EXTENSIONS NO)
2790 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2791 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2792
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002793 ADD_EXECUTABLE(softmax-bench bench/softmax.cc)
2794 SET_TARGET_PROPERTIES(softmax-bench PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002795 CXX_STANDARD 11
2796 CXX_STANDARD_REQUIRED YES
2797 CXX_EXTENSIONS NO)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002798 TARGET_INCLUDE_DIRECTORIES(softmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2799 TARGET_LINK_LIBRARIES(softmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002800
2801 # ---[ Build microkernel-level microbenchmarks
Frank Barchard40d20fe2020-05-05 00:37:45 -07002802 ADD_EXECUTABLE(f16-igemm-bench bench/f16-igemm.cc)
2803 SET_TARGET_PROPERTIES(f16-igemm-bench PROPERTIES
2804 CXX_STANDARD 11
2805 CXX_STANDARD_REQUIRED YES
2806 CXX_EXTENSIONS YES)
2807 TARGET_INCLUDE_DIRECTORIES(f16-igemm-bench PRIVATE src)
2808 TARGET_INCLUDE_DIRECTORIES(f16-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2809 TARGET_LINK_LIBRARIES(f16-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2810
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002811 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
2812 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
2813 CXX_STANDARD 11
2814 CXX_STANDARD_REQUIRED YES
2815 CXX_EXTENSIONS YES)
2816 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
2817 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2818 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2819
2820 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
2821 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
2822 CXX_STANDARD 11
2823 CXX_STANDARD_REQUIRED YES
2824 CXX_EXTENSIONS YES)
2825 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
2826 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2827 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2828
2829 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
2830 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
2831 CXX_STANDARD 11
2832 CXX_STANDARD_REQUIRED YES
2833 CXX_EXTENSIONS YES)
2834 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
2835 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2836 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2837
2838 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
2839 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
2840 CXX_STANDARD 11
2841 CXX_STANDARD_REQUIRED YES
2842 CXX_EXTENSIONS YES)
2843 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
2844 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2845 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2846
2847 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
2848 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
2849 CXX_STANDARD 11
2850 CXX_STANDARD_REQUIRED YES
2851 CXX_EXTENSIONS YES)
2852 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
2853 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2854 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2855
2856 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
2857 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
2858 CXX_STANDARD 11
2859 CXX_STANDARD_REQUIRED YES
2860 CXX_EXTENSIONS YES)
2861 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
2862 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2863 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2864
2865 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
2866 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
2867 C_STANDARD 99
2868 C_STANDARD_REQUIRED YES
2869 C_EXTENSIONS NO
2870 CXX_STANDARD 11
2871 CXX_STANDARD_REQUIRED YES
2872 CXX_EXTENSIONS YES)
2873 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
2874 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2875 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2876
2877 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
2878 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
2879 CXX_STANDARD 11
2880 CXX_STANDARD_REQUIRED YES
2881 CXX_EXTENSIONS YES)
2882 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
2883 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2884 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2885
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002886 ADD_EXECUTABLE(f32-sigmoid-bench bench/f32-sigmoid.cc)
2887 SET_TARGET_PROPERTIES(f32-sigmoid-bench PROPERTIES
2888 CXX_STANDARD 11
2889 CXX_STANDARD_REQUIRED YES
2890 CXX_EXTENSIONS YES)
2891 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE src)
2892 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2893 TARGET_LINK_LIBRARIES(f32-sigmoid-bench PRIVATE XNNPACK benchmark bench-utils)
2894
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002895 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
2896 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
2897 CXX_STANDARD 11
2898 CXX_STANDARD_REQUIRED YES
2899 CXX_EXTENSIONS YES)
2900 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
2901 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2902 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2903
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002904 ADD_EXECUTABLE(f32-softmax-bench bench/f32-softmax.cc)
2905 SET_TARGET_PROPERTIES(f32-softmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002906 CXX_STANDARD 11
2907 CXX_STANDARD_REQUIRED YES
2908 CXX_EXTENSIONS YES)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002909 TARGET_INCLUDE_DIRECTORIES(f32-softmax-bench PRIVATE src)
2910 TARGET_INCLUDE_DIRECTORIES(f32-softmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2911 TARGET_LINK_LIBRARIES(f32-softmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002912
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002913 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
2914 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
2915 CXX_STANDARD 11
2916 CXX_STANDARD_REQUIRED YES
2917 CXX_EXTENSIONS YES)
2918 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
2919 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2920 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
Marat Dukhanfe7acb62020-03-09 19:30:05 -07002921
2922 ADD_EXECUTABLE(requantization-bench bench/requantization.cc)
2923 SET_TARGET_PROPERTIES(requantization-bench PROPERTIES
2924 CXX_STANDARD 11
2925 CXX_STANDARD_REQUIRED YES
2926 CXX_EXTENSIONS YES)
2927 TARGET_INCLUDE_DIRECTORIES(requantization-bench PRIVATE src)
2928 TARGET_INCLUDE_DIRECTORIES(requantization-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2929 TARGET_LINK_LIBRARIES(requantization-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002930ENDIF()