blob: 5bd806061d87f37605252e515a8d3876d77a3078 [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
Marat Dukhanefc184a2020-02-13 09:47:01 -080019OPTION(XNNPACK_ENABLE_ASSEMBLY "Build XNNPACK with assembly micro-kernels" ON)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070020OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
21OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
22
23# ---[ CMake options
24IF(XNNPACK_BUILD_TESTS)
25 ENABLE_TESTING()
26ENDIF()
27
Marat Dukhanefc184a2020-02-13 09:47:01 -080028IF(XNNPACK_ENABLE_ASSEMBLY)
29 ADD_DEFINITIONS(-DXNN_ENABLE_ASSEMBLY=1)
30ELSE()
31 ADD_DEFINITIONS(-DXNN_ENABLE_ASSEMBLY=0)
32ENDIF()
33
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070034# ---[ Build flags
35IF(NOT CMAKE_SYSTEM_PROCESSOR)
36 IF(IOS)
37 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
38 IF(IOS_ARCH_COUNT GREATER 1)
39 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
40 "Specify a single architecture in IOS_ARCH and re-configure. ")
41 ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +090042 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|AMD64|armv7.*|arm64.*)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070043 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
44 ENDIF()
45 ELSE()
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
47 ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +090048ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|AMD64|armv[5-8].*|aarch64)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070049 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
50ENDIF()
51
52IF(NOT CMAKE_SYSTEM_NAME)
53 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +090054ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android|Windows)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -070055 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
56ENDIF()
57
58# ---[ Download deps
59IF(NOT DEFINED CLOG_SOURCE_DIR)
60 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
61 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
62 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
63 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
64 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
65 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
66 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
67ENDIF()
68
69IF(NOT DEFINED CPUINFO_SOURCE_DIR)
70 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
71 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
72 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
73 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
74 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
75 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
76 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
77ENDIF()
78
79IF(NOT DEFINED FP16_SOURCE_DIR)
80 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
81 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
82 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
83 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
84 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
85 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
86 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
87ENDIF()
88
89IF(NOT DEFINED FXDIV_SOURCE_DIR)
90 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
91 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
92 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
93 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
94 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
95 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
96 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
97ENDIF()
98
99IF(NOT DEFINED PSIMD_SOURCE_DIR)
100 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
101 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
102 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
103 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
104 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
105 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
106 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
107ENDIF()
108
109IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
110 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
111 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
112 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
113 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
114 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
115 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
116 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
117ENDIF()
118
119IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
120 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
121 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
122 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
123 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
124 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
125 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
126 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
127ENDIF()
128
129IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
130 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
131 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
132 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
133 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
134 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
135 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
136 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
137ENDIF()
138
139# ---[ XNNPACK library
140SET(XNNPACK_OPERATOR_SRCS
Marat Dukhanefc47b82019-11-18 09:25:38 -0800141 src/add-nc.c
142 src/argmax-pooling-nhwc.c
143 src/average-pooling-nhwc.c
Marat Dukhanb1a0fc32019-12-02 19:32:02 -0800144 src/binary-elementwise-nd.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800145 src/channel-pad-nc.c
146 src/channel-shuffle-nc.c
147 src/clamp-nc.c
148 src/convolution-nchw.c
149 src/convolution-nhwc.c
150 src/deconvolution-nhwc.c
151 src/fully-connected-nc.c
152 src/global-average-pooling-ncw.c
153 src/global-average-pooling-nwc.c
154 src/hardswish-nc.c
155 src/leaky-relu-nc.c
156 src/max-pooling-nhwc.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800157 src/prelu-nc.c
158 src/resize-bilinear-nhwc.c
159 src/sigmoid-nc.c
Marat Dukhanfd8e6892020-01-27 15:25:25 -0800160 src/softmax-nc.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800161 src/unpooling-nhwc.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700162
163SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
164LIST(APPEND XNNPACK_COLD_SRCS
165 src/init.c
Ashkan Aliabadi1f8a2b82019-11-20 11:27:00 -0800166 src/memory.c
Marat Dukhan98ca6352020-02-03 12:53:02 -0800167 src/operator-delete.c
168 src/runtime.c
169 src/subgraph.c
170 src/tensor.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700171
172SET(XNNPACK_HOT_SRCS
173 src/indirection.c
174 src/operator-run.c)
175
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800176SET(XNNPACK_TABLE_SRCS
177 src/tables/exp2-k-over-64.c
178 src/tables/exp2-k-over-2048.c)
179
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700180SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800181 src/f32-argmaxpool/4x-scalar-c1.c
182 src/f32-argmaxpool/9p8x-scalar-c1.c
183 src/f32-argmaxpool/9x-scalar-c1.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800184 src/f32-avgpool/9p8x-scalar-c1.c
185 src/f32-avgpool/9x-scalar-c1.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700186 src/f32-clamp/gen/scalar-x1.c
187 src/f32-clamp/gen/scalar-x2.c
188 src/f32-clamp/gen/scalar-x4.c
Marat Dukhan6b7dfae2019-12-04 16:00:52 -0800189 src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan441e2212019-12-04 18:30:49 -0800190 src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700191 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700192 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700193 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800194 src/f32-dwconv-spchw/5x5p2-scalar.c
Erich Elsen38709a62019-11-08 11:58:45 -0800195 src/f32-dwconv-spchw/5x5s2p2-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700196 src/f32-dwconv/gen/up1x4-scalar.c
197 src/f32-dwconv/gen/up1x4-scalar-acc2.c
198 src/f32-dwconv/gen/up1x9-scalar.c
199 src/f32-dwconv/gen/up1x9-scalar-acc2.c
200 src/f32-dwconv/gen/up1x25-scalar.c
201 src/f32-dwconv/gen/up1x25-scalar-acc2.c
202 src/f32-dwconv/gen/up2x4-scalar.c
203 src/f32-dwconv/gen/up2x4-scalar-acc2.c
204 src/f32-dwconv/gen/up2x9-scalar.c
205 src/f32-dwconv/gen/up2x9-scalar-acc2.c
206 src/f32-dwconv/gen/up2x25-scalar.c
207 src/f32-dwconv/gen/up2x25-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700208 src/f32-dwconv/gen/up1x4-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700209 src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700210 src/f32-dwconv/gen/up1x9-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700211 src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c
212 src/f32-dwconv/gen/up1x25-minmax-scalar.c
213 src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700214 src/f32-dwconv/gen/up2x4-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700215 src/f32-dwconv/gen/up2x4-minmax-scalar-acc2.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700216 src/f32-dwconv/gen/up2x9-minmax-scalar.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700217 src/f32-dwconv/gen/up2x9-minmax-scalar-acc2.c
218 src/f32-dwconv/gen/up2x25-minmax-scalar.c
219 src/f32-dwconv/gen/up2x25-minmax-scalar-acc2.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700220 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700221 src/f32-gavgpool/7p7x-scalar-c1.c
222 src/f32-gavgpool/7x-scalar-c1.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700223 src/f32-gemm/gen/1x4-scalar.c
224 src/f32-gemm/gen/2x4-scalar.c
225 src/f32-gemm/gen/4x2-scalar.c
226 src/f32-gemm/gen/4x4-scalar.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700227 src/f32-gemm/gen/1x4-minmax-scalar.c
228 src/f32-gemm/gen/2x4-minmax-scalar.c
229 src/f32-gemm/gen/4x2-minmax-scalar.c
230 src/f32-gemm/gen/4x4-minmax-scalar.c
231 src/f32-gemm/gen-inc/1x4inc-minmax-scalar.c
232 src/f32-gemm/gen-inc/2x4inc-minmax-scalar.c
233 src/f32-gemm/gen-inc/4x4inc-minmax-scalar.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800234 src/f32-hswish/gen/scalar-x1.c
235 src/f32-hswish/gen/scalar-x2.c
236 src/f32-hswish/gen/scalar-x4.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700237 src/f32-ibilinear/gen/scalar-c1.c
238 src/f32-ibilinear/gen/scalar-c2.c
239 src/f32-ibilinear/gen/scalar-c4.c
Marat Dukhan163a7e62020-04-09 04:19:26 -0700240 src/f32-igemm/gen/1x4-scalar.c
241 src/f32-igemm/gen/2x4-scalar.c
242 src/f32-igemm/gen/4x2-scalar.c
243 src/f32-igemm/gen/4x4-scalar.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700244 src/f32-igemm/gen/1x4-minmax-scalar.c
245 src/f32-igemm/gen/2x4-minmax-scalar.c
246 src/f32-igemm/gen/4x2-minmax-scalar.c
247 src/f32-igemm/gen/4x4-minmax-scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800248 src/f32-maxpool/9p8x-scalar-c1.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800249 src/f32-pavgpool/9p8x-scalar-c1.c
250 src/f32-pavgpool/9x-scalar-c1.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700251 src/f32-ppmm/gen/2x4-minmax-scalar.c
252 src/f32-ppmm/gen/3x3-minmax-scalar.c
253 src/f32-ppmm/gen/4x2-minmax-scalar.c
254 src/f32-ppmm/gen/4x4-minmax-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800255 src/f32-prelu/gen/scalar-2x1.c
256 src/f32-prelu/gen/scalar-2x4.c
Marat Dukhanf46f6752020-01-21 11:03:49 -0800257 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x1.c
258 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x2.c
259 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x2-acc2.c
260 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4.c
261 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4-acc2.c
262 src/f32-raddstoreexpminusmax/gen/scalar-lut64-p2-x4-acc4.c
263 src/f32-raddstoreexpminusmax/gen/scalar-p5-x1.c
264 src/f32-raddstoreexpminusmax/gen/scalar-p5-x2.c
265 src/f32-raddstoreexpminusmax/gen/scalar-p5-x2-acc2.c
266 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4.c
267 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4-acc2.c
268 src/f32-raddstoreexpminusmax/gen/scalar-p5-x4-acc4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700269 src/f32-rmax/scalar.c
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800270 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x1.c
271 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x2.c
272 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x4.c
273 src/f32-sigmoid/gen/scalar-lut64-p2-div-x1.c
274 src/f32-sigmoid/gen/scalar-lut64-p2-div-x2.c
275 src/f32-sigmoid/gen/scalar-lut64-p2-div-x4.c
276 src/f32-sigmoid/gen/scalar-p5-div-x1.c
277 src/f32-sigmoid/gen/scalar-p5-div-x2.c
278 src/f32-sigmoid/gen/scalar-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800279 src/f32-spmm/gen/1x1-scalar-pipelined.c
280 src/f32-spmm/gen/1x1-scalar.c
281 src/f32-spmm/gen/2x1-scalar-pipelined.c
282 src/f32-spmm/gen/2x1-scalar.c
283 src/f32-spmm/gen/4x1-scalar-pipelined.c
284 src/f32-spmm/gen/4x1-scalar.c
285 src/f32-spmm/gen/8x1-scalar-pipelined.c
286 src/f32-spmm/gen/8x1-scalar.c
287 src/f32-spmm/gen/8x2-scalar.c
288 src/f32-spmm/gen/8x4-scalar.c
289 src/f32-vbinary/gen/vadd-scalar-x1.c
290 src/f32-vbinary/gen/vadd-scalar-x2.c
291 src/f32-vbinary/gen/vadd-scalar-x4.c
292 src/f32-vbinary/gen/vaddc-scalar-x1.c
293 src/f32-vbinary/gen/vaddc-scalar-x2.c
294 src/f32-vbinary/gen/vaddc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800295 src/f32-vbinary/gen/vdiv-scalar-x1.c
296 src/f32-vbinary/gen/vdiv-scalar-x2.c
297 src/f32-vbinary/gen/vdiv-scalar-x4.c
298 src/f32-vbinary/gen/vdivc-scalar-x1.c
299 src/f32-vbinary/gen/vdivc-scalar-x2.c
300 src/f32-vbinary/gen/vdivc-scalar-x4.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800301 src/f32-vbinary/gen/vmax-scalar-x1.c
302 src/f32-vbinary/gen/vmax-scalar-x2.c
303 src/f32-vbinary/gen/vmax-scalar-x4.c
304 src/f32-vbinary/gen/vmaxc-scalar-x1.c
305 src/f32-vbinary/gen/vmaxc-scalar-x2.c
306 src/f32-vbinary/gen/vmaxc-scalar-x4.c
307 src/f32-vbinary/gen/vmin-scalar-x1.c
308 src/f32-vbinary/gen/vmin-scalar-x2.c
309 src/f32-vbinary/gen/vmin-scalar-x4.c
310 src/f32-vbinary/gen/vminc-scalar-x1.c
311 src/f32-vbinary/gen/vminc-scalar-x2.c
312 src/f32-vbinary/gen/vminc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800313 src/f32-vbinary/gen/vmul-scalar-x1.c
314 src/f32-vbinary/gen/vmul-scalar-x2.c
315 src/f32-vbinary/gen/vmul-scalar-x4.c
316 src/f32-vbinary/gen/vmulc-scalar-x1.c
317 src/f32-vbinary/gen/vmulc-scalar-x2.c
318 src/f32-vbinary/gen/vmulc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800319 src/f32-vbinary/gen/vrdivc-scalar-x1.c
320 src/f32-vbinary/gen/vrdivc-scalar-x2.c
321 src/f32-vbinary/gen/vrdivc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800322 src/f32-vbinary/gen/vrsubc-scalar-x1.c
323 src/f32-vbinary/gen/vrsubc-scalar-x2.c
324 src/f32-vbinary/gen/vrsubc-scalar-x4.c
325 src/f32-vbinary/gen/vsub-scalar-x1.c
326 src/f32-vbinary/gen/vsub-scalar-x2.c
327 src/f32-vbinary/gen/vsub-scalar-x4.c
328 src/f32-vbinary/gen/vsubc-scalar-x1.c
329 src/f32-vbinary/gen/vsubc-scalar-x2.c
330 src/f32-vbinary/gen/vsubc-scalar-x4.c
331 src/f32-vmulcaddc/gen/c1-scalar-2x.c
332 src/f32-vmulcaddc/gen/c2-scalar-2x.c
333 src/f32-vmulcaddc/gen/c4-scalar-2x.c
Marat Dukhan5739f702019-12-22 19:45:09 -0800334 src/math/expminus-scalar-lut2048-p1.c
335 src/math/expminus-scalar-lut64-p2.c
336 src/math/expminus-scalar-p5.c
337 src/math/sigmoid-scalar-lut2048-p1-div.c
338 src/math/sigmoid-scalar-lut64-p2-div.c
339 src/math/sigmoid-scalar-p5-div.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800340 src/q8-avgpool/9p8x-scalar-c1.c
341 src/q8-avgpool/9x-scalar-c1.c
Marat Dukhande06f492020-04-09 00:19:31 -0700342 src/q8-dwconv/up1x9-minmax-scalar.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700343 src/q8-gavgpool/7p7x-scalar-c1.c
344 src/q8-gavgpool/7x-scalar-c1.c
Marat Dukhande06f492020-04-09 00:19:31 -0700345 src/q8-gemm/2x2-minmax-scalar.c
346 src/q8-igemm/2x2-minmax-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700347 src/q8-vadd/scalar.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700348 src/u8-clamp/scalar-x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700349 src/u8-lut32norm/scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800350 src/u8-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700351 src/u8-rmax/scalar.c
352 src/x32-packx/x2-scalar.c
353 src/x32-packx/x3-scalar.c
354 src/x32-packx/x4-scalar.c
355 src/x32-pad/x2-scalar.c
356 src/x32-unpool/scalar.c
357 src/x32-zip/x2-scalar.c
358 src/x32-zip/x3-scalar.c
359 src/x32-zip/x4-scalar.c
360 src/x32-zip/xm-scalar.c
361 src/x8-lut/scalar.c
362 src/x8-zip/x2-scalar.c
363 src/x8-zip/x3-scalar.c
364 src/x8-zip/x4-scalar.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700365 src/x8-zip/xm-scalar.c
366 src/requantization/precise-scalar.c
367 src/requantization/fp32-scalar.c
368 src/requantization/q31-scalar.c
369 src/requantization/gemmlowp-scalar.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700370
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800371SET(XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800372 src/f32-argmaxpool/4x-psimd-c4.c
373 src/f32-argmaxpool/9p8x-psimd-c4.c
374 src/f32-argmaxpool/9x-psimd-c4.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800375 src/f32-avgpool/9p8x-psimd-c4.c
376 src/f32-avgpool/9x-psimd-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700377 src/f32-clamp/gen/psimd-x4.c
378 src/f32-clamp/gen/psimd-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700379 src/f32-dwconv/gen/up4x25-minmax-psimd-acc2.c
380 src/f32-dwconv/gen/up4x25-minmax-psimd.c
381 src/f32-dwconv/gen/up4x4-minmax-psimd-acc2.c
382 src/f32-dwconv/gen/up4x4-minmax-psimd.c
383 src/f32-dwconv/gen/up4x9-minmax-psimd-acc2.c
384 src/f32-dwconv/gen/up4x9-minmax-psimd.c
385 src/f32-dwconv/gen/up8x25-minmax-psimd-acc2.c
386 src/f32-dwconv/gen/up8x25-minmax-psimd.c
387 src/f32-dwconv/gen/up8x4-minmax-psimd-acc2.c
388 src/f32-dwconv/gen/up8x4-minmax-psimd.c
389 src/f32-dwconv/gen/up8x9-minmax-psimd-acc2.c
390 src/f32-dwconv/gen/up8x9-minmax-psimd.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700391 src/f32-gavgpool/7p7x-psimd-c4.c
392 src/f32-gavgpool/7x-psimd-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700393 src/f32-gemm/gen/1x8-minmax-psimd-loadsplat.c
394 src/f32-gemm/gen/1x8-minmax-psimd-splat.c
395 src/f32-gemm/gen/1x8s4-minmax-psimd.c
396 src/f32-gemm/gen/4x2c4-minmax-psimd.c
397 src/f32-gemm/gen/4x8-minmax-psimd-loadsplat.c
398 src/f32-gemm/gen/4x8-minmax-psimd-splat.c
399 src/f32-gemm/gen/4x8s4-minmax-psimd.c
400 src/f32-gemm/gen/6x8-minmax-psimd-loadsplat.c
401 src/f32-gemm/gen/6x8-minmax-psimd-splat.c
402 src/f32-gemm/gen/6x8s4-minmax-psimd.c
403 src/f32-gemm/gen-inc/1x8inc-minmax-psimd-loadsplat.c
404 src/f32-gemm/gen-inc/1x8inc-minmax-psimd-splat.c
405 src/f32-gemm/gen-inc/1x8s4inc-minmax-psimd.c
406 src/f32-gemm/gen-inc/4x8inc-minmax-psimd-loadsplat.c
407 src/f32-gemm/gen-inc/4x8inc-minmax-psimd-splat.c
408 src/f32-gemm/gen-inc/4x8s4inc-minmax-psimd.c
409 src/f32-gemm/gen-inc/6x8inc-minmax-psimd-loadsplat.c
410 src/f32-gemm/gen-inc/6x8inc-minmax-psimd-splat.c
411 src/f32-gemm/gen-inc/6x8s4inc-minmax-psimd.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800412 src/f32-hswish/gen/psimd-x4.c
413 src/f32-hswish/gen/psimd-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700414 src/f32-ibilinear/gen/psimd-c4.c
415 src/f32-ibilinear/gen/psimd-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700416 src/f32-igemm/gen/1x8-minmax-psimd-loadsplat.c
417 src/f32-igemm/gen/1x8-minmax-psimd-splat.c
418 src/f32-igemm/gen/1x8s4-minmax-psimd.c
419 src/f32-igemm/gen/4x2c4-minmax-psimd.c
420 src/f32-igemm/gen/4x8-minmax-psimd-loadsplat.c
421 src/f32-igemm/gen/4x8-minmax-psimd-splat.c
422 src/f32-igemm/gen/4x8s4-minmax-psimd.c
423 src/f32-igemm/gen/6x8-minmax-psimd-loadsplat.c
424 src/f32-igemm/gen/6x8-minmax-psimd-splat.c
425 src/f32-igemm/gen/6x8s4-minmax-psimd.c
Marat Dukhan329da642019-11-19 21:44:39 -0800426 src/f32-maxpool/9p8x-psimd-c4.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800427 src/f32-pavgpool/9p8x-psimd-c4.c
428 src/f32-pavgpool/9x-psimd-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700429 src/f32-ppmm/gen/4x8-minmax-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800430 src/f32-prelu/gen/psimd-2x4.c
431 src/f32-prelu/gen/psimd-2x8.c
Marat Dukhanb39689d2020-01-24 13:32:20 -0800432 src/f32-rmax/psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800433 src/f32-vbinary/gen/vadd-psimd-x4.c
434 src/f32-vbinary/gen/vadd-psimd-x8.c
435 src/f32-vbinary/gen/vaddc-psimd-x4.c
436 src/f32-vbinary/gen/vaddc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800437 src/f32-vbinary/gen/vdiv-psimd-x4.c
438 src/f32-vbinary/gen/vdiv-psimd-x8.c
439 src/f32-vbinary/gen/vdivc-psimd-x4.c
440 src/f32-vbinary/gen/vdivc-psimd-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800441 src/f32-vbinary/gen/vmax-psimd-x4.c
442 src/f32-vbinary/gen/vmax-psimd-x8.c
443 src/f32-vbinary/gen/vmaxc-psimd-x4.c
444 src/f32-vbinary/gen/vmaxc-psimd-x8.c
445 src/f32-vbinary/gen/vmin-psimd-x4.c
446 src/f32-vbinary/gen/vmin-psimd-x8.c
447 src/f32-vbinary/gen/vminc-psimd-x4.c
448 src/f32-vbinary/gen/vminc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800449 src/f32-vbinary/gen/vmul-psimd-x4.c
450 src/f32-vbinary/gen/vmul-psimd-x8.c
451 src/f32-vbinary/gen/vmulc-psimd-x4.c
452 src/f32-vbinary/gen/vmulc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800453 src/f32-vbinary/gen/vrdivc-psimd-x4.c
454 src/f32-vbinary/gen/vrdivc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800455 src/f32-vbinary/gen/vrsubc-psimd-x4.c
456 src/f32-vbinary/gen/vrsubc-psimd-x8.c
457 src/f32-vbinary/gen/vsub-psimd-x4.c
458 src/f32-vbinary/gen/vsub-psimd-x8.c
459 src/f32-vbinary/gen/vsubc-psimd-x4.c
460 src/f32-vbinary/gen/vsubc-psimd-x8.c
461 src/f32-vmulcaddc/gen/c4-psimd-2x.c
462 src/f32-vmulcaddc/gen/c8-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700463 src/x32-packx/x4-psimd.c
464 src/x32-pad/x2-psimd.c
465 src/x32-unpool/psimd.c
466 src/x32-zip/x2-psimd.c
467 src/x32-zip/x3-psimd.c
468 src/x32-zip/x4-psimd.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700469 src/x32-zip/xm-psimd.c
470 src/requantization/precise-psimd.c
471 src/requantization/fp32-psimd.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700472
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800473SET(XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS
Marat Dukhanb39689d2020-01-24 13:32:20 -0800474 src/f32-raddstoreexpminusmax/gen/psimd-p5-x4.c
475 src/f32-raddstoreexpminusmax/gen/psimd-p5-x8.c
476 src/f32-raddstoreexpminusmax/gen/psimd-p5-x8-acc2.c
477 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12.c
478 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12-acc2.c
479 src/f32-raddstoreexpminusmax/gen/psimd-p5-x12-acc3.c
480 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16.c
481 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16-acc2.c
482 src/f32-raddstoreexpminusmax/gen/psimd-p5-x16-acc4.c
483 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20.c
484 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20-acc2.c
485 src/f32-raddstoreexpminusmax/gen/psimd-p5-x20-acc5.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800486 src/f32-sigmoid/gen/psimd-p5-div-x4.c
487 src/f32-sigmoid/gen/psimd-p5-div-x8.c
488 src/f32-sigmoid/gen/psimd-p5-div-x12.c
489 src/f32-sigmoid/gen/psimd-p5-div-x16.c
490 src/f32-sigmoid/gen/psimd-p5-div-x20.c
491 src/f32-sigmoid/gen/psimd-p5-div-x24.c
492 src/math/sigmoid-psimd-p5-div.c)
493
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700494SET(XNNPACK_NEON_MICROKERNEL_SRCS
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800495 src/f32-avgpool/9p8x-neon-c4.c
496 src/f32-avgpool/9x-neon-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700497 src/f32-clamp/gen/neon-x4.c
498 src/f32-clamp/gen/neon-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700499 src/f32-dwconv/gen/up4x9-minmax-neon.c
500 src/f32-dwconv/gen/up4x9-minmax-neon-acc2.c
501 src/f32-dwconv/gen/up8x9-minmax-neon.c
502 src/f32-dwconv/gen/up8x9-minmax-neon-acc2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800503 src/f32-gavgpool-spchw/neon-x4.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700504 src/f32-gavgpool/7p7x-neon-c4.c
505 src/f32-gavgpool/7x-neon-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700506 src/f32-gemm/gen/1x8-minmax-neon-lane-ld64.c
507 src/f32-gemm/gen/4x2-minmax-neon-lane-ld64.c
508 src/f32-gemm/gen/4x8-minmax-neon-lane-ld128.c
509 src/f32-gemm/gen/4x8-minmax-neon-lane-ld64.c
510 src/f32-gemm/gen/5x8-minmax-neon-lane-ld64.c
511 src/f32-gemm/gen/6x8-minmax-neon-lane-ld64.c
512 src/f32-gemm/gen/6x8-minmax-neon-lane-ld128.c
513 src/f32-gemm/gen/1x8-minmax-neon-dup-ld64.c
514 src/f32-gemm/gen/4x8-minmax-neon-dup-ld128.c
515 src/f32-gemm/gen/4x8-minmax-neon-dup-ld64.c
516 src/f32-gemm/gen/6x8-minmax-neon-dup-ld64.c
517 src/f32-gemm/gen/6x8-minmax-neon-dup-ld128.c
518 src/f32-gemm/gen/1x8s4-minmax-neon.c
519 src/f32-gemm/gen/4x8s4-minmax-neon.c
520 src/f32-gemm/gen/6x8s4-minmax-neon.c
521 src/f32-gemm/gen/8x8s4-minmax-neon.c
522 src/f32-gemm/gen-inc/1x8inc-minmax-neon-lane-ld64.c
523 src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld128.c
524 src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld64.c
525 src/f32-gemm/gen-inc/5x8inc-minmax-neon-lane-ld64.c
526 src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld64.c
527 src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld128.c
528 src/f32-gemm/gen-inc/1x8inc-minmax-neon-dup-ld64.c
529 src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld128.c
530 src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld64.c
531 src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld64.c
532 src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld128.c
533 src/f32-gemm/gen-inc/1x8s4inc-minmax-neon.c
534 src/f32-gemm/gen-inc/4x8s4inc-minmax-neon.c
535 src/f32-gemm/gen-inc/6x8s4inc-minmax-neon.c
536 src/f32-gemm/gen-inc/8x8s4inc-minmax-neon.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800537 src/f32-hswish/gen/neon-x4.c
538 src/f32-hswish/gen/neon-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700539 src/f32-ibilinear/gen/neon-c4.c
540 src/f32-ibilinear/gen/neon-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700541 src/f32-igemm/gen/1x8-minmax-neon-lane-ld64.c
542 src/f32-igemm/gen/4x2-minmax-neon-lane-ld64.c
543 src/f32-igemm/gen/4x4-minmax-neon-lane-ld64.c
544 src/f32-igemm/gen/4x8-minmax-neon-lane-ld128.c
545 src/f32-igemm/gen/4x8-minmax-neon-lane-ld64.c
546 src/f32-igemm/gen/6x8-minmax-neon-lane-ld64.c
547 src/f32-igemm/gen/6x8-minmax-neon-lane-ld128.c
548 src/f32-igemm/gen/1x8-minmax-neon-dup-ld64.c
549 src/f32-igemm/gen/4x8-minmax-neon-dup-ld128.c
550 src/f32-igemm/gen/4x8-minmax-neon-dup-ld64.c
551 src/f32-igemm/gen/6x8-minmax-neon-dup-ld64.c
552 src/f32-igemm/gen/6x8-minmax-neon-dup-ld128.c
553 src/f32-igemm/gen/1x8s4-minmax-neon.c
554 src/f32-igemm/gen/4x8s4-minmax-neon.c
555 src/f32-igemm/gen/6x8s4-minmax-neon.c
556 src/f32-igemm/gen/8x8s4-minmax-neon.c
Frank Barchardf092a4a2020-03-03 14:22:46 -0800557 src/f32-maxpool/9p8x-neon-c4.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800558 src/f32-pavgpool/9p8x-neon-c4.c
559 src/f32-pavgpool/9x-neon-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700560 src/f32-ppmm/gen/4x8-minmax-neon.c
561 src/f32-ppmm/gen/8x8-minmax-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800562 src/f32-prelu/gen/neon-2x4.c
563 src/f32-prelu/gen/neon-2x8.c
Marat Dukhan8137e4c2020-01-25 12:56:58 -0800564 src/f32-raddstoreexpminusmax/gen/neon-p5-x4.c
565 src/f32-raddstoreexpminusmax/gen/neon-p5-x8.c
566 src/f32-raddstoreexpminusmax/gen/neon-p5-x8-acc2.c
567 src/f32-raddstoreexpminusmax/gen/neon-p5-x12.c
568 src/f32-raddstoreexpminusmax/gen/neon-p5-x12-acc2.c
569 src/f32-raddstoreexpminusmax/gen/neon-p5-x12-acc3.c
570 src/f32-raddstoreexpminusmax/gen/neon-p5-x16.c
571 src/f32-raddstoreexpminusmax/gen/neon-p5-x16-acc2.c
572 src/f32-raddstoreexpminusmax/gen/neon-p5-x16-acc4.c
573 src/f32-raddstoreexpminusmax/gen/neon-p5-x20.c
574 src/f32-raddstoreexpminusmax/gen/neon-p5-x20-acc2.c
575 src/f32-raddstoreexpminusmax/gen/neon-p5-x20-acc5.c
576 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x4.c
577 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x8.c
578 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x8-acc2.c
579 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12.c
580 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12-acc2.c
581 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x12-acc3.c
582 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16.c
583 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16-acc2.c
584 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x16-acc4.c
585 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20.c
586 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20-acc2.c
587 src/f32-raddstoreexpminusmax/gen/neon-lut64-p2-x20-acc5.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800588 src/f32-rmax/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800589 src/f32-sigmoid/gen/neon-frac-p9-p10-nr1recps-x16.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800590 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x4.c
591 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x8.c
592 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x12.c
593 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x16.c
594 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x20.c
595 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x24.c
596 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x4.c
597 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x8.c
598 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x12.c
599 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x16.c
600 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x20.c
601 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x24.c
602 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x4.c
603 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x8.c
604 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x12.c
605 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x16.c
606 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x20.c
607 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800608 src/f32-vbinary/gen/vadd-neon-x4.c
609 src/f32-vbinary/gen/vadd-neon-x8.c
610 src/f32-vbinary/gen/vaddc-neon-x4.c
611 src/f32-vbinary/gen/vaddc-neon-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800612 src/f32-vbinary/gen/vmax-neon-x4.c
613 src/f32-vbinary/gen/vmax-neon-x8.c
614 src/f32-vbinary/gen/vmaxc-neon-x4.c
615 src/f32-vbinary/gen/vmaxc-neon-x8.c
616 src/f32-vbinary/gen/vmin-neon-x4.c
617 src/f32-vbinary/gen/vmin-neon-x8.c
618 src/f32-vbinary/gen/vminc-neon-x4.c
619 src/f32-vbinary/gen/vminc-neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800620 src/f32-vbinary/gen/vmul-neon-x4.c
621 src/f32-vbinary/gen/vmul-neon-x8.c
622 src/f32-vbinary/gen/vmulc-neon-x4.c
623 src/f32-vbinary/gen/vmulc-neon-x8.c
624 src/f32-vbinary/gen/vrsubc-neon-x4.c
625 src/f32-vbinary/gen/vrsubc-neon-x8.c
626 src/f32-vbinary/gen/vsub-neon-x4.c
627 src/f32-vbinary/gen/vsub-neon-x8.c
628 src/f32-vbinary/gen/vsubc-neon-x4.c
629 src/f32-vbinary/gen/vsubc-neon-x8.c
630 src/f32-vmulcaddc/gen/c4-neon-2x.c
631 src/f32-vmulcaddc/gen/c8-neon-2x.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800632 src/q8-avgpool/9p8x-neon-c8.c
633 src/q8-avgpool/9x-neon-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -0700634 src/q8-dwconv/up8x9-minmax-neon.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700635 src/q8-gavgpool/7p7x-neon-c8.c
636 src/q8-gavgpool/7x-neon-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -0700637 src/q8-gemm/4x8-minmax-neon.c
638 src/q8-gemm/8x8-minmax-neon.c
639 src/q8-igemm/4x8-minmax-neon.c
640 src/q8-igemm/8x8-minmax-neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800641 src/q8-vadd/neon.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700642 src/u8-clamp/neon-x64.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800643 src/u8-maxpool/9p8x-neon-c16.c
644 src/u8-rmax/neon.c
645 src/x32-packx/x4-neon-st4.c
646 src/x32-pad/x2-neon.c
647 src/x32-zip/x2-neon.c
648 src/x32-zip/x3-neon.c
649 src/x32-zip/x4-neon.c
650 src/x32-zip/xm-neon.c
651 src/x8-zip/x2-neon.c
652 src/x8-zip/x3-neon.c
653 src/x8-zip/x4-neon.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800654 src/x8-zip/xm-neon.c
Marat Dukhan68b3b452020-01-02 10:11:15 -0800655 src/math/sigmoid-neon-frac-p9-p10-nr1recps.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800656 src/math/sigmoid-neon-rr1-lut2048-p1-nr2recps.c
657 src/math/sigmoid-neon-rr1-lut64-p2-nr2recps.c
658 src/math/sigmoid-neon-rr1-p5-nr2recps.c
659 src/math/sigmoid-neon-rr2-lut2048-p1-nr2recps.c
660 src/math/sigmoid-neon-rr2-lut64-p2-nr2recps.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -0700661 src/math/sigmoid-neon-rr2-p5-nr2recps.c
662 src/requantization/precise-neon.c
663 src/requantization/fp32-neon.c
664 src/requantization/q31-neon.c
665 src/requantization/gemmlowp-neon.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700666
667SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan660fd192020-03-10 04:55:30 -0700668 src/f32-ibilinear/gen/neonfma-c4.c
669 src/f32-ibilinear/gen/neonfma-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700670 src/f32-igemm/gen/1x8-minmax-neonfma-dup-ld64.c
671 src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld128.c
672 src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld64.c
673 src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld64.c
674 src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld128.c
675 src/f32-igemm/gen/1x8s4-minmax-neonfma.c
676 src/f32-igemm/gen/4x8s4-minmax-neonfma.c
677 src/f32-igemm/gen/6x8s4-minmax-neonfma.c
678 src/f32-igemm/gen/8x8s4-minmax-neonfma.c
679 src/f32-dwconv/gen/up4x9-minmax-neonfma.c
680 src/f32-dwconv/gen/up4x9-minmax-neonfma-acc2.c
681 src/f32-dwconv/gen/up8x9-minmax-neonfma.c
682 src/f32-dwconv/gen/up8x9-minmax-neonfma-acc2.c
683 src/f32-gemm/gen/1x8-minmax-neonfma-dup-ld64.c
684 src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld128.c
685 src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld64.c
686 src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld64.c
687 src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld128.c
688 src/f32-gemm/gen/1x8s4-minmax-neonfma.c
689 src/f32-gemm/gen/4x8s4-minmax-neonfma.c
690 src/f32-gemm/gen/6x8s4-minmax-neonfma.c
691 src/f32-gemm/gen/8x8s4-minmax-neonfma.c
692 src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-dup-ld64.c
693 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld128.c
694 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld64.c
695 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld64.c
696 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld128.c
697 src/f32-gemm/gen-inc/1x8s4inc-minmax-neonfma.c
698 src/f32-gemm/gen-inc/4x8s4inc-minmax-neonfma.c
699 src/f32-gemm/gen-inc/6x8s4inc-minmax-neonfma.c
700 src/f32-gemm/gen-inc/8x8s4inc-minmax-neonfma.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800701 src/f32-hswish/gen/neonfma-x4.c
702 src/f32-hswish/gen/neonfma-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700703 src/f32-ppmm/gen/4x8-minmax-neonfma.c
704 src/f32-ppmm/gen/8x8-minmax-neonfma.c
Marat Dukhan8137e4c2020-01-25 12:56:58 -0800705 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x4.c
706 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x8.c
707 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x8-acc2.c
708 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12.c
709 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12-acc2.c
710 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x12-acc3.c
711 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16.c
712 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16-acc2.c
713 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x16-acc4.c
714 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20.c
715 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20-acc2.c
716 src/f32-raddstoreexpminusmax/gen/neonfma-p5-x20-acc5.c
717 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x4.c
718 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x8.c
719 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x8-acc2.c
720 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12.c
721 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12-acc2.c
722 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x12-acc3.c
723 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16.c
724 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16-acc2.c
725 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x16-acc4.c
726 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20.c
727 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20-acc2.c
728 src/f32-raddstoreexpminusmax/gen/neonfma-lut64-p2-x20-acc5.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800729 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x4.c
730 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x8.c
731 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x12.c
732 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x16.c
733 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x20.c
734 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x24.c
735 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x4.c
736 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x8.c
737 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x12.c
738 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x16.c
739 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x20.c
740 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x24.c
741 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x4.c
742 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x8.c
743 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x12.c
744 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x16.c
745 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x20.c
746 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x24.c
747 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x4.c
748 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x8.c
749 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x12.c
750 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x16.c
751 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x20.c
752 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x24.c
753 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x4.c
754 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x8.c
755 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x12.c
756 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x16.c
757 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x20.c
758 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x24.c
759 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x4.c
760 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x8.c
761 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x12.c
762 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x16.c
763 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x20.c
764 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x24.c
765 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x4.c
766 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x8.c
767 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x12.c
768 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x16.c
769 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x20.c
770 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x24.c
771 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x4.c
772 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x8.c
773 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x12.c
774 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x16.c
775 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x20.c
776 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x24.c
777 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x4.c
778 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x8.c
779 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x12.c
780 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x16.c
781 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x20.c
782 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800783 src/f32-vmulcaddc/gen/c4-neonfma-2x.c
784 src/f32-vmulcaddc/gen/c8-neonfma-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800785 src/math/exp-neonfma-lut64-p2.c
786 src/math/exp-neonfma-p5.c
Marat Dukhan191e5cd2019-11-28 00:52:01 -0800787 src/math/expminus-neonfma-lut2048-p1.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800788 src/math/expminus-neonfma-lut64-p2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800789 src/math/expminus-neonfma-p5.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800790 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma.c
791 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2fma.c
792 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2recps.c
793 src/math/sigmoid-neonfma-rr1-lut64-p2-nr1recps1fma.c
794 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2fma.c
795 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2recps.c
796 src/math/sigmoid-neonfma-rr1-p5-nr1recps1fma.c
797 src/math/sigmoid-neonfma-rr1-p5-nr2fma.c
798 src/math/sigmoid-neonfma-rr1-p5-nr2recps.c
799 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr1recps1fma.c
800 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2fma.c
801 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2recps.c
802 src/math/sigmoid-neonfma-rr2-lut64-p2-nr1recps1fma.c
803 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2fma.c
804 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2recps.c
805 src/math/sigmoid-neonfma-rr2-p5-nr1recps1fma.c
806 src/math/sigmoid-neonfma-rr2-p5-nr2fma.c
807 src/math/sigmoid-neonfma-rr2-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700808
Marat Dukhan36aecb52019-11-22 17:21:49 -0800809SET(XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan77ca6302019-12-06 12:48:15 -0800810 src/f32-vbinary/gen/vdiv-neon-x4.c
811 src/f32-vbinary/gen/vdiv-neon-x8.c
812 src/f32-vbinary/gen/vdivc-neon-x4.c
813 src/f32-vbinary/gen/vdivc-neon-x8.c
814 src/f32-vbinary/gen/vrdivc-neon-x4.c
815 src/f32-vbinary/gen/vrdivc-neon-x8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700816 src/f32-gemm/gen/1x8-minmax-neonfma-lane-ld64.c
817 src/f32-gemm/gen/4x2-minmax-neonfma-lane-ld64.c
818 src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld128.c
819 src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld64.c
820 src/f32-gemm/gen/5x8-minmax-neonfma-lane-ld64.c
821 src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld64.c
822 src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld128.c
823 src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-lane-ld64.c
824 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld128.c
825 src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld64.c
826 src/f32-gemm/gen-inc/5x8inc-minmax-neonfma-lane-ld64.c
827 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld64.c
828 src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld128.c
829 src/f32-igemm/gen/1x8-minmax-neonfma-lane-ld64.c
830 src/f32-igemm/gen/4x2-minmax-neonfma-lane-ld64.c
831 src/f32-igemm/gen/4x4-minmax-neonfma-lane-ld64.c
832 src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld128.c
833 src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld64.c
834 src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld64.c
835 src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld128.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800836 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
837 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
838 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
839 src/f32-dwconv-spchw/3x3p1-neonfma.c
840 src/f32-dwconv-spchw/5x5p2-neonfma.c
841 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
842 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800843 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x4.c
844 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x8.c
845 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x12.c
846 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x16.c
847 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x20.c
848 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x24.c
849 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x4.c
850 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x8.c
851 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x12.c
852 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x16.c
853 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x20.c
854 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x24.c
855 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x4.c
856 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x8.c
857 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x12.c
858 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x16.c
859 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x20.c
860 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800861 src/f32-spmm/gen/12x1-neonfma.c
862 src/f32-spmm/gen/12x2-neonfma.c
863 src/f32-spmm/gen/12x4-neonfma.c
864 src/f32-spmm/gen/16x1-neonfma-pipelined.c
865 src/f32-spmm/gen/16x1-neonfma-unroll2.c
866 src/f32-spmm/gen/16x1-neonfma.c
867 src/f32-spmm/gen/16x2-neonfma.c
868 src/f32-spmm/gen/16x4-neonfma.c
869 src/f32-spmm/gen/4x1-neonfma-pipelined.c
870 src/f32-spmm/gen/4x1-neonfma-unroll2.c
871 src/f32-spmm/gen/4x1-neonfma.c
872 src/f32-spmm/gen/4x2-neonfma.c
873 src/f32-spmm/gen/4x4-neonfma.c
874 src/f32-spmm/gen/8x1-neonfma-pipelined.c
875 src/f32-spmm/gen/8x1-neonfma-unroll2.c
876 src/f32-spmm/gen/8x1-neonfma.c
877 src/f32-spmm/gen/8x2-neonfma.c
878 src/f32-spmm/gen/8x4-neonfma.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800879 src/math/sigmoid-neonfma-rr1-lut2048-p1-div.c
880 src/math/sigmoid-neonfma-rr1-lut64-p2-div.c
881 src/math/sigmoid-neonfma-rr1-p5-div.c
882 src/math/sigmoid-neonfma-rr2-lut2048-p1-div.c
883 src/math/sigmoid-neonfma-rr2-lut64-p2-div.c
884 src/math/sigmoid-neonfma-rr2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700885
886SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800887 src/f16-gemm/gen/4x8-neonfp16arith-ld64.c
888 src/f16-gemm/gen/6x8-neonfp16arith-ld64.c
889 src/f16-gemm/gen/8x8-neonfp16arith-ld64.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700890
891SET(XNNPACK_SSE_MICROKERNEL_SRCS
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800892 src/f32-avgpool/9p8x-sse-c4.c
893 src/f32-avgpool/9x-sse-c4.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -0700894 src/f32-clamp/gen/sse-x4.c
895 src/f32-clamp/gen/sse-x8.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800896 src/f32-dwconv-spchw/3x3p1-sse.c
897 src/f32-dwconv-spchw/3x3s2p1-sse.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700898 src/f32-dwconv/gen/up4x25-minmax-sse-acc2.c
899 src/f32-dwconv/gen/up4x25-minmax-sse.c
900 src/f32-dwconv/gen/up4x4-minmax-sse-acc2.c
901 src/f32-dwconv/gen/up4x4-minmax-sse.c
902 src/f32-dwconv/gen/up4x9-minmax-sse-acc2.c
903 src/f32-dwconv/gen/up4x9-minmax-sse.c
904 src/f32-dwconv/gen/up8x25-minmax-sse-acc2.c
905 src/f32-dwconv/gen/up8x25-minmax-sse.c
906 src/f32-dwconv/gen/up8x4-minmax-sse-acc2.c
907 src/f32-dwconv/gen/up8x4-minmax-sse.c
908 src/f32-dwconv/gen/up8x9-minmax-sse-acc2.c
909 src/f32-dwconv/gen/up8x9-minmax-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700910 src/f32-gavgpool-spchw/sse-x4.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -0700911 src/f32-gavgpool/7p7x-sse-c4.c
912 src/f32-gavgpool/7x-sse-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700913 src/f32-gemm/gen/1x8-minmax-sse-dup.c
914 src/f32-gemm/gen/1x8-minmax-sse-load1.c
915 src/f32-gemm/gen/1x8s4-minmax-sse.c
916 src/f32-gemm/gen/4x2c4-minmax-sse.c
917 src/f32-gemm/gen/4x8-minmax-sse-dup.c
918 src/f32-gemm/gen/4x8-minmax-sse-load1.c
919 src/f32-gemm/gen/4x8s4-minmax-sse.c
920 src/f32-gemm/gen-inc/1x8inc-minmax-sse-dup.c
921 src/f32-gemm/gen-inc/1x8inc-minmax-sse-load1.c
922 src/f32-gemm/gen-inc/1x8s4inc-minmax-sse.c
923 src/f32-gemm/gen-inc/4x8inc-minmax-sse-dup.c
924 src/f32-gemm/gen-inc/4x8inc-minmax-sse-load1.c
925 src/f32-gemm/gen-inc/4x8s4inc-minmax-sse.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800926 src/f32-hswish/gen/sse-x4.c
927 src/f32-hswish/gen/sse-x8.c
Marat Dukhan660fd192020-03-10 04:55:30 -0700928 src/f32-ibilinear/gen/sse-c4.c
929 src/f32-ibilinear/gen/sse-c8.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700930 src/f32-igemm/gen/1x8-minmax-sse-dup.c
931 src/f32-igemm/gen/1x8-minmax-sse-load1.c
932 src/f32-igemm/gen/1x8s4-minmax-sse.c
933 src/f32-igemm/gen/4x2c4-minmax-sse.c
934 src/f32-igemm/gen/4x8-minmax-sse-dup.c
935 src/f32-igemm/gen/4x8-minmax-sse-load1.c
936 src/f32-igemm/gen/4x8s4-minmax-sse.c
Marat Dukhan329da642019-11-19 21:44:39 -0800937 src/f32-maxpool/9p8x-sse-c4.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -0800938 src/f32-pavgpool/9p8x-sse-c4.c
939 src/f32-pavgpool/9x-sse-c4.c
Marat Dukhan1c587112020-04-08 20:04:28 -0700940 src/f32-ppmm/gen/4x8-minmax-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700941 src/f32-rmax/sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800942 src/f32-spmm/gen/4x1-sse.c
943 src/f32-spmm/gen/8x1-sse.c
944 src/f32-vbinary/gen/vadd-sse-x4.c
945 src/f32-vbinary/gen/vadd-sse-x8.c
946 src/f32-vbinary/gen/vaddc-sse-x4.c
947 src/f32-vbinary/gen/vaddc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800948 src/f32-vbinary/gen/vdiv-sse-x4.c
949 src/f32-vbinary/gen/vdiv-sse-x8.c
950 src/f32-vbinary/gen/vdivc-sse-x4.c
951 src/f32-vbinary/gen/vdivc-sse-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800952 src/f32-vbinary/gen/vmax-sse-x4.c
953 src/f32-vbinary/gen/vmax-sse-x8.c
954 src/f32-vbinary/gen/vmaxc-sse-x4.c
955 src/f32-vbinary/gen/vmaxc-sse-x8.c
956 src/f32-vbinary/gen/vmin-sse-x4.c
957 src/f32-vbinary/gen/vmin-sse-x8.c
958 src/f32-vbinary/gen/vminc-sse-x4.c
959 src/f32-vbinary/gen/vminc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800960 src/f32-vbinary/gen/vmul-sse-x4.c
961 src/f32-vbinary/gen/vmul-sse-x8.c
962 src/f32-vbinary/gen/vmulc-sse-x4.c
963 src/f32-vbinary/gen/vmulc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800964 src/f32-vbinary/gen/vrdivc-sse-x4.c
965 src/f32-vbinary/gen/vrdivc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800966 src/f32-vbinary/gen/vrsubc-sse-x4.c
967 src/f32-vbinary/gen/vrsubc-sse-x8.c
968 src/f32-vbinary/gen/vsub-sse-x4.c
969 src/f32-vbinary/gen/vsub-sse-x8.c
970 src/f32-vbinary/gen/vsubc-sse-x4.c
971 src/f32-vbinary/gen/vsubc-sse-x8.c
972 src/f32-vmulcaddc/gen/c4-sse-2x.c
973 src/f32-vmulcaddc/gen/c8-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700974 src/x32-packx/x4-sse.c)
975
976SET(XNNPACK_SSE2_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800977 src/f32-argmaxpool/4x-sse2-c4.c
978 src/f32-argmaxpool/9p8x-sse2-c4.c
979 src/f32-argmaxpool/9x-sse2-c4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800980 src/f32-prelu/gen/sse2-2x4.c
981 src/f32-prelu/gen/sse2-2x8.c
Marat Dukhanb39689d2020-01-24 13:32:20 -0800982 src/f32-raddstoreexpminusmax/gen/sse2-p5-x4.c
983 src/f32-raddstoreexpminusmax/gen/sse2-p5-x8.c
984 src/f32-raddstoreexpminusmax/gen/sse2-p5-x8-acc2.c
985 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12.c
986 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12-acc2.c
987 src/f32-raddstoreexpminusmax/gen/sse2-p5-x12-acc3.c
988 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16.c
989 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16-acc2.c
990 src/f32-raddstoreexpminusmax/gen/sse2-p5-x16-acc4.c
991 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20.c
992 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20-acc2.c
993 src/f32-raddstoreexpminusmax/gen/sse2-p5-x20-acc5.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800994 src/f32-sigmoid/gen/sse2-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800995 src/f32-sigmoid/gen/sse2-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800996 src/f32-sigmoid/gen/sse2-p5-div-x12.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800997 src/f32-sigmoid/gen/sse2-p5-div-x16.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800998 src/f32-sigmoid/gen/sse2-p5-div-x20.c
999 src/f32-sigmoid/gen/sse2-p5-div-x24.c
Marat Dukhan6ee435a2020-02-26 22:33:38 -08001000 src/q8-avgpool/9p8x-sse2-c8.c
1001 src/q8-avgpool/9x-sse2-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -07001002 src/q8-igemm/4x4c2-minmax-sse2.c
1003 src/q8-dwconv/up8x9-minmax-sse2.c
Marat Dukhana63a6fc2020-03-10 06:12:48 -07001004 src/q8-gavgpool/7p7x-sse2-c8.c
1005 src/q8-gavgpool/7x-sse2-c8.c
Marat Dukhande06f492020-04-09 00:19:31 -07001006 src/q8-gemm/2x4c8-minmax-sse2.c
1007 src/q8-gemm/4x4c2-minmax-sse2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001008 src/q8-vadd/sse2.c
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001009 src/u8-clamp/sse2-x64.c
Marat Dukhan329da642019-11-19 21:44:39 -08001010 src/u8-maxpool/9p8x-sse2-c16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001011 src/u8-rmax/sse2.c
1012 src/x32-pad/x2-sse2.c
1013 src/x32-zip/x2-sse2.c
1014 src/x32-zip/x3-sse2.c
1015 src/x32-zip/x4-sse2.c
1016 src/x32-zip/xm-sse2.c
1017 src/x8-zip/x2-sse2.c
1018 src/x8-zip/x3-sse2.c
1019 src/x8-zip/x4-sse2.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001020 src/x8-zip/xm-sse2.c
1021 src/math/exp-sse2-p5.c
Marat Dukhan80bafd22019-11-18 10:16:01 -08001022 src/math/expminus-sse2-p5.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001023 src/math/sigmoid-sse2-p5-div.c
1024 src/requantization/precise-sse2.c
1025 src/requantization/fp32-sse2.c
1026 src/requantization/q31-sse2.c
1027 src/requantization/gemmlowp-sse2.c)
1028
1029SET(XNNPACK_SSSE3_MICROKERNEL_SRCS
1030 src/requantization/precise-ssse3.c
1031 src/requantization/q31-ssse3.c
1032 src/requantization/gemmlowp-ssse3.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001033
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001034SET(XNNPACK_SSE41_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -08001035 src/f32-prelu/gen/sse41-2x4.c
1036 src/f32-prelu/gen/sse41-2x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001037 src/f32-sigmoid/gen/sse41-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001038 src/f32-sigmoid/gen/sse41-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001039 src/f32-sigmoid/gen/sse41-p5-div-x12.c
1040 src/f32-sigmoid/gen/sse41-p5-div-x16.c
1041 src/f32-sigmoid/gen/sse41-p5-div-x20.c
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001042 src/f32-sigmoid/gen/sse41-p5-div-x24.c
1043 src/requantization/precise-sse4.c
1044 src/requantization/q31-sse4.c
1045 src/requantization/gemmlowp-sse4.c)
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001046
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001047SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001048 src/f32-clamp/gen/avx-x8.c
1049 src/f32-clamp/gen/avx-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001050 src/f32-dwconv/gen/up16x4-minmax-avx-acc2.c
1051 src/f32-dwconv/gen/up16x4-minmax-avx.c
1052 src/f32-dwconv/gen/up8x4-minmax-avx-acc2.c
1053 src/f32-dwconv/gen/up8x4-minmax-avx.c
1054 src/f32-dwconv/gen/up16x9-minmax-avx-acc2.c
1055 src/f32-dwconv/gen/up16x9-minmax-avx.c
1056 src/f32-dwconv/gen/up8x9-minmax-avx-acc2.c
1057 src/f32-dwconv/gen/up8x9-minmax-avx.c
1058 src/f32-dwconv/gen/up16x25-minmax-avx-acc2.c
1059 src/f32-dwconv/gen/up16x25-minmax-avx.c
1060 src/f32-dwconv/gen/up8x25-minmax-avx-acc2.c
1061 src/f32-dwconv/gen/up8x25-minmax-avx.c
1062 src/f32-gemm/gen/1x8-minmax-avx-broadcast.c
1063 src/f32-gemm/gen/4x8-minmax-avx-broadcast.c
1064 src/f32-gemm/gen/5x8-minmax-avx-broadcast.c
1065 src/f32-gemm/gen/6x8-minmax-avx-broadcast.c
1066 src/f32-gemm/gen/7x8-minmax-avx-broadcast.c
1067 src/f32-gemm/gen/1x16-minmax-avx-broadcast.c
1068 src/f32-gemm/gen/3x16-minmax-avx-broadcast.c
1069 src/f32-gemm/gen/4x16-minmax-avx-broadcast.c
1070 src/f32-gemm/gen/5x16-minmax-avx-broadcast.c
1071 src/f32-gemm/gen-inc/1x8inc-minmax-avx-broadcast.c
1072 src/f32-gemm/gen-inc/4x8inc-minmax-avx-broadcast.c
1073 src/f32-gemm/gen-inc/5x8inc-minmax-avx-broadcast.c
1074 src/f32-gemm/gen-inc/6x8inc-minmax-avx-broadcast.c
1075 src/f32-gemm/gen-inc/7x8inc-minmax-avx-broadcast.c
1076 src/f32-gemm/gen-inc/1x16inc-minmax-avx-broadcast.c
1077 src/f32-gemm/gen-inc/3x16inc-minmax-avx-broadcast.c
1078 src/f32-gemm/gen-inc/4x16inc-minmax-avx-broadcast.c
1079 src/f32-gemm/gen-inc/5x16inc-minmax-avx-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001080 src/f32-hswish/gen/avx-x8.c
1081 src/f32-hswish/gen/avx-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001082 src/f32-igemm/gen/1x8-minmax-avx-broadcast.c
1083 src/f32-igemm/gen/4x8-minmax-avx-broadcast.c
1084 src/f32-igemm/gen/5x8-minmax-avx-broadcast.c
1085 src/f32-igemm/gen/6x8-minmax-avx-broadcast.c
1086 src/f32-igemm/gen/7x8-minmax-avx-broadcast.c
1087 src/f32-igemm/gen/1x16-minmax-avx-broadcast.c
1088 src/f32-igemm/gen/3x16-minmax-avx-broadcast.c
1089 src/f32-igemm/gen/4x16-minmax-avx-broadcast.c
1090 src/f32-igemm/gen/5x16-minmax-avx-broadcast.c
Marat Dukhan90eca0a2020-03-11 00:52:23 -07001091 src/f32-prelu/gen/avx-2x8.c
1092 src/f32-prelu/gen/avx-2x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001093 src/f32-rmax/avx.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001094 src/f32-vbinary/gen/vadd-avx-x8.c
1095 src/f32-vbinary/gen/vadd-avx-x16.c
1096 src/f32-vbinary/gen/vaddc-avx-x8.c
1097 src/f32-vbinary/gen/vaddc-avx-x16.c
1098 src/f32-vbinary/gen/vdiv-avx-x8.c
1099 src/f32-vbinary/gen/vdiv-avx-x16.c
1100 src/f32-vbinary/gen/vdivc-avx-x8.c
1101 src/f32-vbinary/gen/vdivc-avx-x16.c
1102 src/f32-vbinary/gen/vmax-avx-x8.c
1103 src/f32-vbinary/gen/vmax-avx-x16.c
1104 src/f32-vbinary/gen/vmaxc-avx-x8.c
1105 src/f32-vbinary/gen/vmaxc-avx-x16.c
1106 src/f32-vbinary/gen/vmin-avx-x8.c
1107 src/f32-vbinary/gen/vmin-avx-x16.c
1108 src/f32-vbinary/gen/vminc-avx-x8.c
1109 src/f32-vbinary/gen/vminc-avx-x16.c
1110 src/f32-vbinary/gen/vmul-avx-x8.c
1111 src/f32-vbinary/gen/vmul-avx-x16.c
1112 src/f32-vbinary/gen/vmulc-avx-x8.c
1113 src/f32-vbinary/gen/vmulc-avx-x16.c
1114 src/f32-vbinary/gen/vrdivc-avx-x8.c
1115 src/f32-vbinary/gen/vrdivc-avx-x16.c
1116 src/f32-vbinary/gen/vrsubc-avx-x8.c
1117 src/f32-vbinary/gen/vrsubc-avx-x16.c
1118 src/f32-vbinary/gen/vsub-avx-x8.c
1119 src/f32-vbinary/gen/vsub-avx-x16.c
1120 src/f32-vbinary/gen/vsubc-avx-x8.c
1121 src/f32-vbinary/gen/vsubc-avx-x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001122 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001123
Marat Dukhanfda12b82019-11-21 12:27:59 -08001124SET(XNNPACK_FMA3_MICROKERNEL_SRCS
Marat Dukhan1c587112020-04-08 20:04:28 -07001125 src/f32-dwconv/gen/up16x4-minmax-fma3-acc2.c
1126 src/f32-dwconv/gen/up16x4-minmax-fma3.c
1127 src/f32-dwconv/gen/up8x4-minmax-fma3-acc2.c
1128 src/f32-dwconv/gen/up8x4-minmax-fma3.c
1129 src/f32-dwconv/gen/up16x9-minmax-fma3-acc2.c
1130 src/f32-dwconv/gen/up16x9-minmax-fma3.c
1131 src/f32-dwconv/gen/up8x9-minmax-fma3-acc2.c
1132 src/f32-dwconv/gen/up8x9-minmax-fma3.c
1133 src/f32-dwconv/gen/up16x25-minmax-fma3-acc2.c
1134 src/f32-dwconv/gen/up16x25-minmax-fma3.c
1135 src/f32-dwconv/gen/up8x25-minmax-fma3-acc2.c
1136 src/f32-dwconv/gen/up8x25-minmax-fma3.c
1137 src/f32-gemm/gen/1x8-minmax-fma3-broadcast.c
1138 src/f32-gemm/gen/4x8-minmax-fma3-broadcast.c
1139 src/f32-gemm/gen/5x8-minmax-fma3-broadcast.c
1140 src/f32-gemm/gen/6x8-minmax-fma3-broadcast.c
1141 src/f32-gemm/gen/7x8-minmax-fma3-broadcast.c
1142 src/f32-gemm/gen/8x8-minmax-fma3-broadcast.c
1143 src/f32-gemm/gen/1x16-minmax-fma3-broadcast.c
1144 src/f32-gemm/gen/3x16-minmax-fma3-broadcast.c
1145 src/f32-gemm/gen/4x16-minmax-fma3-broadcast.c
1146 src/f32-gemm/gen/5x16-minmax-fma3-broadcast.c
1147 src/f32-gemm/gen/1x16s4-minmax-fma3-broadcast.c
1148 src/f32-gemm/gen/3x16s4-minmax-fma3-broadcast.c
1149 src/f32-gemm/gen/4x16s4-minmax-fma3-broadcast.c
1150 src/f32-gemm/gen/5x16s4-minmax-fma3-broadcast.c
1151 src/f32-gemm/gen-inc/1x8inc-minmax-fma3-broadcast.c
1152 src/f32-gemm/gen-inc/4x8inc-minmax-fma3-broadcast.c
1153 src/f32-gemm/gen-inc/5x8inc-minmax-fma3-broadcast.c
1154 src/f32-gemm/gen-inc/6x8inc-minmax-fma3-broadcast.c
1155 src/f32-gemm/gen-inc/7x8inc-minmax-fma3-broadcast.c
1156 src/f32-gemm/gen-inc/8x8inc-minmax-fma3-broadcast.c
1157 src/f32-gemm/gen-inc/1x16inc-minmax-fma3-broadcast.c
1158 src/f32-gemm/gen-inc/3x16inc-minmax-fma3-broadcast.c
1159 src/f32-gemm/gen-inc/4x16inc-minmax-fma3-broadcast.c
1160 src/f32-gemm/gen-inc/5x16inc-minmax-fma3-broadcast.c
1161 src/f32-gemm/gen-inc/1x16s4inc-minmax-fma3-broadcast.c
1162 src/f32-gemm/gen-inc/3x16s4inc-minmax-fma3-broadcast.c
1163 src/f32-gemm/gen-inc/4x16s4inc-minmax-fma3-broadcast.c
1164 src/f32-gemm/gen-inc/5x16s4inc-minmax-fma3-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001165 src/f32-hswish/gen/fma3-x8.c
1166 src/f32-hswish/gen/fma3-x16.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001167 src/f32-igemm/gen/1x8-minmax-fma3-broadcast.c
1168 src/f32-igemm/gen/4x8-minmax-fma3-broadcast.c
1169 src/f32-igemm/gen/5x8-minmax-fma3-broadcast.c
1170 src/f32-igemm/gen/6x8-minmax-fma3-broadcast.c
1171 src/f32-igemm/gen/7x8-minmax-fma3-broadcast.c
1172 src/f32-igemm/gen/8x8-minmax-fma3-broadcast.c
1173 src/f32-igemm/gen/1x16-minmax-fma3-broadcast.c
1174 src/f32-igemm/gen/3x16-minmax-fma3-broadcast.c
1175 src/f32-igemm/gen/4x16-minmax-fma3-broadcast.c
1176 src/f32-igemm/gen/5x16-minmax-fma3-broadcast.c
1177 src/f32-igemm/gen/1x16s4-minmax-fma3-broadcast.c
1178 src/f32-igemm/gen/3x16s4-minmax-fma3-broadcast.c
1179 src/f32-igemm/gen/4x16s4-minmax-fma3-broadcast.c
1180 src/f32-igemm/gen/5x16s4-minmax-fma3-broadcast.c)
Marat Dukhanfda12b82019-11-21 12:27:59 -08001181
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001182SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001183 src/f32-raddexpminusmax/gen/avx2-p5-x64.c
1184 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc2.c
1185 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc4.c
1186 src/f32-raddexpminusmax/gen/avx2-p5-x72.c
1187 src/f32-raddexpminusmax/gen/avx2-p5-x72-acc3.c
1188 src/f32-raddexpminusmax/gen/avx2-p5-x80.c
1189 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc2.c
1190 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc5.c
1191 src/f32-raddexpminusmax/gen/avx2-p5-x96.c
1192 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc2.c
1193 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc3.c
1194 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc6.c
1195 src/f32-raddextexp/gen/avx2-p5-x64.c
1196 src/f32-raddextexp/gen/avx2-p5-x64-acc2.c
1197 src/f32-raddextexp/gen/avx2-p5-x64-acc4.c
1198 src/f32-raddextexp/gen/avx2-p5-x72.c
1199 src/f32-raddextexp/gen/avx2-p5-x72-acc3.c
1200 src/f32-raddextexp/gen/avx2-p5-x80.c
1201 src/f32-raddextexp/gen/avx2-p5-x80-acc2.c
1202 src/f32-raddextexp/gen/avx2-p5-x80-acc5.c
1203 src/f32-raddextexp/gen/avx2-p5-x96.c
1204 src/f32-raddextexp/gen/avx2-p5-x96-acc2.c
1205 src/f32-raddextexp/gen/avx2-p5-x96-acc3.c
1206 src/f32-raddextexp/gen/avx2-p5-x96-acc6.c
1207 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64.c
1208 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc2.c
1209 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc4.c
1210 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72.c
1211 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72-acc3.c
1212 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80.c
1213 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc2.c
1214 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc5.c
1215 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96.c
1216 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc2.c
1217 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc3.c
1218 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc6.c
Marat Dukhanfa0a4322020-01-06 16:14:29 -08001219 src/f32-sigmoid/gen/avx2-rr1-p5-div-x8.c
1220 src/f32-sigmoid/gen/avx2-rr1-p5-div-x16.c
1221 src/f32-sigmoid/gen/avx2-rr1-p5-div-x24.c
1222 src/f32-sigmoid/gen/avx2-rr1-p5-div-x32.c
1223 src/f32-sigmoid/gen/avx2-rr1-p5-div-x40.c
1224 src/f32-sigmoid/gen/avx2-rr1-p5-div-x48.c
1225 src/f32-sigmoid/gen/avx2-rr1-p5-div-x56.c
1226 src/f32-sigmoid/gen/avx2-rr1-p5-div-x64.c
1227 src/f32-sigmoid/gen/avx2-rr1-p5-div-x72.c
1228 src/f32-sigmoid/gen/avx2-rr1-p5-div-x80.c
1229 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x8.c
1230 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x16.c
1231 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x24.c
1232 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x32.c
1233 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x40.c
1234 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x48.c
1235 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x56.c
1236 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x64.c
1237 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x72.c
1238 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x80.c
1239 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x8.c
1240 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x16.c
1241 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x24.c
1242 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x32.c
1243 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x40.c
1244 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x48.c
1245 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x56.c
1246 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x64.c
1247 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x72.c
1248 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x80.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001249 src/f32-vscaleexpminusmax/gen/avx2-p5-x8.c
1250 src/f32-vscaleexpminusmax/gen/avx2-p5-x16.c
1251 src/f32-vscaleexpminusmax/gen/avx2-p5-x24.c
1252 src/f32-vscaleexpminusmax/gen/avx2-p5-x32.c
1253 src/f32-vscaleexpminusmax/gen/avx2-p5-x40.c
1254 src/f32-vscaleexpminusmax/gen/avx2-p5-x48.c
1255 src/f32-vscaleexpminusmax/gen/avx2-p5-x56.c
1256 src/f32-vscaleexpminusmax/gen/avx2-p5-x64.c
1257 src/f32-vscaleexpminusmax/gen/avx2-p5-x72.c
1258 src/f32-vscaleexpminusmax/gen/avx2-p5-x80.c
1259 src/f32-vscaleexpminusmax/gen/avx2-p5-x88.c
1260 src/f32-vscaleexpminusmax/gen/avx2-p5-x96.c
1261 src/f32-vscaleextexp/gen/avx2-p5-x8.c
1262 src/f32-vscaleextexp/gen/avx2-p5-x16.c
1263 src/f32-vscaleextexp/gen/avx2-p5-x24.c
1264 src/f32-vscaleextexp/gen/avx2-p5-x32.c
1265 src/f32-vscaleextexp/gen/avx2-p5-x40.c
1266 src/f32-vscaleextexp/gen/avx2-p5-x48.c
1267 src/f32-vscaleextexp/gen/avx2-p5-x56.c
1268 src/f32-vscaleextexp/gen/avx2-p5-x64.c
1269 src/f32-vscaleextexp/gen/avx2-p5-x72.c
1270 src/f32-vscaleextexp/gen/avx2-p5-x80.c
1271 src/f32-vscaleextexp/gen/avx2-p5-x88.c
1272 src/f32-vscaleextexp/gen/avx2-p5-x96.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001273 src/math/exp-avx2-p5.c
1274 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -07001275 src/math/exp-avx2-perm-p4.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001276 src/math/expminus-avx2-p5.c
Marat Dukhan72416002020-01-05 21:53:19 -08001277 src/math/extexp-avx2-p5.c
1278 src/math/sigmoid-avx2-rr2-p5-div.c
1279 src/math/sigmoid-avx2-rr1-p5-div.c
1280 src/math/sigmoid-avx2-rr2-p5-nr2fma.c
1281 src/math/sigmoid-avx2-rr1-p5-nr2fma.c
1282 src/math/sigmoid-avx2-rr2-p5-nr1fma.c
1283 src/math/sigmoid-avx2-rr1-p5-nr1fma.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001284
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001285SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhan5c5fa962020-03-10 18:38:33 -07001286 src/f32-clamp/gen/avx512f-x16.c
1287 src/f32-clamp/gen/avx512f-x32.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001288 src/f32-dwconv/gen/up32x4-minmax-avx512f-acc2.c
1289 src/f32-dwconv/gen/up32x4-minmax-avx512f.c
1290 src/f32-dwconv/gen/up16x4-minmax-avx512f-acc2.c
1291 src/f32-dwconv/gen/up16x4-minmax-avx512f.c
1292 src/f32-dwconv/gen/up32x9-minmax-avx512f-acc2.c
1293 src/f32-dwconv/gen/up32x9-minmax-avx512f.c
1294 src/f32-dwconv/gen/up16x9-minmax-avx512f-acc2.c
1295 src/f32-dwconv/gen/up16x9-minmax-avx512f.c
1296 src/f32-dwconv/gen/up32x25-minmax-avx512f-acc2.c
1297 src/f32-dwconv/gen/up32x25-minmax-avx512f.c
1298 src/f32-dwconv/gen/up16x25-minmax-avx512f-acc2.c
1299 src/f32-dwconv/gen/up16x25-minmax-avx512f.c
1300 src/f32-gemm/gen/1x16-minmax-avx512f-broadcast.c
1301 src/f32-gemm/gen/4x16-minmax-avx512f-broadcast.c
1302 src/f32-gemm/gen/5x16-minmax-avx512f-broadcast.c
1303 src/f32-gemm/gen/6x16-minmax-avx512f-broadcast.c
1304 src/f32-gemm/gen/7x16-minmax-avx512f-broadcast.c
1305 src/f32-gemm/gen/8x16-minmax-avx512f-broadcast.c
1306 src/f32-gemm/gen-inc/1x16inc-minmax-avx512f-broadcast.c
1307 src/f32-gemm/gen-inc/4x16inc-minmax-avx512f-broadcast.c
1308 src/f32-gemm/gen-inc/5x16inc-minmax-avx512f-broadcast.c
1309 src/f32-gemm/gen-inc/6x16inc-minmax-avx512f-broadcast.c
1310 src/f32-gemm/gen-inc/7x16inc-minmax-avx512f-broadcast.c
1311 src/f32-gemm/gen-inc/8x16inc-minmax-avx512f-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001312 src/f32-hswish/gen/avx512f-x16.c
1313 src/f32-hswish/gen/avx512f-x32.c
Marat Dukhan1c587112020-04-08 20:04:28 -07001314 src/f32-igemm/gen/1x16-minmax-avx512f-broadcast.c
1315 src/f32-igemm/gen/4x16-minmax-avx512f-broadcast.c
1316 src/f32-igemm/gen/5x16-minmax-avx512f-broadcast.c
1317 src/f32-igemm/gen/6x16-minmax-avx512f-broadcast.c
1318 src/f32-igemm/gen/7x16-minmax-avx512f-broadcast.c
1319 src/f32-igemm/gen/8x16-minmax-avx512f-broadcast.c
Marat Dukhan90eca0a2020-03-11 00:52:23 -07001320 src/f32-prelu/gen/avx512f-2x16.c
1321 src/f32-prelu/gen/avx512f-2x32.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001322 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c
1323 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1324 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1325 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144.c
1326 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1327 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160.c
1328 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1329 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1330 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192.c
1331 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1332 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1333 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
1334 src/f32-raddextexp/gen/avx512f-p5-scalef-x128.c
1335 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc2.c
1336 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc4.c
1337 src/f32-raddextexp/gen/avx512f-p5-scalef-x144.c
1338 src/f32-raddextexp/gen/avx512f-p5-scalef-x144-acc3.c
1339 src/f32-raddextexp/gen/avx512f-p5-scalef-x160.c
1340 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc2.c
1341 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc5.c
1342 src/f32-raddextexp/gen/avx512f-p5-scalef-x192.c
1343 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc2.c
1344 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc3.c
1345 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc6.c
1346 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128.c
1347 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1348 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1349 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144.c
1350 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1351 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160.c
1352 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1353 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1354 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192.c
1355 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1356 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1357 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001358 src/f32-rmax/avx512f.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001359 src/f32-vbinary/gen/vadd-avx512f-x16.c
1360 src/f32-vbinary/gen/vadd-avx512f-x32.c
1361 src/f32-vbinary/gen/vaddc-avx512f-x16.c
1362 src/f32-vbinary/gen/vaddc-avx512f-x32.c
1363 src/f32-vbinary/gen/vdiv-avx512f-x16.c
1364 src/f32-vbinary/gen/vdiv-avx512f-x32.c
1365 src/f32-vbinary/gen/vdivc-avx512f-x16.c
1366 src/f32-vbinary/gen/vdivc-avx512f-x32.c
1367 src/f32-vbinary/gen/vmax-avx512f-x16.c
1368 src/f32-vbinary/gen/vmax-avx512f-x32.c
1369 src/f32-vbinary/gen/vmaxc-avx512f-x16.c
1370 src/f32-vbinary/gen/vmaxc-avx512f-x32.c
1371 src/f32-vbinary/gen/vmin-avx512f-x16.c
1372 src/f32-vbinary/gen/vmin-avx512f-x32.c
1373 src/f32-vbinary/gen/vminc-avx512f-x16.c
1374 src/f32-vbinary/gen/vminc-avx512f-x32.c
1375 src/f32-vbinary/gen/vmul-avx512f-x16.c
1376 src/f32-vbinary/gen/vmul-avx512f-x32.c
1377 src/f32-vbinary/gen/vmulc-avx512f-x16.c
1378 src/f32-vbinary/gen/vmulc-avx512f-x32.c
1379 src/f32-vbinary/gen/vrdivc-avx512f-x16.c
1380 src/f32-vbinary/gen/vrdivc-avx512f-x32.c
1381 src/f32-vbinary/gen/vrsubc-avx512f-x16.c
1382 src/f32-vbinary/gen/vrsubc-avx512f-x32.c
1383 src/f32-vbinary/gen/vsub-avx512f-x16.c
1384 src/f32-vbinary/gen/vsub-avx512f-x32.c
1385 src/f32-vbinary/gen/vsubc-avx512f-x16.c
1386 src/f32-vbinary/gen/vsubc-avx512f-x32.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001387 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001388 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x16.c
1389 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x32.c
1390 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x48.c
1391 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x64.c
1392 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x80.c
1393 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x96.c
1394 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x112.c
1395 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x128.c
1396 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x144.c
1397 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x160.c
1398 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x176.c
1399 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x192.c
1400 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x16.c
1401 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x32.c
1402 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x48.c
1403 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x64.c
1404 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x80.c
1405 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x96.c
1406 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x112.c
1407 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x128.c
1408 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x144.c
1409 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x160.c
1410 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x176.c
1411 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x192.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001412 src/math/exp-avx512f-p5-scalef.c
1413 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -07001414 src/math/exp-avx512f-perm-p3.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001415 src/math/exp-avx512f-perm2-p2.c
1416 src/math/extexp-avx512f-p5.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001417
1418SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
Marat Dukhande06f492020-04-09 00:19:31 -07001419 src/q8-dwconv/up8x9-minmax-aarch32-neon.S
Marat Dukhan1c587112020-04-08 20:04:28 -07001420 src/f32-gemm/4x8-minmax-aarch32-neon-cortex-a53.S
1421 src/f32-gemm/4x8-minmax-aarch32-neon-cortex-a55.S
1422 src/f32-gemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S
1423 src/f32-gemm/gen/4x8-minmax-aarch32-neon-pld-cortex-a75.S
1424 src/f32-gemm/4x8-minmax-aarch32-neon-ld64.S
1425 src/f32-igemm/4x8-minmax-aarch32-neon-ld64.S
1426 src/f32-igemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S
1427 src/f32-igemm/gen/4x8-minmax-aarch32-neon-pld-cortex-a75.S
1428 src/f32-igemm/4x8-minmax-aarch32-neon-cortex-a53.S
1429 src/f32-igemm/4x8-minmax-aarch32-neon-cortex-a55.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001430
1431SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
Marat Dukhan1c587112020-04-08 20:04:28 -07001432 src/f32-dwconv/up4x9-minmax-aarch64-neonfma-cortex-a55.S
1433 src/f32-dwconv/up4x9-minmax-aarch64-neonfma.S
1434 src/f32-gemm/gen/1x12-minmax-aarch64-neonfma-cortex-a53.S
1435 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a53.S
1436 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a57.S
1437 src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S
1438 src/f32-gemm/gen/4x12-minmax-aarch64-neonfma-cortex-a53.S
1439 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a53.S
1440 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a55.S
1441 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a57.S
1442 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S
1443 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld128.S
1444 src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld64.S
1445 src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-cortex-a57.S
1446 src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S
1447 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a53.S
1448 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a55.S
1449 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a73.S
1450 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a57.S
1451 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S
1452 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ios.S
1453 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld128.S
1454 src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld64.S
1455 src/f32-gemm/gen-inc/1x12inc-minmax-aarch64-neonfma-cortex-a53.S
1456 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a53.S
1457 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a57.S
1458 src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a75.S
1459 src/f32-gemm/gen-inc/4x12inc-minmax-aarch64-neonfma-cortex-a53.S
1460 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a53.S
1461 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a55.S
1462 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a57.S
1463 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a75.S
1464 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld128.S
1465 src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld64.S
1466 src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-cortex-a57.S
1467 src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-cortex-a75.S
1468 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a53.S
1469 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a55.S
1470 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a73.S
1471 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a57.S
1472 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a75.S
1473 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ios.S
1474 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld128.S
1475 src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld64.S
1476 src/f32-igemm/1x12-minmax-aarch64-neonfma-cortex-a53.S
1477 src/f32-igemm/1x8-minmax-aarch64-neonfma-cortex-a53.S
1478 src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a57.S
1479 src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S
1480 src/f32-igemm/4x8-minmax-aarch64-neonfma-cortex-a53.S
1481 src/f32-igemm/4x8-minmax-aarch64-neonfma-cortex-a55.S
1482 src/f32-igemm/4x12-minmax-aarch64-neonfma-cortex-a53.S
1483 src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a57.S
1484 src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S
1485 src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-cortex-a57.S
1486 src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S
1487 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a53.S
1488 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a55.S
1489 src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a73.S
1490 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a57.S
1491 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S
1492 src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-ios.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001493
1494SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
1495IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001496 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS})
1497 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001498ENDIF()
1499IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1500 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1501 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
1502 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
1503ENDIF()
1504IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1505 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1506 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan36aecb52019-11-22 17:21:49 -08001507 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001508 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
1509 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
1510ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +09001511IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|AMD64)$" OR IOS_ARCH MATCHES "^(i386|x86_64|AMD64)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001512 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
1513 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001514 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSSE3_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001515 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001516 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhanfda12b82019-11-21 12:27:59 -08001517 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_FMA3_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001518 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001519 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
1520ENDIF()
1521
1522IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001523 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001524ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001525 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001526ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001527 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001528ELSE()
1529 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
1530ENDIF()
1531SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
1532 C_STANDARD 99
1533 C_EXTENSIONS YES)
1534IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1535 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001536 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001537 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
1538 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
1539 IF(IOS)
Tao Xu84268142020-02-03 15:18:31 -08001540 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001541 ENDIF()
1542ENDIF()
1543IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1544 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
1545 IF(IOS)
Tao Xu84268142020-02-03 15:18:31 -08001546 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001547 ENDIF()
1548ENDIF()
Yasuhiro Matsumoto462be052020-02-29 13:41:14 +09001549IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|AMD64)$" OR IOS_ARCH MATCHES "^(i386|x86_64|AMD64)$")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001550 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
1551 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
Marat Dukhanfe7acb62020-03-09 19:30:05 -07001552 SET_PROPERTY(SOURCE ${XNNPACK_SSSE3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mssse3 ")
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001553 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001554 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhanfda12b82019-11-21 12:27:59 -08001555 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001556 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001557 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
Yasuhiro Matsumoto081b77c2020-03-02 10:20:53 +09001558 IF(MINGW)
1559 # Work-around for https://gcc.gnu.org/bugzilla/show_bug.cgi?id=65782
1560 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -fno-asynchronous-unwind-tables ")
1561 ENDIF()
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001562ENDIF()
1563IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
1564 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
1565ELSE()
1566 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
1567 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1568 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1569 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
1570ENDIF()
1571IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001572 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 ")
1573 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001574ENDIF()
1575
1576TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
1577TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
Ashkan Aliabadid255a312019-12-03 12:44:34 -08001578SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/xnnpack.h)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001579
Marat Dukhan43130882020-03-12 22:33:07 -07001580# ---[ Find libm
1581FIND_LIBRARY(LIBM m)
1582IF(LIBM)
1583 TARGET_LINK_LIBRARIES(XNNPACK PRIVATE ${LIBM})
1584ENDIF()
1585
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001586# ---[ Configure clog
1587IF(NOT TARGET clog)
1588 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
1589 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
1590 ADD_SUBDIRECTORY(
1591 "${CLOG_SOURCE_DIR}/deps/clog"
1592 "${CMAKE_BINARY_DIR}/clog")
1593 # We build static version of clog but a dynamic library may indirectly depend on it
1594 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
1595ENDIF()
1596TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
1597
1598# ---[ Configure cpuinfo
1599IF(NOT TARGET cpuinfo)
1600 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
1601 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
1602 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
1603 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
1604 ADD_SUBDIRECTORY(
1605 "${CPUINFO_SOURCE_DIR}"
1606 "${CMAKE_BINARY_DIR}/cpuinfo")
1607ENDIF()
1608TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
1609
1610# ---[ Configure pthreadpool
1611IF(NOT TARGET pthreadpool)
1612 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
1613 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -07001614 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001615 ADD_SUBDIRECTORY(
1616 "${PTHREADPOOL_SOURCE_DIR}"
1617 "${CMAKE_BINARY_DIR}/pthreadpool")
1618ENDIF()
1619TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
1620
1621# ---[ Configure FXdiv
1622IF(NOT TARGET fxdiv)
1623 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
1624 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
1625 ADD_SUBDIRECTORY(
1626 "${FXDIV_SOURCE_DIR}"
1627 "${CMAKE_BINARY_DIR}/FXdiv")
1628ENDIF()
1629TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
1630
1631# ---[ Configure psimd
1632IF(NOT TARGET psimd)
1633 ADD_SUBDIRECTORY(
1634 "${PSIMD_SOURCE_DIR}"
1635 "${CMAKE_BINARY_DIR}/psimd")
1636ENDIF()
1637TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
1638
1639# ---[ Configure FP16
1640IF(NOT TARGET fp16)
1641 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
1642 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
1643 ADD_SUBDIRECTORY(
1644 "${FP16_SOURCE_DIR}"
1645 "${CMAKE_BINARY_DIR}/FP16")
1646ENDIF()
1647TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
1648
1649INSTALL(TARGETS XNNPACK
1650 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
1651 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
1652 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
1653
1654# ---[ XNNPACK unit tests
1655IF(XNNPACK_BUILD_TESTS)
1656 # ---[ Build google test
1657 IF(NOT TARGET gtest)
1658 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
1659 ADD_SUBDIRECTORY(
1660 "${GOOGLETEST_SOURCE_DIR}"
1661 "${CMAKE_BINARY_DIR}/googletest")
1662 ENDIF()
1663
Marat Dukhan20c3b922020-03-10 03:45:06 -07001664 # ---[ Build size tests
1665
Marat Dukhan43130882020-03-12 22:33:07 -07001666 ADD_EXECUTABLE(operator-size-test test/operator-size.c)
Marat Dukhan20c3b922020-03-10 03:45:06 -07001667 SET_TARGET_PROPERTIES(operator-size-test PROPERTIES
1668 C_STANDARD 99
1669 C_EXTENSIONS NO)
1670 TARGET_LINK_LIBRARIES(operator-size-test PRIVATE XNNPACK)
1671
Marat Dukhan43130882020-03-12 22:33:07 -07001672 ADD_EXECUTABLE(subgraph-size-test test/subgraph-size.c)
Marat Dukhan20c3b922020-03-10 03:45:06 -07001673 SET_TARGET_PROPERTIES(subgraph-size-test PROPERTIES
1674 C_STANDARD 99
1675 C_EXTENSIONS NO)
1676 TARGET_LINK_LIBRARIES(subgraph-size-test PRIVATE XNNPACK)
1677
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001678 # ---[ Build operator-level unit tests
Marat Dukhanefc47b82019-11-18 09:25:38 -08001679 ADD_EXECUTABLE(add-nc-test test/add-nc.cc)
1680 SET_TARGET_PROPERTIES(add-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001681 CXX_STANDARD 11
1682 CXX_STANDARD_REQUIRED YES
1683 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001684 TARGET_INCLUDE_DIRECTORIES(add-nc-test PRIVATE src test)
1685 TARGET_LINK_LIBRARIES(add-nc-test PRIVATE XNNPACK gtest gtest_main)
1686 ADD_TEST(add-nc-test add-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001687
Marat Dukhanb1a0fc32019-12-02 19:32:02 -08001688 ADD_EXECUTABLE(add-nd-test test/add-nd.cc)
1689 SET_TARGET_PROPERTIES(add-nd-test PROPERTIES
1690 CXX_STANDARD 11
1691 CXX_STANDARD_REQUIRED YES
1692 CXX_EXTENSIONS NO)
1693 TARGET_INCLUDE_DIRECTORIES(add-nd-test PRIVATE src test)
1694 TARGET_LINK_LIBRARIES(add-nd-test PRIVATE XNNPACK gtest gtest_main)
1695 ADD_TEST(add-nd-test add-nd-test)
1696
Marat Dukhanefc47b82019-11-18 09:25:38 -08001697 ADD_EXECUTABLE(argmax-pooling-nhwc-test test/argmax-pooling-nhwc.cc)
1698 SET_TARGET_PROPERTIES(argmax-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001699 CXX_STANDARD 11
1700 CXX_STANDARD_REQUIRED YES
1701 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001702 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-nhwc-test PRIVATE src test)
1703 TARGET_LINK_LIBRARIES(argmax-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1704 ADD_TEST(argmax-pooling-nhwc-test argmax-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001705
Marat Dukhanefc47b82019-11-18 09:25:38 -08001706 ADD_EXECUTABLE(average-pooling-nhwc-test test/average-pooling-nhwc.cc)
1707 SET_TARGET_PROPERTIES(average-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001708 CXX_STANDARD 11
1709 CXX_STANDARD_REQUIRED YES
1710 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001711 TARGET_INCLUDE_DIRECTORIES(average-pooling-nhwc-test PRIVATE src test)
1712 TARGET_LINK_LIBRARIES(average-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1713 ADD_TEST(average-pooling-nhwc-test average-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001714
Marat Dukhanefc47b82019-11-18 09:25:38 -08001715 ADD_EXECUTABLE(channel-pad-nc-test test/channel-pad-nc.cc)
1716 SET_TARGET_PROPERTIES(channel-pad-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001717 CXX_STANDARD 11
1718 CXX_STANDARD_REQUIRED YES
1719 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001720 TARGET_INCLUDE_DIRECTORIES(channel-pad-nc-test PRIVATE src test)
1721 TARGET_LINK_LIBRARIES(channel-pad-nc-test PRIVATE XNNPACK gtest gtest_main)
1722 ADD_TEST(channel-pad-nc-test channel-pad-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001723
Marat Dukhanefc47b82019-11-18 09:25:38 -08001724 ADD_EXECUTABLE(channel-shuffle-nc-test test/channel-shuffle-nc.cc)
1725 SET_TARGET_PROPERTIES(channel-shuffle-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001726 CXX_STANDARD 11
1727 CXX_STANDARD_REQUIRED YES
1728 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001729 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-nc-test PRIVATE src test)
1730 TARGET_LINK_LIBRARIES(channel-shuffle-nc-test PRIVATE XNNPACK gtest gtest_main)
1731 ADD_TEST(channel-shuffle-nc-test channel-shuffle-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001732
Marat Dukhanefc47b82019-11-18 09:25:38 -08001733 ADD_EXECUTABLE(clamp-nc-test test/clamp-nc.cc)
1734 SET_TARGET_PROPERTIES(clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001735 CXX_STANDARD 11
1736 CXX_STANDARD_REQUIRED YES
1737 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001738 TARGET_INCLUDE_DIRECTORIES(clamp-nc-test PRIVATE src test)
1739 TARGET_LINK_LIBRARIES(clamp-nc-test PRIVATE XNNPACK gtest gtest_main)
1740 ADD_TEST(clamp-nc-test clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001741
Marat Dukhanefc47b82019-11-18 09:25:38 -08001742 ADD_EXECUTABLE(convolution-nhwc-test test/convolution-nhwc.cc)
1743 SET_TARGET_PROPERTIES(convolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001744 CXX_STANDARD 11
1745 CXX_STANDARD_REQUIRED YES
1746 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001747 TARGET_INCLUDE_DIRECTORIES(convolution-nhwc-test PRIVATE src test)
1748 TARGET_LINK_LIBRARIES(convolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1749 ADD_TEST(convolution-nhwc-test convolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001750
Marat Dukhanefc47b82019-11-18 09:25:38 -08001751 ADD_EXECUTABLE(convolution-nchw-test test/convolution-nchw.cc)
1752 SET_TARGET_PROPERTIES(convolution-nchw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001753 CXX_STANDARD 11
1754 CXX_STANDARD_REQUIRED YES
1755 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001756 TARGET_INCLUDE_DIRECTORIES(convolution-nchw-test PRIVATE src test)
1757 TARGET_LINK_LIBRARIES(convolution-nchw-test PRIVATE XNNPACK gtest gtest_main)
1758 ADD_TEST(convolution-nchw-test convolution-nchw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001759
Marat Dukhanefc47b82019-11-18 09:25:38 -08001760 ADD_EXECUTABLE(deconvolution-nhwc-test test/deconvolution-nhwc.cc)
1761 SET_TARGET_PROPERTIES(deconvolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001762 CXX_STANDARD 11
1763 CXX_STANDARD_REQUIRED YES
1764 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001765 TARGET_INCLUDE_DIRECTORIES(deconvolution-nhwc-test PRIVATE src test)
1766 TARGET_LINK_LIBRARIES(deconvolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1767 ADD_TEST(deconvolution-nhwc-test deconvolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001768
Marat Dukhan69180502019-12-06 15:00:31 -08001769 ADD_EXECUTABLE(divide-nd-test test/divide-nd.cc)
1770 SET_TARGET_PROPERTIES(divide-nd-test PROPERTIES
1771 CXX_STANDARD 11
1772 CXX_STANDARD_REQUIRED YES
1773 CXX_EXTENSIONS NO)
1774 TARGET_INCLUDE_DIRECTORIES(divide-nd-test PRIVATE src test)
1775 TARGET_LINK_LIBRARIES(divide-nd-test PRIVATE XNNPACK gtest gtest_main)
1776 ADD_TEST(divide-nd-test divide-nd-test)
1777
Marat Dukhanefc47b82019-11-18 09:25:38 -08001778 ADD_EXECUTABLE(fully-connected-nc-test test/fully-connected-nc.cc)
1779 SET_TARGET_PROPERTIES(fully-connected-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001780 CXX_STANDARD 11
1781 CXX_STANDARD_REQUIRED YES
1782 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001783 TARGET_INCLUDE_DIRECTORIES(fully-connected-nc-test PRIVATE src test)
1784 TARGET_LINK_LIBRARIES(fully-connected-nc-test PRIVATE XNNPACK gtest gtest_main)
1785 ADD_TEST(fully-connected-nc-test fully-connected-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001786
Marat Dukhanefc47b82019-11-18 09:25:38 -08001787 ADD_EXECUTABLE(global-average-pooling-nwc-test test/global-average-pooling-nwc.cc)
1788 SET_TARGET_PROPERTIES(global-average-pooling-nwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001789 CXX_STANDARD 11
1790 CXX_STANDARD_REQUIRED YES
1791 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001792 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-nwc-test PRIVATE src test)
1793 TARGET_LINK_LIBRARIES(global-average-pooling-nwc-test PRIVATE XNNPACK gtest gtest_main)
1794 ADD_TEST(global-average-pooling-nwc-test global-average-pooling-nwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001795
Marat Dukhanefc47b82019-11-18 09:25:38 -08001796 ADD_EXECUTABLE(global-average-pooling-ncw-test test/global-average-pooling-ncw.cc)
1797 SET_TARGET_PROPERTIES(global-average-pooling-ncw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001798 CXX_STANDARD 11
1799 CXX_STANDARD_REQUIRED YES
1800 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001801 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-ncw-test PRIVATE src test)
1802 TARGET_LINK_LIBRARIES(global-average-pooling-ncw-test PRIVATE XNNPACK gtest gtest_main)
1803 ADD_TEST(global-average-pooling-ncw-test global-average-pooling-ncw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001804
Marat Dukhanefc47b82019-11-18 09:25:38 -08001805 ADD_EXECUTABLE(hardswish-nc-test test/hardswish-nc.cc)
1806 SET_TARGET_PROPERTIES(hardswish-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001807 CXX_STANDARD 11
1808 CXX_STANDARD_REQUIRED YES
1809 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001810 TARGET_INCLUDE_DIRECTORIES(hardswish-nc-test PRIVATE src test)
1811 TARGET_LINK_LIBRARIES(hardswish-nc-test PRIVATE XNNPACK gtest gtest_main)
1812 ADD_TEST(hardswish-nc-test hardswish-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001813
Marat Dukhanefc47b82019-11-18 09:25:38 -08001814 ADD_EXECUTABLE(leaky-relu-nc-test test/leaky-relu-nc.cc)
1815 SET_TARGET_PROPERTIES(leaky-relu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001816 CXX_STANDARD 11
1817 CXX_STANDARD_REQUIRED YES
1818 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001819 TARGET_INCLUDE_DIRECTORIES(leaky-relu-nc-test PRIVATE src test)
1820 TARGET_LINK_LIBRARIES(leaky-relu-nc-test PRIVATE XNNPACK gtest gtest_main)
1821 ADD_TEST(leaky-relu-nc-test leaky-relu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001822
Marat Dukhanefc47b82019-11-18 09:25:38 -08001823 ADD_EXECUTABLE(max-pooling-nhwc-test test/max-pooling-nhwc.cc)
1824 SET_TARGET_PROPERTIES(max-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001825 CXX_STANDARD 11
1826 CXX_STANDARD_REQUIRED YES
1827 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001828 TARGET_INCLUDE_DIRECTORIES(max-pooling-nhwc-test PRIVATE src test)
1829 TARGET_LINK_LIBRARIES(max-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1830 ADD_TEST(max-pooling-nhwc-test max-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001831
Marat Dukhan79e7f842019-12-05 14:35:50 -08001832 ADD_EXECUTABLE(maximum-nd-test test/multiply-nd.cc)
1833 SET_TARGET_PROPERTIES(maximum-nd-test PROPERTIES
1834 CXX_STANDARD 11
1835 CXX_STANDARD_REQUIRED YES
1836 CXX_EXTENSIONS NO)
1837 TARGET_INCLUDE_DIRECTORIES(maximum-nd-test PRIVATE src test)
1838 TARGET_LINK_LIBRARIES(maximum-nd-test PRIVATE XNNPACK gtest gtest_main)
1839 ADD_TEST(maximum-nd-test maximum-nd-test)
1840
1841 ADD_EXECUTABLE(minimum-nd-test test/multiply-nd.cc)
1842 SET_TARGET_PROPERTIES(minimum-nd-test PROPERTIES
1843 CXX_STANDARD 11
1844 CXX_STANDARD_REQUIRED YES
1845 CXX_EXTENSIONS NO)
1846 TARGET_INCLUDE_DIRECTORIES(minimum-nd-test PRIVATE src test)
1847 TARGET_LINK_LIBRARIES(minimum-nd-test PRIVATE XNNPACK gtest gtest_main)
1848 ADD_TEST(minimum-nd-test minimum-nd-test)
1849
Marat Dukhanefc47b82019-11-18 09:25:38 -08001850 ADD_EXECUTABLE(multiply-nd-test test/multiply-nd.cc)
1851 SET_TARGET_PROPERTIES(multiply-nd-test PROPERTIES
Marat Dukhan9d501d52019-11-16 02:30:50 -08001852 CXX_STANDARD 11
1853 CXX_STANDARD_REQUIRED YES
1854 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001855 TARGET_INCLUDE_DIRECTORIES(multiply-nd-test PRIVATE src test)
1856 TARGET_LINK_LIBRARIES(multiply-nd-test PRIVATE XNNPACK gtest gtest_main)
1857 ADD_TEST(multiply-nd-test multiply-nd-test)
Marat Dukhan9d501d52019-11-16 02:30:50 -08001858
Marat Dukhanefc47b82019-11-18 09:25:38 -08001859 ADD_EXECUTABLE(prelu-nc-test test/prelu-nc.cc)
1860 SET_TARGET_PROPERTIES(prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001861 CXX_STANDARD 11
1862 CXX_STANDARD_REQUIRED YES
1863 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001864 TARGET_INCLUDE_DIRECTORIES(prelu-nc-test PRIVATE src test)
1865 TARGET_LINK_LIBRARIES(prelu-nc-test PRIVATE XNNPACK gtest gtest_main)
1866 ADD_TEST(prelu-nc-test prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001867
Marat Dukhanefc47b82019-11-18 09:25:38 -08001868 ADD_EXECUTABLE(resize-bilinear-nhwc-test test/resize-bilinear-nhwc.cc)
1869 SET_TARGET_PROPERTIES(resize-bilinear-nhwc-test PROPERTIES
Marat Dukhan69722492019-11-11 19:55:50 -08001870 CXX_STANDARD 11
1871 CXX_STANDARD_REQUIRED YES
1872 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001873 TARGET_INCLUDE_DIRECTORIES(resize-bilinear-nhwc-test PRIVATE src test)
1874 TARGET_LINK_LIBRARIES(resize-bilinear-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1875 ADD_TEST(resize-bilinear-nhwc-test resize-bilinear-nhwc-test)
Marat Dukhan69722492019-11-11 19:55:50 -08001876
Marat Dukhanefc47b82019-11-18 09:25:38 -08001877 ADD_EXECUTABLE(sigmoid-nc-test test/sigmoid-nc.cc)
1878 SET_TARGET_PROPERTIES(sigmoid-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001879 CXX_STANDARD 11
1880 CXX_STANDARD_REQUIRED YES
1881 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001882 TARGET_INCLUDE_DIRECTORIES(sigmoid-nc-test PRIVATE src test)
1883 TARGET_LINK_LIBRARIES(sigmoid-nc-test PRIVATE XNNPACK gtest gtest_main)
1884 ADD_TEST(sigmoid-nc-test sigmoid-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001885
Marat Dukhanfd8e6892020-01-27 15:25:25 -08001886 ADD_EXECUTABLE(softmax-nc-test test/softmax-nc.cc)
1887 SET_TARGET_PROPERTIES(softmax-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001888 CXX_STANDARD 11
1889 CXX_STANDARD_REQUIRED YES
1890 CXX_EXTENSIONS NO)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08001891 TARGET_INCLUDE_DIRECTORIES(softmax-nc-test PRIVATE src test)
1892 TARGET_LINK_LIBRARIES(softmax-nc-test PRIVATE XNNPACK gtest gtest_main)
1893 ADD_TEST(softmax-nc-test softmax-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001894
Marat Dukhan05f3f6d2019-12-03 15:13:53 -08001895 ADD_EXECUTABLE(subtract-nd-test test/subtract-nd.cc)
1896 SET_TARGET_PROPERTIES(subtract-nd-test PROPERTIES
1897 CXX_STANDARD 11
1898 CXX_STANDARD_REQUIRED YES
1899 CXX_EXTENSIONS NO)
1900 TARGET_INCLUDE_DIRECTORIES(subtract-nd-test PRIVATE src test)
1901 TARGET_LINK_LIBRARIES(subtract-nd-test PRIVATE XNNPACK gtest gtest_main)
1902 ADD_TEST(subtract-nd-test subtract-nd-test)
1903
Marat Dukhanefc47b82019-11-18 09:25:38 -08001904 ADD_EXECUTABLE(unpooling-nhwc-test test/unpooling-nhwc.cc)
1905 SET_TARGET_PROPERTIES(unpooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001906 CXX_STANDARD 11
1907 CXX_STANDARD_REQUIRED YES
1908 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001909 TARGET_INCLUDE_DIRECTORIES(unpooling-nhwc-test PRIVATE src test)
1910 TARGET_LINK_LIBRARIES(unpooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1911 ADD_TEST(unpooling-nhwc-test unpooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001912
1913 # ---[ Build microkernel-level unit tests
Marat Dukhande06f492020-04-09 00:19:31 -07001914 ADD_EXECUTABLE(f16-gemm-minmax-test test/f16-gemm-minmax.cc)
1915 SET_TARGET_PROPERTIES(f16-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001916 CXX_STANDARD 11
1917 CXX_STANDARD_REQUIRED YES
1918 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07001919 TARGET_INCLUDE_DIRECTORIES(f16-gemm-minmax-test PRIVATE src test)
1920 TARGET_LINK_LIBRARIES(f16-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1921 ADD_TEST(f16-gemm-minmax-test f16-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001922
1923 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
1924 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
1925 CXX_STANDARD 11
1926 CXX_STANDARD_REQUIRED YES
1927 CXX_EXTENSIONS YES)
1928 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
1929 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1930 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
1931
1932 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
1933 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
1934 CXX_STANDARD 11
1935 CXX_STANDARD_REQUIRED YES
1936 CXX_EXTENSIONS YES)
1937 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
1938 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1939 ADD_TEST(f32-avgpool-test f32-avgpool-test)
1940
Marat Dukhan53873d02019-12-06 17:21:30 -08001941 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
1942 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001943 CXX_STANDARD 11
1944 CXX_STANDARD_REQUIRED YES
1945 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001946 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
1947 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1948 ADD_TEST(f32-clamp-test f32-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001949
1950 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
1951 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
1952 CXX_STANDARD 11
1953 CXX_STANDARD_REQUIRED YES
1954 CXX_EXTENSIONS YES)
1955 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
1956 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1957 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
1958
1959 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
1960 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
1961 CXX_STANDARD 11
1962 CXX_STANDARD_REQUIRED YES
1963 CXX_EXTENSIONS YES)
1964 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
1965 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1966 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
1967
1968 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
1969 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
1970 CXX_STANDARD 11
1971 CXX_STANDARD_REQUIRED YES
1972 CXX_EXTENSIONS YES)
1973 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
1974 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1975 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
1976
Marat Dukhan163a7e62020-04-09 04:19:26 -07001977 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
1978 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001979 CXX_STANDARD 11
1980 CXX_STANDARD_REQUIRED YES
1981 CXX_EXTENSIONS YES)
Marat Dukhan163a7e62020-04-09 04:19:26 -07001982 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
1983 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1984 ADD_TEST(f32-dwconv-test f32-dwconv-test)
1985
1986 ADD_EXECUTABLE(f32-dwconv-minmax-test test/f32-dwconv-minmax.cc)
1987 SET_TARGET_PROPERTIES(f32-dwconv-minmax-test PROPERTIES
1988 CXX_STANDARD 11
1989 CXX_STANDARD_REQUIRED YES
1990 CXX_EXTENSIONS YES)
1991 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-minmax-test PRIVATE src test)
1992 TARGET_LINK_LIBRARIES(f32-dwconv-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1993 ADD_TEST(f32-dwconv-minmax-test f32-dwconv-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001994
1995 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
1996 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
1997 CXX_STANDARD 11
1998 CXX_STANDARD_REQUIRED YES
1999 CXX_EXTENSIONS YES)
2000 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
2001 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2002 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
2003
2004 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
2005 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
2006 CXX_STANDARD 11
2007 CXX_STANDARD_REQUIRED YES
2008 CXX_EXTENSIONS YES)
2009 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
2010 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2011 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
2012
Marat Dukhan163a7e62020-04-09 04:19:26 -07002013 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
2014 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
2015 CXX_STANDARD 11
2016 CXX_STANDARD_REQUIRED YES
2017 CXX_EXTENSIONS YES)
2018 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
2019 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2020 ADD_TEST(f32-gemm-test f32-gemm-test)
2021
Marat Dukhan1c587112020-04-08 20:04:28 -07002022 ADD_EXECUTABLE(f32-gemm-minmax-test test/f32-gemm-minmax.cc)
2023 SET_TARGET_PROPERTIES(f32-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002024 CXX_STANDARD 11
2025 CXX_STANDARD_REQUIRED YES
2026 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002027 TARGET_INCLUDE_DIRECTORIES(f32-gemm-minmax-test PRIVATE src test)
2028 TARGET_LINK_LIBRARIES(f32-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2029 ADD_TEST(f32-gemm-minmax-test f32-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002030
Marat Dukhan1c587112020-04-08 20:04:28 -07002031 ADD_EXECUTABLE(f32-gemminc-minmax-test test/f32-gemminc-minmax.cc)
2032 SET_TARGET_PROPERTIES(f32-gemminc-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002033 CXX_STANDARD 11
2034 CXX_STANDARD_REQUIRED YES
2035 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002036 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-minmax-test PRIVATE src test)
2037 TARGET_LINK_LIBRARIES(f32-gemminc-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2038 ADD_TEST(f32-gemminc-minmax-test f32-gemminc-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002039
2040 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
2041 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
2042 CXX_STANDARD 11
2043 CXX_STANDARD_REQUIRED YES
2044 CXX_EXTENSIONS YES)
2045 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
2046 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2047 ADD_TEST(f32-hswish-test f32-hswish-test)
2048
Marat Dukhan660fd192020-03-10 04:55:30 -07002049 ADD_EXECUTABLE(f32-ibilinear-test test/f32-ibilinear.cc)
2050 SET_TARGET_PROPERTIES(f32-ibilinear-test PROPERTIES
2051 CXX_STANDARD 11
2052 CXX_STANDARD_REQUIRED YES
2053 CXX_EXTENSIONS YES)
2054 TARGET_INCLUDE_DIRECTORIES(f32-ibilinear-test PRIVATE src test)
2055 TARGET_LINK_LIBRARIES(f32-ibilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2056 ADD_TEST(f32-ibilinear-test f32-ibilinear-test)
2057
Marat Dukhan163a7e62020-04-09 04:19:26 -07002058 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
2059 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
2060 CXX_STANDARD 11
2061 CXX_STANDARD_REQUIRED YES
2062 CXX_EXTENSIONS YES)
2063 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
2064 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2065 ADD_TEST(f32-igemm-test f32-igemm-test)
2066
Marat Dukhan1c587112020-04-08 20:04:28 -07002067 ADD_EXECUTABLE(f32-igemm-minmax-test test/f32-igemm-minmax.cc)
2068 SET_TARGET_PROPERTIES(f32-igemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002069 CXX_STANDARD 11
2070 CXX_STANDARD_REQUIRED YES
2071 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002072 TARGET_INCLUDE_DIRECTORIES(f32-igemm-minmax-test PRIVATE src test)
2073 TARGET_LINK_LIBRARIES(f32-igemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2074 ADD_TEST(f32-igemm-minmax-test f32-igemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002075
2076 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
2077 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
2078 CXX_STANDARD 11
2079 CXX_STANDARD_REQUIRED YES
2080 CXX_EXTENSIONS YES)
2081 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
2082 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2083 ADD_TEST(f32-maxpool-test f32-maxpool-test)
2084
2085 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
2086 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
2087 CXX_STANDARD 11
2088 CXX_STANDARD_REQUIRED YES
2089 CXX_EXTENSIONS YES)
2090 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
2091 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2092 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
2093
Marat Dukhan1c587112020-04-08 20:04:28 -07002094 ADD_EXECUTABLE(f32-ppmm-minmax-test test/f32-ppmm-minmax.cc)
2095 SET_TARGET_PROPERTIES(f32-ppmm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002096 CXX_STANDARD 11
2097 CXX_STANDARD_REQUIRED YES
2098 CXX_EXTENSIONS YES)
Marat Dukhan1c587112020-04-08 20:04:28 -07002099 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-minmax-test PRIVATE src test)
2100 TARGET_LINK_LIBRARIES(f32-ppmm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2101 ADD_TEST(f32-ppmm-minmax-test f32-ppmm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002102
Marat Dukhan53873d02019-12-06 17:21:30 -08002103 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
2104 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002105 CXX_STANDARD 11
2106 CXX_STANDARD_REQUIRED YES
2107 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002108 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
2109 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2110 ADD_TEST(f32-prelu-test f32-prelu-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002111
Marat Dukhan97579532019-10-18 16:40:39 -07002112 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
2113 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
2114 CXX_STANDARD 11
2115 CXX_STANDARD_REQUIRED YES
2116 CXX_EXTENSIONS YES)
2117 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
2118 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2119 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
2120
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002121 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
2122 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
2123 CXX_STANDARD 11
2124 CXX_STANDARD_REQUIRED YES
2125 CXX_EXTENSIONS YES)
2126 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07002127 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002128 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
2129
Marat Dukhan97579532019-10-18 16:40:39 -07002130 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
2131 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
2132 CXX_STANDARD 11
2133 CXX_STANDARD_REQUIRED YES
2134 CXX_EXTENSIONS YES)
2135 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
2136 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2137 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
2138
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002139 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
2140 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
2141 CXX_STANDARD 11
2142 CXX_STANDARD_REQUIRED YES
2143 CXX_EXTENSIONS YES)
2144 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
2145 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2146 ADD_TEST(f32-rmax-test f32-rmax-test)
2147
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002148 ADD_EXECUTABLE(f32-sigmoid-test test/f32-sigmoid.cc)
2149 SET_TARGET_PROPERTIES(f32-sigmoid-test PROPERTIES
2150 CXX_STANDARD 11
2151 CXX_STANDARD_REQUIRED YES
2152 CXX_EXTENSIONS YES)
2153 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-test PRIVATE src test)
2154 TARGET_LINK_LIBRARIES(f32-sigmoid-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2155 ADD_TEST(f32-sigmoid-test f32-sigmoid-test)
2156
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002157 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
2158 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
2159 CXX_STANDARD 11
2160 CXX_STANDARD_REQUIRED YES
2161 CXX_EXTENSIONS YES)
2162 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
2163 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2164 ADD_TEST(f32-spmm-test f32-spmm-test)
2165
Marat Dukhan53873d02019-12-06 17:21:30 -08002166 ADD_EXECUTABLE(f32-vadd-test test/f32-vadd.cc)
2167 SET_TARGET_PROPERTIES(f32-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002168 CXX_STANDARD 11
2169 CXX_STANDARD_REQUIRED YES
2170 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002171 TARGET_INCLUDE_DIRECTORIES(f32-vadd-test PRIVATE src test)
2172 TARGET_LINK_LIBRARIES(f32-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2173 ADD_TEST(f32-vadd-test f32-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002174
Marat Dukhanc76065f2019-11-14 18:13:33 -08002175 ADD_EXECUTABLE(f32-vaddc-test test/f32-vaddc.cc)
2176 SET_TARGET_PROPERTIES(f32-vaddc-test PROPERTIES
2177 CXX_STANDARD 11
2178 CXX_STANDARD_REQUIRED YES
2179 CXX_EXTENSIONS YES)
2180 TARGET_INCLUDE_DIRECTORIES(f32-vaddc-test PRIVATE src test)
2181 TARGET_LINK_LIBRARIES(f32-vaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2182 ADD_TEST(f32-vaddc-test f32-vaddc-test)
2183
Marat Dukhan77ca6302019-12-06 12:48:15 -08002184 ADD_EXECUTABLE(f32-vdiv-test test/f32-vdiv.cc)
2185 SET_TARGET_PROPERTIES(f32-vdiv-test PROPERTIES
2186 CXX_STANDARD 11
2187 CXX_STANDARD_REQUIRED YES
2188 CXX_EXTENSIONS YES)
2189 TARGET_INCLUDE_DIRECTORIES(f32-vdiv-test PRIVATE src test)
2190 TARGET_LINK_LIBRARIES(f32-vdiv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2191 ADD_TEST(f32-vdiv-test f32-vdiv-test)
2192
2193 ADD_EXECUTABLE(f32-vdivc-test test/f32-vdivc.cc)
2194 SET_TARGET_PROPERTIES(f32-vdivc-test PROPERTIES
2195 CXX_STANDARD 11
2196 CXX_STANDARD_REQUIRED YES
2197 CXX_EXTENSIONS YES)
2198 TARGET_INCLUDE_DIRECTORIES(f32-vdivc-test PRIVATE src test)
2199 TARGET_LINK_LIBRARIES(f32-vdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2200 ADD_TEST(f32-vdivc-test f32-vdivc-test)
2201
2202 ADD_EXECUTABLE(f32-vrdivc-test test/f32-vrdivc.cc)
2203 SET_TARGET_PROPERTIES(f32-vrdivc-test PROPERTIES
2204 CXX_STANDARD 11
2205 CXX_STANDARD_REQUIRED YES
2206 CXX_EXTENSIONS YES)
2207 TARGET_INCLUDE_DIRECTORIES(f32-vrdivc-test PRIVATE src test)
2208 TARGET_LINK_LIBRARIES(f32-vrdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2209 ADD_TEST(f32-vrdivc-test f32-vrdivc-test)
2210
Marat Dukhan403b7d42019-12-05 12:49:11 -08002211 ADD_EXECUTABLE(f32-vmax-test test/f32-vmax.cc)
2212 SET_TARGET_PROPERTIES(f32-vmax-test PROPERTIES
2213 CXX_STANDARD 11
2214 CXX_STANDARD_REQUIRED YES
2215 CXX_EXTENSIONS YES)
2216 TARGET_INCLUDE_DIRECTORIES(f32-vmax-test PRIVATE src test)
2217 TARGET_LINK_LIBRARIES(f32-vmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2218 ADD_TEST(f32-vmax-test f32-vmax-test)
2219
2220 ADD_EXECUTABLE(f32-vmaxc-test test/f32-vmaxc.cc)
2221 SET_TARGET_PROPERTIES(f32-vmaxc-test PROPERTIES
2222 CXX_STANDARD 11
2223 CXX_STANDARD_REQUIRED YES
2224 CXX_EXTENSIONS YES)
2225 TARGET_INCLUDE_DIRECTORIES(f32-vmaxc-test PRIVATE src test)
2226 TARGET_LINK_LIBRARIES(f32-vmaxc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2227 ADD_TEST(f32-vmaxc-test f32-vmaxc-test)
2228
2229 ADD_EXECUTABLE(f32-vmin-test test/f32-vmin.cc)
2230 SET_TARGET_PROPERTIES(f32-vmin-test PROPERTIES
2231 CXX_STANDARD 11
2232 CXX_STANDARD_REQUIRED YES
2233 CXX_EXTENSIONS YES)
2234 TARGET_INCLUDE_DIRECTORIES(f32-vmin-test PRIVATE src test)
2235 TARGET_LINK_LIBRARIES(f32-vmin-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2236 ADD_TEST(f32-vmin-test f32-vmin-test)
2237
2238 ADD_EXECUTABLE(f32-vminc-test test/f32-vminc.cc)
2239 SET_TARGET_PROPERTIES(f32-vminc-test PROPERTIES
2240 CXX_STANDARD 11
2241 CXX_STANDARD_REQUIRED YES
2242 CXX_EXTENSIONS YES)
2243 TARGET_INCLUDE_DIRECTORIES(f32-vminc-test PRIVATE src test)
2244 TARGET_LINK_LIBRARIES(f32-vminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2245 ADD_TEST(f32-vminc-test f32-vminc-test)
2246
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002247 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
2248 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
2249 CXX_STANDARD 11
2250 CXX_STANDARD_REQUIRED YES
2251 CXX_EXTENSIONS YES)
2252 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
2253 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2254 ADD_TEST(f32-vmul-test f32-vmul-test)
2255
Marat Dukhanc76065f2019-11-14 18:13:33 -08002256 ADD_EXECUTABLE(f32-vmulc-test test/f32-vmulc.cc)
2257 SET_TARGET_PROPERTIES(f32-vmulc-test PROPERTIES
2258 CXX_STANDARD 11
2259 CXX_STANDARD_REQUIRED YES
2260 CXX_EXTENSIONS YES)
2261 TARGET_INCLUDE_DIRECTORIES(f32-vmulc-test PRIVATE src test)
2262 TARGET_LINK_LIBRARIES(f32-vmulc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2263 ADD_TEST(f32-vmulc-test f32-vmulc-test)
2264
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002265 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
2266 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
2267 CXX_STANDARD 11
2268 CXX_STANDARD_REQUIRED YES
2269 CXX_EXTENSIONS YES)
2270 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
2271 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2272 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
2273
Marat Dukhan97579532019-10-18 16:40:39 -07002274 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
2275 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
2276 CXX_STANDARD 11
2277 CXX_STANDARD_REQUIRED YES
2278 CXX_EXTENSIONS YES)
2279 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
2280 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2281 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
2282
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002283 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
2284 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
2285 CXX_STANDARD 11
2286 CXX_STANDARD_REQUIRED YES
2287 CXX_EXTENSIONS YES)
2288 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07002289 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002290 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
2291
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002292 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
2293 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
2294 CXX_STANDARD 11
2295 CXX_STANDARD_REQUIRED YES
2296 CXX_EXTENSIONS YES)
2297 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
2298 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2299 ADD_TEST(f32-vsub-test f32-vsub-test)
2300
Marat Dukhanc76065f2019-11-14 18:13:33 -08002301 ADD_EXECUTABLE(f32-vsubc-test test/f32-vsubc.cc)
2302 SET_TARGET_PROPERTIES(f32-vsubc-test PROPERTIES
2303 CXX_STANDARD 11
2304 CXX_STANDARD_REQUIRED YES
2305 CXX_EXTENSIONS YES)
2306 TARGET_INCLUDE_DIRECTORIES(f32-vsubc-test PRIVATE src test)
2307 TARGET_LINK_LIBRARIES(f32-vsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2308 ADD_TEST(f32-vsubc-test f32-vsubc-test)
2309
2310 ADD_EXECUTABLE(f32-vrsubc-test test/f32-vrsubc.cc)
2311 SET_TARGET_PROPERTIES(f32-vrsubc-test PROPERTIES
2312 CXX_STANDARD 11
2313 CXX_STANDARD_REQUIRED YES
2314 CXX_EXTENSIONS YES)
2315 TARGET_INCLUDE_DIRECTORIES(f32-vrsubc-test PRIVATE src test)
2316 TARGET_LINK_LIBRARIES(f32-vrsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2317 ADD_TEST(f32-vrsubc-test f32-vrsubc-test)
2318
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002319 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
2320 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
2321 CXX_STANDARD 11
2322 CXX_STANDARD_REQUIRED YES
2323 CXX_EXTENSIONS YES)
2324 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
2325 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2326 ADD_TEST(q8-avgpool-test q8-avgpool-test)
2327
Marat Dukhande06f492020-04-09 00:19:31 -07002328 ADD_EXECUTABLE(q8-dwconv-minmax-test test/q8-dwconv-minmax.cc)
2329 SET_TARGET_PROPERTIES(q8-dwconv-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002330 CXX_STANDARD 11
2331 CXX_STANDARD_REQUIRED YES
2332 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002333 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-minmax-test PRIVATE src test)
2334 TARGET_LINK_LIBRARIES(q8-dwconv-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2335 ADD_TEST(q8-dwconv-minmax-test q8-dwconv-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002336
2337 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
2338 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
2339 CXX_STANDARD 11
2340 CXX_STANDARD_REQUIRED YES
2341 CXX_EXTENSIONS YES)
2342 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
2343 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2344 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
2345
Marat Dukhande06f492020-04-09 00:19:31 -07002346 ADD_EXECUTABLE(q8-gemm-minmax-test test/q8-gemm-minmax.cc)
2347 SET_TARGET_PROPERTIES(q8-gemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002348 CXX_STANDARD 11
2349 CXX_STANDARD_REQUIRED YES
2350 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002351 TARGET_INCLUDE_DIRECTORIES(q8-gemm-minmax-test PRIVATE src test)
2352 TARGET_LINK_LIBRARIES(q8-gemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2353 ADD_TEST(q8-gemm-minmax-test q8-gemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002354
Marat Dukhande06f492020-04-09 00:19:31 -07002355 ADD_EXECUTABLE(q8-igemm-minmax-test test/q8-igemm-minmax.cc)
2356 SET_TARGET_PROPERTIES(q8-igemm-minmax-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002357 CXX_STANDARD 11
2358 CXX_STANDARD_REQUIRED YES
2359 CXX_EXTENSIONS YES)
Marat Dukhande06f492020-04-09 00:19:31 -07002360 TARGET_INCLUDE_DIRECTORIES(q8-igemm-minmax-test PRIVATE src test)
2361 TARGET_LINK_LIBRARIES(q8-igemm-minmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2362 ADD_TEST(q8-igemm-minmax-test q8-igemm-minmax-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002363
Marat Dukhan53873d02019-12-06 17:21:30 -08002364 ADD_EXECUTABLE(q8-vadd-test test/q8-vadd.cc)
2365 SET_TARGET_PROPERTIES(q8-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002366 CXX_STANDARD 11
2367 CXX_STANDARD_REQUIRED YES
2368 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002369 TARGET_INCLUDE_DIRECTORIES(q8-vadd-test PRIVATE src test)
2370 TARGET_LINK_LIBRARIES(q8-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2371 ADD_TEST(q8-vadd-test q8-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002372
Marat Dukhan53873d02019-12-06 17:21:30 -08002373 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
2374 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002375 CXX_STANDARD 11
2376 CXX_STANDARD_REQUIRED YES
2377 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002378 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
2379 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2380 ADD_TEST(u8-clamp-test u8-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002381
2382 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
2383 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
2384 CXX_STANDARD 11
2385 CXX_STANDARD_REQUIRED YES
2386 CXX_EXTENSIONS YES)
2387 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
2388 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2389 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
2390
2391 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
2392 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
2393 CXX_STANDARD 11
2394 CXX_STANDARD_REQUIRED YES
2395 CXX_EXTENSIONS YES)
2396 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
2397 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2398 ADD_TEST(u8-maxpool-test u8-maxpool-test)
2399
2400 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
2401 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
2402 CXX_STANDARD 11
2403 CXX_STANDARD_REQUIRED YES
2404 CXX_EXTENSIONS YES)
2405 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
2406 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2407 ADD_TEST(u8-rmax-test u8-rmax-test)
2408
2409 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
2410 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
2411 CXX_STANDARD 11
2412 CXX_STANDARD_REQUIRED YES
2413 CXX_EXTENSIONS YES)
2414 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
2415 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2416 ADD_TEST(x32-packx-test x32-packx-test)
2417
2418 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
2419 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
2420 CXX_STANDARD 11
2421 CXX_STANDARD_REQUIRED YES
2422 CXX_EXTENSIONS YES)
2423 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
2424 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2425 ADD_TEST(x32-pad-test x32-pad-test)
2426
2427 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
2428 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
2429 CXX_STANDARD 11
2430 CXX_STANDARD_REQUIRED YES
2431 CXX_EXTENSIONS YES)
2432 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
2433 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2434 ADD_TEST(x32-unpool-test x32-unpool-test)
2435
2436 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
2437 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
2438 CXX_STANDARD 11
2439 CXX_STANDARD_REQUIRED YES
2440 CXX_EXTENSIONS YES)
2441 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
2442 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2443 ADD_TEST(x32-zip-test x32-zip-test)
2444
2445 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
2446 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
2447 CXX_STANDARD 11
2448 CXX_STANDARD_REQUIRED YES
2449 CXX_EXTENSIONS YES)
2450 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
2451 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2452 ADD_TEST(x8-lut-test x8-lut-test)
2453
2454 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
2455 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
2456 CXX_STANDARD 11
2457 CXX_STANDARD_REQUIRED YES
2458 CXX_EXTENSIONS YES)
2459 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
2460 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2461 ADD_TEST(x8-zip-test x8-zip-test)
Marat Dukhanfe7acb62020-03-09 19:30:05 -07002462
2463 ADD_EXECUTABLE(requantization-test test/requantization.cc)
2464 SET_TARGET_PROPERTIES(requantization-test PROPERTIES
2465 CXX_STANDARD 11
2466 CXX_STANDARD_REQUIRED YES
2467 CXX_EXTENSIONS YES)
2468 TARGET_INCLUDE_DIRECTORIES(requantization-test PRIVATE src test)
2469 TARGET_LINK_LIBRARIES(requantization-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2470 ADD_TEST(requantization-test requantization-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002471ENDIF()
2472
2473# ---[ XNNPACK microbenchmarks
2474IF(XNNPACK_BUILD_BENCHMARKS)
2475 # ---[ Build google benchmark
2476 IF(NOT TARGET benchmark)
2477 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
2478 ADD_SUBDIRECTORY(
2479 "${GOOGLEBENCHMARK_SOURCE_DIR}"
2480 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
2481 ENDIF()
2482
2483 ADD_LIBRARY(bench-utils bench/utils.cc)
2484 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
2485 CXX_STANDARD 11
2486 CXX_STANDARD_REQUIRED YES
2487 CXX_EXTENSIONS NO)
2488 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08002489 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002490
Marat Dukhancb10f262019-11-16 15:52:37 -08002491 # ---[ Build accuracy microbenchmarks
2492 ADD_EXECUTABLE(f32-exp-eval eval/f32-exp.cc)
2493 SET_TARGET_PROPERTIES(f32-exp-eval PROPERTIES
2494 CXX_STANDARD 11
2495 CXX_STANDARD_REQUIRED YES
2496 CXX_EXTENSIONS NO)
2497 TARGET_INCLUDE_DIRECTORIES(f32-exp-eval PRIVATE src)
2498 TARGET_LINK_LIBRARIES(f32-exp-eval PRIVATE XNNPACK benchmark fp16)
2499
2500 ADD_EXECUTABLE(f32-expminus-eval eval/f32-expminus.cc)
2501 SET_TARGET_PROPERTIES(f32-expminus-eval PROPERTIES
2502 CXX_STANDARD 11
2503 CXX_STANDARD_REQUIRED YES
2504 CXX_EXTENSIONS NO)
2505 TARGET_INCLUDE_DIRECTORIES(f32-expminus-eval PRIVATE src)
2506 TARGET_LINK_LIBRARIES(f32-expminus-eval PRIVATE XNNPACK benchmark fp16)
2507
2508 ADD_EXECUTABLE(f32-extexp-eval eval/f32-extexp.cc)
2509 SET_TARGET_PROPERTIES(f32-extexp-eval PROPERTIES
2510 CXX_STANDARD 11
2511 CXX_STANDARD_REQUIRED YES
2512 CXX_EXTENSIONS YES)
2513 TARGET_INCLUDE_DIRECTORIES(f32-extexp-eval PRIVATE src)
2514 TARGET_LINK_LIBRARIES(f32-extexp-eval PRIVATE XNNPACK benchmark fp16)
2515
2516 ADD_EXECUTABLE(f32-sigmoid-eval eval/f32-sigmoid.cc)
2517 SET_TARGET_PROPERTIES(f32-sigmoid-eval PROPERTIES
2518 CXX_STANDARD 11
2519 CXX_STANDARD_REQUIRED YES
2520 CXX_EXTENSIONS NO)
2521 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-eval PRIVATE src)
2522 TARGET_LINK_LIBRARIES(f32-sigmoid-eval PRIVATE XNNPACK benchmark fp16)
2523
Marat Dukhan5f18d262019-10-31 10:24:14 -07002524 # ---[ Build end-to-end microbenchmarks
Marat Dukhan17e16282019-12-10 12:09:35 -08002525 ADD_LIBRARY(bench-models STATIC
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002526 models/mobilenet-v1.cc
2527 models/mobilenet-v2.cc
2528 models/mobilenet-v3-large.cc
2529 models/mobilenet-v3-small.cc)
2530 SET_TARGET_PROPERTIES(bench-models PROPERTIES
2531 CXX_STANDARD 11
2532 CXX_STANDARD_REQUIRED YES
2533 CXX_EXTENSIONS YES)
2534 TARGET_INCLUDE_DIRECTORIES(bench-models PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2535 TARGET_LINK_LIBRARIES(bench-models PRIVATE XNNPACK benchmark bench-utils)
2536
2537 ADD_EXECUTABLE(end2end-bench bench/end2end.cc)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002538 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
2539 CXX_STANDARD 11
2540 CXX_STANDARD_REQUIRED YES
2541 CXX_EXTENSIONS NO)
2542 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002543 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002544
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002545 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002546 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
2547 CXX_STANDARD 11
2548 CXX_STANDARD_REQUIRED YES
2549 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002550 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002551 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002552
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002553 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc)
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07002554 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07002555 CXX_STANDARD 11
2556 CXX_STANDARD_REQUIRED YES
2557 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002558 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002559 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07002560
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002561 # ---[ Build operator-level microbenchmarks
2562 ADD_EXECUTABLE(add-bench bench/add.cc)
2563 SET_TARGET_PROPERTIES(add-bench PROPERTIES
2564 CXX_STANDARD 11
2565 CXX_STANDARD_REQUIRED YES
2566 CXX_EXTENSIONS NO)
2567 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2568 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2569
2570 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
2571 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
2572 CXX_STANDARD 11
2573 CXX_STANDARD_REQUIRED YES
2574 CXX_EXTENSIONS NO)
2575 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2576 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2577
2578 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
2579 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
2580 CXX_STANDARD 11
2581 CXX_STANDARD_REQUIRED YES
2582 CXX_EXTENSIONS NO)
2583 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2584 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2585
2586 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
2587 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
2588 CXX_STANDARD 11
2589 CXX_STANDARD_REQUIRED YES
2590 CXX_EXTENSIONS NO)
2591 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2592 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2593
2594 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
2595 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
2596 CXX_STANDARD 11
2597 CXX_STANDARD_REQUIRED YES
2598 CXX_EXTENSIONS NO)
2599 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2600 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2601
2602 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
2603 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
2604 CXX_STANDARD 11
2605 CXX_STANDARD_REQUIRED YES
2606 CXX_EXTENSIONS NO)
2607 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2608 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2609
2610 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
2611 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
2612 CXX_STANDARD 11
2613 CXX_STANDARD_REQUIRED YES
2614 CXX_EXTENSIONS NO)
2615 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2616 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2617
Marat Dukhan95b22432019-10-30 16:30:14 -07002618 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
2619 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
2620 CXX_STANDARD 11
2621 CXX_STANDARD_REQUIRED YES
2622 CXX_EXTENSIONS NO)
2623 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2624 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2625
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002626 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
2627 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
2628 CXX_STANDARD 11
2629 CXX_STANDARD_REQUIRED YES
2630 CXX_EXTENSIONS NO)
2631 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2632 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2633
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002634 ADD_EXECUTABLE(softmax-bench bench/softmax.cc)
2635 SET_TARGET_PROPERTIES(softmax-bench PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002636 CXX_STANDARD 11
2637 CXX_STANDARD_REQUIRED YES
2638 CXX_EXTENSIONS NO)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002639 TARGET_INCLUDE_DIRECTORIES(softmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2640 TARGET_LINK_LIBRARIES(softmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002641
2642 # ---[ Build microkernel-level microbenchmarks
2643 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
2644 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
2645 CXX_STANDARD 11
2646 CXX_STANDARD_REQUIRED YES
2647 CXX_EXTENSIONS YES)
2648 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
2649 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2650 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2651
2652 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
2653 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
2654 CXX_STANDARD 11
2655 CXX_STANDARD_REQUIRED YES
2656 CXX_EXTENSIONS YES)
2657 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
2658 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2659 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2660
2661 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
2662 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
2663 CXX_STANDARD 11
2664 CXX_STANDARD_REQUIRED YES
2665 CXX_EXTENSIONS YES)
2666 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
2667 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2668 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2669
2670 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
2671 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
2672 CXX_STANDARD 11
2673 CXX_STANDARD_REQUIRED YES
2674 CXX_EXTENSIONS YES)
2675 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
2676 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2677 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2678
2679 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
2680 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
2681 CXX_STANDARD 11
2682 CXX_STANDARD_REQUIRED YES
2683 CXX_EXTENSIONS YES)
2684 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
2685 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2686 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2687
2688 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
2689 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
2690 CXX_STANDARD 11
2691 CXX_STANDARD_REQUIRED YES
2692 CXX_EXTENSIONS YES)
2693 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
2694 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2695 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2696
2697 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
2698 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
2699 C_STANDARD 99
2700 C_STANDARD_REQUIRED YES
2701 C_EXTENSIONS NO
2702 CXX_STANDARD 11
2703 CXX_STANDARD_REQUIRED YES
2704 CXX_EXTENSIONS YES)
2705 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
2706 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2707 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2708
2709 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
2710 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
2711 CXX_STANDARD 11
2712 CXX_STANDARD_REQUIRED YES
2713 CXX_EXTENSIONS YES)
2714 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
2715 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2716 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2717
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002718 ADD_EXECUTABLE(f32-sigmoid-bench bench/f32-sigmoid.cc)
2719 SET_TARGET_PROPERTIES(f32-sigmoid-bench PROPERTIES
2720 CXX_STANDARD 11
2721 CXX_STANDARD_REQUIRED YES
2722 CXX_EXTENSIONS YES)
2723 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE src)
2724 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2725 TARGET_LINK_LIBRARIES(f32-sigmoid-bench PRIVATE XNNPACK benchmark bench-utils)
2726
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002727 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
2728 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
2729 CXX_STANDARD 11
2730 CXX_STANDARD_REQUIRED YES
2731 CXX_EXTENSIONS YES)
2732 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
2733 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2734 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2735
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002736 ADD_EXECUTABLE(f32-softmax-bench bench/f32-softmax.cc)
2737 SET_TARGET_PROPERTIES(f32-softmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002738 CXX_STANDARD 11
2739 CXX_STANDARD_REQUIRED YES
2740 CXX_EXTENSIONS YES)
Marat Dukhanfd8e6892020-01-27 15:25:25 -08002741 TARGET_INCLUDE_DIRECTORIES(f32-softmax-bench PRIVATE src)
2742 TARGET_INCLUDE_DIRECTORIES(f32-softmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2743 TARGET_LINK_LIBRARIES(f32-softmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002744
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002745 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
2746 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
2747 CXX_STANDARD 11
2748 CXX_STANDARD_REQUIRED YES
2749 CXX_EXTENSIONS YES)
2750 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
2751 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2752 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
Marat Dukhanfe7acb62020-03-09 19:30:05 -07002753
2754 ADD_EXECUTABLE(requantization-bench bench/requantization.cc)
2755 SET_TARGET_PROPERTIES(requantization-bench PROPERTIES
2756 CXX_STANDARD 11
2757 CXX_STANDARD_REQUIRED YES
2758 CXX_EXTENSIONS YES)
2759 TARGET_INCLUDE_DIRECTORIES(requantization-bench PRIVATE src)
2760 TARGET_INCLUDE_DIRECTORIES(requantization-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2761 TARGET_LINK_LIBRARIES(requantization-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002762ENDIF()