blob: 90bf70f5a2df13a282c5aa0fa9147731b1813a60 [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
19OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
20OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
21
22# ---[ CMake options
23IF(XNNPACK_BUILD_TESTS)
24 ENABLE_TESTING()
25ENDIF()
26
27# ---[ Build flags
28IF(NOT CMAKE_SYSTEM_PROCESSOR)
29 IF(IOS)
30 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
31 IF(IOS_ARCH_COUNT GREATER 1)
32 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
33 "Specify a single architecture in IOS_ARCH and re-configure. ")
34 ENDIF()
35 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|armv7.*|arm64.*)$")
36 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
37 ENDIF()
38 ELSE()
39 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
40 ENDIF()
41ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|armv[5-8].*|aarch64)$")
42 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
43ENDIF()
44
45IF(NOT CMAKE_SYSTEM_NAME)
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
47ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android)$")
48 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
49ENDIF()
50
51# ---[ Download deps
52IF(NOT DEFINED CLOG_SOURCE_DIR)
53 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
54 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
55 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
56 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
57 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
58 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
59 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
60ENDIF()
61
62IF(NOT DEFINED CPUINFO_SOURCE_DIR)
63 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
64 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
65 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
66 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
67 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
68 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
69 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
70ENDIF()
71
72IF(NOT DEFINED FP16_SOURCE_DIR)
73 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
74 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
75 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
76 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
77 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
78 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
79 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
80ENDIF()
81
82IF(NOT DEFINED FXDIV_SOURCE_DIR)
83 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
84 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
85 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
86 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
87 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
88 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
89 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
90ENDIF()
91
92IF(NOT DEFINED PSIMD_SOURCE_DIR)
93 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
94 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
95 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
96 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
97 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
98 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
99 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
100ENDIF()
101
102IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
103 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
104 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
105 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
106 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
107 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
108 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
109 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
110ENDIF()
111
112IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
113 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
114 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
115 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
116 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
117 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
118 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
119 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
120ENDIF()
121
122IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
123 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
124 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
125 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
126 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
127 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
128 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
129 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
130ENDIF()
131
132# ---[ XNNPACK library
133SET(XNNPACK_OPERATOR_SRCS
Marat Dukhanefc47b82019-11-18 09:25:38 -0800134 src/add-nc.c
135 src/argmax-pooling-nhwc.c
136 src/average-pooling-nhwc.c
Marat Dukhanb1a0fc32019-12-02 19:32:02 -0800137 src/binary-elementwise-nd.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800138 src/channel-pad-nc.c
139 src/channel-shuffle-nc.c
140 src/clamp-nc.c
141 src/convolution-nchw.c
142 src/convolution-nhwc.c
143 src/deconvolution-nhwc.c
144 src/fully-connected-nc.c
145 src/global-average-pooling-ncw.c
146 src/global-average-pooling-nwc.c
147 src/hardswish-nc.c
148 src/leaky-relu-nc.c
149 src/max-pooling-nhwc.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800150 src/prelu-nc.c
151 src/resize-bilinear-nhwc.c
152 src/sigmoid-nc.c
153 src/softargmax-nc.c
154 src/unpooling-nhwc.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700155
156SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
157LIST(APPEND XNNPACK_COLD_SRCS
158 src/init.c
Ashkan Aliabadi1f8a2b82019-11-20 11:27:00 -0800159 src/memory.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700160 src/operator-delete.c)
161
162SET(XNNPACK_HOT_SRCS
163 src/indirection.c
164 src/operator-run.c)
165
166SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800167 src/f32-argmaxpool/4x-scalar-c1.c
168 src/f32-argmaxpool/9p8x-scalar-c1.c
169 src/f32-argmaxpool/9x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700170 src/f32-avgpool/mp9p8q-scalar.c
171 src/f32-avgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800172 src/f32-bilinear/gen/scalar-c1.c
173 src/f32-bilinear/gen/scalar-c2.c
174 src/f32-bilinear/gen/scalar-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700175 src/f32-clamp/scalar.c
Marat Dukhan6b7dfae2019-12-04 16:00:52 -0800176 src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan441e2212019-12-04 18:30:49 -0800177 src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700178 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700179 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700180 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800181 src/f32-dwconv-spchw/5x5p2-scalar.c
Erich Elsen38709a62019-11-08 11:58:45 -0800182 src/f32-dwconv-spchw/5x5s2p2-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800183 src/f32-dwconv/gen/up1x25-scalar-acc2.c
184 src/f32-dwconv/gen/up1x25-scalar.c
185 src/f32-dwconv/gen/up1x4-scalar-acc2.c
186 src/f32-dwconv/gen/up1x4-scalar.c
187 src/f32-dwconv/gen/up1x9-scalar-acc2.c
188 src/f32-dwconv/gen/up1x9-scalar.c
189 src/f32-dwconv/gen/up2x25-scalar-acc2.c
190 src/f32-dwconv/gen/up2x25-scalar.c
191 src/f32-dwconv/gen/up2x4-scalar-acc2.c
192 src/f32-dwconv/gen/up2x4-scalar.c
193 src/f32-dwconv/gen/up2x9-scalar-acc2.c
194 src/f32-dwconv/gen/up2x9-scalar.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700195 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700196 src/f32-gavgpool/mp7p7q-scalar.c
197 src/f32-gavgpool/up7-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800198 src/f32-gemm/gen/1x4-scalar.c
199 src/f32-gemm/gen/2x4-scalar.c
200 src/f32-gemm/gen/4x2-scalar.c
201 src/f32-gemm/gen/4x4-scalar.c
202 src/f32-gemm/gen-inc/1x4-scalar.c
203 src/f32-gemm/gen-inc/2x4-scalar.c
204 src/f32-gemm/gen-inc/4x4-scalar.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800205 src/f32-hswish/gen/scalar-x1.c
206 src/f32-hswish/gen/scalar-x2.c
207 src/f32-hswish/gen/scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800208 src/f32-igemm/gen/1x4-scalar.c
209 src/f32-igemm/gen/2x4-scalar.c
210 src/f32-igemm/gen/4x2-scalar.c
211 src/f32-igemm/gen/4x4-scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800212 src/f32-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700213 src/f32-pavgpool/mp9p8q-scalar.c
214 src/f32-pavgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800215 src/f32-ppmm/gen/2x4-scalar.c
216 src/f32-ppmm/gen/3x3-scalar.c
217 src/f32-ppmm/gen/4x2-scalar.c
218 src/f32-ppmm/gen/4x4-scalar.c
219 src/f32-prelu/gen/scalar-2x1.c
220 src/f32-prelu/gen/scalar-2x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700221 src/f32-rmax/scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800222 src/f32-spmm/gen/1x1-scalar-pipelined.c
223 src/f32-spmm/gen/1x1-scalar.c
224 src/f32-spmm/gen/2x1-scalar-pipelined.c
225 src/f32-spmm/gen/2x1-scalar.c
226 src/f32-spmm/gen/4x1-scalar-pipelined.c
227 src/f32-spmm/gen/4x1-scalar.c
228 src/f32-spmm/gen/8x1-scalar-pipelined.c
229 src/f32-spmm/gen/8x1-scalar.c
230 src/f32-spmm/gen/8x2-scalar.c
231 src/f32-spmm/gen/8x4-scalar.c
232 src/f32-vbinary/gen/vadd-scalar-x1.c
233 src/f32-vbinary/gen/vadd-scalar-x2.c
234 src/f32-vbinary/gen/vadd-scalar-x4.c
235 src/f32-vbinary/gen/vaddc-scalar-x1.c
236 src/f32-vbinary/gen/vaddc-scalar-x2.c
237 src/f32-vbinary/gen/vaddc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800238 src/f32-vbinary/gen/vdiv-scalar-x1.c
239 src/f32-vbinary/gen/vdiv-scalar-x2.c
240 src/f32-vbinary/gen/vdiv-scalar-x4.c
241 src/f32-vbinary/gen/vdivc-scalar-x1.c
242 src/f32-vbinary/gen/vdivc-scalar-x2.c
243 src/f32-vbinary/gen/vdivc-scalar-x4.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800244 src/f32-vbinary/gen/vmax-scalar-x1.c
245 src/f32-vbinary/gen/vmax-scalar-x2.c
246 src/f32-vbinary/gen/vmax-scalar-x4.c
247 src/f32-vbinary/gen/vmaxc-scalar-x1.c
248 src/f32-vbinary/gen/vmaxc-scalar-x2.c
249 src/f32-vbinary/gen/vmaxc-scalar-x4.c
250 src/f32-vbinary/gen/vmin-scalar-x1.c
251 src/f32-vbinary/gen/vmin-scalar-x2.c
252 src/f32-vbinary/gen/vmin-scalar-x4.c
253 src/f32-vbinary/gen/vminc-scalar-x1.c
254 src/f32-vbinary/gen/vminc-scalar-x2.c
255 src/f32-vbinary/gen/vminc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800256 src/f32-vbinary/gen/vmul-scalar-x1.c
257 src/f32-vbinary/gen/vmul-scalar-x2.c
258 src/f32-vbinary/gen/vmul-scalar-x4.c
259 src/f32-vbinary/gen/vmulc-scalar-x1.c
260 src/f32-vbinary/gen/vmulc-scalar-x2.c
261 src/f32-vbinary/gen/vmulc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800262 src/f32-vbinary/gen/vrdivc-scalar-x1.c
263 src/f32-vbinary/gen/vrdivc-scalar-x2.c
264 src/f32-vbinary/gen/vrdivc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800265 src/f32-vbinary/gen/vrsubc-scalar-x1.c
266 src/f32-vbinary/gen/vrsubc-scalar-x2.c
267 src/f32-vbinary/gen/vrsubc-scalar-x4.c
268 src/f32-vbinary/gen/vsub-scalar-x1.c
269 src/f32-vbinary/gen/vsub-scalar-x2.c
270 src/f32-vbinary/gen/vsub-scalar-x4.c
271 src/f32-vbinary/gen/vsubc-scalar-x1.c
272 src/f32-vbinary/gen/vsubc-scalar-x2.c
273 src/f32-vbinary/gen/vsubc-scalar-x4.c
274 src/f32-vmulcaddc/gen/c1-scalar-2x.c
275 src/f32-vmulcaddc/gen/c2-scalar-2x.c
276 src/f32-vmulcaddc/gen/c4-scalar-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700277 src/q8-avgpool/mp9p8q-scalar.c
278 src/q8-avgpool/up9-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700279 src/q8-dwconv/up1x9-scalar.c
280 src/q8-gavgpool/mp7p7q-scalar.c
281 src/q8-gavgpool/up7-scalar.c
282 src/q8-gemm/2x2-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800283 src/q8-igemm/2x2-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700284 src/q8-vadd/scalar.c
285 src/u8-clamp/scalar.c
286 src/u8-lut32norm/scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800287 src/u8-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700288 src/u8-rmax/scalar.c
289 src/x32-packx/x2-scalar.c
290 src/x32-packx/x3-scalar.c
291 src/x32-packx/x4-scalar.c
292 src/x32-pad/x2-scalar.c
293 src/x32-unpool/scalar.c
294 src/x32-zip/x2-scalar.c
295 src/x32-zip/x3-scalar.c
296 src/x32-zip/x4-scalar.c
297 src/x32-zip/xm-scalar.c
298 src/x8-lut/scalar.c
299 src/x8-zip/x2-scalar.c
300 src/x8-zip/x3-scalar.c
301 src/x8-zip/x4-scalar.c
302 src/x8-zip/xm-scalar.c)
303
304SET(XNNPACK_PSIMD_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800305 src/f32-argmaxpool/4x-psimd-c4.c
306 src/f32-argmaxpool/9p8x-psimd-c4.c
307 src/f32-argmaxpool/9x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700308 src/f32-avgpool/mp9p8q-psimd.c
309 src/f32-avgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800310 src/f32-bilinear/gen/psimd-c4.c
311 src/f32-bilinear/gen/psimd-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700312 src/f32-clamp/psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800313 src/f32-dwconv/gen/up4x25-psimd-acc2.c
314 src/f32-dwconv/gen/up4x25-psimd.c
315 src/f32-dwconv/gen/up4x4-psimd-acc2.c
316 src/f32-dwconv/gen/up4x4-psimd.c
317 src/f32-dwconv/gen/up4x9-psimd-acc2.c
318 src/f32-dwconv/gen/up4x9-psimd.c
319 src/f32-dwconv/gen/up8x25-psimd-acc2.c
320 src/f32-dwconv/gen/up8x25-psimd.c
321 src/f32-dwconv/gen/up8x4-psimd-acc2.c
322 src/f32-dwconv/gen/up8x4-psimd.c
323 src/f32-dwconv/gen/up8x9-psimd-acc2.c
324 src/f32-dwconv/gen/up8x9-psimd.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700325 src/f32-gavgpool/mp7p7q-psimd.c
326 src/f32-gavgpool/up7-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800327 src/f32-gemm/gen/1x8-psimd-loadsplat.c
328 src/f32-gemm/gen/1x8-psimd-splat.c
329 src/f32-gemm/gen/1x8s4-psimd.c
330 src/f32-gemm/gen/4x8-psimd-loadsplat.c
331 src/f32-gemm/gen/4x8-psimd-splat.c
332 src/f32-gemm/gen/4x8s4-psimd.c
333 src/f32-gemm/gen/6x8-psimd-loadsplat.c
334 src/f32-gemm/gen/6x8-psimd-splat.c
335 src/f32-gemm/gen/6x8s4-psimd.c
336 src/f32-gemm/gen-inc/1x8-psimd-loadsplat.c
337 src/f32-gemm/gen-inc/1x8-psimd-splat.c
338 src/f32-gemm/gen-inc/1x8s4-psimd.c
339 src/f32-gemm/gen-inc/4x8-psimd-loadsplat.c
340 src/f32-gemm/gen-inc/4x8-psimd-splat.c
341 src/f32-gemm/gen-inc/4x8s4-psimd.c
342 src/f32-gemm/gen-inc/6x8-psimd-loadsplat.c
343 src/f32-gemm/gen-inc/6x8-psimd-splat.c
344 src/f32-gemm/gen-inc/6x8s4-psimd.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800345 src/f32-hswish/gen/psimd-x4.c
346 src/f32-hswish/gen/psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800347 src/f32-igemm/gen/1x8-psimd-loadsplat.c
348 src/f32-igemm/gen/1x8-psimd-splat.c
349 src/f32-igemm/gen/1x8s4-psimd.c
350 src/f32-igemm/gen/4x2c4-psimd.c
351 src/f32-igemm/gen/4x8-psimd-loadsplat.c
352 src/f32-igemm/gen/4x8-psimd-splat.c
353 src/f32-igemm/gen/4x8s4-psimd.c
354 src/f32-igemm/gen/6x8-psimd-loadsplat.c
355 src/f32-igemm/gen/6x8-psimd-splat.c
356 src/f32-igemm/gen/6x8s4-psimd.c
Marat Dukhan329da642019-11-19 21:44:39 -0800357 src/f32-maxpool/9p8x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700358 src/f32-pavgpool/mp9p8q-psimd.c
359 src/f32-pavgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800360 src/f32-ppmm/gen/4x8-psimd.c
361 src/f32-prelu/gen/psimd-2x4.c
362 src/f32-prelu/gen/psimd-2x8.c
363 src/f32-vbinary/gen/vadd-psimd-x4.c
364 src/f32-vbinary/gen/vadd-psimd-x8.c
365 src/f32-vbinary/gen/vaddc-psimd-x4.c
366 src/f32-vbinary/gen/vaddc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800367 src/f32-vbinary/gen/vdiv-psimd-x4.c
368 src/f32-vbinary/gen/vdiv-psimd-x8.c
369 src/f32-vbinary/gen/vdivc-psimd-x4.c
370 src/f32-vbinary/gen/vdivc-psimd-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800371 src/f32-vbinary/gen/vmax-psimd-x4.c
372 src/f32-vbinary/gen/vmax-psimd-x8.c
373 src/f32-vbinary/gen/vmaxc-psimd-x4.c
374 src/f32-vbinary/gen/vmaxc-psimd-x8.c
375 src/f32-vbinary/gen/vmin-psimd-x4.c
376 src/f32-vbinary/gen/vmin-psimd-x8.c
377 src/f32-vbinary/gen/vminc-psimd-x4.c
378 src/f32-vbinary/gen/vminc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800379 src/f32-vbinary/gen/vmul-psimd-x4.c
380 src/f32-vbinary/gen/vmul-psimd-x8.c
381 src/f32-vbinary/gen/vmulc-psimd-x4.c
382 src/f32-vbinary/gen/vmulc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800383 src/f32-vbinary/gen/vrdivc-psimd-x4.c
384 src/f32-vbinary/gen/vrdivc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800385 src/f32-vbinary/gen/vrsubc-psimd-x4.c
386 src/f32-vbinary/gen/vrsubc-psimd-x8.c
387 src/f32-vbinary/gen/vsub-psimd-x4.c
388 src/f32-vbinary/gen/vsub-psimd-x8.c
389 src/f32-vbinary/gen/vsubc-psimd-x4.c
390 src/f32-vbinary/gen/vsubc-psimd-x8.c
391 src/f32-vmulcaddc/gen/c4-psimd-2x.c
392 src/f32-vmulcaddc/gen/c8-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700393 src/x32-packx/x4-psimd.c
394 src/x32-pad/x2-psimd.c
395 src/x32-unpool/psimd.c
396 src/x32-zip/x2-psimd.c
397 src/x32-zip/x3-psimd.c
398 src/x32-zip/x4-psimd.c
399 src/x32-zip/xm-psimd.c)
400
401SET(XNNPACK_NEON_MICROKERNEL_SRCS
Marat Dukhan36aecb52019-11-22 17:21:49 -0800402 src/f32-avgpool/mp9p8q-neon.c
403 src/f32-avgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800404 src/f32-bilinear/gen/neon-c4.c
405 src/f32-bilinear/gen/neon-c8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800406 src/f32-clamp/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800407 src/f32-dwconv/gen/up4x9-neon.c
408 src/f32-dwconv/gen/up4x9-neon-acc2.c
409 src/f32-dwconv/gen/up8x9-neon.c
410 src/f32-dwconv/gen/up8x9-neon-acc2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800411 src/f32-gavgpool-spchw/neon-x4.c
412 src/f32-gavgpool/mp7p7q-neon.c
413 src/f32-gavgpool/up7-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800414 src/f32-gemm/gen/1x8-neon-lane-ld64.c
415 src/f32-gemm/gen/4x2-neon-lane-ld64.c
416 src/f32-gemm/gen/4x8-neon-lane-ld128.c
417 src/f32-gemm/gen/4x8-neon-lane-ld64.c
418 src/f32-gemm/gen/5x8-neon-lane-ld64.c
419 src/f32-gemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800420 src/f32-gemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800421 src/f32-gemm/gen/1x8-neon-dup-ld64.c
422 src/f32-gemm/gen/4x8-neon-dup-ld128.c
423 src/f32-gemm/gen/4x8-neon-dup-ld64.c
424 src/f32-gemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800425 src/f32-gemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800426 src/f32-gemm/gen/1x8s4-neon.c
427 src/f32-gemm/gen/4x8s4-neon.c
428 src/f32-gemm/gen/6x8s4-neon.c
429 src/f32-gemm/gen/8x8s4-neon.c
430 src/f32-gemm/gen-inc/1x8-neon-lane-ld64.c
431 src/f32-gemm/gen-inc/4x8-neon-lane-ld128.c
432 src/f32-gemm/gen-inc/4x8-neon-lane-ld64.c
433 src/f32-gemm/gen-inc/5x8-neon-lane-ld64.c
434 src/f32-gemm/gen-inc/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800435 src/f32-gemm/gen-inc/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800436 src/f32-gemm/gen-inc/1x8-neon-dup-ld64.c
437 src/f32-gemm/gen-inc/4x8-neon-dup-ld128.c
438 src/f32-gemm/gen-inc/4x8-neon-dup-ld64.c
439 src/f32-gemm/gen-inc/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800440 src/f32-gemm/gen-inc/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800441 src/f32-gemm/gen-inc/1x8s4-neon.c
442 src/f32-gemm/gen-inc/4x8s4-neon.c
443 src/f32-gemm/gen-inc/6x8s4-neon.c
444 src/f32-gemm/gen-inc/8x8s4-neon.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800445 src/f32-hswish/gen/neon-x4.c
446 src/f32-hswish/gen/neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800447 src/f32-igemm/gen/1x8-neon-lane-ld64.c
448 src/f32-igemm/gen/4x2-neon-lane-ld64.c
449 src/f32-igemm/gen/4x4-neon-lane-ld64.c
450 src/f32-igemm/gen/4x8-neon-lane-ld128.c
451 src/f32-igemm/gen/4x8-neon-lane-ld64.c
452 src/f32-igemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800453 src/f32-igemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800454 src/f32-igemm/gen/1x8-neon-dup-ld64.c
455 src/f32-igemm/gen/4x8-neon-dup-ld128.c
456 src/f32-igemm/gen/4x8-neon-dup-ld64.c
457 src/f32-igemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800458 src/f32-igemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800459 src/f32-igemm/gen/1x8s4-neon.c
460 src/f32-igemm/gen/4x8s4-neon.c
461 src/f32-igemm/gen/6x8s4-neon.c
462 src/f32-igemm/gen/8x8s4-neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800463 src/f32-pavgpool/mp9p8q-neon.c
464 src/f32-pavgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800465 src/f32-ppmm/gen/4x8-neon.c
466 src/f32-ppmm/gen/8x8-neon.c
467 src/f32-prelu/gen/neon-2x4.c
468 src/f32-prelu/gen/neon-2x8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800469 src/f32-rmax/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800470 src/f32-sigmoid/gen/neon-frac-p9-p10-nr1recps-x16.c
471 src/f32-vbinary/gen/vadd-neon-x4.c
472 src/f32-vbinary/gen/vadd-neon-x8.c
473 src/f32-vbinary/gen/vaddc-neon-x4.c
474 src/f32-vbinary/gen/vaddc-neon-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800475 src/f32-vbinary/gen/vmax-neon-x4.c
476 src/f32-vbinary/gen/vmax-neon-x8.c
477 src/f32-vbinary/gen/vmaxc-neon-x4.c
478 src/f32-vbinary/gen/vmaxc-neon-x8.c
479 src/f32-vbinary/gen/vmin-neon-x4.c
480 src/f32-vbinary/gen/vmin-neon-x8.c
481 src/f32-vbinary/gen/vminc-neon-x4.c
482 src/f32-vbinary/gen/vminc-neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800483 src/f32-vbinary/gen/vmul-neon-x4.c
484 src/f32-vbinary/gen/vmul-neon-x8.c
485 src/f32-vbinary/gen/vmulc-neon-x4.c
486 src/f32-vbinary/gen/vmulc-neon-x8.c
487 src/f32-vbinary/gen/vrsubc-neon-x4.c
488 src/f32-vbinary/gen/vrsubc-neon-x8.c
489 src/f32-vbinary/gen/vsub-neon-x4.c
490 src/f32-vbinary/gen/vsub-neon-x8.c
491 src/f32-vbinary/gen/vsubc-neon-x4.c
492 src/f32-vbinary/gen/vsubc-neon-x8.c
493 src/f32-vmulcaddc/gen/c4-neon-2x.c
494 src/f32-vmulcaddc/gen/c8-neon-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800495 src/q8-avgpool/mp9p8q-neon.c
496 src/q8-avgpool/up9-neon.c
497 src/q8-dwconv/up8x9-neon.c
498 src/q8-gavgpool/mp7p7q-neon.c
499 src/q8-gavgpool/up7-neon.c
500 src/q8-gemm/4x8-neon.c
501 src/q8-gemm/8x8-neon.c
502 src/q8-igemm/4x8-neon.c
503 src/q8-igemm/8x8-neon.c
504 src/q8-vadd/neon.c
505 src/u8-clamp/neon.c
506 src/u8-maxpool/9p8x-neon-c16.c
507 src/u8-rmax/neon.c
508 src/x32-packx/x4-neon-st4.c
509 src/x32-pad/x2-neon.c
510 src/x32-zip/x2-neon.c
511 src/x32-zip/x3-neon.c
512 src/x32-zip/x4-neon.c
513 src/x32-zip/xm-neon.c
514 src/x8-zip/x2-neon.c
515 src/x8-zip/x3-neon.c
516 src/x8-zip/x4-neon.c
517 src/x8-zip/xm-neon.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700518
519SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800520 src/f32-bilinear/gen/neonfma-c4.c
521 src/f32-bilinear/gen/neonfma-c8.c
522 src/f32-igemm/gen/1x8-neonfma-dup-ld64.c
523 src/f32-igemm/gen/4x8-neonfma-dup-ld128.c
524 src/f32-igemm/gen/4x8-neonfma-dup-ld64.c
525 src/f32-igemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800526 src/f32-igemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800527 src/f32-igemm/gen/1x8s4-neonfma.c
528 src/f32-igemm/gen/4x8s4-neonfma.c
529 src/f32-igemm/gen/6x8s4-neonfma.c
530 src/f32-igemm/gen/8x8s4-neonfma.c
531 src/f32-dwconv/gen/up4x9-neonfma.c
532 src/f32-dwconv/gen/up4x9-neonfma-acc2.c
533 src/f32-dwconv/gen/up8x9-neonfma.c
534 src/f32-dwconv/gen/up8x9-neonfma-acc2.c
535 src/f32-gemm/gen/1x8-neonfma-dup-ld64.c
536 src/f32-gemm/gen/4x8-neonfma-dup-ld128.c
537 src/f32-gemm/gen/4x8-neonfma-dup-ld64.c
538 src/f32-gemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800539 src/f32-gemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800540 src/f32-gemm/gen/1x8s4-neonfma.c
541 src/f32-gemm/gen/4x8s4-neonfma.c
542 src/f32-gemm/gen/6x8s4-neonfma.c
543 src/f32-gemm/gen/8x8s4-neonfma.c
544 src/f32-gemm/gen-inc/1x8-neonfma-dup-ld64.c
545 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld128.c
546 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld64.c
547 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800548 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800549 src/f32-gemm/gen-inc/1x8s4-neonfma.c
550 src/f32-gemm/gen-inc/4x8s4-neonfma.c
551 src/f32-gemm/gen-inc/6x8s4-neonfma.c
552 src/f32-gemm/gen-inc/8x8s4-neonfma.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800553 src/f32-hswish/gen/neonfma-x4.c
554 src/f32-hswish/gen/neonfma-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800555 src/f32-ppmm/gen/4x8-neonfma.c
556 src/f32-ppmm/gen/8x8-neonfma.c
557 src/f32-sigmoid/gen/neonfma-p5-nr2fma-x16.c
558 src/f32-vmulcaddc/gen/c4-neonfma-2x.c
559 src/f32-vmulcaddc/gen/c8-neonfma-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800560 src/math/exp-neonfma-lut64-p2.c
561 src/math/exp-neonfma-p5.c
Marat Dukhan191e5cd2019-11-28 00:52:01 -0800562 src/math/expminus-neonfma-lut2048-p1.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800563 src/math/expminus-neonfma-lut64-p2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800564 src/math/expminus-neonfma-p5.c
Marat Dukhan91f8d862019-11-27 12:25:42 -0800565 src/math/sigmoid-neonfma-lut2048-p1-nr1recps1fma.c
566 src/math/sigmoid-neonfma-lut2048-p1-nr2fma.c
567 src/math/sigmoid-neonfma-lut2048-p1-nr2recps.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800568 src/math/sigmoid-neonfma-p5-nr1recps1fma.c
569 src/math/sigmoid-neonfma-p5-nr2fma.c
570 src/math/sigmoid-neonfma-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700571
Marat Dukhan36aecb52019-11-22 17:21:49 -0800572SET(XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan77ca6302019-12-06 12:48:15 -0800573 src/f32-vbinary/gen/vdiv-neon-x4.c
574 src/f32-vbinary/gen/vdiv-neon-x8.c
575 src/f32-vbinary/gen/vdivc-neon-x4.c
576 src/f32-vbinary/gen/vdivc-neon-x8.c
577 src/f32-vbinary/gen/vrdivc-neon-x4.c
578 src/f32-vbinary/gen/vrdivc-neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800579 src/f32-gemm/gen/1x8-neonfma-lane-ld64.c
580 src/f32-gemm/gen/4x2-neonfma-lane-ld64.c
581 src/f32-gemm/gen/4x8-neonfma-lane-ld128.c
582 src/f32-gemm/gen/4x8-neonfma-lane-ld64.c
583 src/f32-gemm/gen/5x8-neonfma-lane-ld64.c
584 src/f32-gemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800585 src/f32-gemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800586 src/f32-gemm/gen-inc/1x8-neonfma-lane-ld64.c
587 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld128.c
588 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld64.c
589 src/f32-gemm/gen-inc/5x8-neonfma-lane-ld64.c
590 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800591 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800592 src/f32-igemm/gen/1x8-neonfma-lane-ld64.c
593 src/f32-igemm/gen/4x2-neonfma-lane-ld64.c
594 src/f32-igemm/gen/4x4-neonfma-lane-ld64.c
595 src/f32-igemm/gen/4x8-neonfma-lane-ld128.c
596 src/f32-igemm/gen/4x8-neonfma-lane-ld64.c
597 src/f32-igemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800598 src/f32-igemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800599 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
600 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
601 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
602 src/f32-dwconv-spchw/3x3p1-neonfma.c
603 src/f32-dwconv-spchw/5x5p2-neonfma.c
604 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
605 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800606 src/f32-spmm/gen/12x1-neonfma.c
607 src/f32-spmm/gen/12x2-neonfma.c
608 src/f32-spmm/gen/12x4-neonfma.c
609 src/f32-spmm/gen/16x1-neonfma-pipelined.c
610 src/f32-spmm/gen/16x1-neonfma-unroll2.c
611 src/f32-spmm/gen/16x1-neonfma.c
612 src/f32-spmm/gen/16x2-neonfma.c
613 src/f32-spmm/gen/16x4-neonfma.c
614 src/f32-spmm/gen/4x1-neonfma-pipelined.c
615 src/f32-spmm/gen/4x1-neonfma-unroll2.c
616 src/f32-spmm/gen/4x1-neonfma.c
617 src/f32-spmm/gen/4x2-neonfma.c
618 src/f32-spmm/gen/4x4-neonfma.c
619 src/f32-spmm/gen/8x1-neonfma-pipelined.c
620 src/f32-spmm/gen/8x1-neonfma-unroll2.c
621 src/f32-spmm/gen/8x1-neonfma.c
622 src/f32-spmm/gen/8x2-neonfma.c
623 src/f32-spmm/gen/8x4-neonfma.c
Marat Dukhan91f8d862019-11-27 12:25:42 -0800624 src/math/sigmoid-neonfma-lut2048-p1-div.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800625 src/math/sigmoid-neonfma-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700626
627SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800628 src/f16-gemm/gen/4x8-neonfp16arith-ld64.c
629 src/f16-gemm/gen/6x8-neonfp16arith-ld64.c
630 src/f16-gemm/gen/8x8-neonfp16arith-ld64.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700631
632SET(XNNPACK_SSE_MICROKERNEL_SRCS
633 src/f32-avgpool/mp9p8q-sse.c
634 src/f32-avgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800635 src/f32-bilinear/gen/sse-c4.c
636 src/f32-bilinear/gen/sse-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700637 src/f32-clamp/sse.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800638 src/f32-dwconv-spchw/3x3p1-sse.c
639 src/f32-dwconv-spchw/3x3s2p1-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800640 src/f32-dwconv/gen/up4x25-sse-acc2.c
641 src/f32-dwconv/gen/up4x25-sse.c
642 src/f32-dwconv/gen/up4x4-sse-acc2.c
643 src/f32-dwconv/gen/up4x4-sse.c
644 src/f32-dwconv/gen/up4x9-sse-acc2.c
645 src/f32-dwconv/gen/up4x9-sse.c
646 src/f32-dwconv/gen/up8x25-sse-acc2.c
647 src/f32-dwconv/gen/up8x25-sse.c
648 src/f32-dwconv/gen/up8x4-sse-acc2.c
649 src/f32-dwconv/gen/up8x4-sse.c
650 src/f32-dwconv/gen/up8x9-sse-acc2.c
651 src/f32-dwconv/gen/up8x9-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700652 src/f32-gavgpool-spchw/sse-x4.c
653 src/f32-gavgpool/mp7p7q-sse.c
654 src/f32-gavgpool/up7-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800655 src/f32-gemm/gen/1x8-sse-dup.c
656 src/f32-gemm/gen/1x8-sse-load1.c
657 src/f32-gemm/gen/1x8s4-sse.c
658 src/f32-gemm/gen/4x8-sse-dup.c
659 src/f32-gemm/gen/4x8-sse-load1.c
660 src/f32-gemm/gen/4x8s4-sse.c
661 src/f32-gemm/gen-inc/1x8-sse-dup.c
662 src/f32-gemm/gen-inc/1x8-sse-load1.c
663 src/f32-gemm/gen-inc/1x8s4-sse.c
664 src/f32-gemm/gen-inc/4x8-sse-dup.c
665 src/f32-gemm/gen-inc/4x8-sse-load1.c
666 src/f32-gemm/gen-inc/4x8s4-sse.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800667 src/f32-hswish/gen/sse-x4.c
668 src/f32-hswish/gen/sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800669 src/f32-igemm/gen/1x8-sse-dup.c
670 src/f32-igemm/gen/1x8-sse-load1.c
671 src/f32-igemm/gen/1x8s4-sse.c
672 src/f32-igemm/gen/4x2c4-sse.c
673 src/f32-igemm/gen/4x8-sse-dup.c
674 src/f32-igemm/gen/4x8-sse-load1.c
675 src/f32-igemm/gen/4x8s4-sse.c
Marat Dukhan329da642019-11-19 21:44:39 -0800676 src/f32-maxpool/9p8x-sse-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700677 src/f32-pavgpool/mp9p8q-sse.c
678 src/f32-pavgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800679 src/f32-ppmm/gen/4x8-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700680 src/f32-rmax/sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800681 src/f32-spmm/gen/4x1-sse.c
682 src/f32-spmm/gen/8x1-sse.c
683 src/f32-vbinary/gen/vadd-sse-x4.c
684 src/f32-vbinary/gen/vadd-sse-x8.c
685 src/f32-vbinary/gen/vaddc-sse-x4.c
686 src/f32-vbinary/gen/vaddc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800687 src/f32-vbinary/gen/vdiv-sse-x4.c
688 src/f32-vbinary/gen/vdiv-sse-x8.c
689 src/f32-vbinary/gen/vdivc-sse-x4.c
690 src/f32-vbinary/gen/vdivc-sse-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800691 src/f32-vbinary/gen/vmax-sse-x4.c
692 src/f32-vbinary/gen/vmax-sse-x8.c
693 src/f32-vbinary/gen/vmaxc-sse-x4.c
694 src/f32-vbinary/gen/vmaxc-sse-x8.c
695 src/f32-vbinary/gen/vmin-sse-x4.c
696 src/f32-vbinary/gen/vmin-sse-x8.c
697 src/f32-vbinary/gen/vminc-sse-x4.c
698 src/f32-vbinary/gen/vminc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800699 src/f32-vbinary/gen/vmul-sse-x4.c
700 src/f32-vbinary/gen/vmul-sse-x8.c
701 src/f32-vbinary/gen/vmulc-sse-x4.c
702 src/f32-vbinary/gen/vmulc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800703 src/f32-vbinary/gen/vrdivc-sse-x4.c
704 src/f32-vbinary/gen/vrdivc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800705 src/f32-vbinary/gen/vrsubc-sse-x4.c
706 src/f32-vbinary/gen/vrsubc-sse-x8.c
707 src/f32-vbinary/gen/vsub-sse-x4.c
708 src/f32-vbinary/gen/vsub-sse-x8.c
709 src/f32-vbinary/gen/vsubc-sse-x4.c
710 src/f32-vbinary/gen/vsubc-sse-x8.c
711 src/f32-vmulcaddc/gen/c4-sse-2x.c
712 src/f32-vmulcaddc/gen/c8-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700713 src/x32-packx/x4-sse.c)
714
715SET(XNNPACK_SSE2_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800716 src/f32-argmaxpool/4x-sse2-c4.c
717 src/f32-argmaxpool/9p8x-sse2-c4.c
718 src/f32-argmaxpool/9x-sse2-c4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800719 src/f32-prelu/gen/sse2-2x4.c
720 src/f32-prelu/gen/sse2-2x8.c
721 src/f32-sigmoid/gen/sse2-p5-div-x8.c
722 src/f32-sigmoid/gen/sse2-p5-div-x16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700723 src/q8-avgpool/mp9p8q-sse2.c
724 src/q8-avgpool/up9-sse2.c
725 src/q8-igemm/4x4c2-sse2.c
726 src/q8-dwconv/up8x9-sse2.c
727 src/q8-gavgpool/mp7p7q-sse2.c
728 src/q8-gavgpool/up7-sse2.c
729 src/q8-gemm/2x4c8-sse2.c
730 src/q8-gemm/4x4c2-sse2.c
731 src/q8-vadd/sse2.c
732 src/u8-clamp/sse2.c
Marat Dukhan329da642019-11-19 21:44:39 -0800733 src/u8-maxpool/9p8x-sse2-c16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700734 src/u8-rmax/sse2.c
735 src/x32-pad/x2-sse2.c
736 src/x32-zip/x2-sse2.c
737 src/x32-zip/x3-sse2.c
738 src/x32-zip/x4-sse2.c
739 src/x32-zip/xm-sse2.c
740 src/x8-zip/x2-sse2.c
741 src/x8-zip/x3-sse2.c
742 src/x8-zip/x4-sse2.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800743 src/x8-zip/xm-sse2.c
744 src/math/exp-sse2-p5.c
Marat Dukhan80bafd22019-11-18 10:16:01 -0800745 src/math/expminus-sse2-p5.c
746 src/math/sigmoid-sse2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700747
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800748SET(XNNPACK_SSE41_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800749 src/f32-prelu/gen/sse41-2x4.c
750 src/f32-prelu/gen/sse41-2x8.c
751 src/f32-sigmoid/gen/sse41-p5-div-x8.c
752 src/f32-sigmoid/gen/sse41-p5-div-x16.c)
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800753
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700754SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -0800755 src/f32-clamp/avx.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800756 src/f32-dwconv/gen/up16x4-avx-acc2.c
757 src/f32-dwconv/gen/up16x4-avx.c
758 src/f32-dwconv/gen/up8x4-avx-acc2.c
759 src/f32-dwconv/gen/up8x4-avx.c
760 src/f32-dwconv/gen/up16x9-avx-acc2.c
761 src/f32-dwconv/gen/up16x9-avx.c
762 src/f32-dwconv/gen/up8x9-avx-acc2.c
763 src/f32-dwconv/gen/up8x9-avx.c
764 src/f32-dwconv/gen/up16x25-avx-acc2.c
765 src/f32-dwconv/gen/up16x25-avx.c
766 src/f32-dwconv/gen/up8x25-avx-acc2.c
767 src/f32-dwconv/gen/up8x25-avx.c
768 src/f32-gemm/gen/1x8-avx-broadcast.c
769 src/f32-gemm/gen/4x8-avx-broadcast.c
770 src/f32-gemm/gen/5x8-avx-broadcast.c
771 src/f32-gemm/gen/6x8-avx-broadcast.c
772 src/f32-gemm/gen/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800773 src/f32-gemm/gen/1x16-avx-broadcast.c
774 src/f32-gemm/gen/3x16-avx-broadcast.c
775 src/f32-gemm/gen/4x16-avx-broadcast.c
776 src/f32-gemm/gen/5x16-avx-broadcast.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800777 src/f32-gemm/gen-inc/1x8-avx-broadcast.c
778 src/f32-gemm/gen-inc/4x8-avx-broadcast.c
779 src/f32-gemm/gen-inc/5x8-avx-broadcast.c
780 src/f32-gemm/gen-inc/6x8-avx-broadcast.c
781 src/f32-gemm/gen-inc/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800782 src/f32-gemm/gen-inc/1x16-avx-broadcast.c
783 src/f32-gemm/gen-inc/3x16-avx-broadcast.c
784 src/f32-gemm/gen-inc/4x16-avx-broadcast.c
785 src/f32-gemm/gen-inc/5x16-avx-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800786 src/f32-hswish/gen/avx-x8.c
787 src/f32-hswish/gen/avx-x16.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800788 src/f32-igemm/gen/1x8-avx-broadcast.c
789 src/f32-igemm/gen/4x8-avx-broadcast.c
790 src/f32-igemm/gen/5x8-avx-broadcast.c
791 src/f32-igemm/gen/6x8-avx-broadcast.c
792 src/f32-igemm/gen/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800793 src/f32-igemm/gen/1x16-avx-broadcast.c
794 src/f32-igemm/gen/3x16-avx-broadcast.c
795 src/f32-igemm/gen/4x16-avx-broadcast.c
796 src/f32-igemm/gen/5x16-avx-broadcast.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700797 src/f32-rmax/avx.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -0800798 src/f32-vbinary/gen/vadd-avx-x8.c
799 src/f32-vbinary/gen/vadd-avx-x16.c
800 src/f32-vbinary/gen/vaddc-avx-x8.c
801 src/f32-vbinary/gen/vaddc-avx-x16.c
802 src/f32-vbinary/gen/vdiv-avx-x8.c
803 src/f32-vbinary/gen/vdiv-avx-x16.c
804 src/f32-vbinary/gen/vdivc-avx-x8.c
805 src/f32-vbinary/gen/vdivc-avx-x16.c
806 src/f32-vbinary/gen/vmax-avx-x8.c
807 src/f32-vbinary/gen/vmax-avx-x16.c
808 src/f32-vbinary/gen/vmaxc-avx-x8.c
809 src/f32-vbinary/gen/vmaxc-avx-x16.c
810 src/f32-vbinary/gen/vmin-avx-x8.c
811 src/f32-vbinary/gen/vmin-avx-x16.c
812 src/f32-vbinary/gen/vminc-avx-x8.c
813 src/f32-vbinary/gen/vminc-avx-x16.c
814 src/f32-vbinary/gen/vmul-avx-x8.c
815 src/f32-vbinary/gen/vmul-avx-x16.c
816 src/f32-vbinary/gen/vmulc-avx-x8.c
817 src/f32-vbinary/gen/vmulc-avx-x16.c
818 src/f32-vbinary/gen/vrdivc-avx-x8.c
819 src/f32-vbinary/gen/vrdivc-avx-x16.c
820 src/f32-vbinary/gen/vrsubc-avx-x8.c
821 src/f32-vbinary/gen/vrsubc-avx-x16.c
822 src/f32-vbinary/gen/vsub-avx-x8.c
823 src/f32-vbinary/gen/vsub-avx-x16.c
824 src/f32-vbinary/gen/vsubc-avx-x8.c
825 src/f32-vbinary/gen/vsubc-avx-x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700826 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700827
Marat Dukhanfda12b82019-11-21 12:27:59 -0800828SET(XNNPACK_FMA3_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800829 src/f32-dwconv/gen/up16x4-fma3-acc2.c
830 src/f32-dwconv/gen/up16x4-fma3.c
831 src/f32-dwconv/gen/up8x4-fma3-acc2.c
832 src/f32-dwconv/gen/up8x4-fma3.c
833 src/f32-dwconv/gen/up16x9-fma3-acc2.c
834 src/f32-dwconv/gen/up16x9-fma3.c
835 src/f32-dwconv/gen/up8x9-fma3-acc2.c
836 src/f32-dwconv/gen/up8x9-fma3.c
837 src/f32-dwconv/gen/up16x25-fma3-acc2.c
838 src/f32-dwconv/gen/up16x25-fma3.c
839 src/f32-dwconv/gen/up8x25-fma3-acc2.c
840 src/f32-dwconv/gen/up8x25-fma3.c
841 src/f32-gemm/gen/1x8-fma3-broadcast.c
842 src/f32-gemm/gen/4x8-fma3-broadcast.c
843 src/f32-gemm/gen/5x8-fma3-broadcast.c
844 src/f32-gemm/gen/6x8-fma3-broadcast.c
845 src/f32-gemm/gen/7x8-fma3-broadcast.c
846 src/f32-gemm/gen/8x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800847 src/f32-gemm/gen/1x16-fma3-broadcast.c
848 src/f32-gemm/gen/3x16-fma3-broadcast.c
849 src/f32-gemm/gen/4x16-fma3-broadcast.c
850 src/f32-gemm/gen/5x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -0800851 src/f32-gemm/gen/1x16s4-fma3-broadcast.c
852 src/f32-gemm/gen/3x16s4-fma3-broadcast.c
853 src/f32-gemm/gen/4x16s4-fma3-broadcast.c
854 src/f32-gemm/gen/5x16s4-fma3-broadcast.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800855 src/f32-gemm/gen-inc/1x8-fma3-broadcast.c
856 src/f32-gemm/gen-inc/4x8-fma3-broadcast.c
857 src/f32-gemm/gen-inc/5x8-fma3-broadcast.c
858 src/f32-gemm/gen-inc/6x8-fma3-broadcast.c
859 src/f32-gemm/gen-inc/7x8-fma3-broadcast.c
860 src/f32-gemm/gen-inc/8x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800861 src/f32-gemm/gen-inc/1x16-fma3-broadcast.c
862 src/f32-gemm/gen-inc/3x16-fma3-broadcast.c
863 src/f32-gemm/gen-inc/4x16-fma3-broadcast.c
864 src/f32-gemm/gen-inc/5x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -0800865 src/f32-gemm/gen-inc/1x16s4-fma3-broadcast.c
866 src/f32-gemm/gen-inc/3x16s4-fma3-broadcast.c
867 src/f32-gemm/gen-inc/4x16s4-fma3-broadcast.c
868 src/f32-gemm/gen-inc/5x16s4-fma3-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800869 src/f32-hswish/gen/fma3-x8.c
870 src/f32-hswish/gen/fma3-x16.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800871 src/f32-igemm/gen/1x8-fma3-broadcast.c
872 src/f32-igemm/gen/4x8-fma3-broadcast.c
873 src/f32-igemm/gen/5x8-fma3-broadcast.c
874 src/f32-igemm/gen/6x8-fma3-broadcast.c
875 src/f32-igemm/gen/7x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800876 src/f32-igemm/gen/8x8-fma3-broadcast.c
877 src/f32-igemm/gen/1x16-fma3-broadcast.c
878 src/f32-igemm/gen/3x16-fma3-broadcast.c
879 src/f32-igemm/gen/4x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -0800880 src/f32-igemm/gen/5x16-fma3-broadcast.c
881 src/f32-igemm/gen/1x16s4-fma3-broadcast.c
882 src/f32-igemm/gen/3x16s4-fma3-broadcast.c
883 src/f32-igemm/gen/4x16s4-fma3-broadcast.c
884 src/f32-igemm/gen/5x16s4-fma3-broadcast.c)
Marat Dukhanfda12b82019-11-21 12:27:59 -0800885
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700886SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan4c4eb002019-12-08 21:27:49 -0800887 src/f32-raddexpminusmax/gen/avx2-p5-x64.c
888 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc2.c
889 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc4.c
890 src/f32-raddexpminusmax/gen/avx2-p5-x72.c
891 src/f32-raddexpminusmax/gen/avx2-p5-x72-acc3.c
892 src/f32-raddexpminusmax/gen/avx2-p5-x80.c
893 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc2.c
894 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc5.c
895 src/f32-raddexpminusmax/gen/avx2-p5-x96.c
896 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc2.c
897 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc3.c
898 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc6.c
899 src/f32-raddextexp/gen/avx2-p5-x64.c
900 src/f32-raddextexp/gen/avx2-p5-x64-acc2.c
901 src/f32-raddextexp/gen/avx2-p5-x64-acc4.c
902 src/f32-raddextexp/gen/avx2-p5-x72.c
903 src/f32-raddextexp/gen/avx2-p5-x72-acc3.c
904 src/f32-raddextexp/gen/avx2-p5-x80.c
905 src/f32-raddextexp/gen/avx2-p5-x80-acc2.c
906 src/f32-raddextexp/gen/avx2-p5-x80-acc5.c
907 src/f32-raddextexp/gen/avx2-p5-x96.c
908 src/f32-raddextexp/gen/avx2-p5-x96-acc2.c
909 src/f32-raddextexp/gen/avx2-p5-x96-acc3.c
910 src/f32-raddextexp/gen/avx2-p5-x96-acc6.c
911 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64.c
912 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc2.c
913 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc4.c
914 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72.c
915 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72-acc3.c
916 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80.c
917 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc2.c
918 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc5.c
919 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96.c
920 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc2.c
921 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc3.c
922 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc6.c
923 src/f32-vscaleexpminusmax/gen/avx2-p5-x8.c
924 src/f32-vscaleexpminusmax/gen/avx2-p5-x16.c
925 src/f32-vscaleexpminusmax/gen/avx2-p5-x24.c
926 src/f32-vscaleexpminusmax/gen/avx2-p5-x32.c
927 src/f32-vscaleexpminusmax/gen/avx2-p5-x40.c
928 src/f32-vscaleexpminusmax/gen/avx2-p5-x48.c
929 src/f32-vscaleexpminusmax/gen/avx2-p5-x56.c
930 src/f32-vscaleexpminusmax/gen/avx2-p5-x64.c
931 src/f32-vscaleexpminusmax/gen/avx2-p5-x72.c
932 src/f32-vscaleexpminusmax/gen/avx2-p5-x80.c
933 src/f32-vscaleexpminusmax/gen/avx2-p5-x88.c
934 src/f32-vscaleexpminusmax/gen/avx2-p5-x96.c
935 src/f32-vscaleextexp/gen/avx2-p5-x8.c
936 src/f32-vscaleextexp/gen/avx2-p5-x16.c
937 src/f32-vscaleextexp/gen/avx2-p5-x24.c
938 src/f32-vscaleextexp/gen/avx2-p5-x32.c
939 src/f32-vscaleextexp/gen/avx2-p5-x40.c
940 src/f32-vscaleextexp/gen/avx2-p5-x48.c
941 src/f32-vscaleextexp/gen/avx2-p5-x56.c
942 src/f32-vscaleextexp/gen/avx2-p5-x64.c
943 src/f32-vscaleextexp/gen/avx2-p5-x72.c
944 src/f32-vscaleextexp/gen/avx2-p5-x80.c
945 src/f32-vscaleextexp/gen/avx2-p5-x88.c
946 src/f32-vscaleextexp/gen/avx2-p5-x96.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700947 src/math/exp-avx2-p5.c
948 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -0700949 src/math/exp-avx2-perm-p4.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800950 src/math/expminus-avx2-p5.c
951 src/math/extexp-avx2-p5.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700952
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700953SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -0800954 src/f32-clamp/avx512f.c
Marat Dukhan479f87e2019-11-27 15:17:06 -0800955 src/f32-dwconv/gen/up32x4-avx512f-acc2.c
956 src/f32-dwconv/gen/up32x4-avx512f.c
957 src/f32-dwconv/gen/up16x4-avx512f-acc2.c
958 src/f32-dwconv/gen/up16x4-avx512f.c
959 src/f32-dwconv/gen/up32x9-avx512f-acc2.c
960 src/f32-dwconv/gen/up32x9-avx512f.c
961 src/f32-dwconv/gen/up16x9-avx512f-acc2.c
962 src/f32-dwconv/gen/up16x9-avx512f.c
963 src/f32-dwconv/gen/up32x25-avx512f-acc2.c
964 src/f32-dwconv/gen/up32x25-avx512f.c
965 src/f32-dwconv/gen/up16x25-avx512f-acc2.c
966 src/f32-dwconv/gen/up16x25-avx512f.c
Marat Dukhan0f349c42019-11-27 11:58:54 -0800967 src/f32-gemm/gen/1x16-avx512f-broadcast.c
968 src/f32-gemm/gen/4x16-avx512f-broadcast.c
969 src/f32-gemm/gen/5x16-avx512f-broadcast.c
970 src/f32-gemm/gen/6x16-avx512f-broadcast.c
971 src/f32-gemm/gen/7x16-avx512f-broadcast.c
972 src/f32-gemm/gen/8x16-avx512f-broadcast.c
973 src/f32-gemm/gen-inc/1x16-avx512f-broadcast.c
974 src/f32-gemm/gen-inc/4x16-avx512f-broadcast.c
975 src/f32-gemm/gen-inc/5x16-avx512f-broadcast.c
976 src/f32-gemm/gen-inc/6x16-avx512f-broadcast.c
977 src/f32-gemm/gen-inc/7x16-avx512f-broadcast.c
978 src/f32-gemm/gen-inc/8x16-avx512f-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800979 src/f32-hswish/gen/avx512f-x16.c
980 src/f32-hswish/gen/avx512f-x32.c
Marat Dukhan0f349c42019-11-27 11:58:54 -0800981 src/f32-igemm/gen/1x16-avx512f-broadcast.c
982 src/f32-igemm/gen/4x16-avx512f-broadcast.c
983 src/f32-igemm/gen/5x16-avx512f-broadcast.c
984 src/f32-igemm/gen/6x16-avx512f-broadcast.c
985 src/f32-igemm/gen/7x16-avx512f-broadcast.c
986 src/f32-igemm/gen/8x16-avx512f-broadcast.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -0800987 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c
988 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
989 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
990 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144.c
991 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
992 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160.c
993 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
994 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
995 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192.c
996 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
997 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
998 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
999 src/f32-raddextexp/gen/avx512f-p5-scalef-x128.c
1000 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc2.c
1001 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc4.c
1002 src/f32-raddextexp/gen/avx512f-p5-scalef-x144.c
1003 src/f32-raddextexp/gen/avx512f-p5-scalef-x144-acc3.c
1004 src/f32-raddextexp/gen/avx512f-p5-scalef-x160.c
1005 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc2.c
1006 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc5.c
1007 src/f32-raddextexp/gen/avx512f-p5-scalef-x192.c
1008 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc2.c
1009 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc3.c
1010 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc6.c
1011 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128.c
1012 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1013 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1014 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144.c
1015 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1016 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160.c
1017 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1018 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1019 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192.c
1020 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1021 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1022 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001023 src/f32-rmax/avx512f.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001024 src/f32-vbinary/gen/vadd-avx512f-x16.c
1025 src/f32-vbinary/gen/vadd-avx512f-x32.c
1026 src/f32-vbinary/gen/vaddc-avx512f-x16.c
1027 src/f32-vbinary/gen/vaddc-avx512f-x32.c
1028 src/f32-vbinary/gen/vdiv-avx512f-x16.c
1029 src/f32-vbinary/gen/vdiv-avx512f-x32.c
1030 src/f32-vbinary/gen/vdivc-avx512f-x16.c
1031 src/f32-vbinary/gen/vdivc-avx512f-x32.c
1032 src/f32-vbinary/gen/vmax-avx512f-x16.c
1033 src/f32-vbinary/gen/vmax-avx512f-x32.c
1034 src/f32-vbinary/gen/vmaxc-avx512f-x16.c
1035 src/f32-vbinary/gen/vmaxc-avx512f-x32.c
1036 src/f32-vbinary/gen/vmin-avx512f-x16.c
1037 src/f32-vbinary/gen/vmin-avx512f-x32.c
1038 src/f32-vbinary/gen/vminc-avx512f-x16.c
1039 src/f32-vbinary/gen/vminc-avx512f-x32.c
1040 src/f32-vbinary/gen/vmul-avx512f-x16.c
1041 src/f32-vbinary/gen/vmul-avx512f-x32.c
1042 src/f32-vbinary/gen/vmulc-avx512f-x16.c
1043 src/f32-vbinary/gen/vmulc-avx512f-x32.c
1044 src/f32-vbinary/gen/vrdivc-avx512f-x16.c
1045 src/f32-vbinary/gen/vrdivc-avx512f-x32.c
1046 src/f32-vbinary/gen/vrsubc-avx512f-x16.c
1047 src/f32-vbinary/gen/vrsubc-avx512f-x32.c
1048 src/f32-vbinary/gen/vsub-avx512f-x16.c
1049 src/f32-vbinary/gen/vsub-avx512f-x32.c
1050 src/f32-vbinary/gen/vsubc-avx512f-x16.c
1051 src/f32-vbinary/gen/vsubc-avx512f-x32.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001052 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001053 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x16.c
1054 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x32.c
1055 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x48.c
1056 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x64.c
1057 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x80.c
1058 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x96.c
1059 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x112.c
1060 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x128.c
1061 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x144.c
1062 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x160.c
1063 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x176.c
1064 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x192.c
1065 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x16.c
1066 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x32.c
1067 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x48.c
1068 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x64.c
1069 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x80.c
1070 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x96.c
1071 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x112.c
1072 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x128.c
1073 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x144.c
1074 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x160.c
1075 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x176.c
1076 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x192.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001077 src/math/exp-avx512f-p5-scalef.c
1078 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -07001079 src/math/exp-avx512f-perm-p3.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001080 src/math/exp-avx512f-perm2-p2.c
1081 src/math/extexp-avx512f-p5.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001082
1083SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
Frank Barchard8b0f0262019-11-27 23:18:40 -08001084 src/q8-dwconv/up8x9-aarch32-neon.S
Frank Barchard13916042019-12-11 10:56:34 -08001085 src/f32-gemm/4x8-aarch32-neon-cortex-a53.S
Frank Barchard3e237f22019-12-04 23:08:51 -08001086 src/f32-gemm/4x8-aarch32-neon-cortex-a75.S
Frank Barchard8b0f0262019-11-27 23:18:40 -08001087 src/f32-gemm/4x8-aarch32-neon-ld64.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001088
1089SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
1090 src/f32-dwconv/up4x9-aarch64-neonfma-cortex-a55.S
1091 src/f32-dwconv/up4x9-aarch64-neonfma.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001092 src/f32-gemm/gen/1x12-aarch64-neonfma-cortex-a53.S
1093 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a53.S
1094 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a57.S
1095 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a75.S
1096 src/f32-gemm/gen/4x12-aarch64-neonfma-cortex-a53.S
1097 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a53.S
1098 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a57.S
1099 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a75.S
1100 src/f32-gemm/gen/4x8-aarch64-neonfma-ld128.S
1101 src/f32-gemm/gen/4x8-aarch64-neonfma-ld64.S
1102 src/f32-gemm/gen/5x8-aarch64-neonfma-cortex-a75.S
1103 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a53.S
1104 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a57.S
1105 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a73.S
1106 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a75.S
1107 src/f32-gemm/gen/6x8-aarch64-neonfma-ld128.S
1108 src/f32-gemm/gen/6x8-aarch64-neonfma-ld64.S
1109 src/f32-gemm/gen-inc/1x12-aarch64-neonfma-cortex-a53.S
1110 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a53.S
1111 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a57.S
1112 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a75.S
1113 src/f32-gemm/gen-inc/4x12-aarch64-neonfma-cortex-a53.S
1114 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a53.S
1115 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a57.S
1116 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a75.S
1117 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld128.S
1118 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld64.S
1119 src/f32-gemm/gen-inc/5x8-aarch64-neonfma-cortex-a75.S
1120 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a53.S
1121 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a57.S
1122 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a73.S
1123 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a75.S
1124 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld128.S
1125 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld64.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001126 src/f32-igemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -07001127 src/f32-igemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001128 src/f32-igemm/1x8-aarch64-neonfma-cortex-a57.S
1129 src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.S
1130 src/f32-igemm/4x12-aarch64-neonfma-cortex-a53.S
1131 src/f32-igemm/4x8-aarch64-neonfma-cortex-a75.S
1132 src/f32-igemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -07001133 src/f32-igemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001134 src/f32-igemm/6x8-aarch64-neonfma-cortex-a57.S
1135 src/f32-igemm/6x8-aarch64-neonfma-cortex-a73.S
1136 src/f32-igemm/6x8-aarch64-neonfma-cortex-a75.S)
1137
1138SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
1139IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
1140 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_MICROKERNEL_SRCS})
1141ENDIF()
1142IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1143 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1144 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
1145 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
1146ENDIF()
1147IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1148 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1149 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan36aecb52019-11-22 17:21:49 -08001150 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001151 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
1152 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
1153ENDIF()
1154IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
1155 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
1156 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001157 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001158 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhanfda12b82019-11-21 12:27:59 -08001159 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_FMA3_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001160 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001161 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
1162ENDIF()
1163
1164IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
1165 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
1166ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
1167 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
1168ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
1169 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
1170ELSE()
1171 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
1172ENDIF()
1173SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
1174 C_STANDARD 99
1175 C_EXTENSIONS YES)
1176IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1177 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
1178 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
1179 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
1180 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
1181 IF(IOS)
1182 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
1183 ENDIF()
1184ENDIF()
1185IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1186 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
1187 IF(IOS)
1188 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
1189 ENDIF()
1190ENDIF()
1191IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
1192 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
1193 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001194 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001195 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhanfda12b82019-11-21 12:27:59 -08001196 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001197 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001198 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
1199ENDIF()
1200IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
1201 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
1202ELSE()
1203 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
1204 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1205 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1206 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
1207ENDIF()
1208IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
1209 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
1210ENDIF()
1211
1212TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
1213TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
Ashkan Aliabadid255a312019-12-03 12:44:34 -08001214SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/xnnpack.h)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001215
1216# ---[ Configure clog
1217IF(NOT TARGET clog)
1218 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
1219 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
1220 ADD_SUBDIRECTORY(
1221 "${CLOG_SOURCE_DIR}/deps/clog"
1222 "${CMAKE_BINARY_DIR}/clog")
1223 # We build static version of clog but a dynamic library may indirectly depend on it
1224 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
1225ENDIF()
1226TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
1227
1228# ---[ Configure cpuinfo
1229IF(NOT TARGET cpuinfo)
1230 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
1231 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
1232 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
1233 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
1234 ADD_SUBDIRECTORY(
1235 "${CPUINFO_SOURCE_DIR}"
1236 "${CMAKE_BINARY_DIR}/cpuinfo")
1237ENDIF()
1238TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
1239
1240# ---[ Configure pthreadpool
1241IF(NOT TARGET pthreadpool)
1242 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
1243 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -07001244 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001245 ADD_SUBDIRECTORY(
1246 "${PTHREADPOOL_SOURCE_DIR}"
1247 "${CMAKE_BINARY_DIR}/pthreadpool")
1248ENDIF()
1249TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
1250
1251# ---[ Configure FXdiv
1252IF(NOT TARGET fxdiv)
1253 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
1254 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
1255 ADD_SUBDIRECTORY(
1256 "${FXDIV_SOURCE_DIR}"
1257 "${CMAKE_BINARY_DIR}/FXdiv")
1258ENDIF()
1259TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
1260
1261# ---[ Configure psimd
1262IF(NOT TARGET psimd)
1263 ADD_SUBDIRECTORY(
1264 "${PSIMD_SOURCE_DIR}"
1265 "${CMAKE_BINARY_DIR}/psimd")
1266ENDIF()
1267TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
1268
1269# ---[ Configure FP16
1270IF(NOT TARGET fp16)
1271 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
1272 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
1273 ADD_SUBDIRECTORY(
1274 "${FP16_SOURCE_DIR}"
1275 "${CMAKE_BINARY_DIR}/FP16")
1276ENDIF()
1277TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
1278
1279INSTALL(TARGETS XNNPACK
1280 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
1281 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
1282 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
1283
1284# ---[ XNNPACK unit tests
1285IF(XNNPACK_BUILD_TESTS)
1286 # ---[ Build google test
1287 IF(NOT TARGET gtest)
1288 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
1289 ADD_SUBDIRECTORY(
1290 "${GOOGLETEST_SOURCE_DIR}"
1291 "${CMAKE_BINARY_DIR}/googletest")
1292 ENDIF()
1293
1294 # ---[ Build operator-level unit tests
Marat Dukhanefc47b82019-11-18 09:25:38 -08001295 ADD_EXECUTABLE(add-nc-test test/add-nc.cc)
1296 SET_TARGET_PROPERTIES(add-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001297 CXX_STANDARD 11
1298 CXX_STANDARD_REQUIRED YES
1299 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001300 TARGET_INCLUDE_DIRECTORIES(add-nc-test PRIVATE src test)
1301 TARGET_LINK_LIBRARIES(add-nc-test PRIVATE XNNPACK gtest gtest_main)
1302 ADD_TEST(add-nc-test add-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001303
Marat Dukhanb1a0fc32019-12-02 19:32:02 -08001304 ADD_EXECUTABLE(add-nd-test test/add-nd.cc)
1305 SET_TARGET_PROPERTIES(add-nd-test PROPERTIES
1306 CXX_STANDARD 11
1307 CXX_STANDARD_REQUIRED YES
1308 CXX_EXTENSIONS NO)
1309 TARGET_INCLUDE_DIRECTORIES(add-nd-test PRIVATE src test)
1310 TARGET_LINK_LIBRARIES(add-nd-test PRIVATE XNNPACK gtest gtest_main)
1311 ADD_TEST(add-nd-test add-nd-test)
1312
Marat Dukhanefc47b82019-11-18 09:25:38 -08001313 ADD_EXECUTABLE(argmax-pooling-nhwc-test test/argmax-pooling-nhwc.cc)
1314 SET_TARGET_PROPERTIES(argmax-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001315 CXX_STANDARD 11
1316 CXX_STANDARD_REQUIRED YES
1317 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001318 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-nhwc-test PRIVATE src test)
1319 TARGET_LINK_LIBRARIES(argmax-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1320 ADD_TEST(argmax-pooling-nhwc-test argmax-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001321
Marat Dukhanefc47b82019-11-18 09:25:38 -08001322 ADD_EXECUTABLE(average-pooling-nhwc-test test/average-pooling-nhwc.cc)
1323 SET_TARGET_PROPERTIES(average-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001324 CXX_STANDARD 11
1325 CXX_STANDARD_REQUIRED YES
1326 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001327 TARGET_INCLUDE_DIRECTORIES(average-pooling-nhwc-test PRIVATE src test)
1328 TARGET_LINK_LIBRARIES(average-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1329 ADD_TEST(average-pooling-nhwc-test average-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001330
Marat Dukhanefc47b82019-11-18 09:25:38 -08001331 ADD_EXECUTABLE(channel-pad-nc-test test/channel-pad-nc.cc)
1332 SET_TARGET_PROPERTIES(channel-pad-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001333 CXX_STANDARD 11
1334 CXX_STANDARD_REQUIRED YES
1335 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001336 TARGET_INCLUDE_DIRECTORIES(channel-pad-nc-test PRIVATE src test)
1337 TARGET_LINK_LIBRARIES(channel-pad-nc-test PRIVATE XNNPACK gtest gtest_main)
1338 ADD_TEST(channel-pad-nc-test channel-pad-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001339
Marat Dukhanefc47b82019-11-18 09:25:38 -08001340 ADD_EXECUTABLE(channel-shuffle-nc-test test/channel-shuffle-nc.cc)
1341 SET_TARGET_PROPERTIES(channel-shuffle-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001342 CXX_STANDARD 11
1343 CXX_STANDARD_REQUIRED YES
1344 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001345 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-nc-test PRIVATE src test)
1346 TARGET_LINK_LIBRARIES(channel-shuffle-nc-test PRIVATE XNNPACK gtest gtest_main)
1347 ADD_TEST(channel-shuffle-nc-test channel-shuffle-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001348
Marat Dukhanefc47b82019-11-18 09:25:38 -08001349 ADD_EXECUTABLE(clamp-nc-test test/clamp-nc.cc)
1350 SET_TARGET_PROPERTIES(clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001351 CXX_STANDARD 11
1352 CXX_STANDARD_REQUIRED YES
1353 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001354 TARGET_INCLUDE_DIRECTORIES(clamp-nc-test PRIVATE src test)
1355 TARGET_LINK_LIBRARIES(clamp-nc-test PRIVATE XNNPACK gtest gtest_main)
1356 ADD_TEST(clamp-nc-test clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001357
Marat Dukhanefc47b82019-11-18 09:25:38 -08001358 ADD_EXECUTABLE(convolution-nhwc-test test/convolution-nhwc.cc)
1359 SET_TARGET_PROPERTIES(convolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001360 CXX_STANDARD 11
1361 CXX_STANDARD_REQUIRED YES
1362 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001363 TARGET_INCLUDE_DIRECTORIES(convolution-nhwc-test PRIVATE src test)
1364 TARGET_LINK_LIBRARIES(convolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1365 ADD_TEST(convolution-nhwc-test convolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001366
Marat Dukhanefc47b82019-11-18 09:25:38 -08001367 ADD_EXECUTABLE(convolution-nchw-test test/convolution-nchw.cc)
1368 SET_TARGET_PROPERTIES(convolution-nchw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001369 CXX_STANDARD 11
1370 CXX_STANDARD_REQUIRED YES
1371 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001372 TARGET_INCLUDE_DIRECTORIES(convolution-nchw-test PRIVATE src test)
1373 TARGET_LINK_LIBRARIES(convolution-nchw-test PRIVATE XNNPACK gtest gtest_main)
1374 ADD_TEST(convolution-nchw-test convolution-nchw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001375
Marat Dukhanefc47b82019-11-18 09:25:38 -08001376 ADD_EXECUTABLE(deconvolution-nhwc-test test/deconvolution-nhwc.cc)
1377 SET_TARGET_PROPERTIES(deconvolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001378 CXX_STANDARD 11
1379 CXX_STANDARD_REQUIRED YES
1380 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001381 TARGET_INCLUDE_DIRECTORIES(deconvolution-nhwc-test PRIVATE src test)
1382 TARGET_LINK_LIBRARIES(deconvolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1383 ADD_TEST(deconvolution-nhwc-test deconvolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001384
Marat Dukhan69180502019-12-06 15:00:31 -08001385 ADD_EXECUTABLE(divide-nd-test test/divide-nd.cc)
1386 SET_TARGET_PROPERTIES(divide-nd-test PROPERTIES
1387 CXX_STANDARD 11
1388 CXX_STANDARD_REQUIRED YES
1389 CXX_EXTENSIONS NO)
1390 TARGET_INCLUDE_DIRECTORIES(divide-nd-test PRIVATE src test)
1391 TARGET_LINK_LIBRARIES(divide-nd-test PRIVATE XNNPACK gtest gtest_main)
1392 ADD_TEST(divide-nd-test divide-nd-test)
1393
Marat Dukhanefc47b82019-11-18 09:25:38 -08001394 ADD_EXECUTABLE(fully-connected-nc-test test/fully-connected-nc.cc)
1395 SET_TARGET_PROPERTIES(fully-connected-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001396 CXX_STANDARD 11
1397 CXX_STANDARD_REQUIRED YES
1398 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001399 TARGET_INCLUDE_DIRECTORIES(fully-connected-nc-test PRIVATE src test)
1400 TARGET_LINK_LIBRARIES(fully-connected-nc-test PRIVATE XNNPACK gtest gtest_main)
1401 ADD_TEST(fully-connected-nc-test fully-connected-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001402
Marat Dukhanefc47b82019-11-18 09:25:38 -08001403 ADD_EXECUTABLE(global-average-pooling-nwc-test test/global-average-pooling-nwc.cc)
1404 SET_TARGET_PROPERTIES(global-average-pooling-nwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001405 CXX_STANDARD 11
1406 CXX_STANDARD_REQUIRED YES
1407 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001408 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-nwc-test PRIVATE src test)
1409 TARGET_LINK_LIBRARIES(global-average-pooling-nwc-test PRIVATE XNNPACK gtest gtest_main)
1410 ADD_TEST(global-average-pooling-nwc-test global-average-pooling-nwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001411
Marat Dukhanefc47b82019-11-18 09:25:38 -08001412 ADD_EXECUTABLE(global-average-pooling-ncw-test test/global-average-pooling-ncw.cc)
1413 SET_TARGET_PROPERTIES(global-average-pooling-ncw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001414 CXX_STANDARD 11
1415 CXX_STANDARD_REQUIRED YES
1416 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001417 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-ncw-test PRIVATE src test)
1418 TARGET_LINK_LIBRARIES(global-average-pooling-ncw-test PRIVATE XNNPACK gtest gtest_main)
1419 ADD_TEST(global-average-pooling-ncw-test global-average-pooling-ncw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001420
Marat Dukhanefc47b82019-11-18 09:25:38 -08001421 ADD_EXECUTABLE(hardswish-nc-test test/hardswish-nc.cc)
1422 SET_TARGET_PROPERTIES(hardswish-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001423 CXX_STANDARD 11
1424 CXX_STANDARD_REQUIRED YES
1425 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001426 TARGET_INCLUDE_DIRECTORIES(hardswish-nc-test PRIVATE src test)
1427 TARGET_LINK_LIBRARIES(hardswish-nc-test PRIVATE XNNPACK gtest gtest_main)
1428 ADD_TEST(hardswish-nc-test hardswish-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001429
Marat Dukhanefc47b82019-11-18 09:25:38 -08001430 ADD_EXECUTABLE(leaky-relu-nc-test test/leaky-relu-nc.cc)
1431 SET_TARGET_PROPERTIES(leaky-relu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001432 CXX_STANDARD 11
1433 CXX_STANDARD_REQUIRED YES
1434 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001435 TARGET_INCLUDE_DIRECTORIES(leaky-relu-nc-test PRIVATE src test)
1436 TARGET_LINK_LIBRARIES(leaky-relu-nc-test PRIVATE XNNPACK gtest gtest_main)
1437 ADD_TEST(leaky-relu-nc-test leaky-relu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001438
Marat Dukhanefc47b82019-11-18 09:25:38 -08001439 ADD_EXECUTABLE(max-pooling-nhwc-test test/max-pooling-nhwc.cc)
1440 SET_TARGET_PROPERTIES(max-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001441 CXX_STANDARD 11
1442 CXX_STANDARD_REQUIRED YES
1443 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001444 TARGET_INCLUDE_DIRECTORIES(max-pooling-nhwc-test PRIVATE src test)
1445 TARGET_LINK_LIBRARIES(max-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1446 ADD_TEST(max-pooling-nhwc-test max-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001447
Marat Dukhan79e7f842019-12-05 14:35:50 -08001448 ADD_EXECUTABLE(maximum-nd-test test/multiply-nd.cc)
1449 SET_TARGET_PROPERTIES(maximum-nd-test PROPERTIES
1450 CXX_STANDARD 11
1451 CXX_STANDARD_REQUIRED YES
1452 CXX_EXTENSIONS NO)
1453 TARGET_INCLUDE_DIRECTORIES(maximum-nd-test PRIVATE src test)
1454 TARGET_LINK_LIBRARIES(maximum-nd-test PRIVATE XNNPACK gtest gtest_main)
1455 ADD_TEST(maximum-nd-test maximum-nd-test)
1456
1457 ADD_EXECUTABLE(minimum-nd-test test/multiply-nd.cc)
1458 SET_TARGET_PROPERTIES(minimum-nd-test PROPERTIES
1459 CXX_STANDARD 11
1460 CXX_STANDARD_REQUIRED YES
1461 CXX_EXTENSIONS NO)
1462 TARGET_INCLUDE_DIRECTORIES(minimum-nd-test PRIVATE src test)
1463 TARGET_LINK_LIBRARIES(minimum-nd-test PRIVATE XNNPACK gtest gtest_main)
1464 ADD_TEST(minimum-nd-test minimum-nd-test)
1465
Marat Dukhanefc47b82019-11-18 09:25:38 -08001466 ADD_EXECUTABLE(multiply-nd-test test/multiply-nd.cc)
1467 SET_TARGET_PROPERTIES(multiply-nd-test PROPERTIES
Marat Dukhan9d501d52019-11-16 02:30:50 -08001468 CXX_STANDARD 11
1469 CXX_STANDARD_REQUIRED YES
1470 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001471 TARGET_INCLUDE_DIRECTORIES(multiply-nd-test PRIVATE src test)
1472 TARGET_LINK_LIBRARIES(multiply-nd-test PRIVATE XNNPACK gtest gtest_main)
1473 ADD_TEST(multiply-nd-test multiply-nd-test)
Marat Dukhan9d501d52019-11-16 02:30:50 -08001474
Marat Dukhanefc47b82019-11-18 09:25:38 -08001475 ADD_EXECUTABLE(prelu-nc-test test/prelu-nc.cc)
1476 SET_TARGET_PROPERTIES(prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001477 CXX_STANDARD 11
1478 CXX_STANDARD_REQUIRED YES
1479 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001480 TARGET_INCLUDE_DIRECTORIES(prelu-nc-test PRIVATE src test)
1481 TARGET_LINK_LIBRARIES(prelu-nc-test PRIVATE XNNPACK gtest gtest_main)
1482 ADD_TEST(prelu-nc-test prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001483
Marat Dukhanefc47b82019-11-18 09:25:38 -08001484 ADD_EXECUTABLE(resize-bilinear-nhwc-test test/resize-bilinear-nhwc.cc)
1485 SET_TARGET_PROPERTIES(resize-bilinear-nhwc-test PROPERTIES
Marat Dukhan69722492019-11-11 19:55:50 -08001486 CXX_STANDARD 11
1487 CXX_STANDARD_REQUIRED YES
1488 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001489 TARGET_INCLUDE_DIRECTORIES(resize-bilinear-nhwc-test PRIVATE src test)
1490 TARGET_LINK_LIBRARIES(resize-bilinear-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1491 ADD_TEST(resize-bilinear-nhwc-test resize-bilinear-nhwc-test)
Marat Dukhan69722492019-11-11 19:55:50 -08001492
Marat Dukhanefc47b82019-11-18 09:25:38 -08001493 ADD_EXECUTABLE(sigmoid-nc-test test/sigmoid-nc.cc)
1494 SET_TARGET_PROPERTIES(sigmoid-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001495 CXX_STANDARD 11
1496 CXX_STANDARD_REQUIRED YES
1497 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001498 TARGET_INCLUDE_DIRECTORIES(sigmoid-nc-test PRIVATE src test)
1499 TARGET_LINK_LIBRARIES(sigmoid-nc-test PRIVATE XNNPACK gtest gtest_main)
1500 ADD_TEST(sigmoid-nc-test sigmoid-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001501
Marat Dukhanefc47b82019-11-18 09:25:38 -08001502 ADD_EXECUTABLE(softargmax-nc-test test/softargmax-nc.cc)
1503 SET_TARGET_PROPERTIES(softargmax-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001504 CXX_STANDARD 11
1505 CXX_STANDARD_REQUIRED YES
1506 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001507 TARGET_INCLUDE_DIRECTORIES(softargmax-nc-test PRIVATE src test)
1508 TARGET_LINK_LIBRARIES(softargmax-nc-test PRIVATE XNNPACK gtest gtest_main)
1509 ADD_TEST(softargmax-nc-test softargmax-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001510
Marat Dukhan05f3f6d2019-12-03 15:13:53 -08001511 ADD_EXECUTABLE(subtract-nd-test test/subtract-nd.cc)
1512 SET_TARGET_PROPERTIES(subtract-nd-test PROPERTIES
1513 CXX_STANDARD 11
1514 CXX_STANDARD_REQUIRED YES
1515 CXX_EXTENSIONS NO)
1516 TARGET_INCLUDE_DIRECTORIES(subtract-nd-test PRIVATE src test)
1517 TARGET_LINK_LIBRARIES(subtract-nd-test PRIVATE XNNPACK gtest gtest_main)
1518 ADD_TEST(subtract-nd-test subtract-nd-test)
1519
Marat Dukhanefc47b82019-11-18 09:25:38 -08001520 ADD_EXECUTABLE(unpooling-nhwc-test test/unpooling-nhwc.cc)
1521 SET_TARGET_PROPERTIES(unpooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001522 CXX_STANDARD 11
1523 CXX_STANDARD_REQUIRED YES
1524 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001525 TARGET_INCLUDE_DIRECTORIES(unpooling-nhwc-test PRIVATE src test)
1526 TARGET_LINK_LIBRARIES(unpooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1527 ADD_TEST(unpooling-nhwc-test unpooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001528
1529 # ---[ Build microkernel-level unit tests
1530 ADD_EXECUTABLE(f16-gemm-test test/f16-gemm.cc)
1531 SET_TARGET_PROPERTIES(f16-gemm-test PROPERTIES
1532 CXX_STANDARD 11
1533 CXX_STANDARD_REQUIRED YES
1534 CXX_EXTENSIONS YES)
1535 TARGET_INCLUDE_DIRECTORIES(f16-gemm-test PRIVATE src test)
1536 TARGET_LINK_LIBRARIES(f16-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1537 ADD_TEST(f16-gemm-test f16-gemm-test)
1538
1539 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
1540 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
1541 CXX_STANDARD 11
1542 CXX_STANDARD_REQUIRED YES
1543 CXX_EXTENSIONS YES)
1544 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
1545 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1546 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
1547
1548 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
1549 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
1550 CXX_STANDARD 11
1551 CXX_STANDARD_REQUIRED YES
1552 CXX_EXTENSIONS YES)
1553 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
1554 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1555 ADD_TEST(f32-avgpool-test f32-avgpool-test)
1556
Marat Dukhanc465fc22019-11-07 19:20:28 -08001557 ADD_EXECUTABLE(f32-bilinear-test test/f32-bilinear.cc)
1558 SET_TARGET_PROPERTIES(f32-bilinear-test PROPERTIES
1559 CXX_STANDARD 11
1560 CXX_STANDARD_REQUIRED YES
1561 CXX_EXTENSIONS YES)
1562 TARGET_INCLUDE_DIRECTORIES(f32-bilinear-test PRIVATE src test)
1563 TARGET_LINK_LIBRARIES(f32-bilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1564 ADD_TEST(f32-bilinear-test f32-bilinear-test)
1565
Marat Dukhan53873d02019-12-06 17:21:30 -08001566 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
1567 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001568 CXX_STANDARD 11
1569 CXX_STANDARD_REQUIRED YES
1570 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001571 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
1572 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1573 ADD_TEST(f32-clamp-test f32-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001574
1575 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
1576 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
1577 CXX_STANDARD 11
1578 CXX_STANDARD_REQUIRED YES
1579 CXX_EXTENSIONS YES)
1580 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
1581 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1582 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
1583
1584 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
1585 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
1586 CXX_STANDARD 11
1587 CXX_STANDARD_REQUIRED YES
1588 CXX_EXTENSIONS YES)
1589 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
1590 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1591 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
1592
1593 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
1594 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
1595 CXX_STANDARD 11
1596 CXX_STANDARD_REQUIRED YES
1597 CXX_EXTENSIONS YES)
1598 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
1599 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1600 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
1601
1602 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
1603 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
1604 CXX_STANDARD 11
1605 CXX_STANDARD_REQUIRED YES
1606 CXX_EXTENSIONS YES)
1607 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
1608 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1609 ADD_TEST(f32-dwconv-test f32-dwconv-test)
1610
1611 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
1612 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
1613 CXX_STANDARD 11
1614 CXX_STANDARD_REQUIRED YES
1615 CXX_EXTENSIONS YES)
1616 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
1617 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1618 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
1619
1620 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
1621 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
1622 CXX_STANDARD 11
1623 CXX_STANDARD_REQUIRED YES
1624 CXX_EXTENSIONS YES)
1625 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
1626 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1627 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
1628
1629 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
1630 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
1631 CXX_STANDARD 11
1632 CXX_STANDARD_REQUIRED YES
1633 CXX_EXTENSIONS YES)
1634 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
1635 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1636 ADD_TEST(f32-gemm-test f32-gemm-test)
1637
1638 ADD_EXECUTABLE(f32-gemminc-test test/f32-gemminc.cc)
1639 SET_TARGET_PROPERTIES(f32-gemminc-test PROPERTIES
1640 CXX_STANDARD 11
1641 CXX_STANDARD_REQUIRED YES
1642 CXX_EXTENSIONS YES)
1643 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-test PRIVATE src test)
1644 TARGET_LINK_LIBRARIES(f32-gemminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1645 ADD_TEST(f32-gemminc-test f32-gemminc-test)
1646
1647 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
1648 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
1649 CXX_STANDARD 11
1650 CXX_STANDARD_REQUIRED YES
1651 CXX_EXTENSIONS YES)
1652 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
1653 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1654 ADD_TEST(f32-hswish-test f32-hswish-test)
1655
1656 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
1657 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
1658 CXX_STANDARD 11
1659 CXX_STANDARD_REQUIRED YES
1660 CXX_EXTENSIONS YES)
1661 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
1662 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1663 ADD_TEST(f32-igemm-test f32-igemm-test)
1664
1665 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
1666 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
1667 CXX_STANDARD 11
1668 CXX_STANDARD_REQUIRED YES
1669 CXX_EXTENSIONS YES)
1670 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
1671 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1672 ADD_TEST(f32-maxpool-test f32-maxpool-test)
1673
1674 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
1675 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
1676 CXX_STANDARD 11
1677 CXX_STANDARD_REQUIRED YES
1678 CXX_EXTENSIONS YES)
1679 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
1680 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1681 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
1682
1683 ADD_EXECUTABLE(f32-ppmm-test test/f32-ppmm.cc)
1684 SET_TARGET_PROPERTIES(f32-ppmm-test PROPERTIES
1685 CXX_STANDARD 11
1686 CXX_STANDARD_REQUIRED YES
1687 CXX_EXTENSIONS YES)
1688 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-test PRIVATE src test)
1689 TARGET_LINK_LIBRARIES(f32-ppmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1690 ADD_TEST(f32-ppmm-test f32-ppmm-test)
1691
Marat Dukhan53873d02019-12-06 17:21:30 -08001692 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
1693 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001694 CXX_STANDARD 11
1695 CXX_STANDARD_REQUIRED YES
1696 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001697 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
1698 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1699 ADD_TEST(f32-prelu-test f32-prelu-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001700
Marat Dukhan97579532019-10-18 16:40:39 -07001701 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
1702 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
1703 CXX_STANDARD 11
1704 CXX_STANDARD_REQUIRED YES
1705 CXX_EXTENSIONS YES)
1706 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
1707 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1708 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
1709
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001710 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
1711 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
1712 CXX_STANDARD 11
1713 CXX_STANDARD_REQUIRED YES
1714 CXX_EXTENSIONS YES)
1715 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001716 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001717 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
1718
Marat Dukhan97579532019-10-18 16:40:39 -07001719 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
1720 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
1721 CXX_STANDARD 11
1722 CXX_STANDARD_REQUIRED YES
1723 CXX_EXTENSIONS YES)
1724 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
1725 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1726 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
1727
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001728 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
1729 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
1730 CXX_STANDARD 11
1731 CXX_STANDARD_REQUIRED YES
1732 CXX_EXTENSIONS YES)
1733 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
1734 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1735 ADD_TEST(f32-rmax-test f32-rmax-test)
1736
Marat Dukhan581c1ac2019-11-18 14:57:54 -08001737 ADD_EXECUTABLE(f32-sigmoid-test test/f32-sigmoid.cc)
1738 SET_TARGET_PROPERTIES(f32-sigmoid-test PROPERTIES
1739 CXX_STANDARD 11
1740 CXX_STANDARD_REQUIRED YES
1741 CXX_EXTENSIONS YES)
1742 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-test PRIVATE src test)
1743 TARGET_LINK_LIBRARIES(f32-sigmoid-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1744 ADD_TEST(f32-sigmoid-test f32-sigmoid-test)
1745
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001746 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
1747 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
1748 CXX_STANDARD 11
1749 CXX_STANDARD_REQUIRED YES
1750 CXX_EXTENSIONS YES)
1751 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
1752 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1753 ADD_TEST(f32-spmm-test f32-spmm-test)
1754
Marat Dukhan53873d02019-12-06 17:21:30 -08001755 ADD_EXECUTABLE(f32-vadd-test test/f32-vadd.cc)
1756 SET_TARGET_PROPERTIES(f32-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001757 CXX_STANDARD 11
1758 CXX_STANDARD_REQUIRED YES
1759 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001760 TARGET_INCLUDE_DIRECTORIES(f32-vadd-test PRIVATE src test)
1761 TARGET_LINK_LIBRARIES(f32-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1762 ADD_TEST(f32-vadd-test f32-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001763
Marat Dukhanc76065f2019-11-14 18:13:33 -08001764 ADD_EXECUTABLE(f32-vaddc-test test/f32-vaddc.cc)
1765 SET_TARGET_PROPERTIES(f32-vaddc-test PROPERTIES
1766 CXX_STANDARD 11
1767 CXX_STANDARD_REQUIRED YES
1768 CXX_EXTENSIONS YES)
1769 TARGET_INCLUDE_DIRECTORIES(f32-vaddc-test PRIVATE src test)
1770 TARGET_LINK_LIBRARIES(f32-vaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1771 ADD_TEST(f32-vaddc-test f32-vaddc-test)
1772
Marat Dukhan77ca6302019-12-06 12:48:15 -08001773 ADD_EXECUTABLE(f32-vdiv-test test/f32-vdiv.cc)
1774 SET_TARGET_PROPERTIES(f32-vdiv-test PROPERTIES
1775 CXX_STANDARD 11
1776 CXX_STANDARD_REQUIRED YES
1777 CXX_EXTENSIONS YES)
1778 TARGET_INCLUDE_DIRECTORIES(f32-vdiv-test PRIVATE src test)
1779 TARGET_LINK_LIBRARIES(f32-vdiv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1780 ADD_TEST(f32-vdiv-test f32-vdiv-test)
1781
1782 ADD_EXECUTABLE(f32-vdivc-test test/f32-vdivc.cc)
1783 SET_TARGET_PROPERTIES(f32-vdivc-test PROPERTIES
1784 CXX_STANDARD 11
1785 CXX_STANDARD_REQUIRED YES
1786 CXX_EXTENSIONS YES)
1787 TARGET_INCLUDE_DIRECTORIES(f32-vdivc-test PRIVATE src test)
1788 TARGET_LINK_LIBRARIES(f32-vdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1789 ADD_TEST(f32-vdivc-test f32-vdivc-test)
1790
1791 ADD_EXECUTABLE(f32-vrdivc-test test/f32-vrdivc.cc)
1792 SET_TARGET_PROPERTIES(f32-vrdivc-test PROPERTIES
1793 CXX_STANDARD 11
1794 CXX_STANDARD_REQUIRED YES
1795 CXX_EXTENSIONS YES)
1796 TARGET_INCLUDE_DIRECTORIES(f32-vrdivc-test PRIVATE src test)
1797 TARGET_LINK_LIBRARIES(f32-vrdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1798 ADD_TEST(f32-vrdivc-test f32-vrdivc-test)
1799
Marat Dukhan403b7d42019-12-05 12:49:11 -08001800 ADD_EXECUTABLE(f32-vmax-test test/f32-vmax.cc)
1801 SET_TARGET_PROPERTIES(f32-vmax-test PROPERTIES
1802 CXX_STANDARD 11
1803 CXX_STANDARD_REQUIRED YES
1804 CXX_EXTENSIONS YES)
1805 TARGET_INCLUDE_DIRECTORIES(f32-vmax-test PRIVATE src test)
1806 TARGET_LINK_LIBRARIES(f32-vmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1807 ADD_TEST(f32-vmax-test f32-vmax-test)
1808
1809 ADD_EXECUTABLE(f32-vmaxc-test test/f32-vmaxc.cc)
1810 SET_TARGET_PROPERTIES(f32-vmaxc-test PROPERTIES
1811 CXX_STANDARD 11
1812 CXX_STANDARD_REQUIRED YES
1813 CXX_EXTENSIONS YES)
1814 TARGET_INCLUDE_DIRECTORIES(f32-vmaxc-test PRIVATE src test)
1815 TARGET_LINK_LIBRARIES(f32-vmaxc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1816 ADD_TEST(f32-vmaxc-test f32-vmaxc-test)
1817
1818 ADD_EXECUTABLE(f32-vmin-test test/f32-vmin.cc)
1819 SET_TARGET_PROPERTIES(f32-vmin-test PROPERTIES
1820 CXX_STANDARD 11
1821 CXX_STANDARD_REQUIRED YES
1822 CXX_EXTENSIONS YES)
1823 TARGET_INCLUDE_DIRECTORIES(f32-vmin-test PRIVATE src test)
1824 TARGET_LINK_LIBRARIES(f32-vmin-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1825 ADD_TEST(f32-vmin-test f32-vmin-test)
1826
1827 ADD_EXECUTABLE(f32-vminc-test test/f32-vminc.cc)
1828 SET_TARGET_PROPERTIES(f32-vminc-test PROPERTIES
1829 CXX_STANDARD 11
1830 CXX_STANDARD_REQUIRED YES
1831 CXX_EXTENSIONS YES)
1832 TARGET_INCLUDE_DIRECTORIES(f32-vminc-test PRIVATE src test)
1833 TARGET_LINK_LIBRARIES(f32-vminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1834 ADD_TEST(f32-vminc-test f32-vminc-test)
1835
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001836 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
1837 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
1838 CXX_STANDARD 11
1839 CXX_STANDARD_REQUIRED YES
1840 CXX_EXTENSIONS YES)
1841 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
1842 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1843 ADD_TEST(f32-vmul-test f32-vmul-test)
1844
Marat Dukhanc76065f2019-11-14 18:13:33 -08001845 ADD_EXECUTABLE(f32-vmulc-test test/f32-vmulc.cc)
1846 SET_TARGET_PROPERTIES(f32-vmulc-test PROPERTIES
1847 CXX_STANDARD 11
1848 CXX_STANDARD_REQUIRED YES
1849 CXX_EXTENSIONS YES)
1850 TARGET_INCLUDE_DIRECTORIES(f32-vmulc-test PRIVATE src test)
1851 TARGET_LINK_LIBRARIES(f32-vmulc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1852 ADD_TEST(f32-vmulc-test f32-vmulc-test)
1853
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001854 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
1855 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
1856 CXX_STANDARD 11
1857 CXX_STANDARD_REQUIRED YES
1858 CXX_EXTENSIONS YES)
1859 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
1860 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1861 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
1862
Marat Dukhan97579532019-10-18 16:40:39 -07001863 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
1864 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1865 CXX_STANDARD 11
1866 CXX_STANDARD_REQUIRED YES
1867 CXX_EXTENSIONS YES)
1868 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
1869 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1870 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
1871
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001872 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
1873 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1874 CXX_STANDARD 11
1875 CXX_STANDARD_REQUIRED YES
1876 CXX_EXTENSIONS YES)
1877 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001878 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001879 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
1880
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001881 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
1882 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
1883 CXX_STANDARD 11
1884 CXX_STANDARD_REQUIRED YES
1885 CXX_EXTENSIONS YES)
1886 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
1887 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1888 ADD_TEST(f32-vsub-test f32-vsub-test)
1889
Marat Dukhanc76065f2019-11-14 18:13:33 -08001890 ADD_EXECUTABLE(f32-vsubc-test test/f32-vsubc.cc)
1891 SET_TARGET_PROPERTIES(f32-vsubc-test PROPERTIES
1892 CXX_STANDARD 11
1893 CXX_STANDARD_REQUIRED YES
1894 CXX_EXTENSIONS YES)
1895 TARGET_INCLUDE_DIRECTORIES(f32-vsubc-test PRIVATE src test)
1896 TARGET_LINK_LIBRARIES(f32-vsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1897 ADD_TEST(f32-vsubc-test f32-vsubc-test)
1898
1899 ADD_EXECUTABLE(f32-vrsubc-test test/f32-vrsubc.cc)
1900 SET_TARGET_PROPERTIES(f32-vrsubc-test PROPERTIES
1901 CXX_STANDARD 11
1902 CXX_STANDARD_REQUIRED YES
1903 CXX_EXTENSIONS YES)
1904 TARGET_INCLUDE_DIRECTORIES(f32-vrsubc-test PRIVATE src test)
1905 TARGET_LINK_LIBRARIES(f32-vrsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1906 ADD_TEST(f32-vrsubc-test f32-vrsubc-test)
1907
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001908 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
1909 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
1910 CXX_STANDARD 11
1911 CXX_STANDARD_REQUIRED YES
1912 CXX_EXTENSIONS YES)
1913 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
1914 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1915 ADD_TEST(q8-avgpool-test q8-avgpool-test)
1916
1917 ADD_EXECUTABLE(q8-dwconv-test test/q8-dwconv.cc)
1918 SET_TARGET_PROPERTIES(q8-dwconv-test PROPERTIES
1919 CXX_STANDARD 11
1920 CXX_STANDARD_REQUIRED YES
1921 CXX_EXTENSIONS YES)
1922 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-test PRIVATE src test)
1923 TARGET_LINK_LIBRARIES(q8-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1924 ADD_TEST(q8-dwconv-test q8-dwconv-test)
1925
1926 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
1927 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
1928 CXX_STANDARD 11
1929 CXX_STANDARD_REQUIRED YES
1930 CXX_EXTENSIONS YES)
1931 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
1932 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1933 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
1934
1935 ADD_EXECUTABLE(q8-gemm-test test/q8-gemm.cc)
1936 SET_TARGET_PROPERTIES(q8-gemm-test PROPERTIES
1937 CXX_STANDARD 11
1938 CXX_STANDARD_REQUIRED YES
1939 CXX_EXTENSIONS YES)
1940 TARGET_INCLUDE_DIRECTORIES(q8-gemm-test PRIVATE src test)
1941 TARGET_LINK_LIBRARIES(q8-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1942 ADD_TEST(q8-gemm-test q8-gemm-test)
1943
1944 ADD_EXECUTABLE(q8-igemm-test test/q8-igemm.cc)
1945 SET_TARGET_PROPERTIES(q8-igemm-test PROPERTIES
1946 CXX_STANDARD 11
1947 CXX_STANDARD_REQUIRED YES
1948 CXX_EXTENSIONS YES)
1949 TARGET_INCLUDE_DIRECTORIES(q8-igemm-test PRIVATE src test)
1950 TARGET_LINK_LIBRARIES(q8-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1951 ADD_TEST(q8-igemm-test q8-igemm-test)
1952
Marat Dukhan53873d02019-12-06 17:21:30 -08001953 ADD_EXECUTABLE(q8-vadd-test test/q8-vadd.cc)
1954 SET_TARGET_PROPERTIES(q8-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001955 CXX_STANDARD 11
1956 CXX_STANDARD_REQUIRED YES
1957 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001958 TARGET_INCLUDE_DIRECTORIES(q8-vadd-test PRIVATE src test)
1959 TARGET_LINK_LIBRARIES(q8-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1960 ADD_TEST(q8-vadd-test q8-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001961
Marat Dukhan53873d02019-12-06 17:21:30 -08001962 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
1963 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001964 CXX_STANDARD 11
1965 CXX_STANDARD_REQUIRED YES
1966 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001967 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
1968 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1969 ADD_TEST(u8-clamp-test u8-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001970
1971 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
1972 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
1973 CXX_STANDARD 11
1974 CXX_STANDARD_REQUIRED YES
1975 CXX_EXTENSIONS YES)
1976 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
1977 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1978 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
1979
1980 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
1981 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
1982 CXX_STANDARD 11
1983 CXX_STANDARD_REQUIRED YES
1984 CXX_EXTENSIONS YES)
1985 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
1986 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1987 ADD_TEST(u8-maxpool-test u8-maxpool-test)
1988
1989 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
1990 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
1991 CXX_STANDARD 11
1992 CXX_STANDARD_REQUIRED YES
1993 CXX_EXTENSIONS YES)
1994 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
1995 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1996 ADD_TEST(u8-rmax-test u8-rmax-test)
1997
1998 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
1999 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
2000 CXX_STANDARD 11
2001 CXX_STANDARD_REQUIRED YES
2002 CXX_EXTENSIONS YES)
2003 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
2004 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2005 ADD_TEST(x32-packx-test x32-packx-test)
2006
2007 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
2008 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
2009 CXX_STANDARD 11
2010 CXX_STANDARD_REQUIRED YES
2011 CXX_EXTENSIONS YES)
2012 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
2013 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2014 ADD_TEST(x32-pad-test x32-pad-test)
2015
2016 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
2017 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
2018 CXX_STANDARD 11
2019 CXX_STANDARD_REQUIRED YES
2020 CXX_EXTENSIONS YES)
2021 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
2022 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2023 ADD_TEST(x32-unpool-test x32-unpool-test)
2024
2025 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
2026 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
2027 CXX_STANDARD 11
2028 CXX_STANDARD_REQUIRED YES
2029 CXX_EXTENSIONS YES)
2030 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
2031 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2032 ADD_TEST(x32-zip-test x32-zip-test)
2033
2034 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
2035 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
2036 CXX_STANDARD 11
2037 CXX_STANDARD_REQUIRED YES
2038 CXX_EXTENSIONS YES)
2039 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
2040 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2041 ADD_TEST(x8-lut-test x8-lut-test)
2042
2043 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
2044 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
2045 CXX_STANDARD 11
2046 CXX_STANDARD_REQUIRED YES
2047 CXX_EXTENSIONS YES)
2048 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
2049 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2050 ADD_TEST(x8-zip-test x8-zip-test)
2051ENDIF()
2052
2053# ---[ XNNPACK microbenchmarks
2054IF(XNNPACK_BUILD_BENCHMARKS)
2055 # ---[ Build google benchmark
2056 IF(NOT TARGET benchmark)
2057 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
2058 ADD_SUBDIRECTORY(
2059 "${GOOGLEBENCHMARK_SOURCE_DIR}"
2060 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
2061 ENDIF()
2062
2063 ADD_LIBRARY(bench-utils bench/utils.cc)
2064 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
2065 CXX_STANDARD 11
2066 CXX_STANDARD_REQUIRED YES
2067 CXX_EXTENSIONS NO)
2068 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08002069 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002070
Marat Dukhancb10f262019-11-16 15:52:37 -08002071 # ---[ Build accuracy microbenchmarks
2072 ADD_EXECUTABLE(f32-exp-eval eval/f32-exp.cc)
2073 SET_TARGET_PROPERTIES(f32-exp-eval PROPERTIES
2074 CXX_STANDARD 11
2075 CXX_STANDARD_REQUIRED YES
2076 CXX_EXTENSIONS NO)
2077 TARGET_INCLUDE_DIRECTORIES(f32-exp-eval PRIVATE src)
2078 TARGET_LINK_LIBRARIES(f32-exp-eval PRIVATE XNNPACK benchmark fp16)
2079
2080 ADD_EXECUTABLE(f32-expminus-eval eval/f32-expminus.cc)
2081 SET_TARGET_PROPERTIES(f32-expminus-eval PROPERTIES
2082 CXX_STANDARD 11
2083 CXX_STANDARD_REQUIRED YES
2084 CXX_EXTENSIONS NO)
2085 TARGET_INCLUDE_DIRECTORIES(f32-expminus-eval PRIVATE src)
2086 TARGET_LINK_LIBRARIES(f32-expminus-eval PRIVATE XNNPACK benchmark fp16)
2087
2088 ADD_EXECUTABLE(f32-extexp-eval eval/f32-extexp.cc)
2089 SET_TARGET_PROPERTIES(f32-extexp-eval PROPERTIES
2090 CXX_STANDARD 11
2091 CXX_STANDARD_REQUIRED YES
2092 CXX_EXTENSIONS YES)
2093 TARGET_INCLUDE_DIRECTORIES(f32-extexp-eval PRIVATE src)
2094 TARGET_LINK_LIBRARIES(f32-extexp-eval PRIVATE XNNPACK benchmark fp16)
2095
2096 ADD_EXECUTABLE(f32-sigmoid-eval eval/f32-sigmoid.cc)
2097 SET_TARGET_PROPERTIES(f32-sigmoid-eval PROPERTIES
2098 CXX_STANDARD 11
2099 CXX_STANDARD_REQUIRED YES
2100 CXX_EXTENSIONS NO)
2101 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-eval PRIVATE src)
2102 TARGET_LINK_LIBRARIES(f32-sigmoid-eval PRIVATE XNNPACK benchmark fp16)
2103
Marat Dukhan5f18d262019-10-31 10:24:14 -07002104 # ---[ Build end-to-end microbenchmarks
Marat Dukhan17e16282019-12-10 12:09:35 -08002105 ADD_LIBRARY(bench-models STATIC
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002106 models/mobilenet-v1.cc
2107 models/mobilenet-v2.cc
2108 models/mobilenet-v3-large.cc
2109 models/mobilenet-v3-small.cc)
2110 SET_TARGET_PROPERTIES(bench-models PROPERTIES
2111 CXX_STANDARD 11
2112 CXX_STANDARD_REQUIRED YES
2113 CXX_EXTENSIONS YES)
2114 TARGET_INCLUDE_DIRECTORIES(bench-models PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2115 TARGET_LINK_LIBRARIES(bench-models PRIVATE XNNPACK benchmark bench-utils)
2116
2117 ADD_EXECUTABLE(end2end-bench bench/end2end.cc)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002118 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
2119 CXX_STANDARD 11
2120 CXX_STANDARD_REQUIRED YES
2121 CXX_EXTENSIONS NO)
2122 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002123 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002124
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002125 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002126 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
2127 CXX_STANDARD 11
2128 CXX_STANDARD_REQUIRED YES
2129 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002130 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002131 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002132
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002133 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc)
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07002134 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07002135 CXX_STANDARD 11
2136 CXX_STANDARD_REQUIRED YES
2137 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002138 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002139 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07002140
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002141 # ---[ Build operator-level microbenchmarks
2142 ADD_EXECUTABLE(add-bench bench/add.cc)
2143 SET_TARGET_PROPERTIES(add-bench PROPERTIES
2144 CXX_STANDARD 11
2145 CXX_STANDARD_REQUIRED YES
2146 CXX_EXTENSIONS NO)
2147 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2148 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2149
2150 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
2151 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
2152 CXX_STANDARD 11
2153 CXX_STANDARD_REQUIRED YES
2154 CXX_EXTENSIONS NO)
2155 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2156 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2157
2158 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
2159 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
2160 CXX_STANDARD 11
2161 CXX_STANDARD_REQUIRED YES
2162 CXX_EXTENSIONS NO)
2163 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2164 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2165
2166 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
2167 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
2168 CXX_STANDARD 11
2169 CXX_STANDARD_REQUIRED YES
2170 CXX_EXTENSIONS NO)
2171 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2172 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2173
2174 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
2175 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
2176 CXX_STANDARD 11
2177 CXX_STANDARD_REQUIRED YES
2178 CXX_EXTENSIONS NO)
2179 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2180 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2181
2182 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
2183 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
2184 CXX_STANDARD 11
2185 CXX_STANDARD_REQUIRED YES
2186 CXX_EXTENSIONS NO)
2187 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2188 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2189
2190 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
2191 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
2192 CXX_STANDARD 11
2193 CXX_STANDARD_REQUIRED YES
2194 CXX_EXTENSIONS NO)
2195 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2196 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2197
Marat Dukhan95b22432019-10-30 16:30:14 -07002198 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
2199 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
2200 CXX_STANDARD 11
2201 CXX_STANDARD_REQUIRED YES
2202 CXX_EXTENSIONS NO)
2203 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2204 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2205
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002206 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
2207 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
2208 CXX_STANDARD 11
2209 CXX_STANDARD_REQUIRED YES
2210 CXX_EXTENSIONS NO)
2211 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2212 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2213
2214 ADD_EXECUTABLE(softargmax-bench bench/softargmax.cc)
2215 SET_TARGET_PROPERTIES(softargmax-bench PROPERTIES
2216 CXX_STANDARD 11
2217 CXX_STANDARD_REQUIRED YES
2218 CXX_EXTENSIONS NO)
2219 TARGET_INCLUDE_DIRECTORIES(softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2220 TARGET_LINK_LIBRARIES(softargmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2221
2222 # ---[ Build microkernel-level microbenchmarks
2223 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
2224 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
2225 CXX_STANDARD 11
2226 CXX_STANDARD_REQUIRED YES
2227 CXX_EXTENSIONS YES)
2228 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
2229 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2230 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2231
2232 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
2233 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
2234 CXX_STANDARD 11
2235 CXX_STANDARD_REQUIRED YES
2236 CXX_EXTENSIONS YES)
2237 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
2238 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2239 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2240
2241 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
2242 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
2243 CXX_STANDARD 11
2244 CXX_STANDARD_REQUIRED YES
2245 CXX_EXTENSIONS YES)
2246 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
2247 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2248 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2249
2250 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
2251 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
2252 CXX_STANDARD 11
2253 CXX_STANDARD_REQUIRED YES
2254 CXX_EXTENSIONS YES)
2255 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
2256 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2257 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2258
2259 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
2260 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
2261 CXX_STANDARD 11
2262 CXX_STANDARD_REQUIRED YES
2263 CXX_EXTENSIONS YES)
2264 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
2265 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2266 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2267
2268 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
2269 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
2270 CXX_STANDARD 11
2271 CXX_STANDARD_REQUIRED YES
2272 CXX_EXTENSIONS YES)
2273 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
2274 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2275 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2276
2277 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
2278 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
2279 C_STANDARD 99
2280 C_STANDARD_REQUIRED YES
2281 C_EXTENSIONS NO
2282 CXX_STANDARD 11
2283 CXX_STANDARD_REQUIRED YES
2284 CXX_EXTENSIONS YES)
2285 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
2286 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2287 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2288
2289 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
2290 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
2291 CXX_STANDARD 11
2292 CXX_STANDARD_REQUIRED YES
2293 CXX_EXTENSIONS YES)
2294 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
2295 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2296 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2297
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002298 ADD_EXECUTABLE(f32-sigmoid-bench bench/f32-sigmoid.cc)
2299 SET_TARGET_PROPERTIES(f32-sigmoid-bench PROPERTIES
2300 CXX_STANDARD 11
2301 CXX_STANDARD_REQUIRED YES
2302 CXX_EXTENSIONS YES)
2303 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE src)
2304 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2305 TARGET_LINK_LIBRARIES(f32-sigmoid-bench PRIVATE XNNPACK benchmark bench-utils)
2306
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002307 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
2308 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
2309 CXX_STANDARD 11
2310 CXX_STANDARD_REQUIRED YES
2311 CXX_EXTENSIONS YES)
2312 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
2313 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2314 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2315
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07002316 ADD_EXECUTABLE(f32-softargmax-bench bench/f32-softargmax.cc)
2317 SET_TARGET_PROPERTIES(f32-softargmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002318 CXX_STANDARD 11
2319 CXX_STANDARD_REQUIRED YES
2320 CXX_EXTENSIONS YES)
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07002321 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE src)
2322 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2323 TARGET_LINK_LIBRARIES(f32-softargmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002324
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002325 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
2326 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
2327 CXX_STANDARD 11
2328 CXX_STANDARD_REQUIRED YES
2329 CXX_EXTENSIONS YES)
2330 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
2331 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2332 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2333ENDIF()