blob: a142105d542090eb9f94f2cf6f2b4b51d2a27ff5 [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
19OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
20OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
21
22# ---[ CMake options
23IF(XNNPACK_BUILD_TESTS)
24 ENABLE_TESTING()
25ENDIF()
26
27# ---[ Build flags
28IF(NOT CMAKE_SYSTEM_PROCESSOR)
29 IF(IOS)
30 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
31 IF(IOS_ARCH_COUNT GREATER 1)
32 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
33 "Specify a single architecture in IOS_ARCH and re-configure. ")
34 ENDIF()
35 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|armv7.*|arm64.*)$")
36 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
37 ENDIF()
38 ELSE()
39 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
40 ENDIF()
41ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|armv[5-8].*|aarch64)$")
42 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
43ENDIF()
44
45IF(NOT CMAKE_SYSTEM_NAME)
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
47ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android)$")
48 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
49ENDIF()
50
51# ---[ Download deps
52IF(NOT DEFINED CLOG_SOURCE_DIR)
53 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
54 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
55 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
56 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
57 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
58 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
59 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
60ENDIF()
61
62IF(NOT DEFINED CPUINFO_SOURCE_DIR)
63 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
64 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
65 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
66 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
67 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
68 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
69 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
70ENDIF()
71
72IF(NOT DEFINED FP16_SOURCE_DIR)
73 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
74 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
75 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
76 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
77 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
78 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
79 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
80ENDIF()
81
82IF(NOT DEFINED FXDIV_SOURCE_DIR)
83 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
84 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
85 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
86 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
87 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
88 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
89 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
90ENDIF()
91
92IF(NOT DEFINED PSIMD_SOURCE_DIR)
93 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
94 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
95 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
96 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
97 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
98 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
99 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
100ENDIF()
101
102IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
103 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
104 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
105 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
106 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
107 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
108 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
109 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
110ENDIF()
111
112IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
113 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
114 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
115 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
116 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
117 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
118 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
119 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
120ENDIF()
121
122IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
123 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
124 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
125 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
126 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
127 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
128 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
129 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
130ENDIF()
131
132# ---[ XNNPACK library
133SET(XNNPACK_OPERATOR_SRCS
134 src/add.c
135 src/argmax-pooling.c
136 src/average-pooling.c
137 src/channel-pad.c
138 src/channel-shuffle.c
139 src/clamp.c
140 src/convolution-spnchw.c
141 src/convolution.c
142 src/deconvolution.c
143 src/fully-connected.c
144 src/global-average-pooling-spnchw.c
145 src/global-average-pooling.c
146 src/hardswish.c
147 src/leaky-relu.c
148 src/max-pooling.c
149 src/prelu.c
150 src/sigmoid.c
151 src/softargmax.c
152 src/unpooling.c)
153
154SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
155LIST(APPEND XNNPACK_COLD_SRCS
156 src/init.c
157 src/operator-delete.c)
158
159SET(XNNPACK_HOT_SRCS
160 src/indirection.c
161 src/operator-run.c)
162
163SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
164 src/f32-argmaxpool/mp9p8q-scalar.c
165 src/f32-argmaxpool/up4-scalar.c
166 src/f32-argmaxpool/up9-scalar.c
167 src/f32-avgpool/mp9p8q-scalar.c
168 src/f32-avgpool/up9-scalar.c
Marat Dukhan35dacfb2019-11-07 19:18:16 -0800169 src/f32-bilinear/scalar-c1.c
170 src/f32-bilinear/scalar-c2.c
171 src/f32-bilinear/scalar-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700172 src/f32-clamp/scalar.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700173 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700174 src/f32-igemm/1x4-scalar.c
175 src/f32-igemm/2x4-scalar.c
176 src/f32-igemm/4x2-scalar.c
177 src/f32-igemm/4x4-scalar.c
178 src/f32-dwconv/up1x25-scalar.c
179 src/f32-dwconv/up1x4-scalar.c
180 src/f32-dwconv/up1x9-scalar.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800181 src/f32-dwconv/up1x25-scalar-acc2.c
182 src/f32-dwconv/up1x4-scalar-acc2.c
183 src/f32-dwconv/up1x9-scalar-acc2.c
184 src/f32-dwconv/up2x25-scalar.c
185 src/f32-dwconv/up2x4-scalar.c
186 src/f32-dwconv/up2x9-scalar.c
187 src/f32-dwconv/up2x25-scalar-acc2.c
188 src/f32-dwconv/up2x4-scalar-acc2.c
189 src/f32-dwconv/up2x9-scalar-acc2.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700190 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700191 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700192 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700193 src/f32-gavgpool/mp7p7q-scalar.c
194 src/f32-gavgpool/up7-scalar.c
195 src/f32-gemm/1x4-scalar.c
196 src/f32-gemm/2x4-scalar.c
197 src/f32-gemm/4x2-scalar.c
198 src/f32-gemm/4x4-scalar.c
199 src/f32-gemminc/1x4-scalar.c
200 src/f32-gemminc/2x4-scalar.c
201 src/f32-gemminc/4x4-scalar.c
202 src/f32-hswish/scalar.c
203 src/f32-maxpool/9p8q-scalar.c
204 src/f32-pavgpool/mp9p8q-scalar.c
205 src/f32-pavgpool/up9-scalar.c
206 src/f32-ppmm/2x4-scalar.c
207 src/f32-ppmm/3x3-scalar.c
208 src/f32-ppmm/4x2-scalar.c
209 src/f32-ppmm/4x4-scalar.c
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800210 src/f32-prelu/scalar-2x1.c
211 src/f32-prelu/scalar-2x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700212 src/f32-rmax/scalar.c
213 src/f32-spmm/1x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700214 src/f32-spmm/1x1-scalar.c
215 src/f32-spmm/2x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700216 src/f32-spmm/2x1-scalar.c
217 src/f32-spmm/4x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700218 src/f32-spmm/4x1-scalar.c
219 src/f32-spmm/8x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700220 src/f32-spmm/8x1-scalar.c
Erich Elsenc6afd9b2019-10-24 16:10:53 -0700221 src/f32-spmm/8x2-scalar.c
222 src/f32-spmm/8x4-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700223 src/f32-vadd/scalar.c
224 src/f32-vmul/scalar.c
Marat Dukhan49e6ee92019-11-06 15:55:29 -0800225 src/f32-vmulcaddc/c1-scalar-2x.c
226 src/f32-vmulcaddc/c2-scalar-2x.c
227 src/f32-vmulcaddc/c4-scalar-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700228 src/f32-vsub/scalar.c
229 src/q8-avgpool/mp9p8q-scalar.c
230 src/q8-avgpool/up9-scalar.c
231 src/q8-igemm/2x2-scalar.c
232 src/q8-dwconv/up1x9-scalar.c
233 src/q8-gavgpool/mp7p7q-scalar.c
234 src/q8-gavgpool/up7-scalar.c
235 src/q8-gemm/2x2-scalar.c
236 src/q8-vadd/scalar.c
237 src/u8-clamp/scalar.c
238 src/u8-lut32norm/scalar.c
239 src/u8-maxpool/9p8q-scalar.c
240 src/u8-rmax/scalar.c
241 src/x32-packx/x2-scalar.c
242 src/x32-packx/x3-scalar.c
243 src/x32-packx/x4-scalar.c
244 src/x32-pad/x2-scalar.c
245 src/x32-unpool/scalar.c
246 src/x32-zip/x2-scalar.c
247 src/x32-zip/x3-scalar.c
248 src/x32-zip/x4-scalar.c
249 src/x32-zip/xm-scalar.c
250 src/x8-lut/scalar.c
251 src/x8-zip/x2-scalar.c
252 src/x8-zip/x3-scalar.c
253 src/x8-zip/x4-scalar.c
254 src/x8-zip/xm-scalar.c)
255
256SET(XNNPACK_PSIMD_MICROKERNEL_SRCS
257 src/f32-argmaxpool/mp9p8q-psimd.c
258 src/f32-argmaxpool/up4-psimd.c
259 src/f32-argmaxpool/up9-psimd.c
260 src/f32-avgpool/mp9p8q-psimd.c
261 src/f32-avgpool/up9-psimd.c
Marat Dukhan35dacfb2019-11-07 19:18:16 -0800262 src/f32-bilinear/psimd-c4.c
263 src/f32-bilinear/psimd-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700264 src/f32-clamp/psimd.c
265 src/f32-igemm/1x8-psimd-loadsplat.c
266 src/f32-igemm/1x8-psimd-splat.c
267 src/f32-igemm/1x8s4-psimd.c
268 src/f32-igemm/4x2c4-psimd.c
269 src/f32-igemm/4x8-psimd-loadsplat.c
270 src/f32-igemm/4x8-psimd-splat.c
271 src/f32-igemm/4x8s4-psimd.c
272 src/f32-igemm/6x8-psimd-loadsplat.c
273 src/f32-igemm/6x8-psimd-splat.c
274 src/f32-igemm/6x8s4-psimd.c
275 src/f32-dwconv/up4x25-psimd.c
276 src/f32-dwconv/up4x4-psimd.c
277 src/f32-dwconv/up4x9-psimd.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800278 src/f32-dwconv/up4x25-psimd-acc2.c
279 src/f32-dwconv/up4x4-psimd-acc2.c
280 src/f32-dwconv/up4x9-psimd-acc2.c
281 src/f32-dwconv/up8x25-psimd.c
282 src/f32-dwconv/up8x4-psimd.c
283 src/f32-dwconv/up8x9-psimd.c
284 src/f32-dwconv/up8x25-psimd-acc2.c
285 src/f32-dwconv/up8x4-psimd-acc2.c
286 src/f32-dwconv/up8x9-psimd-acc2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700287 src/f32-gavgpool/mp7p7q-psimd.c
288 src/f32-gavgpool/up7-psimd.c
289 src/f32-gemm/1x8-psimd-loadsplat.c
290 src/f32-gemm/1x8-psimd-splat.c
291 src/f32-gemm/1x8s4-psimd.c
292 src/f32-gemm/4x8-psimd-loadsplat.c
293 src/f32-gemm/4x8-psimd-splat.c
294 src/f32-gemm/4x8s4-psimd.c
295 src/f32-gemm/6x8-psimd-loadsplat.c
296 src/f32-gemm/6x8-psimd-splat.c
297 src/f32-gemm/6x8s4-psimd.c
298 src/f32-gemminc/1x8-psimd-loadsplat.c
299 src/f32-gemminc/1x8-psimd-splat.c
300 src/f32-gemminc/1x8s4-psimd.c
301 src/f32-gemminc/4x8-psimd-loadsplat.c
302 src/f32-gemminc/4x8-psimd-splat.c
303 src/f32-gemminc/4x8s4-psimd.c
304 src/f32-gemminc/6x8-psimd-loadsplat.c
305 src/f32-gemminc/6x8-psimd-splat.c
306 src/f32-gemminc/6x8s4-psimd.c
307 src/f32-hswish/psimd.c
308 src/f32-maxpool/9p8q-psimd.c
309 src/f32-pavgpool/mp9p8q-psimd.c
310 src/f32-pavgpool/up9-psimd.c
311 src/f32-ppmm/4x8-psimd.c
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800312 src/f32-prelu/psimd-2x4.c
313 src/f32-prelu/psimd-2x8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700314 src/f32-vadd/psimd.c
315 src/f32-vmul/psimd.c
Marat Dukhan49e6ee92019-11-06 15:55:29 -0800316 src/f32-vmulcaddc/c4-psimd-2x.c
317 src/f32-vmulcaddc/c8-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700318 src/f32-vsub/psimd.c
319 src/x32-packx/x4-psimd.c
320 src/x32-pad/x2-psimd.c
321 src/x32-unpool/psimd.c
322 src/x32-zip/x2-psimd.c
323 src/x32-zip/x3-psimd.c
324 src/x32-zip/x4-psimd.c
325 src/x32-zip/xm-psimd.c)
326
327SET(XNNPACK_NEON_MICROKERNEL_SRCS
328 src/f32-avgpool/mp9p8q-neon.c
329 src/f32-avgpool/up9-neon.c
Marat Dukhan35dacfb2019-11-07 19:18:16 -0800330 src/f32-bilinear/neon-c4.c
331 src/f32-bilinear/neon-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700332 src/f32-clamp/neon.c
333 src/f32-igemm/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700334 src/f32-igemm/4x2-neon-ld64.c
335 src/f32-igemm/4x4-neon-ld64.c
336 src/f32-igemm/4x8-neon-ld128.c
337 src/f32-igemm/4x8-neon-ld64.c
338 src/f32-igemm/6x8-neon-ld64.c
339 src/f32-dwconv/up4x9-neon.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800340 src/f32-dwconv/up4x9-neon-acc2.c
341 src/f32-dwconv/up8x9-neon.c
342 src/f32-dwconv/up8x9-neon-acc2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700343 src/f32-gavgpool-spchw/neon-x4.c
344 src/f32-gavgpool/mp7p7q-neon.c
345 src/f32-gavgpool/up7-neon.c
346 src/f32-gemm/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700347 src/f32-gemm/4x2-neon-ld64.c
348 src/f32-gemm/4x8-neon-ld128.c
349 src/f32-gemm/4x8-neon-ld64.c
350 src/f32-gemm/5x8-neon-ld64.c
351 src/f32-gemm/6x8-neon-ld64.c
352 src/f32-gemminc/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700353 src/f32-gemminc/4x8-neon-ld128.c
354 src/f32-gemminc/4x8-neon-ld64.c
355 src/f32-gemminc/5x8-neon-ld64.c
356 src/f32-gemminc/6x8-neon-ld64.c
357 src/f32-hswish/neon.c
358 src/f32-pavgpool/mp9p8q-neon.c
359 src/f32-pavgpool/up9-neon.c
360 src/f32-ppmm/4x8-neon.c
361 src/f32-ppmm/8x8-neon.c
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800362 src/f32-prelu/neon-2x4.c
363 src/f32-prelu/neon-2x8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700364 src/f32-rmax/neon.c
Marat Dukhan49e6ee92019-11-06 15:55:29 -0800365 src/f32-vmulcaddc/c4-neon-2x.c
366 src/f32-vmulcaddc/c8-neon-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700367 src/q8-avgpool/mp9p8q-neon.c
368 src/q8-avgpool/up9-neon.c
369 src/q8-igemm/4x8-neon.c
370 src/q8-igemm/8x8-neon.c
371 src/q8-dwconv/up8x9-neon.c
372 src/q8-gavgpool/mp7p7q-neon.c
373 src/q8-gavgpool/up7-neon.c
374 src/q8-gemm/4x8-neon.c
375 src/q8-gemm/8x8-neon.c
376 src/q8-vadd/neon.c
377 src/u8-clamp/neon.c
378 src/u8-maxpool/9p8q-neon.c
379 src/u8-rmax/neon.c
380 src/x32-packx/x4-neon-st4.c
381 src/x32-pad/x2-neon.c
382 src/x32-zip/x2-neon.c
383 src/x32-zip/x3-neon.c
384 src/x32-zip/x4-neon.c
385 src/x32-zip/xm-neon.c
386 src/x8-zip/x2-neon.c
387 src/x8-zip/x3-neon.c
388 src/x8-zip/x4-neon.c
389 src/x8-zip/xm-neon.c)
390
391SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan35dacfb2019-11-07 19:18:16 -0800392 src/f32-bilinear/neonfma-c4.c
393 src/f32-bilinear/neonfma-c8.c
Frank Barcharddb45b6a2019-10-09 16:42:45 -0700394 src/f32-igemm/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700395 src/f32-igemm/4x2-neonfma-ld64.c
396 src/f32-igemm/4x4-neonfma-ld64.c
397 src/f32-igemm/4x8-neonfma-ld128.c
398 src/f32-igemm/4x8-neonfma-ld64.c
399 src/f32-igemm/6x8-neonfma-ld64.c
400 src/f32-dwconv/up4x9-neonfma.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800401 src/f32-dwconv/up4x9-neonfma-acc2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700402 src/f32-dwconv/up8x9-neonfma.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800403 src/f32-dwconv/up8x9-neonfma-acc2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700404 src/f32-gemm/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700405 src/f32-gemm/4x2-neonfma-ld64.c
406 src/f32-gemm/4x8-neonfma-ld128.c
407 src/f32-gemm/4x8-neonfma-ld64.c
408 src/f32-gemm/5x8-neonfma-ld64.c
409 src/f32-gemm/6x8-neonfma-ld64.c
410 src/f32-gemminc/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700411 src/f32-gemminc/4x8-neonfma-ld128.c
412 src/f32-gemminc/4x8-neonfma-ld64.c
413 src/f32-gemminc/5x8-neonfma-ld64.c
414 src/f32-gemminc/6x8-neonfma-ld64.c
415 src/f32-hswish/neonfma.c
416 src/f32-ppmm/4x8-neonfma.c
417 src/f32-ppmm/8x8-neonfma.c
Marat Dukhan49e6ee92019-11-06 15:55:29 -0800418 src/f32-vmulcaddc/c4-neonfma-2x.c
419 src/f32-vmulcaddc/c8-neonfma-2x.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700420
421SET(AARCH64_XNNPACK_NEONFMA_MICROKERNEL_SRCS
422 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
423 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
424 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
425 src/f32-dwconv-spchw/3x3p1-neonfma.c
426 src/f32-dwconv-spchw/5x5p2-neonfma.c
427 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
428 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
429 src/f32-spmm/12x1-neonfma.c
430 src/f32-spmm/12x2-neonfma.c
431 src/f32-spmm/12x4-neonfma.c
432 src/f32-spmm/16x1-neonfma-pipelined.c
433 src/f32-spmm/16x1-neonfma-unroll2.c
434 src/f32-spmm/16x1-neonfma.c
435 src/f32-spmm/16x2-neonfma.c
436 src/f32-spmm/16x4-neonfma.c
437 src/f32-spmm/4x1-neonfma-pipelined.c
438 src/f32-spmm/4x1-neonfma-unroll2.c
439 src/f32-spmm/4x1-neonfma.c
440 src/f32-spmm/4x2-neonfma.c
441 src/f32-spmm/4x4-neonfma.c
442 src/f32-spmm/8x1-neonfma-pipelined.c
443 src/f32-spmm/8x1-neonfma-unroll2.c
444 src/f32-spmm/8x1-neonfma.c
445 src/f32-spmm/8x2-neonfma.c
446 src/f32-spmm/8x4-neonfma.c)
447
448SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
449 src/f16-gemm/4x8-neonfp16arith-ld64.c
450 src/f16-gemm/6x8-neonfp16arith-ld64.c
451 src/f16-gemm/8x8-neonfp16arith-ld64.c)
452
453SET(XNNPACK_SSE_MICROKERNEL_SRCS
454 src/f32-avgpool/mp9p8q-sse.c
455 src/f32-avgpool/up9-sse.c
Marat Dukhan35dacfb2019-11-07 19:18:16 -0800456 src/f32-bilinear/sse-c4.c
457 src/f32-bilinear/sse-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700458 src/f32-clamp/sse.c
459 src/f32-igemm/1x8-sse-dup.c
460 src/f32-igemm/1x8-sse-load1.c
461 src/f32-igemm/1x8s4-sse.c
462 src/f32-igemm/4x2c4-sse.c
463 src/f32-igemm/4x8-sse-dup.c
464 src/f32-igemm/4x8-sse-load1.c
465 src/f32-igemm/4x8s4-sse.c
466 src/f32-dwconv/up4x25-sse.c
467 src/f32-dwconv/up4x4-sse.c
468 src/f32-dwconv/up4x9-sse.c
Marat Dukhan5098c3e2019-11-07 12:01:19 -0800469 src/f32-dwconv/up4x25-sse-acc2.c
470 src/f32-dwconv/up4x4-sse-acc2.c
471 src/f32-dwconv/up4x9-sse-acc2.c
472 src/f32-dwconv/up8x25-sse.c
473 src/f32-dwconv/up8x4-sse.c
474 src/f32-dwconv/up8x9-sse.c
475 src/f32-dwconv/up8x25-sse-acc2.c
476 src/f32-dwconv/up8x4-sse-acc2.c
477 src/f32-dwconv/up8x9-sse-acc2.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700478 src/f32-gavgpool-spchw/sse-x4.c
479 src/f32-gavgpool/mp7p7q-sse.c
480 src/f32-gavgpool/up7-sse.c
481 src/f32-gemm/1x8-sse-dup.c
482 src/f32-gemm/1x8-sse-load1.c
483 src/f32-gemm/1x8s4-sse.c
484 src/f32-gemm/4x8-sse-dup.c
485 src/f32-gemm/4x8-sse-load1.c
486 src/f32-gemm/4x8s4-sse.c
487 src/f32-gemminc/1x8-sse-dup.c
488 src/f32-gemminc/1x8-sse-load1.c
489 src/f32-gemminc/1x8s4-sse.c
490 src/f32-gemminc/4x8-sse-dup.c
491 src/f32-gemminc/4x8-sse-load1.c
492 src/f32-gemminc/4x8s4-sse.c
493 src/f32-hswish/sse.c
494 src/f32-maxpool/9p8q-sse.c
495 src/f32-pavgpool/mp9p8q-sse.c
496 src/f32-pavgpool/up9-sse.c
497 src/f32-dwconv-spchw/3x3p1-sse.c
498 src/f32-dwconv-spchw/3x3s2p1-sse.c
499 src/f32-ppmm/4x8-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700500 src/f32-rmax/sse.c
501 src/f32-spmm/4x1-sse.c
502 src/f32-spmm/8x1-sse.c
503 src/f32-vadd/sse.c
504 src/f32-vmul/sse.c
Marat Dukhan49e6ee92019-11-06 15:55:29 -0800505 src/f32-vmulcaddc/c4-sse-2x.c
506 src/f32-vmulcaddc/c8-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700507 src/f32-vsub/sse.c
508 src/x32-packx/x4-sse.c)
509
510SET(XNNPACK_SSE2_MICROKERNEL_SRCS
511 src/f32-argmaxpool/mp9p8q-sse2.c
512 src/f32-argmaxpool/up4-sse2.c
513 src/f32-argmaxpool/up9-sse2.c
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800514 src/f32-prelu/sse2-2x4.c
515 src/f32-prelu/sse2-2x8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700516 src/q8-avgpool/mp9p8q-sse2.c
517 src/q8-avgpool/up9-sse2.c
518 src/q8-igemm/4x4c2-sse2.c
519 src/q8-dwconv/up8x9-sse2.c
520 src/q8-gavgpool/mp7p7q-sse2.c
521 src/q8-gavgpool/up7-sse2.c
522 src/q8-gemm/2x4c8-sse2.c
523 src/q8-gemm/4x4c2-sse2.c
524 src/q8-vadd/sse2.c
525 src/u8-clamp/sse2.c
526 src/u8-maxpool/9p8q-sse2.c
527 src/u8-rmax/sse2.c
528 src/x32-pad/x2-sse2.c
529 src/x32-zip/x2-sse2.c
530 src/x32-zip/x3-sse2.c
531 src/x32-zip/x4-sse2.c
532 src/x32-zip/xm-sse2.c
533 src/x8-zip/x2-sse2.c
534 src/x8-zip/x3-sse2.c
535 src/x8-zip/x4-sse2.c
536 src/x8-zip/xm-sse2.c)
537
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800538SET(XNNPACK_SSE41_MICROKERNEL_SRCS
539 src/f32-prelu/sse41-2x4.c
540 src/f32-prelu/sse41-2x8.c)
541
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700542SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhana5977df2019-10-30 22:02:15 -0700543 src/f32-rmax/avx.c
544 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700545
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700546SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan97579532019-10-18 16:40:39 -0700547 src/f32-raddexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700548 src/f32-raddextexp/avx2-p5-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700549 src/f32-raddstoreexpminusmax/avx2-p5-unroll64.c
550 src/f32-vscaleexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700551 src/f32-vscaleextexp/avx2-p5-unroll64.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700552 src/math/exp-avx2-p5.c
553 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -0700554 src/math/exp-avx2-perm-p4.c
555 src/math/expminus-avx2-p5.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700556
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700557SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhan97579532019-10-18 16:40:39 -0700558 src/f32-raddexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700559 src/f32-raddextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan97579532019-10-18 16:40:39 -0700560 src/f32-raddstoreexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700561 src/f32-rmax/avx512f.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700562 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700563 src/f32-vscaleexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700564 src/f32-vscaleextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700565 src/math/exp-avx512f-p5-scalef.c
566 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -0700567 src/math/exp-avx512f-perm-p3.c
568 src/math/exp-avx512f-perm2-p2.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700569
570SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
571 src/q8-dwconv/up8x9-aarch32-neon.S)
572
573SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
574 src/f32-dwconv/up4x9-aarch64-neonfma-cortex-a55.S
575 src/f32-dwconv/up4x9-aarch64-neonfma.S
576 src/f32-gemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700577 src/f32-gemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700578 src/f32-gemm/1x8-aarch64-neonfma-cortex-a57.S
579 src/f32-gemm/1x8-aarch64-neonfma-cortex-a75.S
580 src/f32-gemm/4x12-aarch64-neonfma-cortex-a53.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700581 src/f32-gemm/4x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700582 src/f32-gemm/4x8-aarch64-neonfma-cortex-a57.S
583 src/f32-gemm/4x8-aarch64-neonfma-cortex-a75.S
584 src/f32-gemm/4x8-aarch64-neonfma-ld128.S
585 src/f32-gemm/4x8-aarch64-neonfma-ld64.S
586 src/f32-gemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700587 src/f32-gemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700588 src/f32-gemm/6x8-aarch64-neonfma-cortex-a57.S
589 src/f32-gemm/6x8-aarch64-neonfma-cortex-a73.S
590 src/f32-gemm/6x8-aarch64-neonfma-cortex-a75.S
591 src/f32-gemm/6x8-aarch64-neonfma-ld128.S
592 src/f32-gemm/6x8-aarch64-neonfma-ld64.S
593 src/f32-gemminc/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700594 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700595 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a57.S
596 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a75.S
597 src/f32-gemminc/4x12-aarch64-neonfma-cortex-a53.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700598 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700599 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a57.S
600 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a75.S
601 src/f32-gemminc/4x8-aarch64-neonfma-ld128.S
602 src/f32-gemminc/4x8-aarch64-neonfma-ld64.S
603 src/f32-gemminc/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700604 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700605 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a57.S
606 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a73.S
607 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a75.S
608 src/f32-gemminc/6x8-aarch64-neonfma-ld128.S
609 src/f32-gemminc/6x8-aarch64-neonfma-ld64.S
610 src/f32-igemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700611 src/f32-igemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700612 src/f32-igemm/1x8-aarch64-neonfma-cortex-a57.S
613 src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.S
614 src/f32-igemm/4x12-aarch64-neonfma-cortex-a53.S
615 src/f32-igemm/4x8-aarch64-neonfma-cortex-a75.S
616 src/f32-igemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700617 src/f32-igemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700618 src/f32-igemm/6x8-aarch64-neonfma-cortex-a57.S
619 src/f32-igemm/6x8-aarch64-neonfma-cortex-a73.S
620 src/f32-igemm/6x8-aarch64-neonfma-cortex-a75.S)
621
622SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
623IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
624 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_MICROKERNEL_SRCS})
625ENDIF()
626IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
627 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
628 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
629 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
630ENDIF()
631IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
632 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
633 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
634 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${AARCH64_XNNPACK_NEONFMA_MICROKERNEL_SRCS})
635 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
636 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
637ENDIF()
638IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
639 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
640 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800641 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700642 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700643 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700644 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
645ENDIF()
646
647IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
648 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
649ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
650 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
651ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
652 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
653ELSE()
654 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
655ENDIF()
656SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
657 C_STANDARD 99
658 C_EXTENSIONS YES)
659IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
660 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
661 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
662 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
663 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
664 IF(IOS)
665 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
666 ENDIF()
667ENDIF()
668IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
669 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
670 IF(IOS)
671 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
672 ENDIF()
673ENDIF()
674IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
675 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
676 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800677 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700678 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700679 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700680 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
681ENDIF()
682IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
683 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
684ELSE()
685 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
686 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
687 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
688 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
689ENDIF()
690IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
691 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
692ENDIF()
693
694TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
695TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
696SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/XNNPACK.h)
697
698# ---[ Configure clog
699IF(NOT TARGET clog)
700 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
701 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
702 ADD_SUBDIRECTORY(
703 "${CLOG_SOURCE_DIR}/deps/clog"
704 "${CMAKE_BINARY_DIR}/clog")
705 # We build static version of clog but a dynamic library may indirectly depend on it
706 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
707ENDIF()
708TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
709
710# ---[ Configure cpuinfo
711IF(NOT TARGET cpuinfo)
712 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
713 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
714 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
715 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
716 ADD_SUBDIRECTORY(
717 "${CPUINFO_SOURCE_DIR}"
718 "${CMAKE_BINARY_DIR}/cpuinfo")
719ENDIF()
720TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
721
722# ---[ Configure pthreadpool
723IF(NOT TARGET pthreadpool)
724 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
725 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -0700726 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700727 ADD_SUBDIRECTORY(
728 "${PTHREADPOOL_SOURCE_DIR}"
729 "${CMAKE_BINARY_DIR}/pthreadpool")
730ENDIF()
731TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
732
733# ---[ Configure FXdiv
734IF(NOT TARGET fxdiv)
735 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
736 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
737 ADD_SUBDIRECTORY(
738 "${FXDIV_SOURCE_DIR}"
739 "${CMAKE_BINARY_DIR}/FXdiv")
740ENDIF()
741TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
742
743# ---[ Configure psimd
744IF(NOT TARGET psimd)
745 ADD_SUBDIRECTORY(
746 "${PSIMD_SOURCE_DIR}"
747 "${CMAKE_BINARY_DIR}/psimd")
748ENDIF()
749TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
750
751# ---[ Configure FP16
752IF(NOT TARGET fp16)
753 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
754 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
755 ADD_SUBDIRECTORY(
756 "${FP16_SOURCE_DIR}"
757 "${CMAKE_BINARY_DIR}/FP16")
758ENDIF()
759TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
760
761INSTALL(TARGETS XNNPACK
762 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
763 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
764 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
765
766# ---[ XNNPACK unit tests
767IF(XNNPACK_BUILD_TESTS)
768 # ---[ Build google test
769 IF(NOT TARGET gtest)
770 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
771 ADD_SUBDIRECTORY(
772 "${GOOGLETEST_SOURCE_DIR}"
773 "${CMAKE_BINARY_DIR}/googletest")
774 ENDIF()
775
776 # ---[ Build operator-level unit tests
777 ADD_EXECUTABLE(add-test test/add.cc)
778 SET_TARGET_PROPERTIES(add-test PROPERTIES
779 CXX_STANDARD 11
780 CXX_STANDARD_REQUIRED YES
781 CXX_EXTENSIONS NO)
782 TARGET_INCLUDE_DIRECTORIES(add-test PRIVATE src test)
783 TARGET_LINK_LIBRARIES(add-test PRIVATE XNNPACK gtest gtest_main)
784 ADD_TEST(add-test add-test)
785
786 ADD_EXECUTABLE(argmax-pooling-test test/argmax-pooling.cc)
787 SET_TARGET_PROPERTIES(argmax-pooling-test PROPERTIES
788 CXX_STANDARD 11
789 CXX_STANDARD_REQUIRED YES
790 CXX_EXTENSIONS NO)
791 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-test PRIVATE src test)
792 TARGET_LINK_LIBRARIES(argmax-pooling-test PRIVATE XNNPACK gtest gtest_main)
793 ADD_TEST(argmax-pooling-test argmax-pooling-test)
794
795 ADD_EXECUTABLE(average-pooling-test test/average-pooling.cc)
796 SET_TARGET_PROPERTIES(average-pooling-test PROPERTIES
797 CXX_STANDARD 11
798 CXX_STANDARD_REQUIRED YES
799 CXX_EXTENSIONS NO)
800 TARGET_INCLUDE_DIRECTORIES(average-pooling-test PRIVATE src test)
801 TARGET_LINK_LIBRARIES(average-pooling-test PRIVATE XNNPACK gtest gtest_main)
802 ADD_TEST(average-pooling-test average-pooling-test)
803
804 ADD_EXECUTABLE(channel-pad-test test/channel-pad.cc)
805 SET_TARGET_PROPERTIES(channel-pad-test PROPERTIES
806 CXX_STANDARD 11
807 CXX_STANDARD_REQUIRED YES
808 CXX_EXTENSIONS NO)
809 TARGET_INCLUDE_DIRECTORIES(channel-pad-test PRIVATE src test)
810 TARGET_LINK_LIBRARIES(channel-pad-test PRIVATE XNNPACK gtest gtest_main)
811 ADD_TEST(channel-pad-test channel-pad-test)
812
813 ADD_EXECUTABLE(channel-shuffle-test test/channel-shuffle.cc)
814 SET_TARGET_PROPERTIES(channel-shuffle-test PROPERTIES
815 CXX_STANDARD 11
816 CXX_STANDARD_REQUIRED YES
817 CXX_EXTENSIONS NO)
818 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-test PRIVATE src test)
819 TARGET_LINK_LIBRARIES(channel-shuffle-test PRIVATE XNNPACK gtest gtest_main)
820 ADD_TEST(channel-shuffle-test channel-shuffle-test)
821
822 ADD_EXECUTABLE(clamp-test test/clamp.cc)
823 SET_TARGET_PROPERTIES(clamp-test PROPERTIES
824 CXX_STANDARD 11
825 CXX_STANDARD_REQUIRED YES
826 CXX_EXTENSIONS NO)
827 TARGET_INCLUDE_DIRECTORIES(clamp-test PRIVATE src test)
828 TARGET_LINK_LIBRARIES(clamp-test PRIVATE XNNPACK gtest gtest_main)
829 ADD_TEST(clamp-test clamp-test)
830
831 ADD_EXECUTABLE(convolution-test test/convolution.cc)
832 SET_TARGET_PROPERTIES(convolution-test PROPERTIES
833 CXX_STANDARD 11
834 CXX_STANDARD_REQUIRED YES
835 CXX_EXTENSIONS NO)
836 TARGET_INCLUDE_DIRECTORIES(convolution-test PRIVATE src test)
837 TARGET_LINK_LIBRARIES(convolution-test PRIVATE XNNPACK gtest gtest_main)
838 ADD_TEST(convolution-test convolution-test)
839
840 ADD_EXECUTABLE(convolution-spnchw-test test/convolution-spnchw.cc)
841 SET_TARGET_PROPERTIES(convolution-spnchw-test PROPERTIES
842 CXX_STANDARD 11
843 CXX_STANDARD_REQUIRED YES
844 CXX_EXTENSIONS NO)
845 TARGET_INCLUDE_DIRECTORIES(convolution-spnchw-test PRIVATE src test)
846 TARGET_LINK_LIBRARIES(convolution-spnchw-test PRIVATE XNNPACK gtest gtest_main)
847 ADD_TEST(convolution-spnchw-test convolution-spnchw-test)
848
849 ADD_EXECUTABLE(deconvolution-test test/deconvolution.cc)
850 SET_TARGET_PROPERTIES(deconvolution-test PROPERTIES
851 CXX_STANDARD 11
852 CXX_STANDARD_REQUIRED YES
853 CXX_EXTENSIONS NO)
854 TARGET_INCLUDE_DIRECTORIES(deconvolution-test PRIVATE src test)
855 TARGET_LINK_LIBRARIES(deconvolution-test PRIVATE XNNPACK gtest gtest_main)
856 ADD_TEST(deconvolution-test deconvolution-test)
857
858 ADD_EXECUTABLE(fully-connected-test test/fully-connected.cc)
859 SET_TARGET_PROPERTIES(fully-connected-test PROPERTIES
860 CXX_STANDARD 11
861 CXX_STANDARD_REQUIRED YES
862 CXX_EXTENSIONS NO)
863 TARGET_INCLUDE_DIRECTORIES(fully-connected-test PRIVATE src test)
864 TARGET_LINK_LIBRARIES(fully-connected-test PRIVATE XNNPACK gtest gtest_main)
865 ADD_TEST(fully-connected-test fully-connected-test)
866
867 ADD_EXECUTABLE(global-average-pooling-test test/global-average-pooling.cc)
868 SET_TARGET_PROPERTIES(global-average-pooling-test PROPERTIES
869 CXX_STANDARD 11
870 CXX_STANDARD_REQUIRED YES
871 CXX_EXTENSIONS NO)
872 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-test PRIVATE src test)
873 TARGET_LINK_LIBRARIES(global-average-pooling-test PRIVATE XNNPACK gtest gtest_main)
874 ADD_TEST(global-average-pooling-test global-average-pooling-test)
875
876 ADD_EXECUTABLE(global-average-pooling-spnchw-test test/global-average-pooling-spnchw.cc)
877 SET_TARGET_PROPERTIES(global-average-pooling-spnchw-test PROPERTIES
878 CXX_STANDARD 11
879 CXX_STANDARD_REQUIRED YES
880 CXX_EXTENSIONS NO)
881 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-spnchw-test PRIVATE src test)
882 TARGET_LINK_LIBRARIES(global-average-pooling-spnchw-test PRIVATE XNNPACK gtest gtest_main)
883 ADD_TEST(global-average-pooling-spnchw-test global-average-pooling-spnchw-test)
884
885 ADD_EXECUTABLE(hardswish-test test/hardswish.cc)
886 SET_TARGET_PROPERTIES(hardswish-test PROPERTIES
887 CXX_STANDARD 11
888 CXX_STANDARD_REQUIRED YES
889 CXX_EXTENSIONS NO)
890 TARGET_INCLUDE_DIRECTORIES(hardswish-test PRIVATE src test)
891 TARGET_LINK_LIBRARIES(hardswish-test PRIVATE XNNPACK gtest gtest_main)
892 ADD_TEST(hardswish-test hardswish-test)
893
894 ADD_EXECUTABLE(leaky-relu-test test/leaky-relu.cc)
895 SET_TARGET_PROPERTIES(leaky-relu-test PROPERTIES
896 CXX_STANDARD 11
897 CXX_STANDARD_REQUIRED YES
898 CXX_EXTENSIONS NO)
899 TARGET_INCLUDE_DIRECTORIES(leaky-relu-test PRIVATE src test)
900 TARGET_LINK_LIBRARIES(leaky-relu-test PRIVATE XNNPACK gtest gtest_main)
901 ADD_TEST(leaky-relu-test leaky-relu-test)
902
903 ADD_EXECUTABLE(max-pooling-test test/max-pooling.cc)
904 SET_TARGET_PROPERTIES(max-pooling-test PROPERTIES
905 CXX_STANDARD 11
906 CXX_STANDARD_REQUIRED YES
907 CXX_EXTENSIONS NO)
908 TARGET_INCLUDE_DIRECTORIES(max-pooling-test PRIVATE src test)
909 TARGET_LINK_LIBRARIES(max-pooling-test PRIVATE XNNPACK gtest gtest_main)
910 ADD_TEST(max-pooling-test max-pooling-test)
911
912 ADD_EXECUTABLE(prelu-test test/prelu.cc)
913 SET_TARGET_PROPERTIES(prelu-test PROPERTIES
914 CXX_STANDARD 11
915 CXX_STANDARD_REQUIRED YES
916 CXX_EXTENSIONS NO)
917 TARGET_INCLUDE_DIRECTORIES(prelu-test PRIVATE src test)
918 TARGET_LINK_LIBRARIES(prelu-test PRIVATE XNNPACK gtest gtest_main)
919 ADD_TEST(prelu-test prelu-test)
920
921 ADD_EXECUTABLE(sigmoid-test test/sigmoid.cc)
922 SET_TARGET_PROPERTIES(sigmoid-test PROPERTIES
923 CXX_STANDARD 11
924 CXX_STANDARD_REQUIRED YES
925 CXX_EXTENSIONS NO)
926 TARGET_INCLUDE_DIRECTORIES(sigmoid-test PRIVATE src test)
927 TARGET_LINK_LIBRARIES(sigmoid-test PRIVATE XNNPACK gtest gtest_main)
928 ADD_TEST(sigmoid-test sigmoid-test)
929
930 ADD_EXECUTABLE(softargmax-test test/softargmax.cc)
931 SET_TARGET_PROPERTIES(softargmax-test PROPERTIES
932 CXX_STANDARD 11
933 CXX_STANDARD_REQUIRED YES
934 CXX_EXTENSIONS NO)
935 TARGET_INCLUDE_DIRECTORIES(softargmax-test PRIVATE src test)
936 TARGET_LINK_LIBRARIES(softargmax-test PRIVATE XNNPACK gtest gtest_main)
937 ADD_TEST(softargmax-test softargmax-test)
938
939 ADD_EXECUTABLE(unpooling-test test/unpooling.cc)
940 SET_TARGET_PROPERTIES(unpooling-test PROPERTIES
941 CXX_STANDARD 11
942 CXX_STANDARD_REQUIRED YES
943 CXX_EXTENSIONS NO)
944 TARGET_INCLUDE_DIRECTORIES(unpooling-test PRIVATE src test)
945 TARGET_LINK_LIBRARIES(unpooling-test PRIVATE XNNPACK gtest gtest_main)
946 ADD_TEST(unpooling-test unpooling-test)
947
948 # ---[ Build microkernel-level unit tests
949 ADD_EXECUTABLE(f16-gemm-test test/f16-gemm.cc)
950 SET_TARGET_PROPERTIES(f16-gemm-test PROPERTIES
951 CXX_STANDARD 11
952 CXX_STANDARD_REQUIRED YES
953 CXX_EXTENSIONS YES)
954 TARGET_INCLUDE_DIRECTORIES(f16-gemm-test PRIVATE src test)
955 TARGET_LINK_LIBRARIES(f16-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
956 ADD_TEST(f16-gemm-test f16-gemm-test)
957
958 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
959 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
960 CXX_STANDARD 11
961 CXX_STANDARD_REQUIRED YES
962 CXX_EXTENSIONS YES)
963 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
964 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
965 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
966
967 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
968 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
969 CXX_STANDARD 11
970 CXX_STANDARD_REQUIRED YES
971 CXX_EXTENSIONS YES)
972 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
973 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
974 ADD_TEST(f32-avgpool-test f32-avgpool-test)
975
Marat Dukhanc465fc22019-11-07 19:20:28 -0800976 ADD_EXECUTABLE(f32-bilinear-test test/f32-bilinear.cc)
977 SET_TARGET_PROPERTIES(f32-bilinear-test PROPERTIES
978 CXX_STANDARD 11
979 CXX_STANDARD_REQUIRED YES
980 CXX_EXTENSIONS YES)
981 TARGET_INCLUDE_DIRECTORIES(f32-bilinear-test PRIVATE src test)
982 TARGET_LINK_LIBRARIES(f32-bilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
983 ADD_TEST(f32-bilinear-test f32-bilinear-test)
984
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700985 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
986 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
987 CXX_STANDARD 11
988 CXX_STANDARD_REQUIRED YES
989 CXX_EXTENSIONS YES)
990 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
991 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
992 ADD_TEST(f32-clamp-test f32-clamp-test)
993
994 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
995 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
996 CXX_STANDARD 11
997 CXX_STANDARD_REQUIRED YES
998 CXX_EXTENSIONS YES)
999 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
1000 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1001 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
1002
1003 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
1004 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
1005 CXX_STANDARD 11
1006 CXX_STANDARD_REQUIRED YES
1007 CXX_EXTENSIONS YES)
1008 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
1009 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1010 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
1011
1012 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
1013 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
1014 CXX_STANDARD 11
1015 CXX_STANDARD_REQUIRED YES
1016 CXX_EXTENSIONS YES)
1017 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
1018 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1019 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
1020
1021 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
1022 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
1023 CXX_STANDARD 11
1024 CXX_STANDARD_REQUIRED YES
1025 CXX_EXTENSIONS YES)
1026 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
1027 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1028 ADD_TEST(f32-dwconv-test f32-dwconv-test)
1029
1030 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
1031 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
1032 CXX_STANDARD 11
1033 CXX_STANDARD_REQUIRED YES
1034 CXX_EXTENSIONS YES)
1035 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
1036 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1037 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
1038
1039 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
1040 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
1041 CXX_STANDARD 11
1042 CXX_STANDARD_REQUIRED YES
1043 CXX_EXTENSIONS YES)
1044 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
1045 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1046 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
1047
1048 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
1049 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
1050 CXX_STANDARD 11
1051 CXX_STANDARD_REQUIRED YES
1052 CXX_EXTENSIONS YES)
1053 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
1054 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1055 ADD_TEST(f32-gemm-test f32-gemm-test)
1056
1057 ADD_EXECUTABLE(f32-gemminc-test test/f32-gemminc.cc)
1058 SET_TARGET_PROPERTIES(f32-gemminc-test PROPERTIES
1059 CXX_STANDARD 11
1060 CXX_STANDARD_REQUIRED YES
1061 CXX_EXTENSIONS YES)
1062 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-test PRIVATE src test)
1063 TARGET_LINK_LIBRARIES(f32-gemminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1064 ADD_TEST(f32-gemminc-test f32-gemminc-test)
1065
1066 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
1067 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
1068 CXX_STANDARD 11
1069 CXX_STANDARD_REQUIRED YES
1070 CXX_EXTENSIONS YES)
1071 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
1072 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1073 ADD_TEST(f32-hswish-test f32-hswish-test)
1074
1075 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
1076 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
1077 CXX_STANDARD 11
1078 CXX_STANDARD_REQUIRED YES
1079 CXX_EXTENSIONS YES)
1080 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
1081 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1082 ADD_TEST(f32-igemm-test f32-igemm-test)
1083
1084 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
1085 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
1086 CXX_STANDARD 11
1087 CXX_STANDARD_REQUIRED YES
1088 CXX_EXTENSIONS YES)
1089 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
1090 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1091 ADD_TEST(f32-maxpool-test f32-maxpool-test)
1092
1093 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
1094 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
1095 CXX_STANDARD 11
1096 CXX_STANDARD_REQUIRED YES
1097 CXX_EXTENSIONS YES)
1098 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
1099 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1100 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
1101
1102 ADD_EXECUTABLE(f32-ppmm-test test/f32-ppmm.cc)
1103 SET_TARGET_PROPERTIES(f32-ppmm-test PROPERTIES
1104 CXX_STANDARD 11
1105 CXX_STANDARD_REQUIRED YES
1106 CXX_EXTENSIONS YES)
1107 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-test PRIVATE src test)
1108 TARGET_LINK_LIBRARIES(f32-ppmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1109 ADD_TEST(f32-ppmm-test f32-ppmm-test)
1110
1111 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
1112 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
1113 CXX_STANDARD 11
1114 CXX_STANDARD_REQUIRED YES
1115 CXX_EXTENSIONS YES)
1116 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
1117 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1118 ADD_TEST(f32-prelu-test f32-prelu-test)
1119
Marat Dukhan97579532019-10-18 16:40:39 -07001120 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
1121 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
1122 CXX_STANDARD 11
1123 CXX_STANDARD_REQUIRED YES
1124 CXX_EXTENSIONS YES)
1125 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
1126 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1127 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
1128
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001129 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
1130 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
1131 CXX_STANDARD 11
1132 CXX_STANDARD_REQUIRED YES
1133 CXX_EXTENSIONS YES)
1134 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001135 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001136 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
1137
Marat Dukhan97579532019-10-18 16:40:39 -07001138 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
1139 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
1140 CXX_STANDARD 11
1141 CXX_STANDARD_REQUIRED YES
1142 CXX_EXTENSIONS YES)
1143 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
1144 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1145 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
1146
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001147 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
1148 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
1149 CXX_STANDARD 11
1150 CXX_STANDARD_REQUIRED YES
1151 CXX_EXTENSIONS YES)
1152 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
1153 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1154 ADD_TEST(f32-rmax-test f32-rmax-test)
1155
1156 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
1157 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
1158 CXX_STANDARD 11
1159 CXX_STANDARD_REQUIRED YES
1160 CXX_EXTENSIONS YES)
1161 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
1162 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1163 ADD_TEST(f32-spmm-test f32-spmm-test)
1164
1165 ADD_EXECUTABLE(f32-vadd-test test/f32-vadd.cc)
1166 SET_TARGET_PROPERTIES(f32-vadd-test PROPERTIES
1167 CXX_STANDARD 11
1168 CXX_STANDARD_REQUIRED YES
1169 CXX_EXTENSIONS YES)
1170 TARGET_INCLUDE_DIRECTORIES(f32-vadd-test PRIVATE src test)
1171 TARGET_LINK_LIBRARIES(f32-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1172 ADD_TEST(f32-vadd-test f32-vadd-test)
1173
1174 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
1175 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
1176 CXX_STANDARD 11
1177 CXX_STANDARD_REQUIRED YES
1178 CXX_EXTENSIONS YES)
1179 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
1180 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1181 ADD_TEST(f32-vmul-test f32-vmul-test)
1182
1183 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
1184 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
1185 CXX_STANDARD 11
1186 CXX_STANDARD_REQUIRED YES
1187 CXX_EXTENSIONS YES)
1188 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
1189 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1190 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
1191
Marat Dukhan97579532019-10-18 16:40:39 -07001192 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
1193 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1194 CXX_STANDARD 11
1195 CXX_STANDARD_REQUIRED YES
1196 CXX_EXTENSIONS YES)
1197 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
1198 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1199 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
1200
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001201 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
1202 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1203 CXX_STANDARD 11
1204 CXX_STANDARD_REQUIRED YES
1205 CXX_EXTENSIONS YES)
1206 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001207 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001208 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
1209
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001210 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
1211 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
1212 CXX_STANDARD 11
1213 CXX_STANDARD_REQUIRED YES
1214 CXX_EXTENSIONS YES)
1215 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
1216 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1217 ADD_TEST(f32-vsub-test f32-vsub-test)
1218
1219 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
1220 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
1221 CXX_STANDARD 11
1222 CXX_STANDARD_REQUIRED YES
1223 CXX_EXTENSIONS YES)
1224 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
1225 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1226 ADD_TEST(q8-avgpool-test q8-avgpool-test)
1227
1228 ADD_EXECUTABLE(q8-dwconv-test test/q8-dwconv.cc)
1229 SET_TARGET_PROPERTIES(q8-dwconv-test PROPERTIES
1230 CXX_STANDARD 11
1231 CXX_STANDARD_REQUIRED YES
1232 CXX_EXTENSIONS YES)
1233 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-test PRIVATE src test)
1234 TARGET_LINK_LIBRARIES(q8-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1235 ADD_TEST(q8-dwconv-test q8-dwconv-test)
1236
1237 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
1238 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
1239 CXX_STANDARD 11
1240 CXX_STANDARD_REQUIRED YES
1241 CXX_EXTENSIONS YES)
1242 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
1243 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1244 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
1245
1246 ADD_EXECUTABLE(q8-gemm-test test/q8-gemm.cc)
1247 SET_TARGET_PROPERTIES(q8-gemm-test PROPERTIES
1248 CXX_STANDARD 11
1249 CXX_STANDARD_REQUIRED YES
1250 CXX_EXTENSIONS YES)
1251 TARGET_INCLUDE_DIRECTORIES(q8-gemm-test PRIVATE src test)
1252 TARGET_LINK_LIBRARIES(q8-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1253 ADD_TEST(q8-gemm-test q8-gemm-test)
1254
1255 ADD_EXECUTABLE(q8-igemm-test test/q8-igemm.cc)
1256 SET_TARGET_PROPERTIES(q8-igemm-test PROPERTIES
1257 CXX_STANDARD 11
1258 CXX_STANDARD_REQUIRED YES
1259 CXX_EXTENSIONS YES)
1260 TARGET_INCLUDE_DIRECTORIES(q8-igemm-test PRIVATE src test)
1261 TARGET_LINK_LIBRARIES(q8-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1262 ADD_TEST(q8-igemm-test q8-igemm-test)
1263
1264 ADD_EXECUTABLE(q8-vadd-test test/q8-vadd.cc)
1265 SET_TARGET_PROPERTIES(q8-vadd-test PROPERTIES
1266 CXX_STANDARD 11
1267 CXX_STANDARD_REQUIRED YES
1268 CXX_EXTENSIONS YES)
1269 TARGET_INCLUDE_DIRECTORIES(q8-vadd-test PRIVATE src test)
1270 TARGET_LINK_LIBRARIES(q8-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1271 ADD_TEST(q8-vadd-test q8-vadd-test)
1272
1273 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
1274 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
1275 CXX_STANDARD 11
1276 CXX_STANDARD_REQUIRED YES
1277 CXX_EXTENSIONS YES)
1278 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
1279 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1280 ADD_TEST(u8-clamp-test u8-clamp-test)
1281
1282 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
1283 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
1284 CXX_STANDARD 11
1285 CXX_STANDARD_REQUIRED YES
1286 CXX_EXTENSIONS YES)
1287 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
1288 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1289 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
1290
1291 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
1292 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
1293 CXX_STANDARD 11
1294 CXX_STANDARD_REQUIRED YES
1295 CXX_EXTENSIONS YES)
1296 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
1297 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1298 ADD_TEST(u8-maxpool-test u8-maxpool-test)
1299
1300 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
1301 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
1302 CXX_STANDARD 11
1303 CXX_STANDARD_REQUIRED YES
1304 CXX_EXTENSIONS YES)
1305 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
1306 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1307 ADD_TEST(u8-rmax-test u8-rmax-test)
1308
1309 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
1310 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
1311 CXX_STANDARD 11
1312 CXX_STANDARD_REQUIRED YES
1313 CXX_EXTENSIONS YES)
1314 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
1315 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1316 ADD_TEST(x32-packx-test x32-packx-test)
1317
1318 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
1319 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
1320 CXX_STANDARD 11
1321 CXX_STANDARD_REQUIRED YES
1322 CXX_EXTENSIONS YES)
1323 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
1324 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1325 ADD_TEST(x32-pad-test x32-pad-test)
1326
1327 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
1328 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
1329 CXX_STANDARD 11
1330 CXX_STANDARD_REQUIRED YES
1331 CXX_EXTENSIONS YES)
1332 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
1333 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1334 ADD_TEST(x32-unpool-test x32-unpool-test)
1335
1336 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
1337 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
1338 CXX_STANDARD 11
1339 CXX_STANDARD_REQUIRED YES
1340 CXX_EXTENSIONS YES)
1341 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
1342 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1343 ADD_TEST(x32-zip-test x32-zip-test)
1344
1345 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
1346 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
1347 CXX_STANDARD 11
1348 CXX_STANDARD_REQUIRED YES
1349 CXX_EXTENSIONS YES)
1350 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
1351 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1352 ADD_TEST(x8-lut-test x8-lut-test)
1353
1354 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
1355 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
1356 CXX_STANDARD 11
1357 CXX_STANDARD_REQUIRED YES
1358 CXX_EXTENSIONS YES)
1359 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
1360 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1361 ADD_TEST(x8-zip-test x8-zip-test)
1362ENDIF()
1363
1364# ---[ XNNPACK microbenchmarks
1365IF(XNNPACK_BUILD_BENCHMARKS)
1366 # ---[ Build google benchmark
1367 IF(NOT TARGET benchmark)
1368 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
1369 ADD_SUBDIRECTORY(
1370 "${GOOGLEBENCHMARK_SOURCE_DIR}"
1371 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
1372 ENDIF()
1373
1374 ADD_LIBRARY(bench-utils bench/utils.cc)
1375 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
1376 CXX_STANDARD 11
1377 CXX_STANDARD_REQUIRED YES
1378 CXX_EXTENSIONS NO)
1379 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08001380 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001381
Marat Dukhan5f18d262019-10-31 10:24:14 -07001382 # ---[ Build end-to-end microbenchmarks
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001383 ADD_EXECUTABLE(end2end-bench bench/end2end.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1384 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
1385 CXX_STANDARD 11
1386 CXX_STANDARD_REQUIRED YES
1387 CXX_EXTENSIONS NO)
1388 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Frank Barcharde72e2872019-10-31 11:12:15 -07001389 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001390
Marat Dukhanef4416e2019-10-31 13:44:40 -07001391 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1392 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
1393 CXX_STANDARD 11
1394 CXX_STANDARD_REQUIRED YES
1395 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001396 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanef4416e2019-10-31 13:44:40 -07001397 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
1398
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07001399 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1400 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07001401 CXX_STANDARD 11
1402 CXX_STANDARD_REQUIRED YES
1403 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001404 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Frank Barchardc712fa42019-10-31 14:00:21 -07001405 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07001406
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001407 # ---[ Build operator-level microbenchmarks
1408 ADD_EXECUTABLE(add-bench bench/add.cc)
1409 SET_TARGET_PROPERTIES(add-bench PROPERTIES
1410 CXX_STANDARD 11
1411 CXX_STANDARD_REQUIRED YES
1412 CXX_EXTENSIONS NO)
1413 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1414 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1415
1416 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
1417 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
1418 CXX_STANDARD 11
1419 CXX_STANDARD_REQUIRED YES
1420 CXX_EXTENSIONS NO)
1421 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1422 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1423
1424 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
1425 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
1426 CXX_STANDARD 11
1427 CXX_STANDARD_REQUIRED YES
1428 CXX_EXTENSIONS NO)
1429 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1430 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1431
1432 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
1433 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
1434 CXX_STANDARD 11
1435 CXX_STANDARD_REQUIRED YES
1436 CXX_EXTENSIONS NO)
1437 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1438 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1439
1440 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
1441 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
1442 CXX_STANDARD 11
1443 CXX_STANDARD_REQUIRED YES
1444 CXX_EXTENSIONS NO)
1445 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1446 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1447
1448 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
1449 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
1450 CXX_STANDARD 11
1451 CXX_STANDARD_REQUIRED YES
1452 CXX_EXTENSIONS NO)
1453 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1454 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1455
1456 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
1457 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
1458 CXX_STANDARD 11
1459 CXX_STANDARD_REQUIRED YES
1460 CXX_EXTENSIONS NO)
1461 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1462 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1463
Marat Dukhan95b22432019-10-30 16:30:14 -07001464 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
1465 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
1466 CXX_STANDARD 11
1467 CXX_STANDARD_REQUIRED YES
1468 CXX_EXTENSIONS NO)
1469 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1470 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1471
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001472 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
1473 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
1474 CXX_STANDARD 11
1475 CXX_STANDARD_REQUIRED YES
1476 CXX_EXTENSIONS NO)
1477 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1478 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1479
1480 ADD_EXECUTABLE(softargmax-bench bench/softargmax.cc)
1481 SET_TARGET_PROPERTIES(softargmax-bench PROPERTIES
1482 CXX_STANDARD 11
1483 CXX_STANDARD_REQUIRED YES
1484 CXX_EXTENSIONS NO)
1485 TARGET_INCLUDE_DIRECTORIES(softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1486 TARGET_LINK_LIBRARIES(softargmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1487
1488 # ---[ Build microkernel-level microbenchmarks
1489 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
1490 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
1491 CXX_STANDARD 11
1492 CXX_STANDARD_REQUIRED YES
1493 CXX_EXTENSIONS YES)
1494 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
1495 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1496 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1497
1498 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
1499 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
1500 CXX_STANDARD 11
1501 CXX_STANDARD_REQUIRED YES
1502 CXX_EXTENSIONS YES)
1503 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
1504 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1505 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1506
1507 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
1508 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
1509 CXX_STANDARD 11
1510 CXX_STANDARD_REQUIRED YES
1511 CXX_EXTENSIONS YES)
1512 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
1513 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1514 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1515
1516 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
1517 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
1518 CXX_STANDARD 11
1519 CXX_STANDARD_REQUIRED YES
1520 CXX_EXTENSIONS YES)
1521 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
1522 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1523 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1524
1525 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
1526 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
1527 CXX_STANDARD 11
1528 CXX_STANDARD_REQUIRED YES
1529 CXX_EXTENSIONS YES)
1530 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
1531 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1532 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1533
1534 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
1535 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
1536 CXX_STANDARD 11
1537 CXX_STANDARD_REQUIRED YES
1538 CXX_EXTENSIONS YES)
1539 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
1540 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1541 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1542
1543 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
1544 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
1545 C_STANDARD 99
1546 C_STANDARD_REQUIRED YES
1547 C_EXTENSIONS NO
1548 CXX_STANDARD 11
1549 CXX_STANDARD_REQUIRED YES
1550 CXX_EXTENSIONS YES)
1551 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
1552 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1553 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1554
1555 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
1556 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
1557 CXX_STANDARD 11
1558 CXX_STANDARD_REQUIRED YES
1559 CXX_EXTENSIONS YES)
1560 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
1561 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1562 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1563
1564 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
1565 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
1566 CXX_STANDARD 11
1567 CXX_STANDARD_REQUIRED YES
1568 CXX_EXTENSIONS YES)
1569 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
1570 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1571 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1572
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001573 ADD_EXECUTABLE(f32-softargmax-bench bench/f32-softargmax.cc)
1574 SET_TARGET_PROPERTIES(f32-softargmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001575 CXX_STANDARD 11
1576 CXX_STANDARD_REQUIRED YES
1577 CXX_EXTENSIONS YES)
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001578 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE src)
1579 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1580 TARGET_LINK_LIBRARIES(f32-softargmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001581
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001582 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
1583 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
1584 CXX_STANDARD 11
1585 CXX_STANDARD_REQUIRED YES
1586 CXX_EXTENSIONS YES)
1587 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
1588 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1589 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1590ENDIF()