blob: 713ff9f07c799ac66df9fe1f8b62bcebc1347b04 [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
19OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
20OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
21
22# ---[ CMake options
23IF(XNNPACK_BUILD_TESTS)
24 ENABLE_TESTING()
25ENDIF()
26
27# ---[ Build flags
28IF(NOT CMAKE_SYSTEM_PROCESSOR)
29 IF(IOS)
30 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
31 IF(IOS_ARCH_COUNT GREATER 1)
32 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
33 "Specify a single architecture in IOS_ARCH and re-configure. ")
34 ENDIF()
35 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|armv7.*|arm64.*)$")
36 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
37 ENDIF()
38 ELSE()
39 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
40 ENDIF()
41ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|armv[5-8].*|aarch64)$")
42 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
43ENDIF()
44
45IF(NOT CMAKE_SYSTEM_NAME)
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
47ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android)$")
48 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
49ENDIF()
50
51# ---[ Download deps
52IF(NOT DEFINED CLOG_SOURCE_DIR)
53 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
54 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
55 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
56 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
57 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
58 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
59 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
60ENDIF()
61
62IF(NOT DEFINED CPUINFO_SOURCE_DIR)
63 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
64 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
65 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
66 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
67 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
68 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
69 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
70ENDIF()
71
72IF(NOT DEFINED FP16_SOURCE_DIR)
73 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
74 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
75 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
76 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
77 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
78 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
79 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
80ENDIF()
81
82IF(NOT DEFINED FXDIV_SOURCE_DIR)
83 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
84 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
85 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
86 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
87 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
88 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
89 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
90ENDIF()
91
92IF(NOT DEFINED PSIMD_SOURCE_DIR)
93 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
94 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
95 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
96 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
97 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
98 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
99 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
100ENDIF()
101
102IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
103 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
104 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
105 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
106 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
107 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
108 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
109 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
110ENDIF()
111
112IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
113 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
114 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
115 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
116 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
117 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
118 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
119 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
120ENDIF()
121
122IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
123 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
124 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
125 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
126 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
127 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
128 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
129 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
130ENDIF()
131
132# ---[ XNNPACK library
133SET(XNNPACK_OPERATOR_SRCS
134 src/add.c
135 src/argmax-pooling.c
136 src/average-pooling.c
137 src/channel-pad.c
138 src/channel-shuffle.c
139 src/clamp.c
140 src/convolution-spnchw.c
141 src/convolution.c
142 src/deconvolution.c
143 src/fully-connected.c
144 src/global-average-pooling-spnchw.c
145 src/global-average-pooling.c
146 src/hardswish.c
147 src/leaky-relu.c
148 src/max-pooling.c
149 src/prelu.c
150 src/sigmoid.c
151 src/softargmax.c
152 src/unpooling.c)
153
154SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
155LIST(APPEND XNNPACK_COLD_SRCS
156 src/init.c
157 src/operator-delete.c)
158
159SET(XNNPACK_HOT_SRCS
160 src/indirection.c
161 src/operator-run.c)
162
163SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
164 src/f32-argmaxpool/mp9p8q-scalar.c
165 src/f32-argmaxpool/up4-scalar.c
166 src/f32-argmaxpool/up9-scalar.c
167 src/f32-avgpool/mp9p8q-scalar.c
168 src/f32-avgpool/up9-scalar.c
169 src/f32-clamp/scalar.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700170 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700171 src/f32-igemm/1x4-scalar.c
172 src/f32-igemm/2x4-scalar.c
173 src/f32-igemm/4x2-scalar.c
174 src/f32-igemm/4x4-scalar.c
175 src/f32-dwconv/up1x25-scalar.c
176 src/f32-dwconv/up1x4-scalar.c
177 src/f32-dwconv/up1x9-scalar.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700178 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700179 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700180 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700181 src/f32-gavgpool/mp7p7q-scalar.c
182 src/f32-gavgpool/up7-scalar.c
183 src/f32-gemm/1x4-scalar.c
184 src/f32-gemm/2x4-scalar.c
185 src/f32-gemm/4x2-scalar.c
186 src/f32-gemm/4x4-scalar.c
187 src/f32-gemminc/1x4-scalar.c
188 src/f32-gemminc/2x4-scalar.c
189 src/f32-gemminc/4x4-scalar.c
190 src/f32-hswish/scalar.c
191 src/f32-maxpool/9p8q-scalar.c
192 src/f32-pavgpool/mp9p8q-scalar.c
193 src/f32-pavgpool/up9-scalar.c
194 src/f32-ppmm/2x4-scalar.c
195 src/f32-ppmm/3x3-scalar.c
196 src/f32-ppmm/4x2-scalar.c
197 src/f32-ppmm/4x4-scalar.c
198 src/f32-prelu/x4-scalar.c
199 src/f32-rmax/scalar.c
200 src/f32-spmm/1x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700201 src/f32-spmm/1x1-scalar.c
202 src/f32-spmm/2x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700203 src/f32-spmm/2x1-scalar.c
204 src/f32-spmm/4x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700205 src/f32-spmm/4x1-scalar.c
206 src/f32-spmm/8x1-scalar-pipelined.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700207 src/f32-spmm/8x1-scalar.c
Erich Elsenc6afd9b2019-10-24 16:10:53 -0700208 src/f32-spmm/8x2-scalar.c
209 src/f32-spmm/8x4-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700210 src/f32-vadd/scalar.c
211 src/f32-vmul/scalar.c
212 src/f32-vmulcaddc/c1-scalar-x2.c
213 src/f32-vsub/scalar.c
214 src/q8-avgpool/mp9p8q-scalar.c
215 src/q8-avgpool/up9-scalar.c
216 src/q8-igemm/2x2-scalar.c
217 src/q8-dwconv/up1x9-scalar.c
218 src/q8-gavgpool/mp7p7q-scalar.c
219 src/q8-gavgpool/up7-scalar.c
220 src/q8-gemm/2x2-scalar.c
221 src/q8-vadd/scalar.c
222 src/u8-clamp/scalar.c
223 src/u8-lut32norm/scalar.c
224 src/u8-maxpool/9p8q-scalar.c
225 src/u8-rmax/scalar.c
226 src/x32-packx/x2-scalar.c
227 src/x32-packx/x3-scalar.c
228 src/x32-packx/x4-scalar.c
229 src/x32-pad/x2-scalar.c
230 src/x32-unpool/scalar.c
231 src/x32-zip/x2-scalar.c
232 src/x32-zip/x3-scalar.c
233 src/x32-zip/x4-scalar.c
234 src/x32-zip/xm-scalar.c
235 src/x8-lut/scalar.c
236 src/x8-zip/x2-scalar.c
237 src/x8-zip/x3-scalar.c
238 src/x8-zip/x4-scalar.c
239 src/x8-zip/xm-scalar.c)
240
241SET(XNNPACK_PSIMD_MICROKERNEL_SRCS
242 src/f32-argmaxpool/mp9p8q-psimd.c
243 src/f32-argmaxpool/up4-psimd.c
244 src/f32-argmaxpool/up9-psimd.c
245 src/f32-avgpool/mp9p8q-psimd.c
246 src/f32-avgpool/up9-psimd.c
247 src/f32-clamp/psimd.c
248 src/f32-igemm/1x8-psimd-loadsplat.c
249 src/f32-igemm/1x8-psimd-splat.c
250 src/f32-igemm/1x8s4-psimd.c
251 src/f32-igemm/4x2c4-psimd.c
252 src/f32-igemm/4x8-psimd-loadsplat.c
253 src/f32-igemm/4x8-psimd-splat.c
254 src/f32-igemm/4x8s4-psimd.c
255 src/f32-igemm/6x8-psimd-loadsplat.c
256 src/f32-igemm/6x8-psimd-splat.c
257 src/f32-igemm/6x8s4-psimd.c
258 src/f32-dwconv/up4x25-psimd.c
259 src/f32-dwconv/up4x4-psimd.c
260 src/f32-dwconv/up4x9-psimd.c
261 src/f32-gavgpool/mp7p7q-psimd.c
262 src/f32-gavgpool/up7-psimd.c
263 src/f32-gemm/1x8-psimd-loadsplat.c
264 src/f32-gemm/1x8-psimd-splat.c
265 src/f32-gemm/1x8s4-psimd.c
266 src/f32-gemm/4x8-psimd-loadsplat.c
267 src/f32-gemm/4x8-psimd-splat.c
268 src/f32-gemm/4x8s4-psimd.c
269 src/f32-gemm/6x8-psimd-loadsplat.c
270 src/f32-gemm/6x8-psimd-splat.c
271 src/f32-gemm/6x8s4-psimd.c
272 src/f32-gemminc/1x8-psimd-loadsplat.c
273 src/f32-gemminc/1x8-psimd-splat.c
274 src/f32-gemminc/1x8s4-psimd.c
275 src/f32-gemminc/4x8-psimd-loadsplat.c
276 src/f32-gemminc/4x8-psimd-splat.c
277 src/f32-gemminc/4x8s4-psimd.c
278 src/f32-gemminc/6x8-psimd-loadsplat.c
279 src/f32-gemminc/6x8-psimd-splat.c
280 src/f32-gemminc/6x8s4-psimd.c
281 src/f32-hswish/psimd.c
282 src/f32-maxpool/9p8q-psimd.c
283 src/f32-pavgpool/mp9p8q-psimd.c
284 src/f32-pavgpool/up9-psimd.c
285 src/f32-ppmm/4x8-psimd.c
286 src/f32-prelu/x4-psimd.c
287 src/f32-vadd/psimd.c
288 src/f32-vmul/psimd.c
289 src/f32-vmulcaddc/c4-psimd-x2.c
290 src/f32-vsub/psimd.c
291 src/x32-packx/x4-psimd.c
292 src/x32-pad/x2-psimd.c
293 src/x32-unpool/psimd.c
294 src/x32-zip/x2-psimd.c
295 src/x32-zip/x3-psimd.c
296 src/x32-zip/x4-psimd.c
297 src/x32-zip/xm-psimd.c)
298
299SET(XNNPACK_NEON_MICROKERNEL_SRCS
300 src/f32-avgpool/mp9p8q-neon.c
301 src/f32-avgpool/up9-neon.c
302 src/f32-clamp/neon.c
303 src/f32-igemm/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700304 src/f32-igemm/4x2-neon-ld64.c
305 src/f32-igemm/4x4-neon-ld64.c
306 src/f32-igemm/4x8-neon-ld128.c
307 src/f32-igemm/4x8-neon-ld64.c
308 src/f32-igemm/6x8-neon-ld64.c
309 src/f32-dwconv/up4x9-neon.c
310 src/f32-gavgpool-spchw/neon-x4.c
311 src/f32-gavgpool/mp7p7q-neon.c
312 src/f32-gavgpool/up7-neon.c
313 src/f32-gemm/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700314 src/f32-gemm/4x2-neon-ld64.c
315 src/f32-gemm/4x8-neon-ld128.c
316 src/f32-gemm/4x8-neon-ld64.c
317 src/f32-gemm/5x8-neon-ld64.c
318 src/f32-gemm/6x8-neon-ld64.c
319 src/f32-gemminc/1x8-neon-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700320 src/f32-gemminc/4x8-neon-ld128.c
321 src/f32-gemminc/4x8-neon-ld64.c
322 src/f32-gemminc/5x8-neon-ld64.c
323 src/f32-gemminc/6x8-neon-ld64.c
324 src/f32-hswish/neon.c
325 src/f32-pavgpool/mp9p8q-neon.c
326 src/f32-pavgpool/up9-neon.c
327 src/f32-ppmm/4x8-neon.c
328 src/f32-ppmm/8x8-neon.c
329 src/f32-rmax/neon.c
330 src/f32-vmulcaddc/c4-neon-x2.c
331 src/q8-avgpool/mp9p8q-neon.c
332 src/q8-avgpool/up9-neon.c
333 src/q8-igemm/4x8-neon.c
334 src/q8-igemm/8x8-neon.c
335 src/q8-dwconv/up8x9-neon.c
336 src/q8-gavgpool/mp7p7q-neon.c
337 src/q8-gavgpool/up7-neon.c
338 src/q8-gemm/4x8-neon.c
339 src/q8-gemm/8x8-neon.c
340 src/q8-vadd/neon.c
341 src/u8-clamp/neon.c
342 src/u8-maxpool/9p8q-neon.c
343 src/u8-rmax/neon.c
344 src/x32-packx/x4-neon-st4.c
345 src/x32-pad/x2-neon.c
346 src/x32-zip/x2-neon.c
347 src/x32-zip/x3-neon.c
348 src/x32-zip/x4-neon.c
349 src/x32-zip/xm-neon.c
350 src/x8-zip/x2-neon.c
351 src/x8-zip/x3-neon.c
352 src/x8-zip/x4-neon.c
353 src/x8-zip/xm-neon.c)
354
355SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Frank Barcharddb45b6a2019-10-09 16:42:45 -0700356 src/f32-igemm/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700357 src/f32-igemm/4x2-neonfma-ld64.c
358 src/f32-igemm/4x4-neonfma-ld64.c
359 src/f32-igemm/4x8-neonfma-ld128.c
360 src/f32-igemm/4x8-neonfma-ld64.c
361 src/f32-igemm/6x8-neonfma-ld64.c
362 src/f32-dwconv/up4x9-neonfma.c
363 src/f32-dwconv/up8x9-neonfma.c
364 src/f32-gemm/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700365 src/f32-gemm/4x2-neonfma-ld64.c
366 src/f32-gemm/4x8-neonfma-ld128.c
367 src/f32-gemm/4x8-neonfma-ld64.c
368 src/f32-gemm/5x8-neonfma-ld64.c
369 src/f32-gemm/6x8-neonfma-ld64.c
370 src/f32-gemminc/1x8-neonfma-ld64.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700371 src/f32-gemminc/4x8-neonfma-ld128.c
372 src/f32-gemminc/4x8-neonfma-ld64.c
373 src/f32-gemminc/5x8-neonfma-ld64.c
374 src/f32-gemminc/6x8-neonfma-ld64.c
375 src/f32-hswish/neonfma.c
376 src/f32-ppmm/4x8-neonfma.c
377 src/f32-ppmm/8x8-neonfma.c
378 src/f32-vmulcaddc/c4-neonfma-x2.c)
379
380SET(AARCH64_XNNPACK_NEONFMA_MICROKERNEL_SRCS
381 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
382 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
383 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
384 src/f32-dwconv-spchw/3x3p1-neonfma.c
385 src/f32-dwconv-spchw/5x5p2-neonfma.c
386 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
387 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
388 src/f32-spmm/12x1-neonfma.c
389 src/f32-spmm/12x2-neonfma.c
390 src/f32-spmm/12x4-neonfma.c
391 src/f32-spmm/16x1-neonfma-pipelined.c
392 src/f32-spmm/16x1-neonfma-unroll2.c
393 src/f32-spmm/16x1-neonfma.c
394 src/f32-spmm/16x2-neonfma.c
395 src/f32-spmm/16x4-neonfma.c
396 src/f32-spmm/4x1-neonfma-pipelined.c
397 src/f32-spmm/4x1-neonfma-unroll2.c
398 src/f32-spmm/4x1-neonfma.c
399 src/f32-spmm/4x2-neonfma.c
400 src/f32-spmm/4x4-neonfma.c
401 src/f32-spmm/8x1-neonfma-pipelined.c
402 src/f32-spmm/8x1-neonfma-unroll2.c
403 src/f32-spmm/8x1-neonfma.c
404 src/f32-spmm/8x2-neonfma.c
405 src/f32-spmm/8x4-neonfma.c)
406
407SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
408 src/f16-gemm/4x8-neonfp16arith-ld64.c
409 src/f16-gemm/6x8-neonfp16arith-ld64.c
410 src/f16-gemm/8x8-neonfp16arith-ld64.c)
411
412SET(XNNPACK_SSE_MICROKERNEL_SRCS
413 src/f32-avgpool/mp9p8q-sse.c
414 src/f32-avgpool/up9-sse.c
415 src/f32-clamp/sse.c
416 src/f32-igemm/1x8-sse-dup.c
417 src/f32-igemm/1x8-sse-load1.c
418 src/f32-igemm/1x8s4-sse.c
419 src/f32-igemm/4x2c4-sse.c
420 src/f32-igemm/4x8-sse-dup.c
421 src/f32-igemm/4x8-sse-load1.c
422 src/f32-igemm/4x8s4-sse.c
423 src/f32-dwconv/up4x25-sse.c
424 src/f32-dwconv/up4x4-sse.c
425 src/f32-dwconv/up4x9-sse.c
426 src/f32-gavgpool-spchw/sse-x4.c
427 src/f32-gavgpool/mp7p7q-sse.c
428 src/f32-gavgpool/up7-sse.c
429 src/f32-gemm/1x8-sse-dup.c
430 src/f32-gemm/1x8-sse-load1.c
431 src/f32-gemm/1x8s4-sse.c
432 src/f32-gemm/4x8-sse-dup.c
433 src/f32-gemm/4x8-sse-load1.c
434 src/f32-gemm/4x8s4-sse.c
435 src/f32-gemminc/1x8-sse-dup.c
436 src/f32-gemminc/1x8-sse-load1.c
437 src/f32-gemminc/1x8s4-sse.c
438 src/f32-gemminc/4x8-sse-dup.c
439 src/f32-gemminc/4x8-sse-load1.c
440 src/f32-gemminc/4x8s4-sse.c
441 src/f32-hswish/sse.c
442 src/f32-maxpool/9p8q-sse.c
443 src/f32-pavgpool/mp9p8q-sse.c
444 src/f32-pavgpool/up9-sse.c
445 src/f32-dwconv-spchw/3x3p1-sse.c
446 src/f32-dwconv-spchw/3x3s2p1-sse.c
447 src/f32-ppmm/4x8-sse.c
448 src/f32-prelu/x4-sse.c
449 src/f32-rmax/sse.c
450 src/f32-spmm/4x1-sse.c
451 src/f32-spmm/8x1-sse.c
452 src/f32-vadd/sse.c
453 src/f32-vmul/sse.c
454 src/f32-vmulcaddc/c4-sse-x2.c
455 src/f32-vsub/sse.c
456 src/x32-packx/x4-sse.c)
457
458SET(XNNPACK_SSE2_MICROKERNEL_SRCS
459 src/f32-argmaxpool/mp9p8q-sse2.c
460 src/f32-argmaxpool/up4-sse2.c
461 src/f32-argmaxpool/up9-sse2.c
462 src/q8-avgpool/mp9p8q-sse2.c
463 src/q8-avgpool/up9-sse2.c
464 src/q8-igemm/4x4c2-sse2.c
465 src/q8-dwconv/up8x9-sse2.c
466 src/q8-gavgpool/mp7p7q-sse2.c
467 src/q8-gavgpool/up7-sse2.c
468 src/q8-gemm/2x4c8-sse2.c
469 src/q8-gemm/4x4c2-sse2.c
470 src/q8-vadd/sse2.c
471 src/u8-clamp/sse2.c
472 src/u8-maxpool/9p8q-sse2.c
473 src/u8-rmax/sse2.c
474 src/x32-pad/x2-sse2.c
475 src/x32-zip/x2-sse2.c
476 src/x32-zip/x3-sse2.c
477 src/x32-zip/x4-sse2.c
478 src/x32-zip/xm-sse2.c
479 src/x8-zip/x2-sse2.c
480 src/x8-zip/x3-sse2.c
481 src/x8-zip/x4-sse2.c
482 src/x8-zip/xm-sse2.c)
483
484SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhana5977df2019-10-30 22:02:15 -0700485 src/f32-rmax/avx.c
486 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700487
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700488SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan97579532019-10-18 16:40:39 -0700489 src/f32-raddexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700490 src/f32-raddextexp/avx2-p5-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700491 src/f32-raddstoreexpminusmax/avx2-p5-unroll64.c
492 src/f32-vscaleexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700493 src/f32-vscaleextexp/avx2-p5-unroll64.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700494 src/math/exp-avx2-p5.c
495 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -0700496 src/math/exp-avx2-perm-p4.c
497 src/math/expminus-avx2-p5.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700498
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700499SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhan97579532019-10-18 16:40:39 -0700500 src/f32-raddexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700501 src/f32-raddextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan97579532019-10-18 16:40:39 -0700502 src/f32-raddstoreexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700503 src/f32-rmax/avx512f.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700504 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700505 src/f32-vscaleexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700506 src/f32-vscaleextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700507 src/math/exp-avx512f-p5-scalef.c
508 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -0700509 src/math/exp-avx512f-perm-p3.c
510 src/math/exp-avx512f-perm2-p2.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700511
512SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
513 src/q8-dwconv/up8x9-aarch32-neon.S)
514
515SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
516 src/f32-dwconv/up4x9-aarch64-neonfma-cortex-a55.S
517 src/f32-dwconv/up4x9-aarch64-neonfma.S
518 src/f32-gemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700519 src/f32-gemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700520 src/f32-gemm/1x8-aarch64-neonfma-cortex-a57.S
521 src/f32-gemm/1x8-aarch64-neonfma-cortex-a75.S
522 src/f32-gemm/4x12-aarch64-neonfma-cortex-a53.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700523 src/f32-gemm/4x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700524 src/f32-gemm/4x8-aarch64-neonfma-cortex-a57.S
525 src/f32-gemm/4x8-aarch64-neonfma-cortex-a75.S
526 src/f32-gemm/4x8-aarch64-neonfma-ld128.S
527 src/f32-gemm/4x8-aarch64-neonfma-ld64.S
528 src/f32-gemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700529 src/f32-gemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700530 src/f32-gemm/6x8-aarch64-neonfma-cortex-a57.S
531 src/f32-gemm/6x8-aarch64-neonfma-cortex-a73.S
532 src/f32-gemm/6x8-aarch64-neonfma-cortex-a75.S
533 src/f32-gemm/6x8-aarch64-neonfma-ld128.S
534 src/f32-gemm/6x8-aarch64-neonfma-ld64.S
535 src/f32-gemminc/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700536 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700537 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a57.S
538 src/f32-gemminc/1x8-aarch64-neonfma-cortex-a75.S
539 src/f32-gemminc/4x12-aarch64-neonfma-cortex-a53.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700540 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700541 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a57.S
542 src/f32-gemminc/4x8-aarch64-neonfma-cortex-a75.S
543 src/f32-gemminc/4x8-aarch64-neonfma-ld128.S
544 src/f32-gemminc/4x8-aarch64-neonfma-ld64.S
545 src/f32-gemminc/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700546 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700547 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a57.S
548 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a73.S
549 src/f32-gemminc/6x8-aarch64-neonfma-cortex-a75.S
550 src/f32-gemminc/6x8-aarch64-neonfma-ld128.S
551 src/f32-gemminc/6x8-aarch64-neonfma-ld64.S
552 src/f32-igemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700553 src/f32-igemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700554 src/f32-igemm/1x8-aarch64-neonfma-cortex-a57.S
555 src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.S
556 src/f32-igemm/4x12-aarch64-neonfma-cortex-a53.S
557 src/f32-igemm/4x8-aarch64-neonfma-cortex-a75.S
558 src/f32-igemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700559 src/f32-igemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700560 src/f32-igemm/6x8-aarch64-neonfma-cortex-a57.S
561 src/f32-igemm/6x8-aarch64-neonfma-cortex-a73.S
562 src/f32-igemm/6x8-aarch64-neonfma-cortex-a75.S)
563
564SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
565IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
566 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_MICROKERNEL_SRCS})
567ENDIF()
568IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
569 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
570 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
571 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
572ENDIF()
573IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
574 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
575 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
576 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${AARCH64_XNNPACK_NEONFMA_MICROKERNEL_SRCS})
577 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
578 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
579ENDIF()
580IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
581 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
582 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
583 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700584 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700585 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
586ENDIF()
587
588IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
589 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
590ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
591 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
592ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
593 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
594ELSE()
595 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
596ENDIF()
597SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
598 C_STANDARD 99
599 C_EXTENSIONS YES)
600IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
601 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
602 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
603 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
604 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
605 IF(IOS)
606 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
607 ENDIF()
608ENDIF()
609IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
610 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
611 IF(IOS)
612 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
613 ENDIF()
614ENDIF()
615IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
616 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
617 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
618 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700619 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700620 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
621ENDIF()
622IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
623 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
624ELSE()
625 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
626 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
627 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
628 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
629ENDIF()
630IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
631 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
632ENDIF()
633
634TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
635TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
636SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/XNNPACK.h)
637
638# ---[ Configure clog
639IF(NOT TARGET clog)
640 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
641 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
642 ADD_SUBDIRECTORY(
643 "${CLOG_SOURCE_DIR}/deps/clog"
644 "${CMAKE_BINARY_DIR}/clog")
645 # We build static version of clog but a dynamic library may indirectly depend on it
646 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
647ENDIF()
648TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
649
650# ---[ Configure cpuinfo
651IF(NOT TARGET cpuinfo)
652 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
653 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
654 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
655 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
656 ADD_SUBDIRECTORY(
657 "${CPUINFO_SOURCE_DIR}"
658 "${CMAKE_BINARY_DIR}/cpuinfo")
659ENDIF()
660TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
661
662# ---[ Configure pthreadpool
663IF(NOT TARGET pthreadpool)
664 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
665 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -0700666 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700667 ADD_SUBDIRECTORY(
668 "${PTHREADPOOL_SOURCE_DIR}"
669 "${CMAKE_BINARY_DIR}/pthreadpool")
670ENDIF()
671TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
672
673# ---[ Configure FXdiv
674IF(NOT TARGET fxdiv)
675 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
676 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
677 ADD_SUBDIRECTORY(
678 "${FXDIV_SOURCE_DIR}"
679 "${CMAKE_BINARY_DIR}/FXdiv")
680ENDIF()
681TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
682
683# ---[ Configure psimd
684IF(NOT TARGET psimd)
685 ADD_SUBDIRECTORY(
686 "${PSIMD_SOURCE_DIR}"
687 "${CMAKE_BINARY_DIR}/psimd")
688ENDIF()
689TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
690
691# ---[ Configure FP16
692IF(NOT TARGET fp16)
693 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
694 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
695 ADD_SUBDIRECTORY(
696 "${FP16_SOURCE_DIR}"
697 "${CMAKE_BINARY_DIR}/FP16")
698ENDIF()
699TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
700
701INSTALL(TARGETS XNNPACK
702 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
703 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
704 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
705
706# ---[ XNNPACK unit tests
707IF(XNNPACK_BUILD_TESTS)
708 # ---[ Build google test
709 IF(NOT TARGET gtest)
710 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
711 ADD_SUBDIRECTORY(
712 "${GOOGLETEST_SOURCE_DIR}"
713 "${CMAKE_BINARY_DIR}/googletest")
714 ENDIF()
715
716 # ---[ Build operator-level unit tests
717 ADD_EXECUTABLE(add-test test/add.cc)
718 SET_TARGET_PROPERTIES(add-test PROPERTIES
719 CXX_STANDARD 11
720 CXX_STANDARD_REQUIRED YES
721 CXX_EXTENSIONS NO)
722 TARGET_INCLUDE_DIRECTORIES(add-test PRIVATE src test)
723 TARGET_LINK_LIBRARIES(add-test PRIVATE XNNPACK gtest gtest_main)
724 ADD_TEST(add-test add-test)
725
726 ADD_EXECUTABLE(argmax-pooling-test test/argmax-pooling.cc)
727 SET_TARGET_PROPERTIES(argmax-pooling-test PROPERTIES
728 CXX_STANDARD 11
729 CXX_STANDARD_REQUIRED YES
730 CXX_EXTENSIONS NO)
731 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-test PRIVATE src test)
732 TARGET_LINK_LIBRARIES(argmax-pooling-test PRIVATE XNNPACK gtest gtest_main)
733 ADD_TEST(argmax-pooling-test argmax-pooling-test)
734
735 ADD_EXECUTABLE(average-pooling-test test/average-pooling.cc)
736 SET_TARGET_PROPERTIES(average-pooling-test PROPERTIES
737 CXX_STANDARD 11
738 CXX_STANDARD_REQUIRED YES
739 CXX_EXTENSIONS NO)
740 TARGET_INCLUDE_DIRECTORIES(average-pooling-test PRIVATE src test)
741 TARGET_LINK_LIBRARIES(average-pooling-test PRIVATE XNNPACK gtest gtest_main)
742 ADD_TEST(average-pooling-test average-pooling-test)
743
744 ADD_EXECUTABLE(channel-pad-test test/channel-pad.cc)
745 SET_TARGET_PROPERTIES(channel-pad-test PROPERTIES
746 CXX_STANDARD 11
747 CXX_STANDARD_REQUIRED YES
748 CXX_EXTENSIONS NO)
749 TARGET_INCLUDE_DIRECTORIES(channel-pad-test PRIVATE src test)
750 TARGET_LINK_LIBRARIES(channel-pad-test PRIVATE XNNPACK gtest gtest_main)
751 ADD_TEST(channel-pad-test channel-pad-test)
752
753 ADD_EXECUTABLE(channel-shuffle-test test/channel-shuffle.cc)
754 SET_TARGET_PROPERTIES(channel-shuffle-test PROPERTIES
755 CXX_STANDARD 11
756 CXX_STANDARD_REQUIRED YES
757 CXX_EXTENSIONS NO)
758 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-test PRIVATE src test)
759 TARGET_LINK_LIBRARIES(channel-shuffle-test PRIVATE XNNPACK gtest gtest_main)
760 ADD_TEST(channel-shuffle-test channel-shuffle-test)
761
762 ADD_EXECUTABLE(clamp-test test/clamp.cc)
763 SET_TARGET_PROPERTIES(clamp-test PROPERTIES
764 CXX_STANDARD 11
765 CXX_STANDARD_REQUIRED YES
766 CXX_EXTENSIONS NO)
767 TARGET_INCLUDE_DIRECTORIES(clamp-test PRIVATE src test)
768 TARGET_LINK_LIBRARIES(clamp-test PRIVATE XNNPACK gtest gtest_main)
769 ADD_TEST(clamp-test clamp-test)
770
771 ADD_EXECUTABLE(convolution-test test/convolution.cc)
772 SET_TARGET_PROPERTIES(convolution-test PROPERTIES
773 CXX_STANDARD 11
774 CXX_STANDARD_REQUIRED YES
775 CXX_EXTENSIONS NO)
776 TARGET_INCLUDE_DIRECTORIES(convolution-test PRIVATE src test)
777 TARGET_LINK_LIBRARIES(convolution-test PRIVATE XNNPACK gtest gtest_main)
778 ADD_TEST(convolution-test convolution-test)
779
780 ADD_EXECUTABLE(convolution-spnchw-test test/convolution-spnchw.cc)
781 SET_TARGET_PROPERTIES(convolution-spnchw-test PROPERTIES
782 CXX_STANDARD 11
783 CXX_STANDARD_REQUIRED YES
784 CXX_EXTENSIONS NO)
785 TARGET_INCLUDE_DIRECTORIES(convolution-spnchw-test PRIVATE src test)
786 TARGET_LINK_LIBRARIES(convolution-spnchw-test PRIVATE XNNPACK gtest gtest_main)
787 ADD_TEST(convolution-spnchw-test convolution-spnchw-test)
788
789 ADD_EXECUTABLE(deconvolution-test test/deconvolution.cc)
790 SET_TARGET_PROPERTIES(deconvolution-test PROPERTIES
791 CXX_STANDARD 11
792 CXX_STANDARD_REQUIRED YES
793 CXX_EXTENSIONS NO)
794 TARGET_INCLUDE_DIRECTORIES(deconvolution-test PRIVATE src test)
795 TARGET_LINK_LIBRARIES(deconvolution-test PRIVATE XNNPACK gtest gtest_main)
796 ADD_TEST(deconvolution-test deconvolution-test)
797
798 ADD_EXECUTABLE(fully-connected-test test/fully-connected.cc)
799 SET_TARGET_PROPERTIES(fully-connected-test PROPERTIES
800 CXX_STANDARD 11
801 CXX_STANDARD_REQUIRED YES
802 CXX_EXTENSIONS NO)
803 TARGET_INCLUDE_DIRECTORIES(fully-connected-test PRIVATE src test)
804 TARGET_LINK_LIBRARIES(fully-connected-test PRIVATE XNNPACK gtest gtest_main)
805 ADD_TEST(fully-connected-test fully-connected-test)
806
807 ADD_EXECUTABLE(global-average-pooling-test test/global-average-pooling.cc)
808 SET_TARGET_PROPERTIES(global-average-pooling-test PROPERTIES
809 CXX_STANDARD 11
810 CXX_STANDARD_REQUIRED YES
811 CXX_EXTENSIONS NO)
812 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-test PRIVATE src test)
813 TARGET_LINK_LIBRARIES(global-average-pooling-test PRIVATE XNNPACK gtest gtest_main)
814 ADD_TEST(global-average-pooling-test global-average-pooling-test)
815
816 ADD_EXECUTABLE(global-average-pooling-spnchw-test test/global-average-pooling-spnchw.cc)
817 SET_TARGET_PROPERTIES(global-average-pooling-spnchw-test PROPERTIES
818 CXX_STANDARD 11
819 CXX_STANDARD_REQUIRED YES
820 CXX_EXTENSIONS NO)
821 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-spnchw-test PRIVATE src test)
822 TARGET_LINK_LIBRARIES(global-average-pooling-spnchw-test PRIVATE XNNPACK gtest gtest_main)
823 ADD_TEST(global-average-pooling-spnchw-test global-average-pooling-spnchw-test)
824
825 ADD_EXECUTABLE(hardswish-test test/hardswish.cc)
826 SET_TARGET_PROPERTIES(hardswish-test PROPERTIES
827 CXX_STANDARD 11
828 CXX_STANDARD_REQUIRED YES
829 CXX_EXTENSIONS NO)
830 TARGET_INCLUDE_DIRECTORIES(hardswish-test PRIVATE src test)
831 TARGET_LINK_LIBRARIES(hardswish-test PRIVATE XNNPACK gtest gtest_main)
832 ADD_TEST(hardswish-test hardswish-test)
833
834 ADD_EXECUTABLE(leaky-relu-test test/leaky-relu.cc)
835 SET_TARGET_PROPERTIES(leaky-relu-test PROPERTIES
836 CXX_STANDARD 11
837 CXX_STANDARD_REQUIRED YES
838 CXX_EXTENSIONS NO)
839 TARGET_INCLUDE_DIRECTORIES(leaky-relu-test PRIVATE src test)
840 TARGET_LINK_LIBRARIES(leaky-relu-test PRIVATE XNNPACK gtest gtest_main)
841 ADD_TEST(leaky-relu-test leaky-relu-test)
842
843 ADD_EXECUTABLE(max-pooling-test test/max-pooling.cc)
844 SET_TARGET_PROPERTIES(max-pooling-test PROPERTIES
845 CXX_STANDARD 11
846 CXX_STANDARD_REQUIRED YES
847 CXX_EXTENSIONS NO)
848 TARGET_INCLUDE_DIRECTORIES(max-pooling-test PRIVATE src test)
849 TARGET_LINK_LIBRARIES(max-pooling-test PRIVATE XNNPACK gtest gtest_main)
850 ADD_TEST(max-pooling-test max-pooling-test)
851
852 ADD_EXECUTABLE(prelu-test test/prelu.cc)
853 SET_TARGET_PROPERTIES(prelu-test PROPERTIES
854 CXX_STANDARD 11
855 CXX_STANDARD_REQUIRED YES
856 CXX_EXTENSIONS NO)
857 TARGET_INCLUDE_DIRECTORIES(prelu-test PRIVATE src test)
858 TARGET_LINK_LIBRARIES(prelu-test PRIVATE XNNPACK gtest gtest_main)
859 ADD_TEST(prelu-test prelu-test)
860
861 ADD_EXECUTABLE(sigmoid-test test/sigmoid.cc)
862 SET_TARGET_PROPERTIES(sigmoid-test PROPERTIES
863 CXX_STANDARD 11
864 CXX_STANDARD_REQUIRED YES
865 CXX_EXTENSIONS NO)
866 TARGET_INCLUDE_DIRECTORIES(sigmoid-test PRIVATE src test)
867 TARGET_LINK_LIBRARIES(sigmoid-test PRIVATE XNNPACK gtest gtest_main)
868 ADD_TEST(sigmoid-test sigmoid-test)
869
870 ADD_EXECUTABLE(softargmax-test test/softargmax.cc)
871 SET_TARGET_PROPERTIES(softargmax-test PROPERTIES
872 CXX_STANDARD 11
873 CXX_STANDARD_REQUIRED YES
874 CXX_EXTENSIONS NO)
875 TARGET_INCLUDE_DIRECTORIES(softargmax-test PRIVATE src test)
876 TARGET_LINK_LIBRARIES(softargmax-test PRIVATE XNNPACK gtest gtest_main)
877 ADD_TEST(softargmax-test softargmax-test)
878
879 ADD_EXECUTABLE(unpooling-test test/unpooling.cc)
880 SET_TARGET_PROPERTIES(unpooling-test PROPERTIES
881 CXX_STANDARD 11
882 CXX_STANDARD_REQUIRED YES
883 CXX_EXTENSIONS NO)
884 TARGET_INCLUDE_DIRECTORIES(unpooling-test PRIVATE src test)
885 TARGET_LINK_LIBRARIES(unpooling-test PRIVATE XNNPACK gtest gtest_main)
886 ADD_TEST(unpooling-test unpooling-test)
887
888 # ---[ Build microkernel-level unit tests
889 ADD_EXECUTABLE(f16-gemm-test test/f16-gemm.cc)
890 SET_TARGET_PROPERTIES(f16-gemm-test PROPERTIES
891 CXX_STANDARD 11
892 CXX_STANDARD_REQUIRED YES
893 CXX_EXTENSIONS YES)
894 TARGET_INCLUDE_DIRECTORIES(f16-gemm-test PRIVATE src test)
895 TARGET_LINK_LIBRARIES(f16-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
896 ADD_TEST(f16-gemm-test f16-gemm-test)
897
898 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
899 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
900 CXX_STANDARD 11
901 CXX_STANDARD_REQUIRED YES
902 CXX_EXTENSIONS YES)
903 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
904 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
905 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
906
907 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
908 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
909 CXX_STANDARD 11
910 CXX_STANDARD_REQUIRED YES
911 CXX_EXTENSIONS YES)
912 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
913 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
914 ADD_TEST(f32-avgpool-test f32-avgpool-test)
915
916 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
917 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
918 CXX_STANDARD 11
919 CXX_STANDARD_REQUIRED YES
920 CXX_EXTENSIONS YES)
921 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
922 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
923 ADD_TEST(f32-clamp-test f32-clamp-test)
924
925 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
926 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
927 CXX_STANDARD 11
928 CXX_STANDARD_REQUIRED YES
929 CXX_EXTENSIONS YES)
930 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
931 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
932 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
933
934 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
935 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
936 CXX_STANDARD 11
937 CXX_STANDARD_REQUIRED YES
938 CXX_EXTENSIONS YES)
939 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
940 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
941 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
942
943 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
944 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
945 CXX_STANDARD 11
946 CXX_STANDARD_REQUIRED YES
947 CXX_EXTENSIONS YES)
948 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
949 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
950 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
951
952 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
953 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
954 CXX_STANDARD 11
955 CXX_STANDARD_REQUIRED YES
956 CXX_EXTENSIONS YES)
957 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
958 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
959 ADD_TEST(f32-dwconv-test f32-dwconv-test)
960
961 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
962 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
963 CXX_STANDARD 11
964 CXX_STANDARD_REQUIRED YES
965 CXX_EXTENSIONS YES)
966 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
967 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
968 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
969
970 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
971 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
972 CXX_STANDARD 11
973 CXX_STANDARD_REQUIRED YES
974 CXX_EXTENSIONS YES)
975 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
976 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
977 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
978
979 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
980 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
981 CXX_STANDARD 11
982 CXX_STANDARD_REQUIRED YES
983 CXX_EXTENSIONS YES)
984 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
985 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
986 ADD_TEST(f32-gemm-test f32-gemm-test)
987
988 ADD_EXECUTABLE(f32-gemminc-test test/f32-gemminc.cc)
989 SET_TARGET_PROPERTIES(f32-gemminc-test PROPERTIES
990 CXX_STANDARD 11
991 CXX_STANDARD_REQUIRED YES
992 CXX_EXTENSIONS YES)
993 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-test PRIVATE src test)
994 TARGET_LINK_LIBRARIES(f32-gemminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
995 ADD_TEST(f32-gemminc-test f32-gemminc-test)
996
997 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
998 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
999 CXX_STANDARD 11
1000 CXX_STANDARD_REQUIRED YES
1001 CXX_EXTENSIONS YES)
1002 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
1003 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1004 ADD_TEST(f32-hswish-test f32-hswish-test)
1005
1006 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
1007 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
1008 CXX_STANDARD 11
1009 CXX_STANDARD_REQUIRED YES
1010 CXX_EXTENSIONS YES)
1011 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
1012 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1013 ADD_TEST(f32-igemm-test f32-igemm-test)
1014
1015 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
1016 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
1017 CXX_STANDARD 11
1018 CXX_STANDARD_REQUIRED YES
1019 CXX_EXTENSIONS YES)
1020 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
1021 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1022 ADD_TEST(f32-maxpool-test f32-maxpool-test)
1023
1024 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
1025 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
1026 CXX_STANDARD 11
1027 CXX_STANDARD_REQUIRED YES
1028 CXX_EXTENSIONS YES)
1029 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
1030 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1031 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
1032
1033 ADD_EXECUTABLE(f32-ppmm-test test/f32-ppmm.cc)
1034 SET_TARGET_PROPERTIES(f32-ppmm-test PROPERTIES
1035 CXX_STANDARD 11
1036 CXX_STANDARD_REQUIRED YES
1037 CXX_EXTENSIONS YES)
1038 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-test PRIVATE src test)
1039 TARGET_LINK_LIBRARIES(f32-ppmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1040 ADD_TEST(f32-ppmm-test f32-ppmm-test)
1041
1042 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
1043 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
1044 CXX_STANDARD 11
1045 CXX_STANDARD_REQUIRED YES
1046 CXX_EXTENSIONS YES)
1047 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
1048 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1049 ADD_TEST(f32-prelu-test f32-prelu-test)
1050
Marat Dukhan97579532019-10-18 16:40:39 -07001051 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
1052 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
1053 CXX_STANDARD 11
1054 CXX_STANDARD_REQUIRED YES
1055 CXX_EXTENSIONS YES)
1056 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
1057 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1058 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
1059
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001060 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
1061 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
1062 CXX_STANDARD 11
1063 CXX_STANDARD_REQUIRED YES
1064 CXX_EXTENSIONS YES)
1065 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001066 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001067 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
1068
Marat Dukhan97579532019-10-18 16:40:39 -07001069 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
1070 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
1071 CXX_STANDARD 11
1072 CXX_STANDARD_REQUIRED YES
1073 CXX_EXTENSIONS YES)
1074 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
1075 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1076 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
1077
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001078 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
1079 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
1080 CXX_STANDARD 11
1081 CXX_STANDARD_REQUIRED YES
1082 CXX_EXTENSIONS YES)
1083 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
1084 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1085 ADD_TEST(f32-rmax-test f32-rmax-test)
1086
1087 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
1088 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
1089 CXX_STANDARD 11
1090 CXX_STANDARD_REQUIRED YES
1091 CXX_EXTENSIONS YES)
1092 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
1093 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1094 ADD_TEST(f32-spmm-test f32-spmm-test)
1095
1096 ADD_EXECUTABLE(f32-vadd-test test/f32-vadd.cc)
1097 SET_TARGET_PROPERTIES(f32-vadd-test PROPERTIES
1098 CXX_STANDARD 11
1099 CXX_STANDARD_REQUIRED YES
1100 CXX_EXTENSIONS YES)
1101 TARGET_INCLUDE_DIRECTORIES(f32-vadd-test PRIVATE src test)
1102 TARGET_LINK_LIBRARIES(f32-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1103 ADD_TEST(f32-vadd-test f32-vadd-test)
1104
1105 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
1106 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
1107 CXX_STANDARD 11
1108 CXX_STANDARD_REQUIRED YES
1109 CXX_EXTENSIONS YES)
1110 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
1111 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1112 ADD_TEST(f32-vmul-test f32-vmul-test)
1113
1114 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
1115 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
1116 CXX_STANDARD 11
1117 CXX_STANDARD_REQUIRED YES
1118 CXX_EXTENSIONS YES)
1119 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
1120 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1121 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
1122
Marat Dukhan97579532019-10-18 16:40:39 -07001123 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
1124 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1125 CXX_STANDARD 11
1126 CXX_STANDARD_REQUIRED YES
1127 CXX_EXTENSIONS YES)
1128 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
1129 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1130 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
1131
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001132 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
1133 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1134 CXX_STANDARD 11
1135 CXX_STANDARD_REQUIRED YES
1136 CXX_EXTENSIONS YES)
1137 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001138 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001139 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
1140
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001141 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
1142 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
1143 CXX_STANDARD 11
1144 CXX_STANDARD_REQUIRED YES
1145 CXX_EXTENSIONS YES)
1146 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
1147 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1148 ADD_TEST(f32-vsub-test f32-vsub-test)
1149
1150 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
1151 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
1152 CXX_STANDARD 11
1153 CXX_STANDARD_REQUIRED YES
1154 CXX_EXTENSIONS YES)
1155 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
1156 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1157 ADD_TEST(q8-avgpool-test q8-avgpool-test)
1158
1159 ADD_EXECUTABLE(q8-dwconv-test test/q8-dwconv.cc)
1160 SET_TARGET_PROPERTIES(q8-dwconv-test PROPERTIES
1161 CXX_STANDARD 11
1162 CXX_STANDARD_REQUIRED YES
1163 CXX_EXTENSIONS YES)
1164 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-test PRIVATE src test)
1165 TARGET_LINK_LIBRARIES(q8-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1166 ADD_TEST(q8-dwconv-test q8-dwconv-test)
1167
1168 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
1169 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
1170 CXX_STANDARD 11
1171 CXX_STANDARD_REQUIRED YES
1172 CXX_EXTENSIONS YES)
1173 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
1174 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1175 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
1176
1177 ADD_EXECUTABLE(q8-gemm-test test/q8-gemm.cc)
1178 SET_TARGET_PROPERTIES(q8-gemm-test PROPERTIES
1179 CXX_STANDARD 11
1180 CXX_STANDARD_REQUIRED YES
1181 CXX_EXTENSIONS YES)
1182 TARGET_INCLUDE_DIRECTORIES(q8-gemm-test PRIVATE src test)
1183 TARGET_LINK_LIBRARIES(q8-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1184 ADD_TEST(q8-gemm-test q8-gemm-test)
1185
1186 ADD_EXECUTABLE(q8-igemm-test test/q8-igemm.cc)
1187 SET_TARGET_PROPERTIES(q8-igemm-test PROPERTIES
1188 CXX_STANDARD 11
1189 CXX_STANDARD_REQUIRED YES
1190 CXX_EXTENSIONS YES)
1191 TARGET_INCLUDE_DIRECTORIES(q8-igemm-test PRIVATE src test)
1192 TARGET_LINK_LIBRARIES(q8-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1193 ADD_TEST(q8-igemm-test q8-igemm-test)
1194
1195 ADD_EXECUTABLE(q8-vadd-test test/q8-vadd.cc)
1196 SET_TARGET_PROPERTIES(q8-vadd-test PROPERTIES
1197 CXX_STANDARD 11
1198 CXX_STANDARD_REQUIRED YES
1199 CXX_EXTENSIONS YES)
1200 TARGET_INCLUDE_DIRECTORIES(q8-vadd-test PRIVATE src test)
1201 TARGET_LINK_LIBRARIES(q8-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1202 ADD_TEST(q8-vadd-test q8-vadd-test)
1203
1204 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
1205 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
1206 CXX_STANDARD 11
1207 CXX_STANDARD_REQUIRED YES
1208 CXX_EXTENSIONS YES)
1209 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
1210 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1211 ADD_TEST(u8-clamp-test u8-clamp-test)
1212
1213 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
1214 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
1215 CXX_STANDARD 11
1216 CXX_STANDARD_REQUIRED YES
1217 CXX_EXTENSIONS YES)
1218 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
1219 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1220 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
1221
1222 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
1223 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
1224 CXX_STANDARD 11
1225 CXX_STANDARD_REQUIRED YES
1226 CXX_EXTENSIONS YES)
1227 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
1228 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1229 ADD_TEST(u8-maxpool-test u8-maxpool-test)
1230
1231 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
1232 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
1233 CXX_STANDARD 11
1234 CXX_STANDARD_REQUIRED YES
1235 CXX_EXTENSIONS YES)
1236 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
1237 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1238 ADD_TEST(u8-rmax-test u8-rmax-test)
1239
1240 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
1241 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
1242 CXX_STANDARD 11
1243 CXX_STANDARD_REQUIRED YES
1244 CXX_EXTENSIONS YES)
1245 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
1246 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1247 ADD_TEST(x32-packx-test x32-packx-test)
1248
1249 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
1250 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
1251 CXX_STANDARD 11
1252 CXX_STANDARD_REQUIRED YES
1253 CXX_EXTENSIONS YES)
1254 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
1255 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1256 ADD_TEST(x32-pad-test x32-pad-test)
1257
1258 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
1259 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
1260 CXX_STANDARD 11
1261 CXX_STANDARD_REQUIRED YES
1262 CXX_EXTENSIONS YES)
1263 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
1264 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1265 ADD_TEST(x32-unpool-test x32-unpool-test)
1266
1267 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
1268 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
1269 CXX_STANDARD 11
1270 CXX_STANDARD_REQUIRED YES
1271 CXX_EXTENSIONS YES)
1272 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
1273 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1274 ADD_TEST(x32-zip-test x32-zip-test)
1275
1276 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
1277 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
1278 CXX_STANDARD 11
1279 CXX_STANDARD_REQUIRED YES
1280 CXX_EXTENSIONS YES)
1281 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
1282 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1283 ADD_TEST(x8-lut-test x8-lut-test)
1284
1285 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
1286 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
1287 CXX_STANDARD 11
1288 CXX_STANDARD_REQUIRED YES
1289 CXX_EXTENSIONS YES)
1290 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
1291 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1292 ADD_TEST(x8-zip-test x8-zip-test)
1293ENDIF()
1294
1295# ---[ XNNPACK microbenchmarks
1296IF(XNNPACK_BUILD_BENCHMARKS)
1297 # ---[ Build google benchmark
1298 IF(NOT TARGET benchmark)
1299 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
1300 ADD_SUBDIRECTORY(
1301 "${GOOGLEBENCHMARK_SOURCE_DIR}"
1302 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
1303 ENDIF()
1304
1305 ADD_LIBRARY(bench-utils bench/utils.cc)
1306 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
1307 CXX_STANDARD 11
1308 CXX_STANDARD_REQUIRED YES
1309 CXX_EXTENSIONS NO)
1310 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1311 TARGET_LINK_LIBRARIES(bench-utils PRIVATE cpuinfo)
1312
Marat Dukhan5f18d262019-10-31 10:24:14 -07001313 # ---[ Build end-to-end microbenchmarks
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001314 ADD_EXECUTABLE(end2end-bench bench/end2end.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1315 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
1316 CXX_STANDARD 11
1317 CXX_STANDARD_REQUIRED YES
1318 CXX_EXTENSIONS NO)
1319 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Frank Barcharde72e2872019-10-31 11:12:15 -07001320 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001321
Marat Dukhanef4416e2019-10-31 13:44:40 -07001322 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1323 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
1324 CXX_STANDARD 11
1325 CXX_STANDARD_REQUIRED YES
1326 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001327 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanef4416e2019-10-31 13:44:40 -07001328 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
1329
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07001330 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1331 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07001332 CXX_STANDARD 11
1333 CXX_STANDARD_REQUIRED YES
1334 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001335 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Frank Barchardc712fa42019-10-31 14:00:21 -07001336 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07001337
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001338 # ---[ Build operator-level microbenchmarks
1339 ADD_EXECUTABLE(add-bench bench/add.cc)
1340 SET_TARGET_PROPERTIES(add-bench PROPERTIES
1341 CXX_STANDARD 11
1342 CXX_STANDARD_REQUIRED YES
1343 CXX_EXTENSIONS NO)
1344 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1345 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1346
1347 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
1348 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
1349 CXX_STANDARD 11
1350 CXX_STANDARD_REQUIRED YES
1351 CXX_EXTENSIONS NO)
1352 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1353 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1354
1355 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
1356 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
1357 CXX_STANDARD 11
1358 CXX_STANDARD_REQUIRED YES
1359 CXX_EXTENSIONS NO)
1360 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1361 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1362
1363 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
1364 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
1365 CXX_STANDARD 11
1366 CXX_STANDARD_REQUIRED YES
1367 CXX_EXTENSIONS NO)
1368 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1369 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1370
1371 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
1372 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
1373 CXX_STANDARD 11
1374 CXX_STANDARD_REQUIRED YES
1375 CXX_EXTENSIONS NO)
1376 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1377 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1378
1379 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
1380 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
1381 CXX_STANDARD 11
1382 CXX_STANDARD_REQUIRED YES
1383 CXX_EXTENSIONS NO)
1384 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1385 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1386
1387 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
1388 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
1389 CXX_STANDARD 11
1390 CXX_STANDARD_REQUIRED YES
1391 CXX_EXTENSIONS NO)
1392 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1393 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1394
Marat Dukhan95b22432019-10-30 16:30:14 -07001395 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
1396 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
1397 CXX_STANDARD 11
1398 CXX_STANDARD_REQUIRED YES
1399 CXX_EXTENSIONS NO)
1400 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1401 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1402
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001403 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
1404 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
1405 CXX_STANDARD 11
1406 CXX_STANDARD_REQUIRED YES
1407 CXX_EXTENSIONS NO)
1408 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1409 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1410
1411 ADD_EXECUTABLE(softargmax-bench bench/softargmax.cc)
1412 SET_TARGET_PROPERTIES(softargmax-bench PROPERTIES
1413 CXX_STANDARD 11
1414 CXX_STANDARD_REQUIRED YES
1415 CXX_EXTENSIONS NO)
1416 TARGET_INCLUDE_DIRECTORIES(softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1417 TARGET_LINK_LIBRARIES(softargmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1418
1419 # ---[ Build microkernel-level microbenchmarks
1420 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
1421 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
1422 CXX_STANDARD 11
1423 CXX_STANDARD_REQUIRED YES
1424 CXX_EXTENSIONS YES)
1425 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
1426 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1427 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1428
1429 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
1430 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
1431 CXX_STANDARD 11
1432 CXX_STANDARD_REQUIRED YES
1433 CXX_EXTENSIONS YES)
1434 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
1435 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1436 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1437
1438 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
1439 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
1440 CXX_STANDARD 11
1441 CXX_STANDARD_REQUIRED YES
1442 CXX_EXTENSIONS YES)
1443 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
1444 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1445 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1446
1447 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
1448 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
1449 CXX_STANDARD 11
1450 CXX_STANDARD_REQUIRED YES
1451 CXX_EXTENSIONS YES)
1452 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
1453 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1454 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1455
1456 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
1457 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
1458 CXX_STANDARD 11
1459 CXX_STANDARD_REQUIRED YES
1460 CXX_EXTENSIONS YES)
1461 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
1462 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1463 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1464
1465 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
1466 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
1467 CXX_STANDARD 11
1468 CXX_STANDARD_REQUIRED YES
1469 CXX_EXTENSIONS YES)
1470 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
1471 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1472 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1473
1474 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
1475 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
1476 C_STANDARD 99
1477 C_STANDARD_REQUIRED YES
1478 C_EXTENSIONS NO
1479 CXX_STANDARD 11
1480 CXX_STANDARD_REQUIRED YES
1481 CXX_EXTENSIONS YES)
1482 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
1483 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1484 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1485
1486 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
1487 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
1488 CXX_STANDARD 11
1489 CXX_STANDARD_REQUIRED YES
1490 CXX_EXTENSIONS YES)
1491 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
1492 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1493 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1494
1495 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
1496 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
1497 CXX_STANDARD 11
1498 CXX_STANDARD_REQUIRED YES
1499 CXX_EXTENSIONS YES)
1500 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
1501 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1502 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1503
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001504 ADD_EXECUTABLE(f32-softargmax-bench bench/f32-softargmax.cc)
1505 SET_TARGET_PROPERTIES(f32-softargmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001506 CXX_STANDARD 11
1507 CXX_STANDARD_REQUIRED YES
1508 CXX_EXTENSIONS YES)
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001509 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE src)
1510 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1511 TARGET_LINK_LIBRARIES(f32-softargmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001512
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001513 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
1514 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
1515 CXX_STANDARD 11
1516 CXX_STANDARD_REQUIRED YES
1517 CXX_EXTENSIONS YES)
1518 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
1519 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1520 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1521ENDIF()