blob: b3a81a8201b0f9987699a54cea14de5fe8990cec [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
19OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
20OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
21
22# ---[ CMake options
23IF(XNNPACK_BUILD_TESTS)
24 ENABLE_TESTING()
25ENDIF()
26
27# ---[ Build flags
28IF(NOT CMAKE_SYSTEM_PROCESSOR)
29 IF(IOS)
30 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
31 IF(IOS_ARCH_COUNT GREATER 1)
32 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
33 "Specify a single architecture in IOS_ARCH and re-configure. ")
34 ENDIF()
35 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|armv7.*|arm64.*)$")
36 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
37 ENDIF()
38 ELSE()
39 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
40 ENDIF()
41ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|armv[5-8].*|aarch64)$")
42 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
43ENDIF()
44
45IF(NOT CMAKE_SYSTEM_NAME)
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
47ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android)$")
48 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
49ENDIF()
50
51# ---[ Download deps
52IF(NOT DEFINED CLOG_SOURCE_DIR)
53 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
54 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
55 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
56 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
57 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
58 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
59 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
60ENDIF()
61
62IF(NOT DEFINED CPUINFO_SOURCE_DIR)
63 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
64 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
65 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
66 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
67 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
68 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
69 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
70ENDIF()
71
72IF(NOT DEFINED FP16_SOURCE_DIR)
73 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
74 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
75 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
76 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
77 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
78 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
79 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
80ENDIF()
81
82IF(NOT DEFINED FXDIV_SOURCE_DIR)
83 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
84 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
85 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
86 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
87 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
88 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
89 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
90ENDIF()
91
92IF(NOT DEFINED PSIMD_SOURCE_DIR)
93 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
94 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
95 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
96 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
97 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
98 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
99 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
100ENDIF()
101
102IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
103 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
104 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
105 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
106 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
107 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
108 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
109 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
110ENDIF()
111
112IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
113 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
114 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
115 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
116 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
117 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
118 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
119 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
120ENDIF()
121
122IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
123 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
124 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
125 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
126 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
127 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
128 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
129 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
130ENDIF()
131
132# ---[ XNNPACK library
133SET(XNNPACK_OPERATOR_SRCS
Marat Dukhanefc47b82019-11-18 09:25:38 -0800134 src/add-nc.c
135 src/argmax-pooling-nhwc.c
136 src/average-pooling-nhwc.c
137 src/channel-pad-nc.c
138 src/channel-shuffle-nc.c
139 src/clamp-nc.c
140 src/convolution-nchw.c
141 src/convolution-nhwc.c
142 src/deconvolution-nhwc.c
143 src/fully-connected-nc.c
144 src/global-average-pooling-ncw.c
145 src/global-average-pooling-nwc.c
146 src/hardswish-nc.c
147 src/leaky-relu-nc.c
148 src/max-pooling-nhwc.c
149 src/multiply-nd.c
150 src/prelu-nc.c
151 src/resize-bilinear-nhwc.c
152 src/sigmoid-nc.c
153 src/softargmax-nc.c
154 src/unpooling-nhwc.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700155
156SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
157LIST(APPEND XNNPACK_COLD_SRCS
158 src/init.c
Ashkan Aliabadi1f8a2b82019-11-20 11:27:00 -0800159 src/memory.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700160 src/operator-delete.c)
161
162SET(XNNPACK_HOT_SRCS
163 src/indirection.c
164 src/operator-run.c)
165
166SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800167 src/f32-argmaxpool/4x-scalar-c1.c
168 src/f32-argmaxpool/9p8x-scalar-c1.c
169 src/f32-argmaxpool/9x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700170 src/f32-avgpool/mp9p8q-scalar.c
171 src/f32-avgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800172 src/f32-bilinear/gen/scalar-c1.c
173 src/f32-bilinear/gen/scalar-c2.c
174 src/f32-bilinear/gen/scalar-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700175 src/f32-clamp/scalar.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700176 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700177 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700178 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800179 src/f32-dwconv-spchw/5x5p2-scalar.c
Erich Elsen38709a62019-11-08 11:58:45 -0800180 src/f32-dwconv-spchw/5x5s2p2-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800181 src/f32-dwconv/gen/up1x25-scalar-acc2.c
182 src/f32-dwconv/gen/up1x25-scalar.c
183 src/f32-dwconv/gen/up1x4-scalar-acc2.c
184 src/f32-dwconv/gen/up1x4-scalar.c
185 src/f32-dwconv/gen/up1x9-scalar-acc2.c
186 src/f32-dwconv/gen/up1x9-scalar.c
187 src/f32-dwconv/gen/up2x25-scalar-acc2.c
188 src/f32-dwconv/gen/up2x25-scalar.c
189 src/f32-dwconv/gen/up2x4-scalar-acc2.c
190 src/f32-dwconv/gen/up2x4-scalar.c
191 src/f32-dwconv/gen/up2x9-scalar-acc2.c
192 src/f32-dwconv/gen/up2x9-scalar.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700193 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700194 src/f32-gavgpool/mp7p7q-scalar.c
195 src/f32-gavgpool/up7-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800196 src/f32-gemm/gen/1x4-scalar.c
197 src/f32-gemm/gen/2x4-scalar.c
198 src/f32-gemm/gen/4x2-scalar.c
199 src/f32-gemm/gen/4x4-scalar.c
200 src/f32-gemm/gen-inc/1x4-scalar.c
201 src/f32-gemm/gen-inc/2x4-scalar.c
202 src/f32-gemm/gen-inc/4x4-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700203 src/f32-hswish/scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800204 src/f32-igemm/gen/1x4-scalar.c
205 src/f32-igemm/gen/2x4-scalar.c
206 src/f32-igemm/gen/4x2-scalar.c
207 src/f32-igemm/gen/4x4-scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800208 src/f32-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700209 src/f32-pavgpool/mp9p8q-scalar.c
210 src/f32-pavgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800211 src/f32-ppmm/gen/2x4-scalar.c
212 src/f32-ppmm/gen/3x3-scalar.c
213 src/f32-ppmm/gen/4x2-scalar.c
214 src/f32-ppmm/gen/4x4-scalar.c
215 src/f32-prelu/gen/scalar-2x1.c
216 src/f32-prelu/gen/scalar-2x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700217 src/f32-rmax/scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800218 src/f32-spmm/gen/1x1-scalar-pipelined.c
219 src/f32-spmm/gen/1x1-scalar.c
220 src/f32-spmm/gen/2x1-scalar-pipelined.c
221 src/f32-spmm/gen/2x1-scalar.c
222 src/f32-spmm/gen/4x1-scalar-pipelined.c
223 src/f32-spmm/gen/4x1-scalar.c
224 src/f32-spmm/gen/8x1-scalar-pipelined.c
225 src/f32-spmm/gen/8x1-scalar.c
226 src/f32-spmm/gen/8x2-scalar.c
227 src/f32-spmm/gen/8x4-scalar.c
228 src/f32-vbinary/gen/vadd-scalar-x1.c
229 src/f32-vbinary/gen/vadd-scalar-x2.c
230 src/f32-vbinary/gen/vadd-scalar-x4.c
231 src/f32-vbinary/gen/vaddc-scalar-x1.c
232 src/f32-vbinary/gen/vaddc-scalar-x2.c
233 src/f32-vbinary/gen/vaddc-scalar-x4.c
234 src/f32-vbinary/gen/vmul-scalar-x1.c
235 src/f32-vbinary/gen/vmul-scalar-x2.c
236 src/f32-vbinary/gen/vmul-scalar-x4.c
237 src/f32-vbinary/gen/vmulc-scalar-x1.c
238 src/f32-vbinary/gen/vmulc-scalar-x2.c
239 src/f32-vbinary/gen/vmulc-scalar-x4.c
240 src/f32-vbinary/gen/vrsubc-scalar-x1.c
241 src/f32-vbinary/gen/vrsubc-scalar-x2.c
242 src/f32-vbinary/gen/vrsubc-scalar-x4.c
243 src/f32-vbinary/gen/vsub-scalar-x1.c
244 src/f32-vbinary/gen/vsub-scalar-x2.c
245 src/f32-vbinary/gen/vsub-scalar-x4.c
246 src/f32-vbinary/gen/vsubc-scalar-x1.c
247 src/f32-vbinary/gen/vsubc-scalar-x2.c
248 src/f32-vbinary/gen/vsubc-scalar-x4.c
249 src/f32-vmulcaddc/gen/c1-scalar-2x.c
250 src/f32-vmulcaddc/gen/c2-scalar-2x.c
251 src/f32-vmulcaddc/gen/c4-scalar-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700252 src/q8-avgpool/mp9p8q-scalar.c
253 src/q8-avgpool/up9-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700254 src/q8-dwconv/up1x9-scalar.c
255 src/q8-gavgpool/mp7p7q-scalar.c
256 src/q8-gavgpool/up7-scalar.c
257 src/q8-gemm/2x2-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800258 src/q8-igemm/2x2-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700259 src/q8-vadd/scalar.c
260 src/u8-clamp/scalar.c
261 src/u8-lut32norm/scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800262 src/u8-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700263 src/u8-rmax/scalar.c
264 src/x32-packx/x2-scalar.c
265 src/x32-packx/x3-scalar.c
266 src/x32-packx/x4-scalar.c
267 src/x32-pad/x2-scalar.c
268 src/x32-unpool/scalar.c
269 src/x32-zip/x2-scalar.c
270 src/x32-zip/x3-scalar.c
271 src/x32-zip/x4-scalar.c
272 src/x32-zip/xm-scalar.c
273 src/x8-lut/scalar.c
274 src/x8-zip/x2-scalar.c
275 src/x8-zip/x3-scalar.c
276 src/x8-zip/x4-scalar.c
277 src/x8-zip/xm-scalar.c)
278
279SET(XNNPACK_PSIMD_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800280 src/f32-argmaxpool/4x-psimd-c4.c
281 src/f32-argmaxpool/9p8x-psimd-c4.c
282 src/f32-argmaxpool/9x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700283 src/f32-avgpool/mp9p8q-psimd.c
284 src/f32-avgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800285 src/f32-bilinear/gen/psimd-c4.c
286 src/f32-bilinear/gen/psimd-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700287 src/f32-clamp/psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800288 src/f32-dwconv/gen/up4x25-psimd-acc2.c
289 src/f32-dwconv/gen/up4x25-psimd.c
290 src/f32-dwconv/gen/up4x4-psimd-acc2.c
291 src/f32-dwconv/gen/up4x4-psimd.c
292 src/f32-dwconv/gen/up4x9-psimd-acc2.c
293 src/f32-dwconv/gen/up4x9-psimd.c
294 src/f32-dwconv/gen/up8x25-psimd-acc2.c
295 src/f32-dwconv/gen/up8x25-psimd.c
296 src/f32-dwconv/gen/up8x4-psimd-acc2.c
297 src/f32-dwconv/gen/up8x4-psimd.c
298 src/f32-dwconv/gen/up8x9-psimd-acc2.c
299 src/f32-dwconv/gen/up8x9-psimd.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700300 src/f32-gavgpool/mp7p7q-psimd.c
301 src/f32-gavgpool/up7-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800302 src/f32-gemm/gen/1x8-psimd-loadsplat.c
303 src/f32-gemm/gen/1x8-psimd-splat.c
304 src/f32-gemm/gen/1x8s4-psimd.c
305 src/f32-gemm/gen/4x8-psimd-loadsplat.c
306 src/f32-gemm/gen/4x8-psimd-splat.c
307 src/f32-gemm/gen/4x8s4-psimd.c
308 src/f32-gemm/gen/6x8-psimd-loadsplat.c
309 src/f32-gemm/gen/6x8-psimd-splat.c
310 src/f32-gemm/gen/6x8s4-psimd.c
311 src/f32-gemm/gen-inc/1x8-psimd-loadsplat.c
312 src/f32-gemm/gen-inc/1x8-psimd-splat.c
313 src/f32-gemm/gen-inc/1x8s4-psimd.c
314 src/f32-gemm/gen-inc/4x8-psimd-loadsplat.c
315 src/f32-gemm/gen-inc/4x8-psimd-splat.c
316 src/f32-gemm/gen-inc/4x8s4-psimd.c
317 src/f32-gemm/gen-inc/6x8-psimd-loadsplat.c
318 src/f32-gemm/gen-inc/6x8-psimd-splat.c
319 src/f32-gemm/gen-inc/6x8s4-psimd.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700320 src/f32-hswish/psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800321 src/f32-igemm/gen/1x8-psimd-loadsplat.c
322 src/f32-igemm/gen/1x8-psimd-splat.c
323 src/f32-igemm/gen/1x8s4-psimd.c
324 src/f32-igemm/gen/4x2c4-psimd.c
325 src/f32-igemm/gen/4x8-psimd-loadsplat.c
326 src/f32-igemm/gen/4x8-psimd-splat.c
327 src/f32-igemm/gen/4x8s4-psimd.c
328 src/f32-igemm/gen/6x8-psimd-loadsplat.c
329 src/f32-igemm/gen/6x8-psimd-splat.c
330 src/f32-igemm/gen/6x8s4-psimd.c
Marat Dukhan329da642019-11-19 21:44:39 -0800331 src/f32-maxpool/9p8x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700332 src/f32-pavgpool/mp9p8q-psimd.c
333 src/f32-pavgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800334 src/f32-ppmm/gen/4x8-psimd.c
335 src/f32-prelu/gen/psimd-2x4.c
336 src/f32-prelu/gen/psimd-2x8.c
337 src/f32-vbinary/gen/vadd-psimd-x4.c
338 src/f32-vbinary/gen/vadd-psimd-x8.c
339 src/f32-vbinary/gen/vaddc-psimd-x4.c
340 src/f32-vbinary/gen/vaddc-psimd-x8.c
341 src/f32-vbinary/gen/vmul-psimd-x4.c
342 src/f32-vbinary/gen/vmul-psimd-x8.c
343 src/f32-vbinary/gen/vmulc-psimd-x4.c
344 src/f32-vbinary/gen/vmulc-psimd-x8.c
345 src/f32-vbinary/gen/vrsubc-psimd-x4.c
346 src/f32-vbinary/gen/vrsubc-psimd-x8.c
347 src/f32-vbinary/gen/vsub-psimd-x4.c
348 src/f32-vbinary/gen/vsub-psimd-x8.c
349 src/f32-vbinary/gen/vsubc-psimd-x4.c
350 src/f32-vbinary/gen/vsubc-psimd-x8.c
351 src/f32-vmulcaddc/gen/c4-psimd-2x.c
352 src/f32-vmulcaddc/gen/c8-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700353 src/x32-packx/x4-psimd.c
354 src/x32-pad/x2-psimd.c
355 src/x32-unpool/psimd.c
356 src/x32-zip/x2-psimd.c
357 src/x32-zip/x3-psimd.c
358 src/x32-zip/x4-psimd.c
359 src/x32-zip/xm-psimd.c)
360
361SET(XNNPACK_NEON_MICROKERNEL_SRCS
Marat Dukhan36aecb52019-11-22 17:21:49 -0800362 src/f32-avgpool/mp9p8q-neon.c
363 src/f32-avgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800364 src/f32-bilinear/gen/neon-c4.c
365 src/f32-bilinear/gen/neon-c8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800366 src/f32-clamp/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800367 src/f32-dwconv/gen/up4x9-neon.c
368 src/f32-dwconv/gen/up4x9-neon-acc2.c
369 src/f32-dwconv/gen/up8x9-neon.c
370 src/f32-dwconv/gen/up8x9-neon-acc2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800371 src/f32-gavgpool-spchw/neon-x4.c
372 src/f32-gavgpool/mp7p7q-neon.c
373 src/f32-gavgpool/up7-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800374 src/f32-gemm/gen/1x8-neon-lane-ld64.c
375 src/f32-gemm/gen/4x2-neon-lane-ld64.c
376 src/f32-gemm/gen/4x8-neon-lane-ld128.c
377 src/f32-gemm/gen/4x8-neon-lane-ld64.c
378 src/f32-gemm/gen/5x8-neon-lane-ld64.c
379 src/f32-gemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800380 src/f32-gemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800381 src/f32-gemm/gen/1x8-neon-dup-ld64.c
382 src/f32-gemm/gen/4x8-neon-dup-ld128.c
383 src/f32-gemm/gen/4x8-neon-dup-ld64.c
384 src/f32-gemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800385 src/f32-gemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800386 src/f32-gemm/gen/1x8s4-neon.c
387 src/f32-gemm/gen/4x8s4-neon.c
388 src/f32-gemm/gen/6x8s4-neon.c
389 src/f32-gemm/gen/8x8s4-neon.c
390 src/f32-gemm/gen-inc/1x8-neon-lane-ld64.c
391 src/f32-gemm/gen-inc/4x8-neon-lane-ld128.c
392 src/f32-gemm/gen-inc/4x8-neon-lane-ld64.c
393 src/f32-gemm/gen-inc/5x8-neon-lane-ld64.c
394 src/f32-gemm/gen-inc/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800395 src/f32-gemm/gen-inc/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800396 src/f32-gemm/gen-inc/1x8-neon-dup-ld64.c
397 src/f32-gemm/gen-inc/4x8-neon-dup-ld128.c
398 src/f32-gemm/gen-inc/4x8-neon-dup-ld64.c
399 src/f32-gemm/gen-inc/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800400 src/f32-gemm/gen-inc/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800401 src/f32-gemm/gen-inc/1x8s4-neon.c
402 src/f32-gemm/gen-inc/4x8s4-neon.c
403 src/f32-gemm/gen-inc/6x8s4-neon.c
404 src/f32-gemm/gen-inc/8x8s4-neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800405 src/f32-hswish/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800406 src/f32-igemm/gen/1x8-neon-lane-ld64.c
407 src/f32-igemm/gen/4x2-neon-lane-ld64.c
408 src/f32-igemm/gen/4x4-neon-lane-ld64.c
409 src/f32-igemm/gen/4x8-neon-lane-ld128.c
410 src/f32-igemm/gen/4x8-neon-lane-ld64.c
411 src/f32-igemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800412 src/f32-igemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800413 src/f32-igemm/gen/1x8-neon-dup-ld64.c
414 src/f32-igemm/gen/4x8-neon-dup-ld128.c
415 src/f32-igemm/gen/4x8-neon-dup-ld64.c
416 src/f32-igemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800417 src/f32-igemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800418 src/f32-igemm/gen/1x8s4-neon.c
419 src/f32-igemm/gen/4x8s4-neon.c
420 src/f32-igemm/gen/6x8s4-neon.c
421 src/f32-igemm/gen/8x8s4-neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800422 src/f32-pavgpool/mp9p8q-neon.c
423 src/f32-pavgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800424 src/f32-ppmm/gen/4x8-neon.c
425 src/f32-ppmm/gen/8x8-neon.c
426 src/f32-prelu/gen/neon-2x4.c
427 src/f32-prelu/gen/neon-2x8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800428 src/f32-rmax/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800429 src/f32-sigmoid/gen/neon-frac-p9-p10-nr1recps-x16.c
430 src/f32-vbinary/gen/vadd-neon-x4.c
431 src/f32-vbinary/gen/vadd-neon-x8.c
432 src/f32-vbinary/gen/vaddc-neon-x4.c
433 src/f32-vbinary/gen/vaddc-neon-x8.c
434 src/f32-vbinary/gen/vmul-neon-x4.c
435 src/f32-vbinary/gen/vmul-neon-x8.c
436 src/f32-vbinary/gen/vmulc-neon-x4.c
437 src/f32-vbinary/gen/vmulc-neon-x8.c
438 src/f32-vbinary/gen/vrsubc-neon-x4.c
439 src/f32-vbinary/gen/vrsubc-neon-x8.c
440 src/f32-vbinary/gen/vsub-neon-x4.c
441 src/f32-vbinary/gen/vsub-neon-x8.c
442 src/f32-vbinary/gen/vsubc-neon-x4.c
443 src/f32-vbinary/gen/vsubc-neon-x8.c
444 src/f32-vmulcaddc/gen/c4-neon-2x.c
445 src/f32-vmulcaddc/gen/c8-neon-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800446 src/q8-avgpool/mp9p8q-neon.c
447 src/q8-avgpool/up9-neon.c
448 src/q8-dwconv/up8x9-neon.c
449 src/q8-gavgpool/mp7p7q-neon.c
450 src/q8-gavgpool/up7-neon.c
451 src/q8-gemm/4x8-neon.c
452 src/q8-gemm/8x8-neon.c
453 src/q8-igemm/4x8-neon.c
454 src/q8-igemm/8x8-neon.c
455 src/q8-vadd/neon.c
456 src/u8-clamp/neon.c
457 src/u8-maxpool/9p8x-neon-c16.c
458 src/u8-rmax/neon.c
459 src/x32-packx/x4-neon-st4.c
460 src/x32-pad/x2-neon.c
461 src/x32-zip/x2-neon.c
462 src/x32-zip/x3-neon.c
463 src/x32-zip/x4-neon.c
464 src/x32-zip/xm-neon.c
465 src/x8-zip/x2-neon.c
466 src/x8-zip/x3-neon.c
467 src/x8-zip/x4-neon.c
468 src/x8-zip/xm-neon.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700469
470SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800471 src/f32-bilinear/gen/neonfma-c4.c
472 src/f32-bilinear/gen/neonfma-c8.c
473 src/f32-igemm/gen/1x8-neonfma-dup-ld64.c
474 src/f32-igemm/gen/4x8-neonfma-dup-ld128.c
475 src/f32-igemm/gen/4x8-neonfma-dup-ld64.c
476 src/f32-igemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800477 src/f32-igemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800478 src/f32-igemm/gen/1x8s4-neonfma.c
479 src/f32-igemm/gen/4x8s4-neonfma.c
480 src/f32-igemm/gen/6x8s4-neonfma.c
481 src/f32-igemm/gen/8x8s4-neonfma.c
482 src/f32-dwconv/gen/up4x9-neonfma.c
483 src/f32-dwconv/gen/up4x9-neonfma-acc2.c
484 src/f32-dwconv/gen/up8x9-neonfma.c
485 src/f32-dwconv/gen/up8x9-neonfma-acc2.c
486 src/f32-gemm/gen/1x8-neonfma-dup-ld64.c
487 src/f32-gemm/gen/4x8-neonfma-dup-ld128.c
488 src/f32-gemm/gen/4x8-neonfma-dup-ld64.c
489 src/f32-gemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800490 src/f32-gemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800491 src/f32-gemm/gen/1x8s4-neonfma.c
492 src/f32-gemm/gen/4x8s4-neonfma.c
493 src/f32-gemm/gen/6x8s4-neonfma.c
494 src/f32-gemm/gen/8x8s4-neonfma.c
495 src/f32-gemm/gen-inc/1x8-neonfma-dup-ld64.c
496 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld128.c
497 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld64.c
498 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800499 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800500 src/f32-gemm/gen-inc/1x8s4-neonfma.c
501 src/f32-gemm/gen-inc/4x8s4-neonfma.c
502 src/f32-gemm/gen-inc/6x8s4-neonfma.c
503 src/f32-gemm/gen-inc/8x8s4-neonfma.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800504 src/f32-hswish/neonfma.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800505 src/f32-ppmm/gen/4x8-neonfma.c
506 src/f32-ppmm/gen/8x8-neonfma.c
507 src/f32-sigmoid/gen/neonfma-p5-nr2fma-x16.c
508 src/f32-vmulcaddc/gen/c4-neonfma-2x.c
509 src/f32-vmulcaddc/gen/c8-neonfma-2x.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800510 src/math/exp-neonfma-lut2048-p1.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800511 src/math/exp-neonfma-lut64-p2.c
512 src/math/exp-neonfma-p5.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800513 src/math/expminus-neonfma-lut64-p2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800514 src/math/expminus-neonfma-p5.c
Marat Dukhan91f8d862019-11-27 12:25:42 -0800515 src/math/sigmoid-neonfma-lut2048-p1-nr1recps1fma.c
516 src/math/sigmoid-neonfma-lut2048-p1-nr2fma.c
517 src/math/sigmoid-neonfma-lut2048-p1-nr2recps.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800518 src/math/sigmoid-neonfma-p5-nr1recps1fma.c
519 src/math/sigmoid-neonfma-p5-nr2fma.c
520 src/math/sigmoid-neonfma-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700521
Marat Dukhan36aecb52019-11-22 17:21:49 -0800522SET(XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800523 src/f32-gemm/gen/1x8-neonfma-lane-ld64.c
524 src/f32-gemm/gen/4x2-neonfma-lane-ld64.c
525 src/f32-gemm/gen/4x8-neonfma-lane-ld128.c
526 src/f32-gemm/gen/4x8-neonfma-lane-ld64.c
527 src/f32-gemm/gen/5x8-neonfma-lane-ld64.c
528 src/f32-gemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800529 src/f32-gemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800530 src/f32-gemm/gen-inc/1x8-neonfma-lane-ld64.c
531 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld128.c
532 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld64.c
533 src/f32-gemm/gen-inc/5x8-neonfma-lane-ld64.c
534 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800535 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800536 src/f32-igemm/gen/1x8-neonfma-lane-ld64.c
537 src/f32-igemm/gen/4x2-neonfma-lane-ld64.c
538 src/f32-igemm/gen/4x4-neonfma-lane-ld64.c
539 src/f32-igemm/gen/4x8-neonfma-lane-ld128.c
540 src/f32-igemm/gen/4x8-neonfma-lane-ld64.c
541 src/f32-igemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800542 src/f32-igemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800543 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
544 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
545 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
546 src/f32-dwconv-spchw/3x3p1-neonfma.c
547 src/f32-dwconv-spchw/5x5p2-neonfma.c
548 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
549 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800550 src/f32-spmm/gen/12x1-neonfma.c
551 src/f32-spmm/gen/12x2-neonfma.c
552 src/f32-spmm/gen/12x4-neonfma.c
553 src/f32-spmm/gen/16x1-neonfma-pipelined.c
554 src/f32-spmm/gen/16x1-neonfma-unroll2.c
555 src/f32-spmm/gen/16x1-neonfma.c
556 src/f32-spmm/gen/16x2-neonfma.c
557 src/f32-spmm/gen/16x4-neonfma.c
558 src/f32-spmm/gen/4x1-neonfma-pipelined.c
559 src/f32-spmm/gen/4x1-neonfma-unroll2.c
560 src/f32-spmm/gen/4x1-neonfma.c
561 src/f32-spmm/gen/4x2-neonfma.c
562 src/f32-spmm/gen/4x4-neonfma.c
563 src/f32-spmm/gen/8x1-neonfma-pipelined.c
564 src/f32-spmm/gen/8x1-neonfma-unroll2.c
565 src/f32-spmm/gen/8x1-neonfma.c
566 src/f32-spmm/gen/8x2-neonfma.c
567 src/f32-spmm/gen/8x4-neonfma.c
Marat Dukhan91f8d862019-11-27 12:25:42 -0800568 src/math/sigmoid-neonfma-lut2048-p1-div.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800569 src/math/sigmoid-neonfma-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700570
571SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800572 src/f16-gemm/gen/4x8-neonfp16arith-ld64.c
573 src/f16-gemm/gen/6x8-neonfp16arith-ld64.c
574 src/f16-gemm/gen/8x8-neonfp16arith-ld64.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700575
576SET(XNNPACK_SSE_MICROKERNEL_SRCS
577 src/f32-avgpool/mp9p8q-sse.c
578 src/f32-avgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800579 src/f32-bilinear/gen/sse-c4.c
580 src/f32-bilinear/gen/sse-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700581 src/f32-clamp/sse.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800582 src/f32-dwconv-spchw/3x3p1-sse.c
583 src/f32-dwconv-spchw/3x3s2p1-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800584 src/f32-dwconv/gen/up4x25-sse-acc2.c
585 src/f32-dwconv/gen/up4x25-sse.c
586 src/f32-dwconv/gen/up4x4-sse-acc2.c
587 src/f32-dwconv/gen/up4x4-sse.c
588 src/f32-dwconv/gen/up4x9-sse-acc2.c
589 src/f32-dwconv/gen/up4x9-sse.c
590 src/f32-dwconv/gen/up8x25-sse-acc2.c
591 src/f32-dwconv/gen/up8x25-sse.c
592 src/f32-dwconv/gen/up8x4-sse-acc2.c
593 src/f32-dwconv/gen/up8x4-sse.c
594 src/f32-dwconv/gen/up8x9-sse-acc2.c
595 src/f32-dwconv/gen/up8x9-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700596 src/f32-gavgpool-spchw/sse-x4.c
597 src/f32-gavgpool/mp7p7q-sse.c
598 src/f32-gavgpool/up7-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800599 src/f32-gemm/gen/1x8-sse-dup.c
600 src/f32-gemm/gen/1x8-sse-load1.c
601 src/f32-gemm/gen/1x8s4-sse.c
602 src/f32-gemm/gen/4x8-sse-dup.c
603 src/f32-gemm/gen/4x8-sse-load1.c
604 src/f32-gemm/gen/4x8s4-sse.c
605 src/f32-gemm/gen-inc/1x8-sse-dup.c
606 src/f32-gemm/gen-inc/1x8-sse-load1.c
607 src/f32-gemm/gen-inc/1x8s4-sse.c
608 src/f32-gemm/gen-inc/4x8-sse-dup.c
609 src/f32-gemm/gen-inc/4x8-sse-load1.c
610 src/f32-gemm/gen-inc/4x8s4-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700611 src/f32-hswish/sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800612 src/f32-igemm/gen/1x8-sse-dup.c
613 src/f32-igemm/gen/1x8-sse-load1.c
614 src/f32-igemm/gen/1x8s4-sse.c
615 src/f32-igemm/gen/4x2c4-sse.c
616 src/f32-igemm/gen/4x8-sse-dup.c
617 src/f32-igemm/gen/4x8-sse-load1.c
618 src/f32-igemm/gen/4x8s4-sse.c
Marat Dukhan329da642019-11-19 21:44:39 -0800619 src/f32-maxpool/9p8x-sse-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700620 src/f32-pavgpool/mp9p8q-sse.c
621 src/f32-pavgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800622 src/f32-ppmm/gen/4x8-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700623 src/f32-rmax/sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800624 src/f32-spmm/gen/4x1-sse.c
625 src/f32-spmm/gen/8x1-sse.c
626 src/f32-vbinary/gen/vadd-sse-x4.c
627 src/f32-vbinary/gen/vadd-sse-x8.c
628 src/f32-vbinary/gen/vaddc-sse-x4.c
629 src/f32-vbinary/gen/vaddc-sse-x8.c
630 src/f32-vbinary/gen/vmul-sse-x4.c
631 src/f32-vbinary/gen/vmul-sse-x8.c
632 src/f32-vbinary/gen/vmulc-sse-x4.c
633 src/f32-vbinary/gen/vmulc-sse-x8.c
634 src/f32-vbinary/gen/vrsubc-sse-x4.c
635 src/f32-vbinary/gen/vrsubc-sse-x8.c
636 src/f32-vbinary/gen/vsub-sse-x4.c
637 src/f32-vbinary/gen/vsub-sse-x8.c
638 src/f32-vbinary/gen/vsubc-sse-x4.c
639 src/f32-vbinary/gen/vsubc-sse-x8.c
640 src/f32-vmulcaddc/gen/c4-sse-2x.c
641 src/f32-vmulcaddc/gen/c8-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700642 src/x32-packx/x4-sse.c)
643
644SET(XNNPACK_SSE2_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800645 src/f32-argmaxpool/4x-sse2-c4.c
646 src/f32-argmaxpool/9p8x-sse2-c4.c
647 src/f32-argmaxpool/9x-sse2-c4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800648 src/f32-prelu/gen/sse2-2x4.c
649 src/f32-prelu/gen/sse2-2x8.c
650 src/f32-sigmoid/gen/sse2-p5-div-x8.c
651 src/f32-sigmoid/gen/sse2-p5-div-x16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700652 src/q8-avgpool/mp9p8q-sse2.c
653 src/q8-avgpool/up9-sse2.c
654 src/q8-igemm/4x4c2-sse2.c
655 src/q8-dwconv/up8x9-sse2.c
656 src/q8-gavgpool/mp7p7q-sse2.c
657 src/q8-gavgpool/up7-sse2.c
658 src/q8-gemm/2x4c8-sse2.c
659 src/q8-gemm/4x4c2-sse2.c
660 src/q8-vadd/sse2.c
661 src/u8-clamp/sse2.c
Marat Dukhan329da642019-11-19 21:44:39 -0800662 src/u8-maxpool/9p8x-sse2-c16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700663 src/u8-rmax/sse2.c
664 src/x32-pad/x2-sse2.c
665 src/x32-zip/x2-sse2.c
666 src/x32-zip/x3-sse2.c
667 src/x32-zip/x4-sse2.c
668 src/x32-zip/xm-sse2.c
669 src/x8-zip/x2-sse2.c
670 src/x8-zip/x3-sse2.c
671 src/x8-zip/x4-sse2.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800672 src/x8-zip/xm-sse2.c
673 src/math/exp-sse2-p5.c
Marat Dukhan80bafd22019-11-18 10:16:01 -0800674 src/math/expminus-sse2-p5.c
675 src/math/sigmoid-sse2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700676
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800677SET(XNNPACK_SSE41_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800678 src/f32-prelu/gen/sse41-2x4.c
679 src/f32-prelu/gen/sse41-2x8.c
680 src/f32-sigmoid/gen/sse41-p5-div-x8.c
681 src/f32-sigmoid/gen/sse41-p5-div-x16.c)
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800682
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700683SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -0800684 src/f32-clamp/avx.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800685 src/f32-dwconv/gen/up16x4-avx-acc2.c
686 src/f32-dwconv/gen/up16x4-avx.c
687 src/f32-dwconv/gen/up8x4-avx-acc2.c
688 src/f32-dwconv/gen/up8x4-avx.c
689 src/f32-dwconv/gen/up16x9-avx-acc2.c
690 src/f32-dwconv/gen/up16x9-avx.c
691 src/f32-dwconv/gen/up8x9-avx-acc2.c
692 src/f32-dwconv/gen/up8x9-avx.c
693 src/f32-dwconv/gen/up16x25-avx-acc2.c
694 src/f32-dwconv/gen/up16x25-avx.c
695 src/f32-dwconv/gen/up8x25-avx-acc2.c
696 src/f32-dwconv/gen/up8x25-avx.c
697 src/f32-gemm/gen/1x8-avx-broadcast.c
698 src/f32-gemm/gen/4x8-avx-broadcast.c
699 src/f32-gemm/gen/5x8-avx-broadcast.c
700 src/f32-gemm/gen/6x8-avx-broadcast.c
701 src/f32-gemm/gen/7x8-avx-broadcast.c
702 src/f32-gemm/gen-inc/1x8-avx-broadcast.c
703 src/f32-gemm/gen-inc/4x8-avx-broadcast.c
704 src/f32-gemm/gen-inc/5x8-avx-broadcast.c
705 src/f32-gemm/gen-inc/6x8-avx-broadcast.c
706 src/f32-gemm/gen-inc/7x8-avx-broadcast.c
707 src/f32-igemm/gen/1x8-avx-broadcast.c
708 src/f32-igemm/gen/4x8-avx-broadcast.c
709 src/f32-igemm/gen/5x8-avx-broadcast.c
710 src/f32-igemm/gen/6x8-avx-broadcast.c
711 src/f32-igemm/gen/7x8-avx-broadcast.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700712 src/f32-rmax/avx.c
713 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700714
Marat Dukhanfda12b82019-11-21 12:27:59 -0800715SET(XNNPACK_FMA3_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800716 src/f32-dwconv/gen/up16x4-fma3-acc2.c
717 src/f32-dwconv/gen/up16x4-fma3.c
718 src/f32-dwconv/gen/up8x4-fma3-acc2.c
719 src/f32-dwconv/gen/up8x4-fma3.c
720 src/f32-dwconv/gen/up16x9-fma3-acc2.c
721 src/f32-dwconv/gen/up16x9-fma3.c
722 src/f32-dwconv/gen/up8x9-fma3-acc2.c
723 src/f32-dwconv/gen/up8x9-fma3.c
724 src/f32-dwconv/gen/up16x25-fma3-acc2.c
725 src/f32-dwconv/gen/up16x25-fma3.c
726 src/f32-dwconv/gen/up8x25-fma3-acc2.c
727 src/f32-dwconv/gen/up8x25-fma3.c
728 src/f32-gemm/gen/1x8-fma3-broadcast.c
729 src/f32-gemm/gen/4x8-fma3-broadcast.c
730 src/f32-gemm/gen/5x8-fma3-broadcast.c
731 src/f32-gemm/gen/6x8-fma3-broadcast.c
732 src/f32-gemm/gen/7x8-fma3-broadcast.c
733 src/f32-gemm/gen/8x8-fma3-broadcast.c
734 src/f32-gemm/gen-inc/1x8-fma3-broadcast.c
735 src/f32-gemm/gen-inc/4x8-fma3-broadcast.c
736 src/f32-gemm/gen-inc/5x8-fma3-broadcast.c
737 src/f32-gemm/gen-inc/6x8-fma3-broadcast.c
738 src/f32-gemm/gen-inc/7x8-fma3-broadcast.c
739 src/f32-gemm/gen-inc/8x8-fma3-broadcast.c
740 src/f32-igemm/gen/1x8-fma3-broadcast.c
741 src/f32-igemm/gen/4x8-fma3-broadcast.c
742 src/f32-igemm/gen/5x8-fma3-broadcast.c
743 src/f32-igemm/gen/6x8-fma3-broadcast.c
744 src/f32-igemm/gen/7x8-fma3-broadcast.c
745 src/f32-igemm/gen/8x8-fma3-broadcast.c)
Marat Dukhanfda12b82019-11-21 12:27:59 -0800746
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700747SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan97579532019-10-18 16:40:39 -0700748 src/f32-raddexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700749 src/f32-raddextexp/avx2-p5-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700750 src/f32-raddstoreexpminusmax/avx2-p5-unroll64.c
751 src/f32-vscaleexpminusmax/avx2-p5-unroll64.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700752 src/f32-vscaleextexp/avx2-p5-unroll64.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700753 src/math/exp-avx2-p5.c
754 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -0700755 src/math/exp-avx2-perm-p4.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800756 src/math/expminus-avx2-p5.c
757 src/math/extexp-avx2-p5.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700758
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700759SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -0800760 src/f32-clamp/avx512f.c
Marat Dukhan479f87e2019-11-27 15:17:06 -0800761 src/f32-dwconv/gen/up32x4-avx512f-acc2.c
762 src/f32-dwconv/gen/up32x4-avx512f.c
763 src/f32-dwconv/gen/up16x4-avx512f-acc2.c
764 src/f32-dwconv/gen/up16x4-avx512f.c
765 src/f32-dwconv/gen/up32x9-avx512f-acc2.c
766 src/f32-dwconv/gen/up32x9-avx512f.c
767 src/f32-dwconv/gen/up16x9-avx512f-acc2.c
768 src/f32-dwconv/gen/up16x9-avx512f.c
769 src/f32-dwconv/gen/up32x25-avx512f-acc2.c
770 src/f32-dwconv/gen/up32x25-avx512f.c
771 src/f32-dwconv/gen/up16x25-avx512f-acc2.c
772 src/f32-dwconv/gen/up16x25-avx512f.c
Marat Dukhan0f349c42019-11-27 11:58:54 -0800773 src/f32-gemm/gen/1x16-avx512f-broadcast.c
774 src/f32-gemm/gen/4x16-avx512f-broadcast.c
775 src/f32-gemm/gen/5x16-avx512f-broadcast.c
776 src/f32-gemm/gen/6x16-avx512f-broadcast.c
777 src/f32-gemm/gen/7x16-avx512f-broadcast.c
778 src/f32-gemm/gen/8x16-avx512f-broadcast.c
779 src/f32-gemm/gen-inc/1x16-avx512f-broadcast.c
780 src/f32-gemm/gen-inc/4x16-avx512f-broadcast.c
781 src/f32-gemm/gen-inc/5x16-avx512f-broadcast.c
782 src/f32-gemm/gen-inc/6x16-avx512f-broadcast.c
783 src/f32-gemm/gen-inc/7x16-avx512f-broadcast.c
784 src/f32-gemm/gen-inc/8x16-avx512f-broadcast.c
785 src/f32-igemm/gen/1x16-avx512f-broadcast.c
786 src/f32-igemm/gen/4x16-avx512f-broadcast.c
787 src/f32-igemm/gen/5x16-avx512f-broadcast.c
788 src/f32-igemm/gen/6x16-avx512f-broadcast.c
789 src/f32-igemm/gen/7x16-avx512f-broadcast.c
790 src/f32-igemm/gen/8x16-avx512f-broadcast.c
Marat Dukhan97579532019-10-18 16:40:39 -0700791 src/f32-raddexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700792 src/f32-raddextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan97579532019-10-18 16:40:39 -0700793 src/f32-raddstoreexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700794 src/f32-rmax/avx512f.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700795 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan97579532019-10-18 16:40:39 -0700796 src/f32-vscaleexpminusmax/avx512f-p5-scalef-unroll128.c
Marat Dukhan6f8d4d32019-10-25 17:07:09 -0700797 src/f32-vscaleextexp/avx512f-p5-scalef-unroll128.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700798 src/math/exp-avx512f-p5-scalef.c
799 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -0700800 src/math/exp-avx512f-perm-p3.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800801 src/math/exp-avx512f-perm2-p2.c
802 src/math/extexp-avx512f-p5.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700803
804SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
805 src/q8-dwconv/up8x9-aarch32-neon.S)
806
807SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
808 src/f32-dwconv/up4x9-aarch64-neonfma-cortex-a55.S
809 src/f32-dwconv/up4x9-aarch64-neonfma.S
Marat Dukhan40a672f2019-11-25 03:08:22 -0800810 src/f32-gemm/gen/1x12-aarch64-neonfma-cortex-a53.S
811 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a53.S
812 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a57.S
813 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a75.S
814 src/f32-gemm/gen/4x12-aarch64-neonfma-cortex-a53.S
815 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a53.S
816 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a57.S
817 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a75.S
818 src/f32-gemm/gen/4x8-aarch64-neonfma-ld128.S
819 src/f32-gemm/gen/4x8-aarch64-neonfma-ld64.S
820 src/f32-gemm/gen/5x8-aarch64-neonfma-cortex-a75.S
821 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a53.S
822 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a57.S
823 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a73.S
824 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a75.S
825 src/f32-gemm/gen/6x8-aarch64-neonfma-ld128.S
826 src/f32-gemm/gen/6x8-aarch64-neonfma-ld64.S
827 src/f32-gemm/gen-inc/1x12-aarch64-neonfma-cortex-a53.S
828 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a53.S
829 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a57.S
830 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a75.S
831 src/f32-gemm/gen-inc/4x12-aarch64-neonfma-cortex-a53.S
832 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a53.S
833 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a57.S
834 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a75.S
835 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld128.S
836 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld64.S
837 src/f32-gemm/gen-inc/5x8-aarch64-neonfma-cortex-a75.S
838 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a53.S
839 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a57.S
840 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a73.S
841 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a75.S
842 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld128.S
843 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld64.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700844 src/f32-igemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -0700845 src/f32-igemm/1x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700846 src/f32-igemm/1x8-aarch64-neonfma-cortex-a57.S
847 src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.S
848 src/f32-igemm/4x12-aarch64-neonfma-cortex-a53.S
849 src/f32-igemm/4x8-aarch64-neonfma-cortex-a75.S
850 src/f32-igemm/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -0700851 src/f32-igemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700852 src/f32-igemm/6x8-aarch64-neonfma-cortex-a57.S
853 src/f32-igemm/6x8-aarch64-neonfma-cortex-a73.S
854 src/f32-igemm/6x8-aarch64-neonfma-cortex-a75.S)
855
856SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
857IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
858 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_MICROKERNEL_SRCS})
859ENDIF()
860IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
861 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
862 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
863 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
864ENDIF()
865IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
866 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
867 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan36aecb52019-11-22 17:21:49 -0800868 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700869 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
870 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
871ENDIF()
872IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
873 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
874 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800875 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700876 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhanfda12b82019-11-21 12:27:59 -0800877 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_FMA3_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700878 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700879 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
880ENDIF()
881
882IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
883 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
884ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
885 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
886ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
887 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
888ELSE()
889 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
890ENDIF()
891SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
892 C_STANDARD 99
893 C_EXTENSIONS YES)
894IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
895 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
896 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
897 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
898 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
899 IF(IOS)
900 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
901 ENDIF()
902ENDIF()
903IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
904 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
905 IF(IOS)
906 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
907 ENDIF()
908ENDIF()
909IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
910 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
911 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800912 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700913 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhanfda12b82019-11-21 12:27:59 -0800914 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -0700915 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700916 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
917ENDIF()
918IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
919 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
920ELSE()
921 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
922 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
923 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
924 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
925ENDIF()
926IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
927 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
928ENDIF()
929
930TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
931TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
932SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/XNNPACK.h)
933
934# ---[ Configure clog
935IF(NOT TARGET clog)
936 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
937 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
938 ADD_SUBDIRECTORY(
939 "${CLOG_SOURCE_DIR}/deps/clog"
940 "${CMAKE_BINARY_DIR}/clog")
941 # We build static version of clog but a dynamic library may indirectly depend on it
942 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
943ENDIF()
944TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
945
946# ---[ Configure cpuinfo
947IF(NOT TARGET cpuinfo)
948 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
949 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
950 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
951 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
952 ADD_SUBDIRECTORY(
953 "${CPUINFO_SOURCE_DIR}"
954 "${CMAKE_BINARY_DIR}/cpuinfo")
955ENDIF()
956TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
957
958# ---[ Configure pthreadpool
959IF(NOT TARGET pthreadpool)
960 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
961 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -0700962 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700963 ADD_SUBDIRECTORY(
964 "${PTHREADPOOL_SOURCE_DIR}"
965 "${CMAKE_BINARY_DIR}/pthreadpool")
966ENDIF()
967TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
968
969# ---[ Configure FXdiv
970IF(NOT TARGET fxdiv)
971 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
972 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
973 ADD_SUBDIRECTORY(
974 "${FXDIV_SOURCE_DIR}"
975 "${CMAKE_BINARY_DIR}/FXdiv")
976ENDIF()
977TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
978
979# ---[ Configure psimd
980IF(NOT TARGET psimd)
981 ADD_SUBDIRECTORY(
982 "${PSIMD_SOURCE_DIR}"
983 "${CMAKE_BINARY_DIR}/psimd")
984ENDIF()
985TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
986
987# ---[ Configure FP16
988IF(NOT TARGET fp16)
989 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
990 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
991 ADD_SUBDIRECTORY(
992 "${FP16_SOURCE_DIR}"
993 "${CMAKE_BINARY_DIR}/FP16")
994ENDIF()
995TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
996
997INSTALL(TARGETS XNNPACK
998 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
999 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
1000 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
1001
1002# ---[ XNNPACK unit tests
1003IF(XNNPACK_BUILD_TESTS)
1004 # ---[ Build google test
1005 IF(NOT TARGET gtest)
1006 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
1007 ADD_SUBDIRECTORY(
1008 "${GOOGLETEST_SOURCE_DIR}"
1009 "${CMAKE_BINARY_DIR}/googletest")
1010 ENDIF()
1011
1012 # ---[ Build operator-level unit tests
Marat Dukhanefc47b82019-11-18 09:25:38 -08001013 ADD_EXECUTABLE(add-nc-test test/add-nc.cc)
1014 SET_TARGET_PROPERTIES(add-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001015 CXX_STANDARD 11
1016 CXX_STANDARD_REQUIRED YES
1017 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001018 TARGET_INCLUDE_DIRECTORIES(add-nc-test PRIVATE src test)
1019 TARGET_LINK_LIBRARIES(add-nc-test PRIVATE XNNPACK gtest gtest_main)
1020 ADD_TEST(add-nc-test add-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001021
Marat Dukhanefc47b82019-11-18 09:25:38 -08001022 ADD_EXECUTABLE(argmax-pooling-nhwc-test test/argmax-pooling-nhwc.cc)
1023 SET_TARGET_PROPERTIES(argmax-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001024 CXX_STANDARD 11
1025 CXX_STANDARD_REQUIRED YES
1026 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001027 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-nhwc-test PRIVATE src test)
1028 TARGET_LINK_LIBRARIES(argmax-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1029 ADD_TEST(argmax-pooling-nhwc-test argmax-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001030
Marat Dukhanefc47b82019-11-18 09:25:38 -08001031 ADD_EXECUTABLE(average-pooling-nhwc-test test/average-pooling-nhwc.cc)
1032 SET_TARGET_PROPERTIES(average-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001033 CXX_STANDARD 11
1034 CXX_STANDARD_REQUIRED YES
1035 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001036 TARGET_INCLUDE_DIRECTORIES(average-pooling-nhwc-test PRIVATE src test)
1037 TARGET_LINK_LIBRARIES(average-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1038 ADD_TEST(average-pooling-nhwc-test average-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001039
Marat Dukhanefc47b82019-11-18 09:25:38 -08001040 ADD_EXECUTABLE(channel-pad-nc-test test/channel-pad-nc.cc)
1041 SET_TARGET_PROPERTIES(channel-pad-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001042 CXX_STANDARD 11
1043 CXX_STANDARD_REQUIRED YES
1044 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001045 TARGET_INCLUDE_DIRECTORIES(channel-pad-nc-test PRIVATE src test)
1046 TARGET_LINK_LIBRARIES(channel-pad-nc-test PRIVATE XNNPACK gtest gtest_main)
1047 ADD_TEST(channel-pad-nc-test channel-pad-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001048
Marat Dukhanefc47b82019-11-18 09:25:38 -08001049 ADD_EXECUTABLE(channel-shuffle-nc-test test/channel-shuffle-nc.cc)
1050 SET_TARGET_PROPERTIES(channel-shuffle-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001051 CXX_STANDARD 11
1052 CXX_STANDARD_REQUIRED YES
1053 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001054 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-nc-test PRIVATE src test)
1055 TARGET_LINK_LIBRARIES(channel-shuffle-nc-test PRIVATE XNNPACK gtest gtest_main)
1056 ADD_TEST(channel-shuffle-nc-test channel-shuffle-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001057
Marat Dukhanefc47b82019-11-18 09:25:38 -08001058 ADD_EXECUTABLE(clamp-nc-test test/clamp-nc.cc)
1059 SET_TARGET_PROPERTIES(clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001060 CXX_STANDARD 11
1061 CXX_STANDARD_REQUIRED YES
1062 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001063 TARGET_INCLUDE_DIRECTORIES(clamp-nc-test PRIVATE src test)
1064 TARGET_LINK_LIBRARIES(clamp-nc-test PRIVATE XNNPACK gtest gtest_main)
1065 ADD_TEST(clamp-nc-test clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001066
Marat Dukhanefc47b82019-11-18 09:25:38 -08001067 ADD_EXECUTABLE(convolution-nhwc-test test/convolution-nhwc.cc)
1068 SET_TARGET_PROPERTIES(convolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001069 CXX_STANDARD 11
1070 CXX_STANDARD_REQUIRED YES
1071 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001072 TARGET_INCLUDE_DIRECTORIES(convolution-nhwc-test PRIVATE src test)
1073 TARGET_LINK_LIBRARIES(convolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1074 ADD_TEST(convolution-nhwc-test convolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001075
Marat Dukhanefc47b82019-11-18 09:25:38 -08001076 ADD_EXECUTABLE(convolution-nchw-test test/convolution-nchw.cc)
1077 SET_TARGET_PROPERTIES(convolution-nchw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001078 CXX_STANDARD 11
1079 CXX_STANDARD_REQUIRED YES
1080 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001081 TARGET_INCLUDE_DIRECTORIES(convolution-nchw-test PRIVATE src test)
1082 TARGET_LINK_LIBRARIES(convolution-nchw-test PRIVATE XNNPACK gtest gtest_main)
1083 ADD_TEST(convolution-nchw-test convolution-nchw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001084
Marat Dukhanefc47b82019-11-18 09:25:38 -08001085 ADD_EXECUTABLE(deconvolution-nhwc-test test/deconvolution-nhwc.cc)
1086 SET_TARGET_PROPERTIES(deconvolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001087 CXX_STANDARD 11
1088 CXX_STANDARD_REQUIRED YES
1089 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001090 TARGET_INCLUDE_DIRECTORIES(deconvolution-nhwc-test PRIVATE src test)
1091 TARGET_LINK_LIBRARIES(deconvolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1092 ADD_TEST(deconvolution-nhwc-test deconvolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001093
Marat Dukhanefc47b82019-11-18 09:25:38 -08001094 ADD_EXECUTABLE(fully-connected-nc-test test/fully-connected-nc.cc)
1095 SET_TARGET_PROPERTIES(fully-connected-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001096 CXX_STANDARD 11
1097 CXX_STANDARD_REQUIRED YES
1098 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001099 TARGET_INCLUDE_DIRECTORIES(fully-connected-nc-test PRIVATE src test)
1100 TARGET_LINK_LIBRARIES(fully-connected-nc-test PRIVATE XNNPACK gtest gtest_main)
1101 ADD_TEST(fully-connected-nc-test fully-connected-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001102
Marat Dukhanefc47b82019-11-18 09:25:38 -08001103 ADD_EXECUTABLE(global-average-pooling-nwc-test test/global-average-pooling-nwc.cc)
1104 SET_TARGET_PROPERTIES(global-average-pooling-nwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001105 CXX_STANDARD 11
1106 CXX_STANDARD_REQUIRED YES
1107 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001108 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-nwc-test PRIVATE src test)
1109 TARGET_LINK_LIBRARIES(global-average-pooling-nwc-test PRIVATE XNNPACK gtest gtest_main)
1110 ADD_TEST(global-average-pooling-nwc-test global-average-pooling-nwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001111
Marat Dukhanefc47b82019-11-18 09:25:38 -08001112 ADD_EXECUTABLE(global-average-pooling-ncw-test test/global-average-pooling-ncw.cc)
1113 SET_TARGET_PROPERTIES(global-average-pooling-ncw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001114 CXX_STANDARD 11
1115 CXX_STANDARD_REQUIRED YES
1116 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001117 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-ncw-test PRIVATE src test)
1118 TARGET_LINK_LIBRARIES(global-average-pooling-ncw-test PRIVATE XNNPACK gtest gtest_main)
1119 ADD_TEST(global-average-pooling-ncw-test global-average-pooling-ncw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001120
Marat Dukhanefc47b82019-11-18 09:25:38 -08001121 ADD_EXECUTABLE(hardswish-nc-test test/hardswish-nc.cc)
1122 SET_TARGET_PROPERTIES(hardswish-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001123 CXX_STANDARD 11
1124 CXX_STANDARD_REQUIRED YES
1125 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001126 TARGET_INCLUDE_DIRECTORIES(hardswish-nc-test PRIVATE src test)
1127 TARGET_LINK_LIBRARIES(hardswish-nc-test PRIVATE XNNPACK gtest gtest_main)
1128 ADD_TEST(hardswish-nc-test hardswish-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001129
Marat Dukhanefc47b82019-11-18 09:25:38 -08001130 ADD_EXECUTABLE(leaky-relu-nc-test test/leaky-relu-nc.cc)
1131 SET_TARGET_PROPERTIES(leaky-relu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001132 CXX_STANDARD 11
1133 CXX_STANDARD_REQUIRED YES
1134 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001135 TARGET_INCLUDE_DIRECTORIES(leaky-relu-nc-test PRIVATE src test)
1136 TARGET_LINK_LIBRARIES(leaky-relu-nc-test PRIVATE XNNPACK gtest gtest_main)
1137 ADD_TEST(leaky-relu-nc-test leaky-relu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001138
Marat Dukhanefc47b82019-11-18 09:25:38 -08001139 ADD_EXECUTABLE(max-pooling-nhwc-test test/max-pooling-nhwc.cc)
1140 SET_TARGET_PROPERTIES(max-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001141 CXX_STANDARD 11
1142 CXX_STANDARD_REQUIRED YES
1143 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001144 TARGET_INCLUDE_DIRECTORIES(max-pooling-nhwc-test PRIVATE src test)
1145 TARGET_LINK_LIBRARIES(max-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1146 ADD_TEST(max-pooling-nhwc-test max-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001147
Marat Dukhanefc47b82019-11-18 09:25:38 -08001148 ADD_EXECUTABLE(multiply-nd-test test/multiply-nd.cc)
1149 SET_TARGET_PROPERTIES(multiply-nd-test PROPERTIES
Marat Dukhan9d501d52019-11-16 02:30:50 -08001150 CXX_STANDARD 11
1151 CXX_STANDARD_REQUIRED YES
1152 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001153 TARGET_INCLUDE_DIRECTORIES(multiply-nd-test PRIVATE src test)
1154 TARGET_LINK_LIBRARIES(multiply-nd-test PRIVATE XNNPACK gtest gtest_main)
1155 ADD_TEST(multiply-nd-test multiply-nd-test)
Marat Dukhan9d501d52019-11-16 02:30:50 -08001156
Marat Dukhanefc47b82019-11-18 09:25:38 -08001157 ADD_EXECUTABLE(prelu-nc-test test/prelu-nc.cc)
1158 SET_TARGET_PROPERTIES(prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001159 CXX_STANDARD 11
1160 CXX_STANDARD_REQUIRED YES
1161 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001162 TARGET_INCLUDE_DIRECTORIES(prelu-nc-test PRIVATE src test)
1163 TARGET_LINK_LIBRARIES(prelu-nc-test PRIVATE XNNPACK gtest gtest_main)
1164 ADD_TEST(prelu-nc-test prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001165
Marat Dukhanefc47b82019-11-18 09:25:38 -08001166 ADD_EXECUTABLE(resize-bilinear-nhwc-test test/resize-bilinear-nhwc.cc)
1167 SET_TARGET_PROPERTIES(resize-bilinear-nhwc-test PROPERTIES
Marat Dukhan69722492019-11-11 19:55:50 -08001168 CXX_STANDARD 11
1169 CXX_STANDARD_REQUIRED YES
1170 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001171 TARGET_INCLUDE_DIRECTORIES(resize-bilinear-nhwc-test PRIVATE src test)
1172 TARGET_LINK_LIBRARIES(resize-bilinear-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1173 ADD_TEST(resize-bilinear-nhwc-test resize-bilinear-nhwc-test)
Marat Dukhan69722492019-11-11 19:55:50 -08001174
Marat Dukhanefc47b82019-11-18 09:25:38 -08001175 ADD_EXECUTABLE(sigmoid-nc-test test/sigmoid-nc.cc)
1176 SET_TARGET_PROPERTIES(sigmoid-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001177 CXX_STANDARD 11
1178 CXX_STANDARD_REQUIRED YES
1179 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001180 TARGET_INCLUDE_DIRECTORIES(sigmoid-nc-test PRIVATE src test)
1181 TARGET_LINK_LIBRARIES(sigmoid-nc-test PRIVATE XNNPACK gtest gtest_main)
1182 ADD_TEST(sigmoid-nc-test sigmoid-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001183
Marat Dukhanefc47b82019-11-18 09:25:38 -08001184 ADD_EXECUTABLE(softargmax-nc-test test/softargmax-nc.cc)
1185 SET_TARGET_PROPERTIES(softargmax-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001186 CXX_STANDARD 11
1187 CXX_STANDARD_REQUIRED YES
1188 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001189 TARGET_INCLUDE_DIRECTORIES(softargmax-nc-test PRIVATE src test)
1190 TARGET_LINK_LIBRARIES(softargmax-nc-test PRIVATE XNNPACK gtest gtest_main)
1191 ADD_TEST(softargmax-nc-test softargmax-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001192
Marat Dukhanefc47b82019-11-18 09:25:38 -08001193 ADD_EXECUTABLE(unpooling-nhwc-test test/unpooling-nhwc.cc)
1194 SET_TARGET_PROPERTIES(unpooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001195 CXX_STANDARD 11
1196 CXX_STANDARD_REQUIRED YES
1197 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001198 TARGET_INCLUDE_DIRECTORIES(unpooling-nhwc-test PRIVATE src test)
1199 TARGET_LINK_LIBRARIES(unpooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1200 ADD_TEST(unpooling-nhwc-test unpooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001201
1202 # ---[ Build microkernel-level unit tests
1203 ADD_EXECUTABLE(f16-gemm-test test/f16-gemm.cc)
1204 SET_TARGET_PROPERTIES(f16-gemm-test PROPERTIES
1205 CXX_STANDARD 11
1206 CXX_STANDARD_REQUIRED YES
1207 CXX_EXTENSIONS YES)
1208 TARGET_INCLUDE_DIRECTORIES(f16-gemm-test PRIVATE src test)
1209 TARGET_LINK_LIBRARIES(f16-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1210 ADD_TEST(f16-gemm-test f16-gemm-test)
1211
1212 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
1213 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
1214 CXX_STANDARD 11
1215 CXX_STANDARD_REQUIRED YES
1216 CXX_EXTENSIONS YES)
1217 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
1218 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1219 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
1220
1221 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
1222 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
1223 CXX_STANDARD 11
1224 CXX_STANDARD_REQUIRED YES
1225 CXX_EXTENSIONS YES)
1226 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
1227 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1228 ADD_TEST(f32-avgpool-test f32-avgpool-test)
1229
Marat Dukhanc465fc22019-11-07 19:20:28 -08001230 ADD_EXECUTABLE(f32-bilinear-test test/f32-bilinear.cc)
1231 SET_TARGET_PROPERTIES(f32-bilinear-test PROPERTIES
1232 CXX_STANDARD 11
1233 CXX_STANDARD_REQUIRED YES
1234 CXX_EXTENSIONS YES)
1235 TARGET_INCLUDE_DIRECTORIES(f32-bilinear-test PRIVATE src test)
1236 TARGET_LINK_LIBRARIES(f32-bilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1237 ADD_TEST(f32-bilinear-test f32-bilinear-test)
1238
Marat Dukhanefc47b82019-11-18 09:25:38 -08001239 ADD_EXECUTABLE(f32-clamp-nc-test test/f32-clamp.cc)
1240 SET_TARGET_PROPERTIES(f32-clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001241 CXX_STANDARD 11
1242 CXX_STANDARD_REQUIRED YES
1243 CXX_EXTENSIONS YES)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001244 TARGET_INCLUDE_DIRECTORIES(f32-clamp-nc-test PRIVATE src test)
1245 TARGET_LINK_LIBRARIES(f32-clamp-nc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1246 ADD_TEST(f32-clamp-nc-test f32-clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001247
1248 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
1249 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
1250 CXX_STANDARD 11
1251 CXX_STANDARD_REQUIRED YES
1252 CXX_EXTENSIONS YES)
1253 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
1254 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1255 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
1256
1257 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
1258 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
1259 CXX_STANDARD 11
1260 CXX_STANDARD_REQUIRED YES
1261 CXX_EXTENSIONS YES)
1262 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
1263 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1264 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
1265
1266 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
1267 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
1268 CXX_STANDARD 11
1269 CXX_STANDARD_REQUIRED YES
1270 CXX_EXTENSIONS YES)
1271 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
1272 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1273 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
1274
1275 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
1276 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
1277 CXX_STANDARD 11
1278 CXX_STANDARD_REQUIRED YES
1279 CXX_EXTENSIONS YES)
1280 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
1281 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1282 ADD_TEST(f32-dwconv-test f32-dwconv-test)
1283
1284 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
1285 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
1286 CXX_STANDARD 11
1287 CXX_STANDARD_REQUIRED YES
1288 CXX_EXTENSIONS YES)
1289 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
1290 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1291 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
1292
1293 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
1294 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
1295 CXX_STANDARD 11
1296 CXX_STANDARD_REQUIRED YES
1297 CXX_EXTENSIONS YES)
1298 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
1299 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1300 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
1301
1302 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
1303 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
1304 CXX_STANDARD 11
1305 CXX_STANDARD_REQUIRED YES
1306 CXX_EXTENSIONS YES)
1307 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
1308 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1309 ADD_TEST(f32-gemm-test f32-gemm-test)
1310
1311 ADD_EXECUTABLE(f32-gemminc-test test/f32-gemminc.cc)
1312 SET_TARGET_PROPERTIES(f32-gemminc-test PROPERTIES
1313 CXX_STANDARD 11
1314 CXX_STANDARD_REQUIRED YES
1315 CXX_EXTENSIONS YES)
1316 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-test PRIVATE src test)
1317 TARGET_LINK_LIBRARIES(f32-gemminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1318 ADD_TEST(f32-gemminc-test f32-gemminc-test)
1319
1320 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
1321 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
1322 CXX_STANDARD 11
1323 CXX_STANDARD_REQUIRED YES
1324 CXX_EXTENSIONS YES)
1325 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
1326 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1327 ADD_TEST(f32-hswish-test f32-hswish-test)
1328
1329 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
1330 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
1331 CXX_STANDARD 11
1332 CXX_STANDARD_REQUIRED YES
1333 CXX_EXTENSIONS YES)
1334 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
1335 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1336 ADD_TEST(f32-igemm-test f32-igemm-test)
1337
1338 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
1339 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
1340 CXX_STANDARD 11
1341 CXX_STANDARD_REQUIRED YES
1342 CXX_EXTENSIONS YES)
1343 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
1344 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1345 ADD_TEST(f32-maxpool-test f32-maxpool-test)
1346
1347 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
1348 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
1349 CXX_STANDARD 11
1350 CXX_STANDARD_REQUIRED YES
1351 CXX_EXTENSIONS YES)
1352 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
1353 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1354 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
1355
1356 ADD_EXECUTABLE(f32-ppmm-test test/f32-ppmm.cc)
1357 SET_TARGET_PROPERTIES(f32-ppmm-test PROPERTIES
1358 CXX_STANDARD 11
1359 CXX_STANDARD_REQUIRED YES
1360 CXX_EXTENSIONS YES)
1361 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-test PRIVATE src test)
1362 TARGET_LINK_LIBRARIES(f32-ppmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1363 ADD_TEST(f32-ppmm-test f32-ppmm-test)
1364
Marat Dukhanefc47b82019-11-18 09:25:38 -08001365 ADD_EXECUTABLE(f32-prelu-nc-test test/f32-prelu.cc)
1366 SET_TARGET_PROPERTIES(f32-prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001367 CXX_STANDARD 11
1368 CXX_STANDARD_REQUIRED YES
1369 CXX_EXTENSIONS YES)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001370 TARGET_INCLUDE_DIRECTORIES(f32-prelu-nc-test PRIVATE src test)
1371 TARGET_LINK_LIBRARIES(f32-prelu-nc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1372 ADD_TEST(f32-prelu-nc-test f32-prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001373
Marat Dukhan97579532019-10-18 16:40:39 -07001374 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
1375 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
1376 CXX_STANDARD 11
1377 CXX_STANDARD_REQUIRED YES
1378 CXX_EXTENSIONS YES)
1379 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
1380 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1381 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
1382
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001383 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
1384 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
1385 CXX_STANDARD 11
1386 CXX_STANDARD_REQUIRED YES
1387 CXX_EXTENSIONS YES)
1388 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001389 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001390 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
1391
Marat Dukhan97579532019-10-18 16:40:39 -07001392 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
1393 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
1394 CXX_STANDARD 11
1395 CXX_STANDARD_REQUIRED YES
1396 CXX_EXTENSIONS YES)
1397 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
1398 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1399 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
1400
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001401 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
1402 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
1403 CXX_STANDARD 11
1404 CXX_STANDARD_REQUIRED YES
1405 CXX_EXTENSIONS YES)
1406 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
1407 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1408 ADD_TEST(f32-rmax-test f32-rmax-test)
1409
Marat Dukhan581c1ac2019-11-18 14:57:54 -08001410 ADD_EXECUTABLE(f32-sigmoid-test test/f32-sigmoid.cc)
1411 SET_TARGET_PROPERTIES(f32-sigmoid-test PROPERTIES
1412 CXX_STANDARD 11
1413 CXX_STANDARD_REQUIRED YES
1414 CXX_EXTENSIONS YES)
1415 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-test PRIVATE src test)
1416 TARGET_LINK_LIBRARIES(f32-sigmoid-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1417 ADD_TEST(f32-sigmoid-test f32-sigmoid-test)
1418
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001419 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
1420 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
1421 CXX_STANDARD 11
1422 CXX_STANDARD_REQUIRED YES
1423 CXX_EXTENSIONS YES)
1424 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
1425 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1426 ADD_TEST(f32-spmm-test f32-spmm-test)
1427
Marat Dukhanefc47b82019-11-18 09:25:38 -08001428 ADD_EXECUTABLE(f32-vadd-nc-test test/f32-vadd.cc)
1429 SET_TARGET_PROPERTIES(f32-vadd-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001430 CXX_STANDARD 11
1431 CXX_STANDARD_REQUIRED YES
1432 CXX_EXTENSIONS YES)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001433 TARGET_INCLUDE_DIRECTORIES(f32-vadd-nc-test PRIVATE src test)
1434 TARGET_LINK_LIBRARIES(f32-vadd-nc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1435 ADD_TEST(f32-vadd-nc-test f32-vadd-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001436
Marat Dukhanc76065f2019-11-14 18:13:33 -08001437 ADD_EXECUTABLE(f32-vaddc-test test/f32-vaddc.cc)
1438 SET_TARGET_PROPERTIES(f32-vaddc-test PROPERTIES
1439 CXX_STANDARD 11
1440 CXX_STANDARD_REQUIRED YES
1441 CXX_EXTENSIONS YES)
1442 TARGET_INCLUDE_DIRECTORIES(f32-vaddc-test PRIVATE src test)
1443 TARGET_LINK_LIBRARIES(f32-vaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1444 ADD_TEST(f32-vaddc-test f32-vaddc-test)
1445
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001446 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
1447 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
1448 CXX_STANDARD 11
1449 CXX_STANDARD_REQUIRED YES
1450 CXX_EXTENSIONS YES)
1451 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
1452 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1453 ADD_TEST(f32-vmul-test f32-vmul-test)
1454
Marat Dukhanc76065f2019-11-14 18:13:33 -08001455 ADD_EXECUTABLE(f32-vmulc-test test/f32-vmulc.cc)
1456 SET_TARGET_PROPERTIES(f32-vmulc-test PROPERTIES
1457 CXX_STANDARD 11
1458 CXX_STANDARD_REQUIRED YES
1459 CXX_EXTENSIONS YES)
1460 TARGET_INCLUDE_DIRECTORIES(f32-vmulc-test PRIVATE src test)
1461 TARGET_LINK_LIBRARIES(f32-vmulc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1462 ADD_TEST(f32-vmulc-test f32-vmulc-test)
1463
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001464 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
1465 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
1466 CXX_STANDARD 11
1467 CXX_STANDARD_REQUIRED YES
1468 CXX_EXTENSIONS YES)
1469 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
1470 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1471 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
1472
Marat Dukhan97579532019-10-18 16:40:39 -07001473 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
1474 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1475 CXX_STANDARD 11
1476 CXX_STANDARD_REQUIRED YES
1477 CXX_EXTENSIONS YES)
1478 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
1479 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1480 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
1481
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001482 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
1483 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
1484 CXX_STANDARD 11
1485 CXX_STANDARD_REQUIRED YES
1486 CXX_EXTENSIONS YES)
1487 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001488 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001489 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
1490
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001491 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
1492 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
1493 CXX_STANDARD 11
1494 CXX_STANDARD_REQUIRED YES
1495 CXX_EXTENSIONS YES)
1496 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
1497 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1498 ADD_TEST(f32-vsub-test f32-vsub-test)
1499
Marat Dukhanc76065f2019-11-14 18:13:33 -08001500 ADD_EXECUTABLE(f32-vsubc-test test/f32-vsubc.cc)
1501 SET_TARGET_PROPERTIES(f32-vsubc-test PROPERTIES
1502 CXX_STANDARD 11
1503 CXX_STANDARD_REQUIRED YES
1504 CXX_EXTENSIONS YES)
1505 TARGET_INCLUDE_DIRECTORIES(f32-vsubc-test PRIVATE src test)
1506 TARGET_LINK_LIBRARIES(f32-vsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1507 ADD_TEST(f32-vsubc-test f32-vsubc-test)
1508
1509 ADD_EXECUTABLE(f32-vrsubc-test test/f32-vrsubc.cc)
1510 SET_TARGET_PROPERTIES(f32-vrsubc-test PROPERTIES
1511 CXX_STANDARD 11
1512 CXX_STANDARD_REQUIRED YES
1513 CXX_EXTENSIONS YES)
1514 TARGET_INCLUDE_DIRECTORIES(f32-vrsubc-test PRIVATE src test)
1515 TARGET_LINK_LIBRARIES(f32-vrsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1516 ADD_TEST(f32-vrsubc-test f32-vrsubc-test)
1517
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001518 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
1519 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
1520 CXX_STANDARD 11
1521 CXX_STANDARD_REQUIRED YES
1522 CXX_EXTENSIONS YES)
1523 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
1524 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1525 ADD_TEST(q8-avgpool-test q8-avgpool-test)
1526
1527 ADD_EXECUTABLE(q8-dwconv-test test/q8-dwconv.cc)
1528 SET_TARGET_PROPERTIES(q8-dwconv-test PROPERTIES
1529 CXX_STANDARD 11
1530 CXX_STANDARD_REQUIRED YES
1531 CXX_EXTENSIONS YES)
1532 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-test PRIVATE src test)
1533 TARGET_LINK_LIBRARIES(q8-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1534 ADD_TEST(q8-dwconv-test q8-dwconv-test)
1535
1536 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
1537 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
1538 CXX_STANDARD 11
1539 CXX_STANDARD_REQUIRED YES
1540 CXX_EXTENSIONS YES)
1541 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
1542 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1543 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
1544
1545 ADD_EXECUTABLE(q8-gemm-test test/q8-gemm.cc)
1546 SET_TARGET_PROPERTIES(q8-gemm-test PROPERTIES
1547 CXX_STANDARD 11
1548 CXX_STANDARD_REQUIRED YES
1549 CXX_EXTENSIONS YES)
1550 TARGET_INCLUDE_DIRECTORIES(q8-gemm-test PRIVATE src test)
1551 TARGET_LINK_LIBRARIES(q8-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1552 ADD_TEST(q8-gemm-test q8-gemm-test)
1553
1554 ADD_EXECUTABLE(q8-igemm-test test/q8-igemm.cc)
1555 SET_TARGET_PROPERTIES(q8-igemm-test PROPERTIES
1556 CXX_STANDARD 11
1557 CXX_STANDARD_REQUIRED YES
1558 CXX_EXTENSIONS YES)
1559 TARGET_INCLUDE_DIRECTORIES(q8-igemm-test PRIVATE src test)
1560 TARGET_LINK_LIBRARIES(q8-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1561 ADD_TEST(q8-igemm-test q8-igemm-test)
1562
Marat Dukhanefc47b82019-11-18 09:25:38 -08001563 ADD_EXECUTABLE(q8-vadd-nc-test test/q8-vadd.cc)
1564 SET_TARGET_PROPERTIES(q8-vadd-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001565 CXX_STANDARD 11
1566 CXX_STANDARD_REQUIRED YES
1567 CXX_EXTENSIONS YES)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001568 TARGET_INCLUDE_DIRECTORIES(q8-vadd-nc-test PRIVATE src test)
1569 TARGET_LINK_LIBRARIES(q8-vadd-nc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1570 ADD_TEST(q8-vadd-nc-test q8-vadd-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001571
Marat Dukhanefc47b82019-11-18 09:25:38 -08001572 ADD_EXECUTABLE(u8-clamp-nc-test test/u8-clamp.cc)
1573 SET_TARGET_PROPERTIES(u8-clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001574 CXX_STANDARD 11
1575 CXX_STANDARD_REQUIRED YES
1576 CXX_EXTENSIONS YES)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001577 TARGET_INCLUDE_DIRECTORIES(u8-clamp-nc-test PRIVATE src test)
1578 TARGET_LINK_LIBRARIES(u8-clamp-nc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1579 ADD_TEST(u8-clamp-nc-test u8-clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001580
1581 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
1582 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
1583 CXX_STANDARD 11
1584 CXX_STANDARD_REQUIRED YES
1585 CXX_EXTENSIONS YES)
1586 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
1587 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1588 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
1589
1590 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
1591 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
1592 CXX_STANDARD 11
1593 CXX_STANDARD_REQUIRED YES
1594 CXX_EXTENSIONS YES)
1595 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
1596 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1597 ADD_TEST(u8-maxpool-test u8-maxpool-test)
1598
1599 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
1600 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
1601 CXX_STANDARD 11
1602 CXX_STANDARD_REQUIRED YES
1603 CXX_EXTENSIONS YES)
1604 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
1605 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1606 ADD_TEST(u8-rmax-test u8-rmax-test)
1607
1608 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
1609 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
1610 CXX_STANDARD 11
1611 CXX_STANDARD_REQUIRED YES
1612 CXX_EXTENSIONS YES)
1613 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
1614 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1615 ADD_TEST(x32-packx-test x32-packx-test)
1616
1617 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
1618 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
1619 CXX_STANDARD 11
1620 CXX_STANDARD_REQUIRED YES
1621 CXX_EXTENSIONS YES)
1622 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
1623 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1624 ADD_TEST(x32-pad-test x32-pad-test)
1625
1626 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
1627 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
1628 CXX_STANDARD 11
1629 CXX_STANDARD_REQUIRED YES
1630 CXX_EXTENSIONS YES)
1631 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
1632 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1633 ADD_TEST(x32-unpool-test x32-unpool-test)
1634
1635 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
1636 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
1637 CXX_STANDARD 11
1638 CXX_STANDARD_REQUIRED YES
1639 CXX_EXTENSIONS YES)
1640 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
1641 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1642 ADD_TEST(x32-zip-test x32-zip-test)
1643
1644 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
1645 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
1646 CXX_STANDARD 11
1647 CXX_STANDARD_REQUIRED YES
1648 CXX_EXTENSIONS YES)
1649 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
1650 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1651 ADD_TEST(x8-lut-test x8-lut-test)
1652
1653 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
1654 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
1655 CXX_STANDARD 11
1656 CXX_STANDARD_REQUIRED YES
1657 CXX_EXTENSIONS YES)
1658 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
1659 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1660 ADD_TEST(x8-zip-test x8-zip-test)
1661ENDIF()
1662
1663# ---[ XNNPACK microbenchmarks
1664IF(XNNPACK_BUILD_BENCHMARKS)
1665 # ---[ Build google benchmark
1666 IF(NOT TARGET benchmark)
1667 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
1668 ADD_SUBDIRECTORY(
1669 "${GOOGLEBENCHMARK_SOURCE_DIR}"
1670 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
1671 ENDIF()
1672
1673 ADD_LIBRARY(bench-utils bench/utils.cc)
1674 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
1675 CXX_STANDARD 11
1676 CXX_STANDARD_REQUIRED YES
1677 CXX_EXTENSIONS NO)
1678 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08001679 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001680
Marat Dukhancb10f262019-11-16 15:52:37 -08001681 # ---[ Build accuracy microbenchmarks
1682 ADD_EXECUTABLE(f32-exp-eval eval/f32-exp.cc)
1683 SET_TARGET_PROPERTIES(f32-exp-eval PROPERTIES
1684 CXX_STANDARD 11
1685 CXX_STANDARD_REQUIRED YES
1686 CXX_EXTENSIONS NO)
1687 TARGET_INCLUDE_DIRECTORIES(f32-exp-eval PRIVATE src)
1688 TARGET_LINK_LIBRARIES(f32-exp-eval PRIVATE XNNPACK benchmark fp16)
1689
1690 ADD_EXECUTABLE(f32-expminus-eval eval/f32-expminus.cc)
1691 SET_TARGET_PROPERTIES(f32-expminus-eval PROPERTIES
1692 CXX_STANDARD 11
1693 CXX_STANDARD_REQUIRED YES
1694 CXX_EXTENSIONS NO)
1695 TARGET_INCLUDE_DIRECTORIES(f32-expminus-eval PRIVATE src)
1696 TARGET_LINK_LIBRARIES(f32-expminus-eval PRIVATE XNNPACK benchmark fp16)
1697
1698 ADD_EXECUTABLE(f32-extexp-eval eval/f32-extexp.cc)
1699 SET_TARGET_PROPERTIES(f32-extexp-eval PROPERTIES
1700 CXX_STANDARD 11
1701 CXX_STANDARD_REQUIRED YES
1702 CXX_EXTENSIONS YES)
1703 TARGET_INCLUDE_DIRECTORIES(f32-extexp-eval PRIVATE src)
1704 TARGET_LINK_LIBRARIES(f32-extexp-eval PRIVATE XNNPACK benchmark fp16)
1705
1706 ADD_EXECUTABLE(f32-sigmoid-eval eval/f32-sigmoid.cc)
1707 SET_TARGET_PROPERTIES(f32-sigmoid-eval PROPERTIES
1708 CXX_STANDARD 11
1709 CXX_STANDARD_REQUIRED YES
1710 CXX_EXTENSIONS NO)
1711 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-eval PRIVATE src)
1712 TARGET_LINK_LIBRARIES(f32-sigmoid-eval PRIVATE XNNPACK benchmark fp16)
1713
Marat Dukhan5f18d262019-10-31 10:24:14 -07001714 # ---[ Build end-to-end microbenchmarks
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001715 ADD_EXECUTABLE(end2end-bench bench/end2end.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1716 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
1717 CXX_STANDARD 11
1718 CXX_STANDARD_REQUIRED YES
1719 CXX_EXTENSIONS NO)
1720 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Frank Barcharde72e2872019-10-31 11:12:15 -07001721 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001722
Marat Dukhanef4416e2019-10-31 13:44:40 -07001723 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1724 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
1725 CXX_STANDARD 11
1726 CXX_STANDARD_REQUIRED YES
1727 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001728 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanef4416e2019-10-31 13:44:40 -07001729 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
1730
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07001731 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc models/mobilenet-v1.cc models/mobilenet-v2.cc)
1732 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07001733 CXX_STANDARD 11
1734 CXX_STANDARD_REQUIRED YES
1735 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07001736 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Frank Barchardc712fa42019-10-31 14:00:21 -07001737 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07001738
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001739 # ---[ Build operator-level microbenchmarks
1740 ADD_EXECUTABLE(add-bench bench/add.cc)
1741 SET_TARGET_PROPERTIES(add-bench PROPERTIES
1742 CXX_STANDARD 11
1743 CXX_STANDARD_REQUIRED YES
1744 CXX_EXTENSIONS NO)
1745 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1746 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1747
1748 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
1749 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
1750 CXX_STANDARD 11
1751 CXX_STANDARD_REQUIRED YES
1752 CXX_EXTENSIONS NO)
1753 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1754 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1755
1756 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
1757 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
1758 CXX_STANDARD 11
1759 CXX_STANDARD_REQUIRED YES
1760 CXX_EXTENSIONS NO)
1761 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1762 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1763
1764 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
1765 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
1766 CXX_STANDARD 11
1767 CXX_STANDARD_REQUIRED YES
1768 CXX_EXTENSIONS NO)
1769 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1770 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1771
1772 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
1773 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
1774 CXX_STANDARD 11
1775 CXX_STANDARD_REQUIRED YES
1776 CXX_EXTENSIONS NO)
1777 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1778 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1779
1780 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
1781 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
1782 CXX_STANDARD 11
1783 CXX_STANDARD_REQUIRED YES
1784 CXX_EXTENSIONS NO)
1785 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1786 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1787
1788 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
1789 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
1790 CXX_STANDARD 11
1791 CXX_STANDARD_REQUIRED YES
1792 CXX_EXTENSIONS NO)
1793 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1794 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1795
Marat Dukhan95b22432019-10-30 16:30:14 -07001796 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
1797 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
1798 CXX_STANDARD 11
1799 CXX_STANDARD_REQUIRED YES
1800 CXX_EXTENSIONS NO)
1801 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1802 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1803
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001804 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
1805 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
1806 CXX_STANDARD 11
1807 CXX_STANDARD_REQUIRED YES
1808 CXX_EXTENSIONS NO)
1809 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1810 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1811
1812 ADD_EXECUTABLE(softargmax-bench bench/softargmax.cc)
1813 SET_TARGET_PROPERTIES(softargmax-bench PROPERTIES
1814 CXX_STANDARD 11
1815 CXX_STANDARD_REQUIRED YES
1816 CXX_EXTENSIONS NO)
1817 TARGET_INCLUDE_DIRECTORIES(softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1818 TARGET_LINK_LIBRARIES(softargmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
1819
1820 # ---[ Build microkernel-level microbenchmarks
1821 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
1822 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
1823 CXX_STANDARD 11
1824 CXX_STANDARD_REQUIRED YES
1825 CXX_EXTENSIONS YES)
1826 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
1827 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1828 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1829
1830 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
1831 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
1832 CXX_STANDARD 11
1833 CXX_STANDARD_REQUIRED YES
1834 CXX_EXTENSIONS YES)
1835 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
1836 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1837 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1838
1839 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
1840 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
1841 CXX_STANDARD 11
1842 CXX_STANDARD_REQUIRED YES
1843 CXX_EXTENSIONS YES)
1844 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
1845 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1846 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1847
1848 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
1849 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
1850 CXX_STANDARD 11
1851 CXX_STANDARD_REQUIRED YES
1852 CXX_EXTENSIONS YES)
1853 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
1854 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1855 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1856
1857 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
1858 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
1859 CXX_STANDARD 11
1860 CXX_STANDARD_REQUIRED YES
1861 CXX_EXTENSIONS YES)
1862 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
1863 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1864 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1865
1866 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
1867 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
1868 CXX_STANDARD 11
1869 CXX_STANDARD_REQUIRED YES
1870 CXX_EXTENSIONS YES)
1871 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
1872 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1873 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1874
1875 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
1876 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
1877 C_STANDARD 99
1878 C_STANDARD_REQUIRED YES
1879 C_EXTENSIONS NO
1880 CXX_STANDARD 11
1881 CXX_STANDARD_REQUIRED YES
1882 CXX_EXTENSIONS YES)
1883 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
1884 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1885 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1886
1887 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
1888 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
1889 CXX_STANDARD 11
1890 CXX_STANDARD_REQUIRED YES
1891 CXX_EXTENSIONS YES)
1892 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
1893 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1894 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1895
Marat Dukhan581c1ac2019-11-18 14:57:54 -08001896 ADD_EXECUTABLE(f32-sigmoid-bench bench/f32-sigmoid.cc)
1897 SET_TARGET_PROPERTIES(f32-sigmoid-bench PROPERTIES
1898 CXX_STANDARD 11
1899 CXX_STANDARD_REQUIRED YES
1900 CXX_EXTENSIONS YES)
1901 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE src)
1902 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1903 TARGET_LINK_LIBRARIES(f32-sigmoid-bench PRIVATE XNNPACK benchmark bench-utils)
1904
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001905 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
1906 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
1907 CXX_STANDARD 11
1908 CXX_STANDARD_REQUIRED YES
1909 CXX_EXTENSIONS YES)
1910 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
1911 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1912 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1913
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001914 ADD_EXECUTABLE(f32-softargmax-bench bench/f32-softargmax.cc)
1915 SET_TARGET_PROPERTIES(f32-softargmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001916 CXX_STANDARD 11
1917 CXX_STANDARD_REQUIRED YES
1918 CXX_EXTENSIONS YES)
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07001919 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE src)
1920 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1921 TARGET_LINK_LIBRARIES(f32-softargmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07001922
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001923 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
1924 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
1925 CXX_STANDARD 11
1926 CXX_STANDARD_REQUIRED YES
1927 CXX_EXTENSIONS YES)
1928 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
1929 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
1930 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
1931ENDIF()