blob: 944f4a6951680a69d8d61b23cc4955b16f2f08cb [file] [log] [blame]
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001# Copyright (c) Facebook, Inc. and its affiliates.
2# All rights reserved.
3#
4# Copyright 2019 Google LLC
5#
6# This source code is licensed under the BSD-style license found in the
7# LICENSE file in the root directory of this source tree.
8
9CMAKE_MINIMUM_REQUIRED(VERSION 3.5 FATAL_ERROR)
10
11INCLUDE(GNUInstallDirs)
12
13# ---[ Project and semantic versioning.
14PROJECT(XNNPACK C CXX ASM)
15
16# ---[ Options.
17SET(XNNPACK_LIBRARY_TYPE "default" CACHE STRING "Type of library (shared, static, or default) to build")
18SET_PROPERTY(CACHE XNNPACK_LIBRARY_TYPE PROPERTY STRINGS default static shared)
19OPTION(XNNPACK_BUILD_TESTS "Build XNNPACK unit tests" ON)
20OPTION(XNNPACK_BUILD_BENCHMARKS "Build XNNPACK benchmarks" ON)
21
22# ---[ CMake options
23IF(XNNPACK_BUILD_TESTS)
24 ENABLE_TESTING()
25ENDIF()
26
27# ---[ Build flags
28IF(NOT CMAKE_SYSTEM_PROCESSOR)
29 IF(IOS)
30 LIST(LENGTH IOS_ARCH IOS_ARCH_COUNT)
31 IF(IOS_ARCH_COUNT GREATER 1)
32 MESSAGE(FATAL_ERROR "Unsupported XNNPACK build with multiple iOS architectures (${IOS_ARCH}). "
33 "Specify a single architecture in IOS_ARCH and re-configure. ")
34 ENDIF()
35 IF(NOT IOS_ARCH MATCHES "^(i386|x86_64|armv7.*|arm64.*)$")
36 MESSAGE(FATAL_ERROR "Unrecognized IOS_ARCH = ${IOS_ARCH}")
37 ENDIF()
38 ELSE()
39 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_PROCESSOR is not defined")
40 ENDIF()
41ELSEIF(NOT CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64|armv[5-8].*|aarch64)$")
42 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_PROCESSOR = ${CMAKE_SYSTEM_PROCESSOR}")
43ENDIF()
44
45IF(NOT CMAKE_SYSTEM_NAME)
46 MESSAGE(FATAL_ERROR "CMAKE_SYSTEM_NAME not defined")
47ELSEIF(NOT CMAKE_SYSTEM_NAME MATCHES "^(Darwin|Linux|Android)$")
48 MESSAGE(FATAL_ERROR "Unrecognized CMAKE_SYSTEM_NAME = ${CMAKE_SYSTEM_NAME}")
49ENDIF()
50
51# ---[ Download deps
52IF(NOT DEFINED CLOG_SOURCE_DIR)
53 MESSAGE(STATUS "Downloading clog to ${CMAKE_BINARY_DIR}/clog-source (define CLOG_SOURCE_DIR to avoid it)")
54 CONFIGURE_FILE(cmake/DownloadCLog.cmake "${CMAKE_BINARY_DIR}/clog-download/CMakeLists.txt")
55 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
56 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
57 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
58 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/clog-download")
59 SET(CLOG_SOURCE_DIR "${CMAKE_BINARY_DIR}/clog-source" CACHE STRING "clog source directory")
60ENDIF()
61
62IF(NOT DEFINED CPUINFO_SOURCE_DIR)
63 MESSAGE(STATUS "Downloading cpuinfo to ${CMAKE_BINARY_DIR}/cpuinfo-source (define CPUINFO_SOURCE_DIR to avoid it)")
64 CONFIGURE_FILE(cmake/DownloadCpuinfo.cmake "${CMAKE_BINARY_DIR}/cpuinfo-download/CMakeLists.txt")
65 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
66 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
67 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
68 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/cpuinfo-download")
69 SET(CPUINFO_SOURCE_DIR "${CMAKE_BINARY_DIR}/cpuinfo-source" CACHE STRING "cpuinfo source directory")
70ENDIF()
71
72IF(NOT DEFINED FP16_SOURCE_DIR)
73 MESSAGE(STATUS "Downloading FP16 to ${CMAKE_BINARY_DIR}/FP16-source (define FP16_SOURCE_DIR to avoid it)")
74 CONFIGURE_FILE(cmake/DownloadFP16.cmake "${CMAKE_BINARY_DIR}/FP16-download/CMakeLists.txt")
75 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
76 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
77 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
78 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FP16-download")
79 SET(FP16_SOURCE_DIR "${CMAKE_BINARY_DIR}/FP16-source" CACHE STRING "FP16 source directory")
80ENDIF()
81
82IF(NOT DEFINED FXDIV_SOURCE_DIR)
83 MESSAGE(STATUS "Downloading FXdiv to ${CMAKE_BINARY_DIR}/FXdiv-source (define FXDIV_SOURCE_DIR to avoid it)")
84 CONFIGURE_FILE(cmake/DownloadFXdiv.cmake "${CMAKE_BINARY_DIR}/FXdiv-download/CMakeLists.txt")
85 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
86 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
87 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
88 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/FXdiv-download")
89 SET(FXDIV_SOURCE_DIR "${CMAKE_BINARY_DIR}/FXdiv-source" CACHE STRING "FXdiv source directory")
90ENDIF()
91
92IF(NOT DEFINED PSIMD_SOURCE_DIR)
93 MESSAGE(STATUS "Downloading PSimd to ${CMAKE_BINARY_DIR}/psimd-source (define PSIMD_SOURCE_DIR to avoid it)")
94 CONFIGURE_FILE(cmake/DownloadPSimd.cmake "${CMAKE_BINARY_DIR}/psimd-download/CMakeLists.txt")
95 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
96 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
97 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
98 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/psimd-download")
99 SET(PSIMD_SOURCE_DIR "${CMAKE_BINARY_DIR}/psimd-source" CACHE STRING "PSimd source directory")
100ENDIF()
101
102IF(NOT DEFINED PTHREADPOOL_SOURCE_DIR)
103 MESSAGE(STATUS "Downloading pthreadpool to ${CMAKE_BINARY_DIR}/pthreadpool-source (define PTHREADPOOL_SOURCE_DIR to avoid it)")
104 CONFIGURE_FILE(cmake/DownloadPThreadPool.cmake "${CMAKE_BINARY_DIR}/pthreadpool-download/CMakeLists.txt")
105 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
106 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
107 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
108 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/pthreadpool-download")
109 SET(PTHREADPOOL_SOURCE_DIR "${CMAKE_BINARY_DIR}/pthreadpool-source" CACHE STRING "pthreadpool source directory")
110ENDIF()
111
112IF(XNNPACK_BUILD_TESTS AND NOT DEFINED GOOGLETEST_SOURCE_DIR)
113 MESSAGE(STATUS "Downloading Google Test to ${CMAKE_BINARY_DIR}/googletest-source (define GOOGLETEST_SOURCE_DIR to avoid it)")
114 CONFIGURE_FILE(cmake/DownloadGoogleTest.cmake "${CMAKE_BINARY_DIR}/googletest-download/CMakeLists.txt")
115 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
116 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
117 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
118 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googletest-download")
119 SET(GOOGLETEST_SOURCE_DIR "${CMAKE_BINARY_DIR}/googletest-source" CACHE STRING "Google Test source directory")
120ENDIF()
121
122IF(XNNPACK_BUILD_BENCHMARKS AND NOT DEFINED GOOGLEBENCHMARK_SOURCE_DIR)
123 MESSAGE(STATUS "Downloading Google Benchmark to ${CMAKE_BINARY_DIR}/googlebenchmark-source (define GOOGLEBENCHMARK_SOURCE_DIR to avoid it)")
124 CONFIGURE_FILE(cmake/DownloadGoogleBenchmark.cmake "${CMAKE_BINARY_DIR}/googlebenchmark-download/CMakeLists.txt")
125 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" -G "${CMAKE_GENERATOR}" .
126 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
127 EXECUTE_PROCESS(COMMAND "${CMAKE_COMMAND}" --build .
128 WORKING_DIRECTORY "${CMAKE_BINARY_DIR}/googlebenchmark-download")
129 SET(GOOGLEBENCHMARK_SOURCE_DIR "${CMAKE_BINARY_DIR}/googlebenchmark-source" CACHE STRING "Google Benchmark source directory")
130ENDIF()
131
132# ---[ XNNPACK library
133SET(XNNPACK_OPERATOR_SRCS
Marat Dukhanefc47b82019-11-18 09:25:38 -0800134 src/add-nc.c
135 src/argmax-pooling-nhwc.c
136 src/average-pooling-nhwc.c
Marat Dukhanb1a0fc32019-12-02 19:32:02 -0800137 src/binary-elementwise-nd.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800138 src/channel-pad-nc.c
139 src/channel-shuffle-nc.c
140 src/clamp-nc.c
141 src/convolution-nchw.c
142 src/convolution-nhwc.c
143 src/deconvolution-nhwc.c
144 src/fully-connected-nc.c
145 src/global-average-pooling-ncw.c
146 src/global-average-pooling-nwc.c
147 src/hardswish-nc.c
148 src/leaky-relu-nc.c
149 src/max-pooling-nhwc.c
Marat Dukhanefc47b82019-11-18 09:25:38 -0800150 src/prelu-nc.c
151 src/resize-bilinear-nhwc.c
152 src/sigmoid-nc.c
153 src/softargmax-nc.c
154 src/unpooling-nhwc.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700155
156SET(XNNPACK_COLD_SRCS ${XNNPACK_OPERATOR_SRCS})
157LIST(APPEND XNNPACK_COLD_SRCS
158 src/init.c
Ashkan Aliabadi1f8a2b82019-11-20 11:27:00 -0800159 src/memory.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700160 src/operator-delete.c)
161
162SET(XNNPACK_HOT_SRCS
163 src/indirection.c
164 src/operator-run.c)
165
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800166SET(XNNPACK_TABLE_SRCS
167 src/tables/exp2-k-over-64.c
168 src/tables/exp2-k-over-2048.c)
169
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700170SET(XNNPACK_SCALAR_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800171 src/f32-argmaxpool/4x-scalar-c1.c
172 src/f32-argmaxpool/9p8x-scalar-c1.c
173 src/f32-argmaxpool/9x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700174 src/f32-avgpool/mp9p8q-scalar.c
175 src/f32-avgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800176 src/f32-bilinear/gen/scalar-c1.c
177 src/f32-bilinear/gen/scalar-c2.c
178 src/f32-bilinear/gen/scalar-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700179 src/f32-clamp/scalar.c
Marat Dukhan6b7dfae2019-12-04 16:00:52 -0800180 src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c
Marat Dukhan441e2212019-12-04 18:30:49 -0800181 src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c
Erich Elsen563df5f2019-10-23 08:02:21 -0700182 src/f32-conv-hwc2spchw/3x3s2p1c3x4-scalar-1x1.c
Erich Elsen0cc2c532019-10-15 04:44:18 -0700183 src/f32-dwconv-spchw/3x3p1-scalar.c
Erich Elsenac4de802019-10-16 04:35:30 -0700184 src/f32-dwconv-spchw/3x3s2p1-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800185 src/f32-dwconv-spchw/5x5p2-scalar.c
Erich Elsen38709a62019-11-08 11:58:45 -0800186 src/f32-dwconv-spchw/5x5s2p2-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800187 src/f32-dwconv/gen/up1x25-scalar-acc2.c
188 src/f32-dwconv/gen/up1x25-scalar.c
189 src/f32-dwconv/gen/up1x4-scalar-acc2.c
190 src/f32-dwconv/gen/up1x4-scalar.c
191 src/f32-dwconv/gen/up1x9-scalar-acc2.c
192 src/f32-dwconv/gen/up1x9-scalar.c
193 src/f32-dwconv/gen/up2x25-scalar-acc2.c
194 src/f32-dwconv/gen/up2x25-scalar.c
195 src/f32-dwconv/gen/up2x4-scalar-acc2.c
196 src/f32-dwconv/gen/up2x4-scalar.c
197 src/f32-dwconv/gen/up2x9-scalar-acc2.c
198 src/f32-dwconv/gen/up2x9-scalar.c
Erich Elsen34dc2c02019-10-16 05:11:41 -0700199 src/f32-gavgpool-spchw/scalar-x1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700200 src/f32-gavgpool/mp7p7q-scalar.c
201 src/f32-gavgpool/up7-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800202 src/f32-gemm/gen/1x4-scalar.c
203 src/f32-gemm/gen/2x4-scalar.c
204 src/f32-gemm/gen/4x2-scalar.c
205 src/f32-gemm/gen/4x4-scalar.c
206 src/f32-gemm/gen-inc/1x4-scalar.c
207 src/f32-gemm/gen-inc/2x4-scalar.c
208 src/f32-gemm/gen-inc/4x4-scalar.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800209 src/f32-hswish/gen/scalar-x1.c
210 src/f32-hswish/gen/scalar-x2.c
211 src/f32-hswish/gen/scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800212 src/f32-igemm/gen/1x4-scalar.c
213 src/f32-igemm/gen/2x4-scalar.c
214 src/f32-igemm/gen/4x2-scalar.c
215 src/f32-igemm/gen/4x4-scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800216 src/f32-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700217 src/f32-pavgpool/mp9p8q-scalar.c
218 src/f32-pavgpool/up9-scalar.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800219 src/f32-ppmm/gen/2x4-scalar.c
220 src/f32-ppmm/gen/3x3-scalar.c
221 src/f32-ppmm/gen/4x2-scalar.c
222 src/f32-ppmm/gen/4x4-scalar.c
223 src/f32-prelu/gen/scalar-2x1.c
224 src/f32-prelu/gen/scalar-2x4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700225 src/f32-rmax/scalar.c
Marat Dukhan3a77ea72019-12-23 12:10:24 -0800226 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x1.c
227 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x2.c
228 src/f32-sigmoid/gen/scalar-lut2048-p1-div-x4.c
229 src/f32-sigmoid/gen/scalar-lut64-p2-div-x1.c
230 src/f32-sigmoid/gen/scalar-lut64-p2-div-x2.c
231 src/f32-sigmoid/gen/scalar-lut64-p2-div-x4.c
232 src/f32-sigmoid/gen/scalar-p5-div-x1.c
233 src/f32-sigmoid/gen/scalar-p5-div-x2.c
234 src/f32-sigmoid/gen/scalar-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800235 src/f32-spmm/gen/1x1-scalar-pipelined.c
236 src/f32-spmm/gen/1x1-scalar.c
237 src/f32-spmm/gen/2x1-scalar-pipelined.c
238 src/f32-spmm/gen/2x1-scalar.c
239 src/f32-spmm/gen/4x1-scalar-pipelined.c
240 src/f32-spmm/gen/4x1-scalar.c
241 src/f32-spmm/gen/8x1-scalar-pipelined.c
242 src/f32-spmm/gen/8x1-scalar.c
243 src/f32-spmm/gen/8x2-scalar.c
244 src/f32-spmm/gen/8x4-scalar.c
245 src/f32-vbinary/gen/vadd-scalar-x1.c
246 src/f32-vbinary/gen/vadd-scalar-x2.c
247 src/f32-vbinary/gen/vadd-scalar-x4.c
248 src/f32-vbinary/gen/vaddc-scalar-x1.c
249 src/f32-vbinary/gen/vaddc-scalar-x2.c
250 src/f32-vbinary/gen/vaddc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800251 src/f32-vbinary/gen/vdiv-scalar-x1.c
252 src/f32-vbinary/gen/vdiv-scalar-x2.c
253 src/f32-vbinary/gen/vdiv-scalar-x4.c
254 src/f32-vbinary/gen/vdivc-scalar-x1.c
255 src/f32-vbinary/gen/vdivc-scalar-x2.c
256 src/f32-vbinary/gen/vdivc-scalar-x4.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800257 src/f32-vbinary/gen/vmax-scalar-x1.c
258 src/f32-vbinary/gen/vmax-scalar-x2.c
259 src/f32-vbinary/gen/vmax-scalar-x4.c
260 src/f32-vbinary/gen/vmaxc-scalar-x1.c
261 src/f32-vbinary/gen/vmaxc-scalar-x2.c
262 src/f32-vbinary/gen/vmaxc-scalar-x4.c
263 src/f32-vbinary/gen/vmin-scalar-x1.c
264 src/f32-vbinary/gen/vmin-scalar-x2.c
265 src/f32-vbinary/gen/vmin-scalar-x4.c
266 src/f32-vbinary/gen/vminc-scalar-x1.c
267 src/f32-vbinary/gen/vminc-scalar-x2.c
268 src/f32-vbinary/gen/vminc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800269 src/f32-vbinary/gen/vmul-scalar-x1.c
270 src/f32-vbinary/gen/vmul-scalar-x2.c
271 src/f32-vbinary/gen/vmul-scalar-x4.c
272 src/f32-vbinary/gen/vmulc-scalar-x1.c
273 src/f32-vbinary/gen/vmulc-scalar-x2.c
274 src/f32-vbinary/gen/vmulc-scalar-x4.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800275 src/f32-vbinary/gen/vrdivc-scalar-x1.c
276 src/f32-vbinary/gen/vrdivc-scalar-x2.c
277 src/f32-vbinary/gen/vrdivc-scalar-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800278 src/f32-vbinary/gen/vrsubc-scalar-x1.c
279 src/f32-vbinary/gen/vrsubc-scalar-x2.c
280 src/f32-vbinary/gen/vrsubc-scalar-x4.c
281 src/f32-vbinary/gen/vsub-scalar-x1.c
282 src/f32-vbinary/gen/vsub-scalar-x2.c
283 src/f32-vbinary/gen/vsub-scalar-x4.c
284 src/f32-vbinary/gen/vsubc-scalar-x1.c
285 src/f32-vbinary/gen/vsubc-scalar-x2.c
286 src/f32-vbinary/gen/vsubc-scalar-x4.c
287 src/f32-vmulcaddc/gen/c1-scalar-2x.c
288 src/f32-vmulcaddc/gen/c2-scalar-2x.c
289 src/f32-vmulcaddc/gen/c4-scalar-2x.c
Marat Dukhan5739f702019-12-22 19:45:09 -0800290 src/math/expminus-scalar-lut2048-p1.c
291 src/math/expminus-scalar-lut64-p2.c
292 src/math/expminus-scalar-p5.c
293 src/math/sigmoid-scalar-lut2048-p1-div.c
294 src/math/sigmoid-scalar-lut64-p2-div.c
295 src/math/sigmoid-scalar-p5-div.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700296 src/q8-avgpool/mp9p8q-scalar.c
297 src/q8-avgpool/up9-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700298 src/q8-dwconv/up1x9-scalar.c
299 src/q8-gavgpool/mp7p7q-scalar.c
300 src/q8-gavgpool/up7-scalar.c
301 src/q8-gemm/2x2-scalar.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800302 src/q8-igemm/2x2-scalar.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700303 src/q8-vadd/scalar.c
304 src/u8-clamp/scalar.c
305 src/u8-lut32norm/scalar.c
Marat Dukhan329da642019-11-19 21:44:39 -0800306 src/u8-maxpool/9p8x-scalar-c1.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700307 src/u8-rmax/scalar.c
308 src/x32-packx/x2-scalar.c
309 src/x32-packx/x3-scalar.c
310 src/x32-packx/x4-scalar.c
311 src/x32-pad/x2-scalar.c
312 src/x32-unpool/scalar.c
313 src/x32-zip/x2-scalar.c
314 src/x32-zip/x3-scalar.c
315 src/x32-zip/x4-scalar.c
316 src/x32-zip/xm-scalar.c
317 src/x8-lut/scalar.c
318 src/x8-zip/x2-scalar.c
319 src/x8-zip/x3-scalar.c
320 src/x8-zip/x4-scalar.c
321 src/x8-zip/xm-scalar.c)
322
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800323SET(XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800324 src/f32-argmaxpool/4x-psimd-c4.c
325 src/f32-argmaxpool/9p8x-psimd-c4.c
326 src/f32-argmaxpool/9x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700327 src/f32-avgpool/mp9p8q-psimd.c
328 src/f32-avgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800329 src/f32-bilinear/gen/psimd-c4.c
330 src/f32-bilinear/gen/psimd-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700331 src/f32-clamp/psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800332 src/f32-dwconv/gen/up4x25-psimd-acc2.c
333 src/f32-dwconv/gen/up4x25-psimd.c
334 src/f32-dwconv/gen/up4x4-psimd-acc2.c
335 src/f32-dwconv/gen/up4x4-psimd.c
336 src/f32-dwconv/gen/up4x9-psimd-acc2.c
337 src/f32-dwconv/gen/up4x9-psimd.c
338 src/f32-dwconv/gen/up8x25-psimd-acc2.c
339 src/f32-dwconv/gen/up8x25-psimd.c
340 src/f32-dwconv/gen/up8x4-psimd-acc2.c
341 src/f32-dwconv/gen/up8x4-psimd.c
342 src/f32-dwconv/gen/up8x9-psimd-acc2.c
343 src/f32-dwconv/gen/up8x9-psimd.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700344 src/f32-gavgpool/mp7p7q-psimd.c
345 src/f32-gavgpool/up7-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800346 src/f32-gemm/gen/1x8-psimd-loadsplat.c
347 src/f32-gemm/gen/1x8-psimd-splat.c
348 src/f32-gemm/gen/1x8s4-psimd.c
349 src/f32-gemm/gen/4x8-psimd-loadsplat.c
350 src/f32-gemm/gen/4x8-psimd-splat.c
351 src/f32-gemm/gen/4x8s4-psimd.c
352 src/f32-gemm/gen/6x8-psimd-loadsplat.c
353 src/f32-gemm/gen/6x8-psimd-splat.c
354 src/f32-gemm/gen/6x8s4-psimd.c
355 src/f32-gemm/gen-inc/1x8-psimd-loadsplat.c
356 src/f32-gemm/gen-inc/1x8-psimd-splat.c
357 src/f32-gemm/gen-inc/1x8s4-psimd.c
358 src/f32-gemm/gen-inc/4x8-psimd-loadsplat.c
359 src/f32-gemm/gen-inc/4x8-psimd-splat.c
360 src/f32-gemm/gen-inc/4x8s4-psimd.c
361 src/f32-gemm/gen-inc/6x8-psimd-loadsplat.c
362 src/f32-gemm/gen-inc/6x8-psimd-splat.c
363 src/f32-gemm/gen-inc/6x8s4-psimd.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800364 src/f32-hswish/gen/psimd-x4.c
365 src/f32-hswish/gen/psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800366 src/f32-igemm/gen/1x8-psimd-loadsplat.c
367 src/f32-igemm/gen/1x8-psimd-splat.c
368 src/f32-igemm/gen/1x8s4-psimd.c
369 src/f32-igemm/gen/4x2c4-psimd.c
370 src/f32-igemm/gen/4x8-psimd-loadsplat.c
371 src/f32-igemm/gen/4x8-psimd-splat.c
372 src/f32-igemm/gen/4x8s4-psimd.c
373 src/f32-igemm/gen/6x8-psimd-loadsplat.c
374 src/f32-igemm/gen/6x8-psimd-splat.c
375 src/f32-igemm/gen/6x8s4-psimd.c
Marat Dukhan329da642019-11-19 21:44:39 -0800376 src/f32-maxpool/9p8x-psimd-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700377 src/f32-pavgpool/mp9p8q-psimd.c
378 src/f32-pavgpool/up9-psimd.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800379 src/f32-ppmm/gen/4x8-psimd.c
380 src/f32-prelu/gen/psimd-2x4.c
381 src/f32-prelu/gen/psimd-2x8.c
382 src/f32-vbinary/gen/vadd-psimd-x4.c
383 src/f32-vbinary/gen/vadd-psimd-x8.c
384 src/f32-vbinary/gen/vaddc-psimd-x4.c
385 src/f32-vbinary/gen/vaddc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800386 src/f32-vbinary/gen/vdiv-psimd-x4.c
387 src/f32-vbinary/gen/vdiv-psimd-x8.c
388 src/f32-vbinary/gen/vdivc-psimd-x4.c
389 src/f32-vbinary/gen/vdivc-psimd-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800390 src/f32-vbinary/gen/vmax-psimd-x4.c
391 src/f32-vbinary/gen/vmax-psimd-x8.c
392 src/f32-vbinary/gen/vmaxc-psimd-x4.c
393 src/f32-vbinary/gen/vmaxc-psimd-x8.c
394 src/f32-vbinary/gen/vmin-psimd-x4.c
395 src/f32-vbinary/gen/vmin-psimd-x8.c
396 src/f32-vbinary/gen/vminc-psimd-x4.c
397 src/f32-vbinary/gen/vminc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800398 src/f32-vbinary/gen/vmul-psimd-x4.c
399 src/f32-vbinary/gen/vmul-psimd-x8.c
400 src/f32-vbinary/gen/vmulc-psimd-x4.c
401 src/f32-vbinary/gen/vmulc-psimd-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800402 src/f32-vbinary/gen/vrdivc-psimd-x4.c
403 src/f32-vbinary/gen/vrdivc-psimd-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800404 src/f32-vbinary/gen/vrsubc-psimd-x4.c
405 src/f32-vbinary/gen/vrsubc-psimd-x8.c
406 src/f32-vbinary/gen/vsub-psimd-x4.c
407 src/f32-vbinary/gen/vsub-psimd-x8.c
408 src/f32-vbinary/gen/vsubc-psimd-x4.c
409 src/f32-vbinary/gen/vsubc-psimd-x8.c
410 src/f32-vmulcaddc/gen/c4-psimd-2x.c
411 src/f32-vmulcaddc/gen/c8-psimd-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700412 src/x32-packx/x4-psimd.c
413 src/x32-pad/x2-psimd.c
414 src/x32-unpool/psimd.c
415 src/x32-zip/x2-psimd.c
416 src/x32-zip/x3-psimd.c
417 src/x32-zip/x4-psimd.c
418 src/x32-zip/xm-psimd.c)
419
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800420SET(XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS
421 src/f32-sigmoid/gen/psimd-p5-div-x4.c
422 src/f32-sigmoid/gen/psimd-p5-div-x8.c
423 src/f32-sigmoid/gen/psimd-p5-div-x12.c
424 src/f32-sigmoid/gen/psimd-p5-div-x16.c
425 src/f32-sigmoid/gen/psimd-p5-div-x20.c
426 src/f32-sigmoid/gen/psimd-p5-div-x24.c
427 src/math/sigmoid-psimd-p5-div.c)
428
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700429SET(XNNPACK_NEON_MICROKERNEL_SRCS
Marat Dukhan36aecb52019-11-22 17:21:49 -0800430 src/f32-avgpool/mp9p8q-neon.c
431 src/f32-avgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800432 src/f32-bilinear/gen/neon-c4.c
433 src/f32-bilinear/gen/neon-c8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800434 src/f32-clamp/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800435 src/f32-dwconv/gen/up4x9-neon.c
436 src/f32-dwconv/gen/up4x9-neon-acc2.c
437 src/f32-dwconv/gen/up8x9-neon.c
438 src/f32-dwconv/gen/up8x9-neon-acc2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800439 src/f32-gavgpool-spchw/neon-x4.c
440 src/f32-gavgpool/mp7p7q-neon.c
441 src/f32-gavgpool/up7-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800442 src/f32-gemm/gen/1x8-neon-lane-ld64.c
443 src/f32-gemm/gen/4x2-neon-lane-ld64.c
444 src/f32-gemm/gen/4x8-neon-lane-ld128.c
445 src/f32-gemm/gen/4x8-neon-lane-ld64.c
446 src/f32-gemm/gen/5x8-neon-lane-ld64.c
447 src/f32-gemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800448 src/f32-gemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800449 src/f32-gemm/gen/1x8-neon-dup-ld64.c
450 src/f32-gemm/gen/4x8-neon-dup-ld128.c
451 src/f32-gemm/gen/4x8-neon-dup-ld64.c
452 src/f32-gemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800453 src/f32-gemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800454 src/f32-gemm/gen/1x8s4-neon.c
455 src/f32-gemm/gen/4x8s4-neon.c
456 src/f32-gemm/gen/6x8s4-neon.c
457 src/f32-gemm/gen/8x8s4-neon.c
458 src/f32-gemm/gen-inc/1x8-neon-lane-ld64.c
459 src/f32-gemm/gen-inc/4x8-neon-lane-ld128.c
460 src/f32-gemm/gen-inc/4x8-neon-lane-ld64.c
461 src/f32-gemm/gen-inc/5x8-neon-lane-ld64.c
462 src/f32-gemm/gen-inc/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800463 src/f32-gemm/gen-inc/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800464 src/f32-gemm/gen-inc/1x8-neon-dup-ld64.c
465 src/f32-gemm/gen-inc/4x8-neon-dup-ld128.c
466 src/f32-gemm/gen-inc/4x8-neon-dup-ld64.c
467 src/f32-gemm/gen-inc/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800468 src/f32-gemm/gen-inc/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800469 src/f32-gemm/gen-inc/1x8s4-neon.c
470 src/f32-gemm/gen-inc/4x8s4-neon.c
471 src/f32-gemm/gen-inc/6x8s4-neon.c
472 src/f32-gemm/gen-inc/8x8s4-neon.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800473 src/f32-hswish/gen/neon-x4.c
474 src/f32-hswish/gen/neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800475 src/f32-igemm/gen/1x8-neon-lane-ld64.c
476 src/f32-igemm/gen/4x2-neon-lane-ld64.c
477 src/f32-igemm/gen/4x4-neon-lane-ld64.c
478 src/f32-igemm/gen/4x8-neon-lane-ld128.c
479 src/f32-igemm/gen/4x8-neon-lane-ld64.c
480 src/f32-igemm/gen/6x8-neon-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800481 src/f32-igemm/gen/6x8-neon-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800482 src/f32-igemm/gen/1x8-neon-dup-ld64.c
483 src/f32-igemm/gen/4x8-neon-dup-ld128.c
484 src/f32-igemm/gen/4x8-neon-dup-ld64.c
485 src/f32-igemm/gen/6x8-neon-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800486 src/f32-igemm/gen/6x8-neon-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800487 src/f32-igemm/gen/1x8s4-neon.c
488 src/f32-igemm/gen/4x8s4-neon.c
489 src/f32-igemm/gen/6x8s4-neon.c
490 src/f32-igemm/gen/8x8s4-neon.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800491 src/f32-pavgpool/mp9p8q-neon.c
492 src/f32-pavgpool/up9-neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800493 src/f32-ppmm/gen/4x8-neon.c
494 src/f32-ppmm/gen/8x8-neon.c
495 src/f32-prelu/gen/neon-2x4.c
496 src/f32-prelu/gen/neon-2x8.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800497 src/f32-rmax/neon.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800498 src/f32-sigmoid/gen/neon-frac-p9-p10-nr1recps-x16.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800499 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x4.c
500 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x8.c
501 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x12.c
502 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x16.c
503 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x20.c
504 src/f32-sigmoid/gen/neon-rr2-p5-nr2recps-x24.c
505 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x4.c
506 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x8.c
507 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x12.c
508 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x16.c
509 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x20.c
510 src/f32-sigmoid/gen/neon-rr2-lut64-p2-nr2recps-x24.c
511 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x4.c
512 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x8.c
513 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x12.c
514 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x16.c
515 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x20.c
516 src/f32-sigmoid/gen/neon-rr2-lut2048-p1-nr2recps-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800517 src/f32-vbinary/gen/vadd-neon-x4.c
518 src/f32-vbinary/gen/vadd-neon-x8.c
519 src/f32-vbinary/gen/vaddc-neon-x4.c
520 src/f32-vbinary/gen/vaddc-neon-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800521 src/f32-vbinary/gen/vmax-neon-x4.c
522 src/f32-vbinary/gen/vmax-neon-x8.c
523 src/f32-vbinary/gen/vmaxc-neon-x4.c
524 src/f32-vbinary/gen/vmaxc-neon-x8.c
525 src/f32-vbinary/gen/vmin-neon-x4.c
526 src/f32-vbinary/gen/vmin-neon-x8.c
527 src/f32-vbinary/gen/vminc-neon-x4.c
528 src/f32-vbinary/gen/vminc-neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800529 src/f32-vbinary/gen/vmul-neon-x4.c
530 src/f32-vbinary/gen/vmul-neon-x8.c
531 src/f32-vbinary/gen/vmulc-neon-x4.c
532 src/f32-vbinary/gen/vmulc-neon-x8.c
533 src/f32-vbinary/gen/vrsubc-neon-x4.c
534 src/f32-vbinary/gen/vrsubc-neon-x8.c
535 src/f32-vbinary/gen/vsub-neon-x4.c
536 src/f32-vbinary/gen/vsub-neon-x8.c
537 src/f32-vbinary/gen/vsubc-neon-x4.c
538 src/f32-vbinary/gen/vsubc-neon-x8.c
539 src/f32-vmulcaddc/gen/c4-neon-2x.c
540 src/f32-vmulcaddc/gen/c8-neon-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800541 src/q8-avgpool/mp9p8q-neon.c
542 src/q8-avgpool/up9-neon.c
543 src/q8-dwconv/up8x9-neon.c
544 src/q8-gavgpool/mp7p7q-neon.c
545 src/q8-gavgpool/up7-neon.c
546 src/q8-gemm/4x8-neon.c
547 src/q8-gemm/8x8-neon.c
548 src/q8-igemm/4x8-neon.c
549 src/q8-igemm/8x8-neon.c
550 src/q8-vadd/neon.c
551 src/u8-clamp/neon.c
552 src/u8-maxpool/9p8x-neon-c16.c
553 src/u8-rmax/neon.c
554 src/x32-packx/x4-neon-st4.c
555 src/x32-pad/x2-neon.c
556 src/x32-zip/x2-neon.c
557 src/x32-zip/x3-neon.c
558 src/x32-zip/x4-neon.c
559 src/x32-zip/xm-neon.c
560 src/x8-zip/x2-neon.c
561 src/x8-zip/x3-neon.c
562 src/x8-zip/x4-neon.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800563 src/x8-zip/xm-neon.c
Marat Dukhan68b3b452020-01-02 10:11:15 -0800564 src/math/sigmoid-neon-frac-p9-p10-nr1recps.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800565 src/math/sigmoid-neon-rr1-lut2048-p1-nr2recps.c
566 src/math/sigmoid-neon-rr1-lut64-p2-nr2recps.c
567 src/math/sigmoid-neon-rr1-p5-nr2recps.c
568 src/math/sigmoid-neon-rr2-lut2048-p1-nr2recps.c
569 src/math/sigmoid-neon-rr2-lut64-p2-nr2recps.c
570 src/math/sigmoid-neon-rr2-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700571
572SET(XNNPACK_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800573 src/f32-bilinear/gen/neonfma-c4.c
574 src/f32-bilinear/gen/neonfma-c8.c
575 src/f32-igemm/gen/1x8-neonfma-dup-ld64.c
576 src/f32-igemm/gen/4x8-neonfma-dup-ld128.c
577 src/f32-igemm/gen/4x8-neonfma-dup-ld64.c
578 src/f32-igemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800579 src/f32-igemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800580 src/f32-igemm/gen/1x8s4-neonfma.c
581 src/f32-igemm/gen/4x8s4-neonfma.c
582 src/f32-igemm/gen/6x8s4-neonfma.c
583 src/f32-igemm/gen/8x8s4-neonfma.c
584 src/f32-dwconv/gen/up4x9-neonfma.c
585 src/f32-dwconv/gen/up4x9-neonfma-acc2.c
586 src/f32-dwconv/gen/up8x9-neonfma.c
587 src/f32-dwconv/gen/up8x9-neonfma-acc2.c
588 src/f32-gemm/gen/1x8-neonfma-dup-ld64.c
589 src/f32-gemm/gen/4x8-neonfma-dup-ld128.c
590 src/f32-gemm/gen/4x8-neonfma-dup-ld64.c
591 src/f32-gemm/gen/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800592 src/f32-gemm/gen/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800593 src/f32-gemm/gen/1x8s4-neonfma.c
594 src/f32-gemm/gen/4x8s4-neonfma.c
595 src/f32-gemm/gen/6x8s4-neonfma.c
596 src/f32-gemm/gen/8x8s4-neonfma.c
597 src/f32-gemm/gen-inc/1x8-neonfma-dup-ld64.c
598 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld128.c
599 src/f32-gemm/gen-inc/4x8-neonfma-dup-ld64.c
600 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800601 src/f32-gemm/gen-inc/6x8-neonfma-dup-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800602 src/f32-gemm/gen-inc/1x8s4-neonfma.c
603 src/f32-gemm/gen-inc/4x8s4-neonfma.c
604 src/f32-gemm/gen-inc/6x8s4-neonfma.c
605 src/f32-gemm/gen-inc/8x8s4-neonfma.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800606 src/f32-hswish/gen/neonfma-x4.c
607 src/f32-hswish/gen/neonfma-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800608 src/f32-ppmm/gen/4x8-neonfma.c
609 src/f32-ppmm/gen/8x8-neonfma.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800610 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x4.c
611 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x8.c
612 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x12.c
613 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x16.c
614 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x20.c
615 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2fma-x24.c
616 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x4.c
617 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x8.c
618 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x12.c
619 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x16.c
620 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x20.c
621 src/f32-sigmoid/gen/neonfma-rr1-p5-nr1recps1fma-x24.c
622 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x4.c
623 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x8.c
624 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x12.c
625 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x16.c
626 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x20.c
627 src/f32-sigmoid/gen/neonfma-rr1-p5-nr2recps-x24.c
628 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x4.c
629 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x8.c
630 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x12.c
631 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x16.c
632 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x20.c
633 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2fma-x24.c
634 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x4.c
635 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x8.c
636 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x12.c
637 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x16.c
638 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x20.c
639 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr1recps1fma-x24.c
640 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x4.c
641 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x8.c
642 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x12.c
643 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x16.c
644 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x20.c
645 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-nr2recps-x24.c
646 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x4.c
647 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x8.c
648 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x12.c
649 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x16.c
650 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x20.c
651 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2fma-x24.c
652 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x4.c
653 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x8.c
654 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x12.c
655 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x16.c
656 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x20.c
657 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr1recps1fma-x24.c
658 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x4.c
659 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x8.c
660 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x12.c
661 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x16.c
662 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x20.c
663 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-nr2recps-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800664 src/f32-vmulcaddc/gen/c4-neonfma-2x.c
665 src/f32-vmulcaddc/gen/c8-neonfma-2x.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800666 src/math/exp-neonfma-lut64-p2.c
667 src/math/exp-neonfma-p5.c
Marat Dukhan191e5cd2019-11-28 00:52:01 -0800668 src/math/expminus-neonfma-lut2048-p1.c
Marat Dukhan189ae802019-11-26 11:28:44 -0800669 src/math/expminus-neonfma-lut64-p2.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800670 src/math/expminus-neonfma-p5.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800671 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma.c
672 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2fma.c
673 src/math/sigmoid-neonfma-rr1-lut2048-p1-nr2recps.c
674 src/math/sigmoid-neonfma-rr1-lut64-p2-nr1recps1fma.c
675 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2fma.c
676 src/math/sigmoid-neonfma-rr1-lut64-p2-nr2recps.c
677 src/math/sigmoid-neonfma-rr1-p5-nr1recps1fma.c
678 src/math/sigmoid-neonfma-rr1-p5-nr2fma.c
679 src/math/sigmoid-neonfma-rr1-p5-nr2recps.c
680 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr1recps1fma.c
681 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2fma.c
682 src/math/sigmoid-neonfma-rr2-lut2048-p1-nr2recps.c
683 src/math/sigmoid-neonfma-rr2-lut64-p2-nr1recps1fma.c
684 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2fma.c
685 src/math/sigmoid-neonfma-rr2-lut64-p2-nr2recps.c
686 src/math/sigmoid-neonfma-rr2-p5-nr1recps1fma.c
687 src/math/sigmoid-neonfma-rr2-p5-nr2fma.c
688 src/math/sigmoid-neonfma-rr2-p5-nr2recps.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700689
Marat Dukhan36aecb52019-11-22 17:21:49 -0800690SET(XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS
Marat Dukhan77ca6302019-12-06 12:48:15 -0800691 src/f32-vbinary/gen/vdiv-neon-x4.c
692 src/f32-vbinary/gen/vdiv-neon-x8.c
693 src/f32-vbinary/gen/vdivc-neon-x4.c
694 src/f32-vbinary/gen/vdivc-neon-x8.c
695 src/f32-vbinary/gen/vrdivc-neon-x4.c
696 src/f32-vbinary/gen/vrdivc-neon-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800697 src/f32-gemm/gen/1x8-neonfma-lane-ld64.c
698 src/f32-gemm/gen/4x2-neonfma-lane-ld64.c
699 src/f32-gemm/gen/4x8-neonfma-lane-ld128.c
700 src/f32-gemm/gen/4x8-neonfma-lane-ld64.c
701 src/f32-gemm/gen/5x8-neonfma-lane-ld64.c
702 src/f32-gemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800703 src/f32-gemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800704 src/f32-gemm/gen-inc/1x8-neonfma-lane-ld64.c
705 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld128.c
706 src/f32-gemm/gen-inc/4x8-neonfma-lane-ld64.c
707 src/f32-gemm/gen-inc/5x8-neonfma-lane-ld64.c
708 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800709 src/f32-gemm/gen-inc/6x8-neonfma-lane-ld128.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800710 src/f32-igemm/gen/1x8-neonfma-lane-ld64.c
711 src/f32-igemm/gen/4x2-neonfma-lane-ld64.c
712 src/f32-igemm/gen/4x4-neonfma-lane-ld64.c
713 src/f32-igemm/gen/4x8-neonfma-lane-ld128.c
714 src/f32-igemm/gen/4x8-neonfma-lane-ld64.c
715 src/f32-igemm/gen/6x8-neonfma-lane-ld64.c
Frank Barchard69172d92019-11-26 16:22:39 -0800716 src/f32-igemm/gen/6x8-neonfma-lane-ld128.c
Marat Dukhan36aecb52019-11-22 17:21:49 -0800717 src/f32-conv-hwc/3x3s2p1c3x4-neonfma-2x2.c
718 src/f32-conv-hwc/3x3s2p1c3x8-neonfma-2x2.c
719 src/f32-conv-hwc2spchw/3x3s2p1c3x4-neonfma-2x2.c
720 src/f32-dwconv-spchw/3x3p1-neonfma.c
721 src/f32-dwconv-spchw/5x5p2-neonfma.c
722 src/f32-dwconv-spchw/3x3s2p1-neonfma.c
723 src/f32-dwconv-spchw/5x5s2p2-neonfma.c
Marat Dukhan4a24a582020-01-06 13:30:00 -0800724 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x4.c
725 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x8.c
726 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x12.c
727 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x16.c
728 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x20.c
729 src/f32-sigmoid/gen/neonfma-rr1-p5-div-x24.c
730 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x4.c
731 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x8.c
732 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x12.c
733 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x16.c
734 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x20.c
735 src/f32-sigmoid/gen/neonfma-rr1-lut64-p2-div-x24.c
736 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x4.c
737 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x8.c
738 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x12.c
739 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x16.c
740 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x20.c
741 src/f32-sigmoid/gen/neonfma-rr1-lut2048-p1-div-x24.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800742 src/f32-spmm/gen/12x1-neonfma.c
743 src/f32-spmm/gen/12x2-neonfma.c
744 src/f32-spmm/gen/12x4-neonfma.c
745 src/f32-spmm/gen/16x1-neonfma-pipelined.c
746 src/f32-spmm/gen/16x1-neonfma-unroll2.c
747 src/f32-spmm/gen/16x1-neonfma.c
748 src/f32-spmm/gen/16x2-neonfma.c
749 src/f32-spmm/gen/16x4-neonfma.c
750 src/f32-spmm/gen/4x1-neonfma-pipelined.c
751 src/f32-spmm/gen/4x1-neonfma-unroll2.c
752 src/f32-spmm/gen/4x1-neonfma.c
753 src/f32-spmm/gen/4x2-neonfma.c
754 src/f32-spmm/gen/4x4-neonfma.c
755 src/f32-spmm/gen/8x1-neonfma-pipelined.c
756 src/f32-spmm/gen/8x1-neonfma-unroll2.c
757 src/f32-spmm/gen/8x1-neonfma.c
758 src/f32-spmm/gen/8x2-neonfma.c
759 src/f32-spmm/gen/8x4-neonfma.c
Marat Dukhan77221d32020-01-06 10:04:39 -0800760 src/math/sigmoid-neonfma-rr1-lut2048-p1-div.c
761 src/math/sigmoid-neonfma-rr1-lut64-p2-div.c
762 src/math/sigmoid-neonfma-rr1-p5-div.c
763 src/math/sigmoid-neonfma-rr2-lut2048-p1-div.c
764 src/math/sigmoid-neonfma-rr2-lut64-p2-div.c
765 src/math/sigmoid-neonfma-rr2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700766
767SET(XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800768 src/f16-gemm/gen/4x8-neonfp16arith-ld64.c
769 src/f16-gemm/gen/6x8-neonfp16arith-ld64.c
770 src/f16-gemm/gen/8x8-neonfp16arith-ld64.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700771
772SET(XNNPACK_SSE_MICROKERNEL_SRCS
773 src/f32-avgpool/mp9p8q-sse.c
774 src/f32-avgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800775 src/f32-bilinear/gen/sse-c4.c
776 src/f32-bilinear/gen/sse-c8.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700777 src/f32-clamp/sse.c
Marat Dukhan1e782c42019-11-21 17:02:40 -0800778 src/f32-dwconv-spchw/3x3p1-sse.c
779 src/f32-dwconv-spchw/3x3s2p1-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800780 src/f32-dwconv/gen/up4x25-sse-acc2.c
781 src/f32-dwconv/gen/up4x25-sse.c
782 src/f32-dwconv/gen/up4x4-sse-acc2.c
783 src/f32-dwconv/gen/up4x4-sse.c
784 src/f32-dwconv/gen/up4x9-sse-acc2.c
785 src/f32-dwconv/gen/up4x9-sse.c
786 src/f32-dwconv/gen/up8x25-sse-acc2.c
787 src/f32-dwconv/gen/up8x25-sse.c
788 src/f32-dwconv/gen/up8x4-sse-acc2.c
789 src/f32-dwconv/gen/up8x4-sse.c
790 src/f32-dwconv/gen/up8x9-sse-acc2.c
791 src/f32-dwconv/gen/up8x9-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700792 src/f32-gavgpool-spchw/sse-x4.c
793 src/f32-gavgpool/mp7p7q-sse.c
794 src/f32-gavgpool/up7-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800795 src/f32-gemm/gen/1x8-sse-dup.c
796 src/f32-gemm/gen/1x8-sse-load1.c
797 src/f32-gemm/gen/1x8s4-sse.c
798 src/f32-gemm/gen/4x8-sse-dup.c
799 src/f32-gemm/gen/4x8-sse-load1.c
800 src/f32-gemm/gen/4x8s4-sse.c
801 src/f32-gemm/gen-inc/1x8-sse-dup.c
802 src/f32-gemm/gen-inc/1x8-sse-load1.c
803 src/f32-gemm/gen-inc/1x8s4-sse.c
804 src/f32-gemm/gen-inc/4x8-sse-dup.c
805 src/f32-gemm/gen-inc/4x8-sse-load1.c
806 src/f32-gemm/gen-inc/4x8s4-sse.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800807 src/f32-hswish/gen/sse-x4.c
808 src/f32-hswish/gen/sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800809 src/f32-igemm/gen/1x8-sse-dup.c
810 src/f32-igemm/gen/1x8-sse-load1.c
811 src/f32-igemm/gen/1x8s4-sse.c
812 src/f32-igemm/gen/4x2c4-sse.c
813 src/f32-igemm/gen/4x8-sse-dup.c
814 src/f32-igemm/gen/4x8-sse-load1.c
815 src/f32-igemm/gen/4x8s4-sse.c
Marat Dukhan329da642019-11-19 21:44:39 -0800816 src/f32-maxpool/9p8x-sse-c4.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700817 src/f32-pavgpool/mp9p8q-sse.c
818 src/f32-pavgpool/up9-sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800819 src/f32-ppmm/gen/4x8-sse.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700820 src/f32-rmax/sse.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800821 src/f32-spmm/gen/4x1-sse.c
822 src/f32-spmm/gen/8x1-sse.c
823 src/f32-vbinary/gen/vadd-sse-x4.c
824 src/f32-vbinary/gen/vadd-sse-x8.c
825 src/f32-vbinary/gen/vaddc-sse-x4.c
826 src/f32-vbinary/gen/vaddc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800827 src/f32-vbinary/gen/vdiv-sse-x4.c
828 src/f32-vbinary/gen/vdiv-sse-x8.c
829 src/f32-vbinary/gen/vdivc-sse-x4.c
830 src/f32-vbinary/gen/vdivc-sse-x8.c
Marat Dukhan403b7d42019-12-05 12:49:11 -0800831 src/f32-vbinary/gen/vmax-sse-x4.c
832 src/f32-vbinary/gen/vmax-sse-x8.c
833 src/f32-vbinary/gen/vmaxc-sse-x4.c
834 src/f32-vbinary/gen/vmaxc-sse-x8.c
835 src/f32-vbinary/gen/vmin-sse-x4.c
836 src/f32-vbinary/gen/vmin-sse-x8.c
837 src/f32-vbinary/gen/vminc-sse-x4.c
838 src/f32-vbinary/gen/vminc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800839 src/f32-vbinary/gen/vmul-sse-x4.c
840 src/f32-vbinary/gen/vmul-sse-x8.c
841 src/f32-vbinary/gen/vmulc-sse-x4.c
842 src/f32-vbinary/gen/vmulc-sse-x8.c
Marat Dukhan77ca6302019-12-06 12:48:15 -0800843 src/f32-vbinary/gen/vrdivc-sse-x4.c
844 src/f32-vbinary/gen/vrdivc-sse-x8.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800845 src/f32-vbinary/gen/vrsubc-sse-x4.c
846 src/f32-vbinary/gen/vrsubc-sse-x8.c
847 src/f32-vbinary/gen/vsub-sse-x4.c
848 src/f32-vbinary/gen/vsub-sse-x8.c
849 src/f32-vbinary/gen/vsubc-sse-x4.c
850 src/f32-vbinary/gen/vsubc-sse-x8.c
851 src/f32-vmulcaddc/gen/c4-sse-2x.c
852 src/f32-vmulcaddc/gen/c8-sse-2x.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700853 src/x32-packx/x4-sse.c)
854
855SET(XNNPACK_SSE2_MICROKERNEL_SRCS
Ashkan Aliabadif866a452019-11-20 10:58:51 -0800856 src/f32-argmaxpool/4x-sse2-c4.c
857 src/f32-argmaxpool/9p8x-sse2-c4.c
858 src/f32-argmaxpool/9x-sse2-c4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800859 src/f32-prelu/gen/sse2-2x4.c
860 src/f32-prelu/gen/sse2-2x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800861 src/f32-sigmoid/gen/sse2-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800862 src/f32-sigmoid/gen/sse2-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800863 src/f32-sigmoid/gen/sse2-p5-div-x12.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800864 src/f32-sigmoid/gen/sse2-p5-div-x16.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800865 src/f32-sigmoid/gen/sse2-p5-div-x20.c
866 src/f32-sigmoid/gen/sse2-p5-div-x24.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700867 src/q8-avgpool/mp9p8q-sse2.c
868 src/q8-avgpool/up9-sse2.c
869 src/q8-igemm/4x4c2-sse2.c
870 src/q8-dwconv/up8x9-sse2.c
871 src/q8-gavgpool/mp7p7q-sse2.c
872 src/q8-gavgpool/up7-sse2.c
873 src/q8-gemm/2x4c8-sse2.c
874 src/q8-gemm/4x4c2-sse2.c
875 src/q8-vadd/sse2.c
876 src/u8-clamp/sse2.c
Marat Dukhan329da642019-11-19 21:44:39 -0800877 src/u8-maxpool/9p8x-sse2-c16.c
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700878 src/u8-rmax/sse2.c
879 src/x32-pad/x2-sse2.c
880 src/x32-zip/x2-sse2.c
881 src/x32-zip/x3-sse2.c
882 src/x32-zip/x4-sse2.c
883 src/x32-zip/xm-sse2.c
884 src/x8-zip/x2-sse2.c
885 src/x8-zip/x3-sse2.c
886 src/x8-zip/x4-sse2.c
Marat Dukhan9d501d52019-11-16 02:30:50 -0800887 src/x8-zip/xm-sse2.c
888 src/math/exp-sse2-p5.c
Marat Dukhan80bafd22019-11-18 10:16:01 -0800889 src/math/expminus-sse2-p5.c
890 src/math/sigmoid-sse2-p5-div.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700891
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800892SET(XNNPACK_SSE41_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800893 src/f32-prelu/gen/sse41-2x4.c
894 src/f32-prelu/gen/sse41-2x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800895 src/f32-sigmoid/gen/sse41-p5-div-x4.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800896 src/f32-sigmoid/gen/sse41-p5-div-x8.c
Marat Dukhan8d3c07e2020-01-02 01:20:59 -0800897 src/f32-sigmoid/gen/sse41-p5-div-x12.c
898 src/f32-sigmoid/gen/sse41-p5-div-x16.c
899 src/f32-sigmoid/gen/sse41-p5-div-x20.c
900 src/f32-sigmoid/gen/sse41-p5-div-x24.c)
Marat Dukhan69c3f2c2019-11-06 12:30:01 -0800901
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700902SET(XNNPACK_AVX_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -0800903 src/f32-clamp/avx.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800904 src/f32-dwconv/gen/up16x4-avx-acc2.c
905 src/f32-dwconv/gen/up16x4-avx.c
906 src/f32-dwconv/gen/up8x4-avx-acc2.c
907 src/f32-dwconv/gen/up8x4-avx.c
908 src/f32-dwconv/gen/up16x9-avx-acc2.c
909 src/f32-dwconv/gen/up16x9-avx.c
910 src/f32-dwconv/gen/up8x9-avx-acc2.c
911 src/f32-dwconv/gen/up8x9-avx.c
912 src/f32-dwconv/gen/up16x25-avx-acc2.c
913 src/f32-dwconv/gen/up16x25-avx.c
914 src/f32-dwconv/gen/up8x25-avx-acc2.c
915 src/f32-dwconv/gen/up8x25-avx.c
916 src/f32-gemm/gen/1x8-avx-broadcast.c
917 src/f32-gemm/gen/4x8-avx-broadcast.c
918 src/f32-gemm/gen/5x8-avx-broadcast.c
919 src/f32-gemm/gen/6x8-avx-broadcast.c
920 src/f32-gemm/gen/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800921 src/f32-gemm/gen/1x16-avx-broadcast.c
922 src/f32-gemm/gen/3x16-avx-broadcast.c
923 src/f32-gemm/gen/4x16-avx-broadcast.c
924 src/f32-gemm/gen/5x16-avx-broadcast.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800925 src/f32-gemm/gen-inc/1x8-avx-broadcast.c
926 src/f32-gemm/gen-inc/4x8-avx-broadcast.c
927 src/f32-gemm/gen-inc/5x8-avx-broadcast.c
928 src/f32-gemm/gen-inc/6x8-avx-broadcast.c
929 src/f32-gemm/gen-inc/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800930 src/f32-gemm/gen-inc/1x16-avx-broadcast.c
931 src/f32-gemm/gen-inc/3x16-avx-broadcast.c
932 src/f32-gemm/gen-inc/4x16-avx-broadcast.c
933 src/f32-gemm/gen-inc/5x16-avx-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -0800934 src/f32-hswish/gen/avx-x8.c
935 src/f32-hswish/gen/avx-x16.c
Marat Dukhan40a672f2019-11-25 03:08:22 -0800936 src/f32-igemm/gen/1x8-avx-broadcast.c
937 src/f32-igemm/gen/4x8-avx-broadcast.c
938 src/f32-igemm/gen/5x8-avx-broadcast.c
939 src/f32-igemm/gen/6x8-avx-broadcast.c
940 src/f32-igemm/gen/7x8-avx-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800941 src/f32-igemm/gen/1x16-avx-broadcast.c
942 src/f32-igemm/gen/3x16-avx-broadcast.c
943 src/f32-igemm/gen/4x16-avx-broadcast.c
944 src/f32-igemm/gen/5x16-avx-broadcast.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700945 src/f32-rmax/avx.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -0800946 src/f32-vbinary/gen/vadd-avx-x8.c
947 src/f32-vbinary/gen/vadd-avx-x16.c
948 src/f32-vbinary/gen/vaddc-avx-x8.c
949 src/f32-vbinary/gen/vaddc-avx-x16.c
950 src/f32-vbinary/gen/vdiv-avx-x8.c
951 src/f32-vbinary/gen/vdiv-avx-x16.c
952 src/f32-vbinary/gen/vdivc-avx-x8.c
953 src/f32-vbinary/gen/vdivc-avx-x16.c
954 src/f32-vbinary/gen/vmax-avx-x8.c
955 src/f32-vbinary/gen/vmax-avx-x16.c
956 src/f32-vbinary/gen/vmaxc-avx-x8.c
957 src/f32-vbinary/gen/vmaxc-avx-x16.c
958 src/f32-vbinary/gen/vmin-avx-x8.c
959 src/f32-vbinary/gen/vmin-avx-x16.c
960 src/f32-vbinary/gen/vminc-avx-x8.c
961 src/f32-vbinary/gen/vminc-avx-x16.c
962 src/f32-vbinary/gen/vmul-avx-x8.c
963 src/f32-vbinary/gen/vmul-avx-x16.c
964 src/f32-vbinary/gen/vmulc-avx-x8.c
965 src/f32-vbinary/gen/vmulc-avx-x16.c
966 src/f32-vbinary/gen/vrdivc-avx-x8.c
967 src/f32-vbinary/gen/vrdivc-avx-x16.c
968 src/f32-vbinary/gen/vrsubc-avx-x8.c
969 src/f32-vbinary/gen/vrsubc-avx-x16.c
970 src/f32-vbinary/gen/vsub-avx-x8.c
971 src/f32-vbinary/gen/vsub-avx-x16.c
972 src/f32-vbinary/gen/vsubc-avx-x8.c
973 src/f32-vbinary/gen/vsubc-avx-x16.c
Marat Dukhana5977df2019-10-30 22:02:15 -0700974 src/f32-vscale/avx-unroll32.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -0700975
Marat Dukhanfda12b82019-11-21 12:27:59 -0800976SET(XNNPACK_FMA3_MICROKERNEL_SRCS
Marat Dukhan40a672f2019-11-25 03:08:22 -0800977 src/f32-dwconv/gen/up16x4-fma3-acc2.c
978 src/f32-dwconv/gen/up16x4-fma3.c
979 src/f32-dwconv/gen/up8x4-fma3-acc2.c
980 src/f32-dwconv/gen/up8x4-fma3.c
981 src/f32-dwconv/gen/up16x9-fma3-acc2.c
982 src/f32-dwconv/gen/up16x9-fma3.c
983 src/f32-dwconv/gen/up8x9-fma3-acc2.c
984 src/f32-dwconv/gen/up8x9-fma3.c
985 src/f32-dwconv/gen/up16x25-fma3-acc2.c
986 src/f32-dwconv/gen/up16x25-fma3.c
987 src/f32-dwconv/gen/up8x25-fma3-acc2.c
988 src/f32-dwconv/gen/up8x25-fma3.c
989 src/f32-gemm/gen/1x8-fma3-broadcast.c
990 src/f32-gemm/gen/4x8-fma3-broadcast.c
991 src/f32-gemm/gen/5x8-fma3-broadcast.c
992 src/f32-gemm/gen/6x8-fma3-broadcast.c
993 src/f32-gemm/gen/7x8-fma3-broadcast.c
994 src/f32-gemm/gen/8x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -0800995 src/f32-gemm/gen/1x16-fma3-broadcast.c
996 src/f32-gemm/gen/3x16-fma3-broadcast.c
997 src/f32-gemm/gen/4x16-fma3-broadcast.c
998 src/f32-gemm/gen/5x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -0800999 src/f32-gemm/gen/1x16s4-fma3-broadcast.c
1000 src/f32-gemm/gen/3x16s4-fma3-broadcast.c
1001 src/f32-gemm/gen/4x16s4-fma3-broadcast.c
1002 src/f32-gemm/gen/5x16s4-fma3-broadcast.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001003 src/f32-gemm/gen-inc/1x8-fma3-broadcast.c
1004 src/f32-gemm/gen-inc/4x8-fma3-broadcast.c
1005 src/f32-gemm/gen-inc/5x8-fma3-broadcast.c
1006 src/f32-gemm/gen-inc/6x8-fma3-broadcast.c
1007 src/f32-gemm/gen-inc/7x8-fma3-broadcast.c
1008 src/f32-gemm/gen-inc/8x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -08001009 src/f32-gemm/gen-inc/1x16-fma3-broadcast.c
1010 src/f32-gemm/gen-inc/3x16-fma3-broadcast.c
1011 src/f32-gemm/gen-inc/4x16-fma3-broadcast.c
1012 src/f32-gemm/gen-inc/5x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -08001013 src/f32-gemm/gen-inc/1x16s4-fma3-broadcast.c
1014 src/f32-gemm/gen-inc/3x16s4-fma3-broadcast.c
1015 src/f32-gemm/gen-inc/4x16s4-fma3-broadcast.c
1016 src/f32-gemm/gen-inc/5x16s4-fma3-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001017 src/f32-hswish/gen/fma3-x8.c
1018 src/f32-hswish/gen/fma3-x16.c
Marat Dukhan40a672f2019-11-25 03:08:22 -08001019 src/f32-igemm/gen/1x8-fma3-broadcast.c
1020 src/f32-igemm/gen/4x8-fma3-broadcast.c
1021 src/f32-igemm/gen/5x8-fma3-broadcast.c
1022 src/f32-igemm/gen/6x8-fma3-broadcast.c
1023 src/f32-igemm/gen/7x8-fma3-broadcast.c
Marat Dukhaneccfd712019-12-08 16:49:27 -08001024 src/f32-igemm/gen/8x8-fma3-broadcast.c
1025 src/f32-igemm/gen/1x16-fma3-broadcast.c
1026 src/f32-igemm/gen/3x16-fma3-broadcast.c
1027 src/f32-igemm/gen/4x16-fma3-broadcast.c
Marat Dukhan27121322019-12-09 14:57:40 -08001028 src/f32-igemm/gen/5x16-fma3-broadcast.c
1029 src/f32-igemm/gen/1x16s4-fma3-broadcast.c
1030 src/f32-igemm/gen/3x16s4-fma3-broadcast.c
1031 src/f32-igemm/gen/4x16s4-fma3-broadcast.c
1032 src/f32-igemm/gen/5x16s4-fma3-broadcast.c)
Marat Dukhanfda12b82019-11-21 12:27:59 -08001033
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001034SET(XNNPACK_AVX2_MICROKERNEL_SRCS
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001035 src/f32-raddexpminusmax/gen/avx2-p5-x64.c
1036 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc2.c
1037 src/f32-raddexpminusmax/gen/avx2-p5-x64-acc4.c
1038 src/f32-raddexpminusmax/gen/avx2-p5-x72.c
1039 src/f32-raddexpminusmax/gen/avx2-p5-x72-acc3.c
1040 src/f32-raddexpminusmax/gen/avx2-p5-x80.c
1041 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc2.c
1042 src/f32-raddexpminusmax/gen/avx2-p5-x80-acc5.c
1043 src/f32-raddexpminusmax/gen/avx2-p5-x96.c
1044 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc2.c
1045 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc3.c
1046 src/f32-raddexpminusmax/gen/avx2-p5-x96-acc6.c
1047 src/f32-raddextexp/gen/avx2-p5-x64.c
1048 src/f32-raddextexp/gen/avx2-p5-x64-acc2.c
1049 src/f32-raddextexp/gen/avx2-p5-x64-acc4.c
1050 src/f32-raddextexp/gen/avx2-p5-x72.c
1051 src/f32-raddextexp/gen/avx2-p5-x72-acc3.c
1052 src/f32-raddextexp/gen/avx2-p5-x80.c
1053 src/f32-raddextexp/gen/avx2-p5-x80-acc2.c
1054 src/f32-raddextexp/gen/avx2-p5-x80-acc5.c
1055 src/f32-raddextexp/gen/avx2-p5-x96.c
1056 src/f32-raddextexp/gen/avx2-p5-x96-acc2.c
1057 src/f32-raddextexp/gen/avx2-p5-x96-acc3.c
1058 src/f32-raddextexp/gen/avx2-p5-x96-acc6.c
1059 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64.c
1060 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc2.c
1061 src/f32-raddstoreexpminusmax/gen/avx2-p5-x64-acc4.c
1062 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72.c
1063 src/f32-raddstoreexpminusmax/gen/avx2-p5-x72-acc3.c
1064 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80.c
1065 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc2.c
1066 src/f32-raddstoreexpminusmax/gen/avx2-p5-x80-acc5.c
1067 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96.c
1068 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc2.c
1069 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc3.c
1070 src/f32-raddstoreexpminusmax/gen/avx2-p5-x96-acc6.c
Marat Dukhanfa0a4322020-01-06 16:14:29 -08001071 src/f32-sigmoid/gen/avx2-rr1-p5-div-x8.c
1072 src/f32-sigmoid/gen/avx2-rr1-p5-div-x16.c
1073 src/f32-sigmoid/gen/avx2-rr1-p5-div-x24.c
1074 src/f32-sigmoid/gen/avx2-rr1-p5-div-x32.c
1075 src/f32-sigmoid/gen/avx2-rr1-p5-div-x40.c
1076 src/f32-sigmoid/gen/avx2-rr1-p5-div-x48.c
1077 src/f32-sigmoid/gen/avx2-rr1-p5-div-x56.c
1078 src/f32-sigmoid/gen/avx2-rr1-p5-div-x64.c
1079 src/f32-sigmoid/gen/avx2-rr1-p5-div-x72.c
1080 src/f32-sigmoid/gen/avx2-rr1-p5-div-x80.c
1081 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x8.c
1082 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x16.c
1083 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x24.c
1084 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x32.c
1085 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x40.c
1086 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x48.c
1087 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x56.c
1088 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x64.c
1089 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x72.c
1090 src/f32-sigmoid/gen/avx2-rr1-p5-nr1fma-x80.c
1091 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x8.c
1092 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x16.c
1093 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x24.c
1094 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x32.c
1095 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x40.c
1096 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x48.c
1097 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x56.c
1098 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x64.c
1099 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x72.c
1100 src/f32-sigmoid/gen/avx2-rr1-p5-nr2fma-x80.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001101 src/f32-vscaleexpminusmax/gen/avx2-p5-x8.c
1102 src/f32-vscaleexpminusmax/gen/avx2-p5-x16.c
1103 src/f32-vscaleexpminusmax/gen/avx2-p5-x24.c
1104 src/f32-vscaleexpminusmax/gen/avx2-p5-x32.c
1105 src/f32-vscaleexpminusmax/gen/avx2-p5-x40.c
1106 src/f32-vscaleexpminusmax/gen/avx2-p5-x48.c
1107 src/f32-vscaleexpminusmax/gen/avx2-p5-x56.c
1108 src/f32-vscaleexpminusmax/gen/avx2-p5-x64.c
1109 src/f32-vscaleexpminusmax/gen/avx2-p5-x72.c
1110 src/f32-vscaleexpminusmax/gen/avx2-p5-x80.c
1111 src/f32-vscaleexpminusmax/gen/avx2-p5-x88.c
1112 src/f32-vscaleexpminusmax/gen/avx2-p5-x96.c
1113 src/f32-vscaleextexp/gen/avx2-p5-x8.c
1114 src/f32-vscaleextexp/gen/avx2-p5-x16.c
1115 src/f32-vscaleextexp/gen/avx2-p5-x24.c
1116 src/f32-vscaleextexp/gen/avx2-p5-x32.c
1117 src/f32-vscaleextexp/gen/avx2-p5-x40.c
1118 src/f32-vscaleextexp/gen/avx2-p5-x48.c
1119 src/f32-vscaleextexp/gen/avx2-p5-x56.c
1120 src/f32-vscaleextexp/gen/avx2-p5-x64.c
1121 src/f32-vscaleextexp/gen/avx2-p5-x72.c
1122 src/f32-vscaleextexp/gen/avx2-p5-x80.c
1123 src/f32-vscaleextexp/gen/avx2-p5-x88.c
1124 src/f32-vscaleextexp/gen/avx2-p5-x96.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001125 src/math/exp-avx2-p5.c
1126 src/math/exp-avx2-perm-p3.c
Marat Dukhan515c9772019-10-17 18:07:57 -07001127 src/math/exp-avx2-perm-p4.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001128 src/math/expminus-avx2-p5.c
Marat Dukhan72416002020-01-05 21:53:19 -08001129 src/math/extexp-avx2-p5.c
1130 src/math/sigmoid-avx2-rr2-p5-div.c
1131 src/math/sigmoid-avx2-rr1-p5-div.c
1132 src/math/sigmoid-avx2-rr2-p5-nr2fma.c
1133 src/math/sigmoid-avx2-rr1-p5-nr2fma.c
1134 src/math/sigmoid-avx2-rr2-p5-nr1fma.c
1135 src/math/sigmoid-avx2-rr1-p5-nr1fma.c)
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001136
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001137SET(XNNPACK_AVX512F_MICROKERNEL_SRCS
Marat Dukhane2c3f292019-11-27 15:40:54 -08001138 src/f32-clamp/avx512f.c
Marat Dukhan479f87e2019-11-27 15:17:06 -08001139 src/f32-dwconv/gen/up32x4-avx512f-acc2.c
1140 src/f32-dwconv/gen/up32x4-avx512f.c
1141 src/f32-dwconv/gen/up16x4-avx512f-acc2.c
1142 src/f32-dwconv/gen/up16x4-avx512f.c
1143 src/f32-dwconv/gen/up32x9-avx512f-acc2.c
1144 src/f32-dwconv/gen/up32x9-avx512f.c
1145 src/f32-dwconv/gen/up16x9-avx512f-acc2.c
1146 src/f32-dwconv/gen/up16x9-avx512f.c
1147 src/f32-dwconv/gen/up32x25-avx512f-acc2.c
1148 src/f32-dwconv/gen/up32x25-avx512f.c
1149 src/f32-dwconv/gen/up16x25-avx512f-acc2.c
1150 src/f32-dwconv/gen/up16x25-avx512f.c
Marat Dukhan0f349c42019-11-27 11:58:54 -08001151 src/f32-gemm/gen/1x16-avx512f-broadcast.c
1152 src/f32-gemm/gen/4x16-avx512f-broadcast.c
1153 src/f32-gemm/gen/5x16-avx512f-broadcast.c
1154 src/f32-gemm/gen/6x16-avx512f-broadcast.c
1155 src/f32-gemm/gen/7x16-avx512f-broadcast.c
1156 src/f32-gemm/gen/8x16-avx512f-broadcast.c
1157 src/f32-gemm/gen-inc/1x16-avx512f-broadcast.c
1158 src/f32-gemm/gen-inc/4x16-avx512f-broadcast.c
1159 src/f32-gemm/gen-inc/5x16-avx512f-broadcast.c
1160 src/f32-gemm/gen-inc/6x16-avx512f-broadcast.c
1161 src/f32-gemm/gen-inc/7x16-avx512f-broadcast.c
1162 src/f32-gemm/gen-inc/8x16-avx512f-broadcast.c
Marat Dukhan662faa02019-12-09 22:48:16 -08001163 src/f32-hswish/gen/avx512f-x16.c
1164 src/f32-hswish/gen/avx512f-x32.c
Marat Dukhan0f349c42019-11-27 11:58:54 -08001165 src/f32-igemm/gen/1x16-avx512f-broadcast.c
1166 src/f32-igemm/gen/4x16-avx512f-broadcast.c
1167 src/f32-igemm/gen/5x16-avx512f-broadcast.c
1168 src/f32-igemm/gen/6x16-avx512f-broadcast.c
1169 src/f32-igemm/gen/7x16-avx512f-broadcast.c
1170 src/f32-igemm/gen/8x16-avx512f-broadcast.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001171 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c
1172 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1173 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1174 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144.c
1175 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1176 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160.c
1177 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1178 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1179 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192.c
1180 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1181 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1182 src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
1183 src/f32-raddextexp/gen/avx512f-p5-scalef-x128.c
1184 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc2.c
1185 src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc4.c
1186 src/f32-raddextexp/gen/avx512f-p5-scalef-x144.c
1187 src/f32-raddextexp/gen/avx512f-p5-scalef-x144-acc3.c
1188 src/f32-raddextexp/gen/avx512f-p5-scalef-x160.c
1189 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc2.c
1190 src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc5.c
1191 src/f32-raddextexp/gen/avx512f-p5-scalef-x192.c
1192 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc2.c
1193 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc3.c
1194 src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc6.c
1195 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128.c
1196 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c
1197 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c
1198 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144.c
1199 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c
1200 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160.c
1201 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c
1202 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c
1203 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192.c
1204 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c
1205 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c
1206 src/f32-raddstoreexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001207 src/f32-rmax/avx512f.c
Marat Dukhan9a88efe2019-12-10 15:54:24 -08001208 src/f32-vbinary/gen/vadd-avx512f-x16.c
1209 src/f32-vbinary/gen/vadd-avx512f-x32.c
1210 src/f32-vbinary/gen/vaddc-avx512f-x16.c
1211 src/f32-vbinary/gen/vaddc-avx512f-x32.c
1212 src/f32-vbinary/gen/vdiv-avx512f-x16.c
1213 src/f32-vbinary/gen/vdiv-avx512f-x32.c
1214 src/f32-vbinary/gen/vdivc-avx512f-x16.c
1215 src/f32-vbinary/gen/vdivc-avx512f-x32.c
1216 src/f32-vbinary/gen/vmax-avx512f-x16.c
1217 src/f32-vbinary/gen/vmax-avx512f-x32.c
1218 src/f32-vbinary/gen/vmaxc-avx512f-x16.c
1219 src/f32-vbinary/gen/vmaxc-avx512f-x32.c
1220 src/f32-vbinary/gen/vmin-avx512f-x16.c
1221 src/f32-vbinary/gen/vmin-avx512f-x32.c
1222 src/f32-vbinary/gen/vminc-avx512f-x16.c
1223 src/f32-vbinary/gen/vminc-avx512f-x32.c
1224 src/f32-vbinary/gen/vmul-avx512f-x16.c
1225 src/f32-vbinary/gen/vmul-avx512f-x32.c
1226 src/f32-vbinary/gen/vmulc-avx512f-x16.c
1227 src/f32-vbinary/gen/vmulc-avx512f-x32.c
1228 src/f32-vbinary/gen/vrdivc-avx512f-x16.c
1229 src/f32-vbinary/gen/vrdivc-avx512f-x32.c
1230 src/f32-vbinary/gen/vrsubc-avx512f-x16.c
1231 src/f32-vbinary/gen/vrsubc-avx512f-x32.c
1232 src/f32-vbinary/gen/vsub-avx512f-x16.c
1233 src/f32-vbinary/gen/vsub-avx512f-x32.c
1234 src/f32-vbinary/gen/vsubc-avx512f-x16.c
1235 src/f32-vbinary/gen/vsubc-avx512f-x32.c
Marat Dukhana5977df2019-10-30 22:02:15 -07001236 src/f32-vscale/avx512f-unroll64.c
Marat Dukhan4c4eb002019-12-08 21:27:49 -08001237 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x16.c
1238 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x32.c
1239 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x48.c
1240 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x64.c
1241 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x80.c
1242 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x96.c
1243 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x112.c
1244 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x128.c
1245 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x144.c
1246 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x160.c
1247 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x176.c
1248 src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x192.c
1249 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x16.c
1250 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x32.c
1251 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x48.c
1252 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x64.c
1253 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x80.c
1254 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x96.c
1255 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x112.c
1256 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x128.c
1257 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x144.c
1258 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x160.c
1259 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x176.c
1260 src/f32-vscaleextexp/gen/avx512f-p5-scalef-x192.c
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001261 src/math/exp-avx512f-p5-scalef.c
1262 src/math/exp-avx512f-p5.c
Marat Dukhanfeb49232019-10-28 11:03:31 -07001263 src/math/exp-avx512f-perm-p3.c
Marat Dukhan9d501d52019-11-16 02:30:50 -08001264 src/math/exp-avx512f-perm2-p2.c
1265 src/math/extexp-avx512f-p5.c)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001266
1267SET(XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS
Frank Barchard8b0f0262019-11-27 23:18:40 -08001268 src/q8-dwconv/up8x9-aarch32-neon.S
Frank Barchard13916042019-12-11 10:56:34 -08001269 src/f32-gemm/4x8-aarch32-neon-cortex-a53.S
Frank Barchardabf81542019-12-13 16:18:30 -08001270 src/f32-gemm/gen/4x8-aarch32-neon-cortex-a75.S
1271 src/f32-gemm/gen/4x8-aarch32-neon-pld-cortex-a75.S
Frank Barchard8b0f0262019-11-27 23:18:40 -08001272 src/f32-gemm/4x8-aarch32-neon-ld64.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001273
1274SET(XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS
1275 src/f32-dwconv/up4x9-aarch64-neonfma-cortex-a55.S
1276 src/f32-dwconv/up4x9-aarch64-neonfma.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001277 src/f32-gemm/gen/1x12-aarch64-neonfma-cortex-a53.S
1278 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a53.S
1279 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a57.S
1280 src/f32-gemm/gen/1x8-aarch64-neonfma-cortex-a75.S
1281 src/f32-gemm/gen/4x12-aarch64-neonfma-cortex-a53.S
1282 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a53.S
1283 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a57.S
1284 src/f32-gemm/gen/4x8-aarch64-neonfma-cortex-a75.S
1285 src/f32-gemm/gen/4x8-aarch64-neonfma-ld128.S
1286 src/f32-gemm/gen/4x8-aarch64-neonfma-ld64.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001287 src/f32-gemm/gen/5x8-aarch64-neonfma-cortex-a57.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001288 src/f32-gemm/gen/5x8-aarch64-neonfma-cortex-a75.S
1289 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001290 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a73.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001291 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a57.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001292 src/f32-gemm/gen/6x8-aarch64-neonfma-cortex-a75.S
1293 src/f32-gemm/gen/6x8-aarch64-neonfma-ld128.S
1294 src/f32-gemm/gen/6x8-aarch64-neonfma-ld64.S
1295 src/f32-gemm/gen-inc/1x12-aarch64-neonfma-cortex-a53.S
1296 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a53.S
1297 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a57.S
1298 src/f32-gemm/gen-inc/1x8-aarch64-neonfma-cortex-a75.S
1299 src/f32-gemm/gen-inc/4x12-aarch64-neonfma-cortex-a53.S
1300 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a53.S
1301 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a57.S
1302 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-cortex-a75.S
1303 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld128.S
1304 src/f32-gemm/gen-inc/4x8-aarch64-neonfma-ld64.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001305 src/f32-gemm/gen-inc/5x8-aarch64-neonfma-cortex-a57.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001306 src/f32-gemm/gen-inc/5x8-aarch64-neonfma-cortex-a75.S
1307 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001308 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a73.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001309 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a57.S
Marat Dukhan40a672f2019-11-25 03:08:22 -08001310 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-cortex-a75.S
1311 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld128.S
1312 src/f32-gemm/gen-inc/6x8-aarch64-neonfma-ld64.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001313 src/f32-igemm/1x12-aarch64-neonfma-cortex-a53.S
Frank Barchard21be34f2019-10-09 19:32:19 -07001314 src/f32-igemm/1x8-aarch64-neonfma-cortex-a53.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001315 src/f32-igemm/gen/1x8-aarch64-neonfma-cortex-a57.S
1316 src/f32-igemm/gen/1x8-aarch64-neonfma-cortex-a75.S
1317 src/f32-igemm/4x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001318 src/f32-igemm/4x12-aarch64-neonfma-cortex-a53.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001319 src/f32-igemm/gen/4x8-aarch64-neonfma-cortex-a57.S
1320 src/f32-igemm/gen/4x8-aarch64-neonfma-cortex-a75.S
1321 src/f32-igemm/gen/5x8-aarch64-neonfma-cortex-a57.S
1322 src/f32-igemm/gen/5x8-aarch64-neonfma-cortex-a75.S
Marat Dukhan8e6e9972019-10-31 14:15:31 -07001323 src/f32-igemm/6x8-aarch64-neonfma-cortex-a53.S
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001324 src/f32-igemm/6x8-aarch64-neonfma-cortex-a73.S
Frank Barchard387c2d12019-12-16 19:14:07 -08001325 src/f32-igemm/gen/6x8-aarch64-neonfma-cortex-a57.S
1326 src/f32-igemm/gen/6x8-aarch64-neonfma-cortex-a75.S)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001327
1328SET(XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SCALAR_MICROKERNEL_SRCS})
1329IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001330 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS})
1331 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001332ENDIF()
1333IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1334 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1335 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
1336 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH32_ASM_MICROKERNEL_SRCS})
1337ENDIF()
1338IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1339 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEON_MICROKERNEL_SRCS})
1340 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan36aecb52019-11-22 17:21:49 -08001341 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFMA_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001342 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS})
1343 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AARCH64_ASM_MICROKERNEL_SRCS})
1344ENDIF()
1345IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
1346 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE_MICROKERNEL_SRCS})
1347 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE2_MICROKERNEL_SRCS})
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001348 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_SSE41_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001349 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX_MICROKERNEL_SRCS})
Marat Dukhanfda12b82019-11-21 12:27:59 -08001350 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_FMA3_MICROKERNEL_SRCS})
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001351 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX2_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001352 LIST(APPEND XNNPACK_MICROKERNEL_SRCS ${XNNPACK_AVX512F_MICROKERNEL_SRCS})
1353ENDIF()
1354
1355IF(XNNPACK_LIBRARY_TYPE STREQUAL "default")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001356 ADD_LIBRARY(XNNPACK ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001357ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "shared")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001358 ADD_LIBRARY(XNNPACK SHARED ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001359ELSEIF(XNNPACK_LIBRARY_TYPE STREQUAL "static")
Marat Dukhan3a77ea72019-12-23 12:10:24 -08001360 ADD_LIBRARY(XNNPACK STATIC ${XNNPACK_COLD_SRCS} ${XNNPACK_HOT_SRCS} ${XNNPACK_TABLE_SRCS} ${XNNPACK_MICROKERNEL_SRCS})
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001361ELSE()
1362 MESSAGE(FATAL_ERROR "Unsupported XNNPACK library type \"${XNNPACK_LIBRARY_TYPE}\". Must be \"static\", \"shared\", or \"default\"")
1363ENDIF()
1364SET_TARGET_PROPERTIES(XNNPACK PROPERTIES
1365 C_STANDARD 99
1366 C_EXTENSIONS YES)
1367IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^armv[5-8]" OR IOS_ARCH MATCHES "^armv7")
1368 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -marm ")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001369 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001370 SET_PROPERTY(SOURCE ${XNNPACK_NEON_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon ")
1371 SET_PROPERTY(SOURCE ${XNNPACK_NEONFMA_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfpu=neon-vfpv4 ")
1372 IF(IOS)
1373 SET_PROPERTY(SOURCE ${XNNPACK_AARCH32_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
1374 ENDIF()
1375ENDIF()
1376IF(CMAKE_SYSTEM_PROCESSOR STREQUAL "aarch64" OR IOS_ARCH MATCHES "^arm64.*")
1377 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -march=armv8.2-a+fp16 ")
1378 IF(IOS)
1379 SET_PROPERTY(SOURCE ${XNNPACK_AARCH64_ASM_UKERNELS} APPEND_STRING PROPERTY COMPILE_FLAGS " -arch ${IOS_ARCH} ")
1380 ENDIF()
1381ENDIF()
1382IF(CMAKE_SYSTEM_PROCESSOR MATCHES "^(i[3-6]86|x86_64)$" OR IOS_ARCH MATCHES "^(i386|x86_64)$")
1383 SET_PROPERTY(SOURCE ${XNNPACK_SSE_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse ")
1384 SET_PROPERTY(SOURCE ${XNNPACK_SSE2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse2 ")
Marat Dukhan69c3f2c2019-11-06 12:30:01 -08001385 SET_PROPERTY(SOURCE ${XNNPACK_SSE41_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -msse4.1 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001386 SET_PROPERTY(SOURCE ${XNNPACK_AVX_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx ")
Marat Dukhanfda12b82019-11-21 12:27:59 -08001387 SET_PROPERTY(SOURCE ${XNNPACK_FMA3_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma ")
Marat Dukhan6adff4e2019-10-14 18:32:07 -07001388 SET_PROPERTY(SOURCE ${XNNPACK_AVX2_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mfma -mavx2 ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001389 SET_PROPERTY(SOURCE ${XNNPACK_AVX512F_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -mavx512f ")
1390ENDIF()
1391IF(CMAKE_BUILD_TYPE STREQUAL "Debug")
1392 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=5)
1393ELSE()
1394 TARGET_COMPILE_DEFINITIONS(XNNPACK PRIVATE XNN_LOG_LEVEL=0)
1395 SET_PROPERTY(SOURCE ${XNNPACK_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1396 SET_PROPERTY(SOURCE ${XNNPACK_HOT_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O2 ")
1397 SET_PROPERTY(SOURCE ${XNNPACK_COLD_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -Os ")
1398ENDIF()
1399IF(NOT CMAKE_SYSTEM_NAME STREQUAL "Emscripten")
Marat Dukhan8d3c07e2020-01-02 01:20:59 -08001400 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_ACCMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 ")
1401 SET_PROPERTY(SOURCE ${XNNPACK_PSIMD_FASTMATH_MICROKERNEL_SRCS} APPEND_STRING PROPERTY COMPILE_FLAGS " -O3 -ffast-math ")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001402ENDIF()
1403
1404TARGET_INCLUDE_DIRECTORIES(XNNPACK PUBLIC include)
1405TARGET_INCLUDE_DIRECTORIES(XNNPACK PRIVATE src)
Ashkan Aliabadid255a312019-12-03 12:44:34 -08001406SET_TARGET_PROPERTIES(XNNPACK PROPERTIES PUBLIC_HEADER include/xnnpack.h)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001407
1408# ---[ Configure clog
1409IF(NOT TARGET clog)
1410 SET(CLOG_BUILD_TESTS OFF CACHE BOOL "")
1411 SET(CLOG_RUNTIME_TYPE "${CPUINFO_RUNTIME_TYPE}" CACHE STRING "")
1412 ADD_SUBDIRECTORY(
1413 "${CLOG_SOURCE_DIR}/deps/clog"
1414 "${CMAKE_BINARY_DIR}/clog")
1415 # We build static version of clog but a dynamic library may indirectly depend on it
1416 SET_PROPERTY(TARGET clog PROPERTY POSITION_INDEPENDENT_CODE ON)
1417ENDIF()
1418TARGET_LINK_LIBRARIES(XNNPACK PRIVATE clog)
1419
1420# ---[ Configure cpuinfo
1421IF(NOT TARGET cpuinfo)
1422 SET(CPUINFO_BUILD_TOOLS OFF CACHE BOOL "")
1423 SET(CPUINFO_BUILD_UNIT_TESTS OFF CACHE BOOL "")
1424 SET(CPUINFO_BUILD_MOCK_TESTS OFF CACHE BOOL "")
1425 SET(CPUINFO_BUILD_BENCHMARKS OFF CACHE BOOL "")
1426 ADD_SUBDIRECTORY(
1427 "${CPUINFO_SOURCE_DIR}"
1428 "${CMAKE_BINARY_DIR}/cpuinfo")
1429ENDIF()
1430TARGET_LINK_LIBRARIES(XNNPACK PRIVATE cpuinfo)
1431
1432# ---[ Configure pthreadpool
1433IF(NOT TARGET pthreadpool)
1434 SET(PTHREADPOOL_BUILD_TESTS OFF CACHE BOOL "")
1435 SET(PTHREADPOOL_BUILD_BENCHMARKS OFF CACHE BOOL "")
Marat Dukhand70028a2019-10-29 09:53:16 -07001436 SET(PTHREADPOOL_ALLOW_DEPRECATED_API OFF CACHE BOOL "")
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001437 ADD_SUBDIRECTORY(
1438 "${PTHREADPOOL_SOURCE_DIR}"
1439 "${CMAKE_BINARY_DIR}/pthreadpool")
1440ENDIF()
1441TARGET_LINK_LIBRARIES(XNNPACK PUBLIC pthreadpool)
1442
1443# ---[ Configure FXdiv
1444IF(NOT TARGET fxdiv)
1445 SET(FXDIV_BUILD_TESTS OFF CACHE BOOL "")
1446 SET(FXDIV_BUILD_BENCHMARKS OFF CACHE BOOL "")
1447 ADD_SUBDIRECTORY(
1448 "${FXDIV_SOURCE_DIR}"
1449 "${CMAKE_BINARY_DIR}/FXdiv")
1450ENDIF()
1451TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fxdiv)
1452
1453# ---[ Configure psimd
1454IF(NOT TARGET psimd)
1455 ADD_SUBDIRECTORY(
1456 "${PSIMD_SOURCE_DIR}"
1457 "${CMAKE_BINARY_DIR}/psimd")
1458ENDIF()
1459TARGET_LINK_LIBRARIES(XNNPACK PRIVATE psimd)
1460
1461# ---[ Configure FP16
1462IF(NOT TARGET fp16)
1463 SET(FP16_BUILD_TESTS OFF CACHE BOOL "")
1464 SET(FP16_BUILD_BENCHMARKS OFF CACHE BOOL "")
1465 ADD_SUBDIRECTORY(
1466 "${FP16_SOURCE_DIR}"
1467 "${CMAKE_BINARY_DIR}/FP16")
1468ENDIF()
1469TARGET_LINK_LIBRARIES(XNNPACK PRIVATE fp16)
1470
1471INSTALL(TARGETS XNNPACK
1472 LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}
1473 ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}
1474 PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
1475
1476# ---[ XNNPACK unit tests
1477IF(XNNPACK_BUILD_TESTS)
1478 # ---[ Build google test
1479 IF(NOT TARGET gtest)
1480 SET(gtest_force_shared_crt ON CACHE BOOL "" FORCE)
1481 ADD_SUBDIRECTORY(
1482 "${GOOGLETEST_SOURCE_DIR}"
1483 "${CMAKE_BINARY_DIR}/googletest")
1484 ENDIF()
1485
1486 # ---[ Build operator-level unit tests
Marat Dukhanefc47b82019-11-18 09:25:38 -08001487 ADD_EXECUTABLE(add-nc-test test/add-nc.cc)
1488 SET_TARGET_PROPERTIES(add-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001489 CXX_STANDARD 11
1490 CXX_STANDARD_REQUIRED YES
1491 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001492 TARGET_INCLUDE_DIRECTORIES(add-nc-test PRIVATE src test)
1493 TARGET_LINK_LIBRARIES(add-nc-test PRIVATE XNNPACK gtest gtest_main)
1494 ADD_TEST(add-nc-test add-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001495
Marat Dukhanb1a0fc32019-12-02 19:32:02 -08001496 ADD_EXECUTABLE(add-nd-test test/add-nd.cc)
1497 SET_TARGET_PROPERTIES(add-nd-test PROPERTIES
1498 CXX_STANDARD 11
1499 CXX_STANDARD_REQUIRED YES
1500 CXX_EXTENSIONS NO)
1501 TARGET_INCLUDE_DIRECTORIES(add-nd-test PRIVATE src test)
1502 TARGET_LINK_LIBRARIES(add-nd-test PRIVATE XNNPACK gtest gtest_main)
1503 ADD_TEST(add-nd-test add-nd-test)
1504
Marat Dukhanefc47b82019-11-18 09:25:38 -08001505 ADD_EXECUTABLE(argmax-pooling-nhwc-test test/argmax-pooling-nhwc.cc)
1506 SET_TARGET_PROPERTIES(argmax-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001507 CXX_STANDARD 11
1508 CXX_STANDARD_REQUIRED YES
1509 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001510 TARGET_INCLUDE_DIRECTORIES(argmax-pooling-nhwc-test PRIVATE src test)
1511 TARGET_LINK_LIBRARIES(argmax-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1512 ADD_TEST(argmax-pooling-nhwc-test argmax-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001513
Marat Dukhanefc47b82019-11-18 09:25:38 -08001514 ADD_EXECUTABLE(average-pooling-nhwc-test test/average-pooling-nhwc.cc)
1515 SET_TARGET_PROPERTIES(average-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001516 CXX_STANDARD 11
1517 CXX_STANDARD_REQUIRED YES
1518 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001519 TARGET_INCLUDE_DIRECTORIES(average-pooling-nhwc-test PRIVATE src test)
1520 TARGET_LINK_LIBRARIES(average-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1521 ADD_TEST(average-pooling-nhwc-test average-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001522
Marat Dukhanefc47b82019-11-18 09:25:38 -08001523 ADD_EXECUTABLE(channel-pad-nc-test test/channel-pad-nc.cc)
1524 SET_TARGET_PROPERTIES(channel-pad-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001525 CXX_STANDARD 11
1526 CXX_STANDARD_REQUIRED YES
1527 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001528 TARGET_INCLUDE_DIRECTORIES(channel-pad-nc-test PRIVATE src test)
1529 TARGET_LINK_LIBRARIES(channel-pad-nc-test PRIVATE XNNPACK gtest gtest_main)
1530 ADD_TEST(channel-pad-nc-test channel-pad-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001531
Marat Dukhanefc47b82019-11-18 09:25:38 -08001532 ADD_EXECUTABLE(channel-shuffle-nc-test test/channel-shuffle-nc.cc)
1533 SET_TARGET_PROPERTIES(channel-shuffle-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001534 CXX_STANDARD 11
1535 CXX_STANDARD_REQUIRED YES
1536 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001537 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-nc-test PRIVATE src test)
1538 TARGET_LINK_LIBRARIES(channel-shuffle-nc-test PRIVATE XNNPACK gtest gtest_main)
1539 ADD_TEST(channel-shuffle-nc-test channel-shuffle-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001540
Marat Dukhanefc47b82019-11-18 09:25:38 -08001541 ADD_EXECUTABLE(clamp-nc-test test/clamp-nc.cc)
1542 SET_TARGET_PROPERTIES(clamp-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001543 CXX_STANDARD 11
1544 CXX_STANDARD_REQUIRED YES
1545 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001546 TARGET_INCLUDE_DIRECTORIES(clamp-nc-test PRIVATE src test)
1547 TARGET_LINK_LIBRARIES(clamp-nc-test PRIVATE XNNPACK gtest gtest_main)
1548 ADD_TEST(clamp-nc-test clamp-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001549
Marat Dukhanefc47b82019-11-18 09:25:38 -08001550 ADD_EXECUTABLE(convolution-nhwc-test test/convolution-nhwc.cc)
1551 SET_TARGET_PROPERTIES(convolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001552 CXX_STANDARD 11
1553 CXX_STANDARD_REQUIRED YES
1554 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001555 TARGET_INCLUDE_DIRECTORIES(convolution-nhwc-test PRIVATE src test)
1556 TARGET_LINK_LIBRARIES(convolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1557 ADD_TEST(convolution-nhwc-test convolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001558
Marat Dukhanefc47b82019-11-18 09:25:38 -08001559 ADD_EXECUTABLE(convolution-nchw-test test/convolution-nchw.cc)
1560 SET_TARGET_PROPERTIES(convolution-nchw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001561 CXX_STANDARD 11
1562 CXX_STANDARD_REQUIRED YES
1563 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001564 TARGET_INCLUDE_DIRECTORIES(convolution-nchw-test PRIVATE src test)
1565 TARGET_LINK_LIBRARIES(convolution-nchw-test PRIVATE XNNPACK gtest gtest_main)
1566 ADD_TEST(convolution-nchw-test convolution-nchw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001567
Marat Dukhanefc47b82019-11-18 09:25:38 -08001568 ADD_EXECUTABLE(deconvolution-nhwc-test test/deconvolution-nhwc.cc)
1569 SET_TARGET_PROPERTIES(deconvolution-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001570 CXX_STANDARD 11
1571 CXX_STANDARD_REQUIRED YES
1572 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001573 TARGET_INCLUDE_DIRECTORIES(deconvolution-nhwc-test PRIVATE src test)
1574 TARGET_LINK_LIBRARIES(deconvolution-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1575 ADD_TEST(deconvolution-nhwc-test deconvolution-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001576
Marat Dukhan69180502019-12-06 15:00:31 -08001577 ADD_EXECUTABLE(divide-nd-test test/divide-nd.cc)
1578 SET_TARGET_PROPERTIES(divide-nd-test PROPERTIES
1579 CXX_STANDARD 11
1580 CXX_STANDARD_REQUIRED YES
1581 CXX_EXTENSIONS NO)
1582 TARGET_INCLUDE_DIRECTORIES(divide-nd-test PRIVATE src test)
1583 TARGET_LINK_LIBRARIES(divide-nd-test PRIVATE XNNPACK gtest gtest_main)
1584 ADD_TEST(divide-nd-test divide-nd-test)
1585
Marat Dukhanefc47b82019-11-18 09:25:38 -08001586 ADD_EXECUTABLE(fully-connected-nc-test test/fully-connected-nc.cc)
1587 SET_TARGET_PROPERTIES(fully-connected-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001588 CXX_STANDARD 11
1589 CXX_STANDARD_REQUIRED YES
1590 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001591 TARGET_INCLUDE_DIRECTORIES(fully-connected-nc-test PRIVATE src test)
1592 TARGET_LINK_LIBRARIES(fully-connected-nc-test PRIVATE XNNPACK gtest gtest_main)
1593 ADD_TEST(fully-connected-nc-test fully-connected-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001594
Marat Dukhanefc47b82019-11-18 09:25:38 -08001595 ADD_EXECUTABLE(global-average-pooling-nwc-test test/global-average-pooling-nwc.cc)
1596 SET_TARGET_PROPERTIES(global-average-pooling-nwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001597 CXX_STANDARD 11
1598 CXX_STANDARD_REQUIRED YES
1599 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001600 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-nwc-test PRIVATE src test)
1601 TARGET_LINK_LIBRARIES(global-average-pooling-nwc-test PRIVATE XNNPACK gtest gtest_main)
1602 ADD_TEST(global-average-pooling-nwc-test global-average-pooling-nwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001603
Marat Dukhanefc47b82019-11-18 09:25:38 -08001604 ADD_EXECUTABLE(global-average-pooling-ncw-test test/global-average-pooling-ncw.cc)
1605 SET_TARGET_PROPERTIES(global-average-pooling-ncw-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001606 CXX_STANDARD 11
1607 CXX_STANDARD_REQUIRED YES
1608 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001609 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-ncw-test PRIVATE src test)
1610 TARGET_LINK_LIBRARIES(global-average-pooling-ncw-test PRIVATE XNNPACK gtest gtest_main)
1611 ADD_TEST(global-average-pooling-ncw-test global-average-pooling-ncw-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001612
Marat Dukhanefc47b82019-11-18 09:25:38 -08001613 ADD_EXECUTABLE(hardswish-nc-test test/hardswish-nc.cc)
1614 SET_TARGET_PROPERTIES(hardswish-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001615 CXX_STANDARD 11
1616 CXX_STANDARD_REQUIRED YES
1617 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001618 TARGET_INCLUDE_DIRECTORIES(hardswish-nc-test PRIVATE src test)
1619 TARGET_LINK_LIBRARIES(hardswish-nc-test PRIVATE XNNPACK gtest gtest_main)
1620 ADD_TEST(hardswish-nc-test hardswish-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001621
Marat Dukhanefc47b82019-11-18 09:25:38 -08001622 ADD_EXECUTABLE(leaky-relu-nc-test test/leaky-relu-nc.cc)
1623 SET_TARGET_PROPERTIES(leaky-relu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001624 CXX_STANDARD 11
1625 CXX_STANDARD_REQUIRED YES
1626 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001627 TARGET_INCLUDE_DIRECTORIES(leaky-relu-nc-test PRIVATE src test)
1628 TARGET_LINK_LIBRARIES(leaky-relu-nc-test PRIVATE XNNPACK gtest gtest_main)
1629 ADD_TEST(leaky-relu-nc-test leaky-relu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001630
Marat Dukhanefc47b82019-11-18 09:25:38 -08001631 ADD_EXECUTABLE(max-pooling-nhwc-test test/max-pooling-nhwc.cc)
1632 SET_TARGET_PROPERTIES(max-pooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001633 CXX_STANDARD 11
1634 CXX_STANDARD_REQUIRED YES
1635 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001636 TARGET_INCLUDE_DIRECTORIES(max-pooling-nhwc-test PRIVATE src test)
1637 TARGET_LINK_LIBRARIES(max-pooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1638 ADD_TEST(max-pooling-nhwc-test max-pooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001639
Marat Dukhan79e7f842019-12-05 14:35:50 -08001640 ADD_EXECUTABLE(maximum-nd-test test/multiply-nd.cc)
1641 SET_TARGET_PROPERTIES(maximum-nd-test PROPERTIES
1642 CXX_STANDARD 11
1643 CXX_STANDARD_REQUIRED YES
1644 CXX_EXTENSIONS NO)
1645 TARGET_INCLUDE_DIRECTORIES(maximum-nd-test PRIVATE src test)
1646 TARGET_LINK_LIBRARIES(maximum-nd-test PRIVATE XNNPACK gtest gtest_main)
1647 ADD_TEST(maximum-nd-test maximum-nd-test)
1648
1649 ADD_EXECUTABLE(minimum-nd-test test/multiply-nd.cc)
1650 SET_TARGET_PROPERTIES(minimum-nd-test PROPERTIES
1651 CXX_STANDARD 11
1652 CXX_STANDARD_REQUIRED YES
1653 CXX_EXTENSIONS NO)
1654 TARGET_INCLUDE_DIRECTORIES(minimum-nd-test PRIVATE src test)
1655 TARGET_LINK_LIBRARIES(minimum-nd-test PRIVATE XNNPACK gtest gtest_main)
1656 ADD_TEST(minimum-nd-test minimum-nd-test)
1657
Marat Dukhanefc47b82019-11-18 09:25:38 -08001658 ADD_EXECUTABLE(multiply-nd-test test/multiply-nd.cc)
1659 SET_TARGET_PROPERTIES(multiply-nd-test PROPERTIES
Marat Dukhan9d501d52019-11-16 02:30:50 -08001660 CXX_STANDARD 11
1661 CXX_STANDARD_REQUIRED YES
1662 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001663 TARGET_INCLUDE_DIRECTORIES(multiply-nd-test PRIVATE src test)
1664 TARGET_LINK_LIBRARIES(multiply-nd-test PRIVATE XNNPACK gtest gtest_main)
1665 ADD_TEST(multiply-nd-test multiply-nd-test)
Marat Dukhan9d501d52019-11-16 02:30:50 -08001666
Marat Dukhanefc47b82019-11-18 09:25:38 -08001667 ADD_EXECUTABLE(prelu-nc-test test/prelu-nc.cc)
1668 SET_TARGET_PROPERTIES(prelu-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001669 CXX_STANDARD 11
1670 CXX_STANDARD_REQUIRED YES
1671 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001672 TARGET_INCLUDE_DIRECTORIES(prelu-nc-test PRIVATE src test)
1673 TARGET_LINK_LIBRARIES(prelu-nc-test PRIVATE XNNPACK gtest gtest_main)
1674 ADD_TEST(prelu-nc-test prelu-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001675
Marat Dukhanefc47b82019-11-18 09:25:38 -08001676 ADD_EXECUTABLE(resize-bilinear-nhwc-test test/resize-bilinear-nhwc.cc)
1677 SET_TARGET_PROPERTIES(resize-bilinear-nhwc-test PROPERTIES
Marat Dukhan69722492019-11-11 19:55:50 -08001678 CXX_STANDARD 11
1679 CXX_STANDARD_REQUIRED YES
1680 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001681 TARGET_INCLUDE_DIRECTORIES(resize-bilinear-nhwc-test PRIVATE src test)
1682 TARGET_LINK_LIBRARIES(resize-bilinear-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1683 ADD_TEST(resize-bilinear-nhwc-test resize-bilinear-nhwc-test)
Marat Dukhan69722492019-11-11 19:55:50 -08001684
Marat Dukhanefc47b82019-11-18 09:25:38 -08001685 ADD_EXECUTABLE(sigmoid-nc-test test/sigmoid-nc.cc)
1686 SET_TARGET_PROPERTIES(sigmoid-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001687 CXX_STANDARD 11
1688 CXX_STANDARD_REQUIRED YES
1689 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001690 TARGET_INCLUDE_DIRECTORIES(sigmoid-nc-test PRIVATE src test)
1691 TARGET_LINK_LIBRARIES(sigmoid-nc-test PRIVATE XNNPACK gtest gtest_main)
1692 ADD_TEST(sigmoid-nc-test sigmoid-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001693
Marat Dukhanefc47b82019-11-18 09:25:38 -08001694 ADD_EXECUTABLE(softargmax-nc-test test/softargmax-nc.cc)
1695 SET_TARGET_PROPERTIES(softargmax-nc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001696 CXX_STANDARD 11
1697 CXX_STANDARD_REQUIRED YES
1698 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001699 TARGET_INCLUDE_DIRECTORIES(softargmax-nc-test PRIVATE src test)
1700 TARGET_LINK_LIBRARIES(softargmax-nc-test PRIVATE XNNPACK gtest gtest_main)
1701 ADD_TEST(softargmax-nc-test softargmax-nc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001702
Marat Dukhan05f3f6d2019-12-03 15:13:53 -08001703 ADD_EXECUTABLE(subtract-nd-test test/subtract-nd.cc)
1704 SET_TARGET_PROPERTIES(subtract-nd-test PROPERTIES
1705 CXX_STANDARD 11
1706 CXX_STANDARD_REQUIRED YES
1707 CXX_EXTENSIONS NO)
1708 TARGET_INCLUDE_DIRECTORIES(subtract-nd-test PRIVATE src test)
1709 TARGET_LINK_LIBRARIES(subtract-nd-test PRIVATE XNNPACK gtest gtest_main)
1710 ADD_TEST(subtract-nd-test subtract-nd-test)
1711
Marat Dukhanefc47b82019-11-18 09:25:38 -08001712 ADD_EXECUTABLE(unpooling-nhwc-test test/unpooling-nhwc.cc)
1713 SET_TARGET_PROPERTIES(unpooling-nhwc-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001714 CXX_STANDARD 11
1715 CXX_STANDARD_REQUIRED YES
1716 CXX_EXTENSIONS NO)
Marat Dukhanefc47b82019-11-18 09:25:38 -08001717 TARGET_INCLUDE_DIRECTORIES(unpooling-nhwc-test PRIVATE src test)
1718 TARGET_LINK_LIBRARIES(unpooling-nhwc-test PRIVATE XNNPACK gtest gtest_main)
1719 ADD_TEST(unpooling-nhwc-test unpooling-nhwc-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001720
1721 # ---[ Build microkernel-level unit tests
1722 ADD_EXECUTABLE(f16-gemm-test test/f16-gemm.cc)
1723 SET_TARGET_PROPERTIES(f16-gemm-test PROPERTIES
1724 CXX_STANDARD 11
1725 CXX_STANDARD_REQUIRED YES
1726 CXX_EXTENSIONS YES)
1727 TARGET_INCLUDE_DIRECTORIES(f16-gemm-test PRIVATE src test)
1728 TARGET_LINK_LIBRARIES(f16-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1729 ADD_TEST(f16-gemm-test f16-gemm-test)
1730
1731 ADD_EXECUTABLE(f32-argmaxpool-test test/f32-argmaxpool.cc)
1732 SET_TARGET_PROPERTIES(f32-argmaxpool-test PROPERTIES
1733 CXX_STANDARD 11
1734 CXX_STANDARD_REQUIRED YES
1735 CXX_EXTENSIONS YES)
1736 TARGET_INCLUDE_DIRECTORIES(f32-argmaxpool-test PRIVATE src test)
1737 TARGET_LINK_LIBRARIES(f32-argmaxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1738 ADD_TEST(f32-argmaxpool-test f32-argmaxpool-test)
1739
1740 ADD_EXECUTABLE(f32-avgpool-test test/f32-avgpool.cc)
1741 SET_TARGET_PROPERTIES(f32-avgpool-test PROPERTIES
1742 CXX_STANDARD 11
1743 CXX_STANDARD_REQUIRED YES
1744 CXX_EXTENSIONS YES)
1745 TARGET_INCLUDE_DIRECTORIES(f32-avgpool-test PRIVATE src test)
1746 TARGET_LINK_LIBRARIES(f32-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1747 ADD_TEST(f32-avgpool-test f32-avgpool-test)
1748
Marat Dukhanc465fc22019-11-07 19:20:28 -08001749 ADD_EXECUTABLE(f32-bilinear-test test/f32-bilinear.cc)
1750 SET_TARGET_PROPERTIES(f32-bilinear-test PROPERTIES
1751 CXX_STANDARD 11
1752 CXX_STANDARD_REQUIRED YES
1753 CXX_EXTENSIONS YES)
1754 TARGET_INCLUDE_DIRECTORIES(f32-bilinear-test PRIVATE src test)
1755 TARGET_LINK_LIBRARIES(f32-bilinear-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1756 ADD_TEST(f32-bilinear-test f32-bilinear-test)
1757
Marat Dukhan53873d02019-12-06 17:21:30 -08001758 ADD_EXECUTABLE(f32-clamp-test test/f32-clamp.cc)
1759 SET_TARGET_PROPERTIES(f32-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001760 CXX_STANDARD 11
1761 CXX_STANDARD_REQUIRED YES
1762 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001763 TARGET_INCLUDE_DIRECTORIES(f32-clamp-test PRIVATE src test)
1764 TARGET_LINK_LIBRARIES(f32-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1765 ADD_TEST(f32-clamp-test f32-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001766
1767 ADD_EXECUTABLE(f32-conv-hwc-test test/f32-conv-hwc.cc)
1768 SET_TARGET_PROPERTIES(f32-conv-hwc-test PROPERTIES
1769 CXX_STANDARD 11
1770 CXX_STANDARD_REQUIRED YES
1771 CXX_EXTENSIONS YES)
1772 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-test PRIVATE src test)
1773 TARGET_LINK_LIBRARIES(f32-conv-hwc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1774 ADD_TEST(f32-conv-hwc-test f32-conv-hwc-test)
1775
1776 ADD_EXECUTABLE(f32-conv-hwc2spchw-test test/f32-conv-hwc2spchw.cc)
1777 SET_TARGET_PROPERTIES(f32-conv-hwc2spchw-test PROPERTIES
1778 CXX_STANDARD 11
1779 CXX_STANDARD_REQUIRED YES
1780 CXX_EXTENSIONS YES)
1781 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc2spchw-test PRIVATE src test)
1782 TARGET_LINK_LIBRARIES(f32-conv-hwc2spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1783 ADD_TEST(f32-conv-hwc2spchw-test f32-conv-hwc2spchw-test)
1784
1785 ADD_EXECUTABLE(f32-dwconv-spchw-test test/f32-dwconv-spchw.cc)
1786 SET_TARGET_PROPERTIES(f32-dwconv-spchw-test PROPERTIES
1787 CXX_STANDARD 11
1788 CXX_STANDARD_REQUIRED YES
1789 CXX_EXTENSIONS YES)
1790 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-test PRIVATE src test)
1791 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1792 ADD_TEST(f32-dwconv-spchw-test f32-dwconv-spchw-test)
1793
1794 ADD_EXECUTABLE(f32-dwconv-test test/f32-dwconv.cc)
1795 SET_TARGET_PROPERTIES(f32-dwconv-test PROPERTIES
1796 CXX_STANDARD 11
1797 CXX_STANDARD_REQUIRED YES
1798 CXX_EXTENSIONS YES)
1799 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-test PRIVATE src test)
1800 TARGET_LINK_LIBRARIES(f32-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1801 ADD_TEST(f32-dwconv-test f32-dwconv-test)
1802
1803 ADD_EXECUTABLE(f32-gavgpool-spchw-test test/f32-gavgpool-spchw.cc)
1804 SET_TARGET_PROPERTIES(f32-gavgpool-spchw-test PROPERTIES
1805 CXX_STANDARD 11
1806 CXX_STANDARD_REQUIRED YES
1807 CXX_EXTENSIONS YES)
1808 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-spchw-test PRIVATE src test)
1809 TARGET_LINK_LIBRARIES(f32-gavgpool-spchw-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1810 ADD_TEST(f32-gavgpool-spchw-test f32-gavgpool-spchw-test)
1811
1812 ADD_EXECUTABLE(f32-gavgpool-test test/f32-gavgpool.cc)
1813 SET_TARGET_PROPERTIES(f32-gavgpool-test PROPERTIES
1814 CXX_STANDARD 11
1815 CXX_STANDARD_REQUIRED YES
1816 CXX_EXTENSIONS YES)
1817 TARGET_INCLUDE_DIRECTORIES(f32-gavgpool-test PRIVATE src test)
1818 TARGET_LINK_LIBRARIES(f32-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1819 ADD_TEST(f32-gavgpool-test f32-gavgpool-test)
1820
1821 ADD_EXECUTABLE(f32-gemm-test test/f32-gemm.cc)
1822 SET_TARGET_PROPERTIES(f32-gemm-test PROPERTIES
1823 CXX_STANDARD 11
1824 CXX_STANDARD_REQUIRED YES
1825 CXX_EXTENSIONS YES)
1826 TARGET_INCLUDE_DIRECTORIES(f32-gemm-test PRIVATE src test)
1827 TARGET_LINK_LIBRARIES(f32-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1828 ADD_TEST(f32-gemm-test f32-gemm-test)
1829
1830 ADD_EXECUTABLE(f32-gemminc-test test/f32-gemminc.cc)
1831 SET_TARGET_PROPERTIES(f32-gemminc-test PROPERTIES
1832 CXX_STANDARD 11
1833 CXX_STANDARD_REQUIRED YES
1834 CXX_EXTENSIONS YES)
1835 TARGET_INCLUDE_DIRECTORIES(f32-gemminc-test PRIVATE src test)
1836 TARGET_LINK_LIBRARIES(f32-gemminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1837 ADD_TEST(f32-gemminc-test f32-gemminc-test)
1838
1839 ADD_EXECUTABLE(f32-hswish-test test/f32-hswish.cc)
1840 SET_TARGET_PROPERTIES(f32-hswish-test PROPERTIES
1841 CXX_STANDARD 11
1842 CXX_STANDARD_REQUIRED YES
1843 CXX_EXTENSIONS YES)
1844 TARGET_INCLUDE_DIRECTORIES(f32-hswish-test PRIVATE src test)
1845 TARGET_LINK_LIBRARIES(f32-hswish-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1846 ADD_TEST(f32-hswish-test f32-hswish-test)
1847
1848 ADD_EXECUTABLE(f32-igemm-test test/f32-igemm.cc)
1849 SET_TARGET_PROPERTIES(f32-igemm-test PROPERTIES
1850 CXX_STANDARD 11
1851 CXX_STANDARD_REQUIRED YES
1852 CXX_EXTENSIONS YES)
1853 TARGET_INCLUDE_DIRECTORIES(f32-igemm-test PRIVATE src test)
1854 TARGET_LINK_LIBRARIES(f32-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1855 ADD_TEST(f32-igemm-test f32-igemm-test)
1856
1857 ADD_EXECUTABLE(f32-maxpool-test test/f32-maxpool.cc)
1858 SET_TARGET_PROPERTIES(f32-maxpool-test PROPERTIES
1859 CXX_STANDARD 11
1860 CXX_STANDARD_REQUIRED YES
1861 CXX_EXTENSIONS YES)
1862 TARGET_INCLUDE_DIRECTORIES(f32-maxpool-test PRIVATE src test)
1863 TARGET_LINK_LIBRARIES(f32-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1864 ADD_TEST(f32-maxpool-test f32-maxpool-test)
1865
1866 ADD_EXECUTABLE(f32-pavgpool-test test/f32-pavgpool.cc)
1867 SET_TARGET_PROPERTIES(f32-pavgpool-test PROPERTIES
1868 CXX_STANDARD 11
1869 CXX_STANDARD_REQUIRED YES
1870 CXX_EXTENSIONS YES)
1871 TARGET_INCLUDE_DIRECTORIES(f32-pavgpool-test PRIVATE src test)
1872 TARGET_LINK_LIBRARIES(f32-pavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1873 ADD_TEST(f32-pavgpool-test f32-pavgpool-test)
1874
1875 ADD_EXECUTABLE(f32-ppmm-test test/f32-ppmm.cc)
1876 SET_TARGET_PROPERTIES(f32-ppmm-test PROPERTIES
1877 CXX_STANDARD 11
1878 CXX_STANDARD_REQUIRED YES
1879 CXX_EXTENSIONS YES)
1880 TARGET_INCLUDE_DIRECTORIES(f32-ppmm-test PRIVATE src test)
1881 TARGET_LINK_LIBRARIES(f32-ppmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1882 ADD_TEST(f32-ppmm-test f32-ppmm-test)
1883
Marat Dukhan53873d02019-12-06 17:21:30 -08001884 ADD_EXECUTABLE(f32-prelu-test test/f32-prelu.cc)
1885 SET_TARGET_PROPERTIES(f32-prelu-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001886 CXX_STANDARD 11
1887 CXX_STANDARD_REQUIRED YES
1888 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001889 TARGET_INCLUDE_DIRECTORIES(f32-prelu-test PRIVATE src test)
1890 TARGET_LINK_LIBRARIES(f32-prelu-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1891 ADD_TEST(f32-prelu-test f32-prelu-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001892
Marat Dukhan97579532019-10-18 16:40:39 -07001893 ADD_EXECUTABLE(f32-raddexpminusmax-test test/f32-raddexpminusmax.cc)
1894 SET_TARGET_PROPERTIES(f32-raddexpminusmax-test PROPERTIES
1895 CXX_STANDARD 11
1896 CXX_STANDARD_REQUIRED YES
1897 CXX_EXTENSIONS YES)
1898 TARGET_INCLUDE_DIRECTORIES(f32-raddexpminusmax-test PRIVATE src test)
1899 TARGET_LINK_LIBRARIES(f32-raddexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1900 ADD_TEST(f32-raddexpminusmax-test f32-raddexpminusmax-test)
1901
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001902 ADD_EXECUTABLE(f32-raddextexp-test test/f32-raddextexp.cc)
1903 SET_TARGET_PROPERTIES(f32-raddextexp-test PROPERTIES
1904 CXX_STANDARD 11
1905 CXX_STANDARD_REQUIRED YES
1906 CXX_EXTENSIONS YES)
1907 TARGET_INCLUDE_DIRECTORIES(f32-raddextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07001908 TARGET_LINK_LIBRARIES(f32-raddextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07001909 ADD_TEST(f32-raddextexp-test f32-raddextexp-test)
1910
Marat Dukhan97579532019-10-18 16:40:39 -07001911 ADD_EXECUTABLE(f32-raddstoreexpminusmax-test test/f32-raddstoreexpminusmax.cc)
1912 SET_TARGET_PROPERTIES(f32-raddstoreexpminusmax-test PROPERTIES
1913 CXX_STANDARD 11
1914 CXX_STANDARD_REQUIRED YES
1915 CXX_EXTENSIONS YES)
1916 TARGET_INCLUDE_DIRECTORIES(f32-raddstoreexpminusmax-test PRIVATE src test)
1917 TARGET_LINK_LIBRARIES(f32-raddstoreexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1918 ADD_TEST(f32-raddstoreexpminusmax-test f32-raddstoreexpminusmax-test)
1919
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001920 ADD_EXECUTABLE(f32-rmax-test test/f32-rmax.cc)
1921 SET_TARGET_PROPERTIES(f32-rmax-test PROPERTIES
1922 CXX_STANDARD 11
1923 CXX_STANDARD_REQUIRED YES
1924 CXX_EXTENSIONS YES)
1925 TARGET_INCLUDE_DIRECTORIES(f32-rmax-test PRIVATE src test)
1926 TARGET_LINK_LIBRARIES(f32-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1927 ADD_TEST(f32-rmax-test f32-rmax-test)
1928
Marat Dukhan581c1ac2019-11-18 14:57:54 -08001929 ADD_EXECUTABLE(f32-sigmoid-test test/f32-sigmoid.cc)
1930 SET_TARGET_PROPERTIES(f32-sigmoid-test PROPERTIES
1931 CXX_STANDARD 11
1932 CXX_STANDARD_REQUIRED YES
1933 CXX_EXTENSIONS YES)
1934 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-test PRIVATE src test)
1935 TARGET_LINK_LIBRARIES(f32-sigmoid-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1936 ADD_TEST(f32-sigmoid-test f32-sigmoid-test)
1937
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001938 ADD_EXECUTABLE(f32-spmm-test test/f32-spmm.cc)
1939 SET_TARGET_PROPERTIES(f32-spmm-test PROPERTIES
1940 CXX_STANDARD 11
1941 CXX_STANDARD_REQUIRED YES
1942 CXX_EXTENSIONS YES)
1943 TARGET_INCLUDE_DIRECTORIES(f32-spmm-test PRIVATE src test)
1944 TARGET_LINK_LIBRARIES(f32-spmm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1945 ADD_TEST(f32-spmm-test f32-spmm-test)
1946
Marat Dukhan53873d02019-12-06 17:21:30 -08001947 ADD_EXECUTABLE(f32-vadd-test test/f32-vadd.cc)
1948 SET_TARGET_PROPERTIES(f32-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001949 CXX_STANDARD 11
1950 CXX_STANDARD_REQUIRED YES
1951 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08001952 TARGET_INCLUDE_DIRECTORIES(f32-vadd-test PRIVATE src test)
1953 TARGET_LINK_LIBRARIES(f32-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1954 ADD_TEST(f32-vadd-test f32-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07001955
Marat Dukhanc76065f2019-11-14 18:13:33 -08001956 ADD_EXECUTABLE(f32-vaddc-test test/f32-vaddc.cc)
1957 SET_TARGET_PROPERTIES(f32-vaddc-test PROPERTIES
1958 CXX_STANDARD 11
1959 CXX_STANDARD_REQUIRED YES
1960 CXX_EXTENSIONS YES)
1961 TARGET_INCLUDE_DIRECTORIES(f32-vaddc-test PRIVATE src test)
1962 TARGET_LINK_LIBRARIES(f32-vaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1963 ADD_TEST(f32-vaddc-test f32-vaddc-test)
1964
Marat Dukhan77ca6302019-12-06 12:48:15 -08001965 ADD_EXECUTABLE(f32-vdiv-test test/f32-vdiv.cc)
1966 SET_TARGET_PROPERTIES(f32-vdiv-test PROPERTIES
1967 CXX_STANDARD 11
1968 CXX_STANDARD_REQUIRED YES
1969 CXX_EXTENSIONS YES)
1970 TARGET_INCLUDE_DIRECTORIES(f32-vdiv-test PRIVATE src test)
1971 TARGET_LINK_LIBRARIES(f32-vdiv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1972 ADD_TEST(f32-vdiv-test f32-vdiv-test)
1973
1974 ADD_EXECUTABLE(f32-vdivc-test test/f32-vdivc.cc)
1975 SET_TARGET_PROPERTIES(f32-vdivc-test PROPERTIES
1976 CXX_STANDARD 11
1977 CXX_STANDARD_REQUIRED YES
1978 CXX_EXTENSIONS YES)
1979 TARGET_INCLUDE_DIRECTORIES(f32-vdivc-test PRIVATE src test)
1980 TARGET_LINK_LIBRARIES(f32-vdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1981 ADD_TEST(f32-vdivc-test f32-vdivc-test)
1982
1983 ADD_EXECUTABLE(f32-vrdivc-test test/f32-vrdivc.cc)
1984 SET_TARGET_PROPERTIES(f32-vrdivc-test PROPERTIES
1985 CXX_STANDARD 11
1986 CXX_STANDARD_REQUIRED YES
1987 CXX_EXTENSIONS YES)
1988 TARGET_INCLUDE_DIRECTORIES(f32-vrdivc-test PRIVATE src test)
1989 TARGET_LINK_LIBRARIES(f32-vrdivc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1990 ADD_TEST(f32-vrdivc-test f32-vrdivc-test)
1991
Marat Dukhan403b7d42019-12-05 12:49:11 -08001992 ADD_EXECUTABLE(f32-vmax-test test/f32-vmax.cc)
1993 SET_TARGET_PROPERTIES(f32-vmax-test PROPERTIES
1994 CXX_STANDARD 11
1995 CXX_STANDARD_REQUIRED YES
1996 CXX_EXTENSIONS YES)
1997 TARGET_INCLUDE_DIRECTORIES(f32-vmax-test PRIVATE src test)
1998 TARGET_LINK_LIBRARIES(f32-vmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
1999 ADD_TEST(f32-vmax-test f32-vmax-test)
2000
2001 ADD_EXECUTABLE(f32-vmaxc-test test/f32-vmaxc.cc)
2002 SET_TARGET_PROPERTIES(f32-vmaxc-test PROPERTIES
2003 CXX_STANDARD 11
2004 CXX_STANDARD_REQUIRED YES
2005 CXX_EXTENSIONS YES)
2006 TARGET_INCLUDE_DIRECTORIES(f32-vmaxc-test PRIVATE src test)
2007 TARGET_LINK_LIBRARIES(f32-vmaxc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2008 ADD_TEST(f32-vmaxc-test f32-vmaxc-test)
2009
2010 ADD_EXECUTABLE(f32-vmin-test test/f32-vmin.cc)
2011 SET_TARGET_PROPERTIES(f32-vmin-test PROPERTIES
2012 CXX_STANDARD 11
2013 CXX_STANDARD_REQUIRED YES
2014 CXX_EXTENSIONS YES)
2015 TARGET_INCLUDE_DIRECTORIES(f32-vmin-test PRIVATE src test)
2016 TARGET_LINK_LIBRARIES(f32-vmin-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2017 ADD_TEST(f32-vmin-test f32-vmin-test)
2018
2019 ADD_EXECUTABLE(f32-vminc-test test/f32-vminc.cc)
2020 SET_TARGET_PROPERTIES(f32-vminc-test PROPERTIES
2021 CXX_STANDARD 11
2022 CXX_STANDARD_REQUIRED YES
2023 CXX_EXTENSIONS YES)
2024 TARGET_INCLUDE_DIRECTORIES(f32-vminc-test PRIVATE src test)
2025 TARGET_LINK_LIBRARIES(f32-vminc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2026 ADD_TEST(f32-vminc-test f32-vminc-test)
2027
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002028 ADD_EXECUTABLE(f32-vmul-test test/f32-vmul.cc)
2029 SET_TARGET_PROPERTIES(f32-vmul-test PROPERTIES
2030 CXX_STANDARD 11
2031 CXX_STANDARD_REQUIRED YES
2032 CXX_EXTENSIONS YES)
2033 TARGET_INCLUDE_DIRECTORIES(f32-vmul-test PRIVATE src test)
2034 TARGET_LINK_LIBRARIES(f32-vmul-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2035 ADD_TEST(f32-vmul-test f32-vmul-test)
2036
Marat Dukhanc76065f2019-11-14 18:13:33 -08002037 ADD_EXECUTABLE(f32-vmulc-test test/f32-vmulc.cc)
2038 SET_TARGET_PROPERTIES(f32-vmulc-test PROPERTIES
2039 CXX_STANDARD 11
2040 CXX_STANDARD_REQUIRED YES
2041 CXX_EXTENSIONS YES)
2042 TARGET_INCLUDE_DIRECTORIES(f32-vmulc-test PRIVATE src test)
2043 TARGET_LINK_LIBRARIES(f32-vmulc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2044 ADD_TEST(f32-vmulc-test f32-vmulc-test)
2045
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002046 ADD_EXECUTABLE(f32-vmulcaddc-test test/f32-vmulcaddc.cc)
2047 SET_TARGET_PROPERTIES(f32-vmulcaddc-test PROPERTIES
2048 CXX_STANDARD 11
2049 CXX_STANDARD_REQUIRED YES
2050 CXX_EXTENSIONS YES)
2051 TARGET_INCLUDE_DIRECTORIES(f32-vmulcaddc-test PRIVATE src test)
2052 TARGET_LINK_LIBRARIES(f32-vmulcaddc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2053 ADD_TEST(f32-vmulcaddc-test f32-vmulcaddc-test)
2054
Marat Dukhan97579532019-10-18 16:40:39 -07002055 ADD_EXECUTABLE(f32-vscaleexpminusmax-test test/f32-vscaleexpminusmax.cc)
2056 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
2057 CXX_STANDARD 11
2058 CXX_STANDARD_REQUIRED YES
2059 CXX_EXTENSIONS YES)
2060 TARGET_INCLUDE_DIRECTORIES(f32-vscaleexpminusmax-test PRIVATE src test)
2061 TARGET_LINK_LIBRARIES(f32-vscaleexpminusmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2062 ADD_TEST(f32-vscaleexpminusmax-test f32-vscaleexpminusmax-test)
2063
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002064 ADD_EXECUTABLE(f32-vscaleextexp-test test/f32-vscaleextexp.cc)
2065 SET_TARGET_PROPERTIES(f32-vscaleexpminusmax-test PROPERTIES
2066 CXX_STANDARD 11
2067 CXX_STANDARD_REQUIRED YES
2068 CXX_EXTENSIONS YES)
2069 TARGET_INCLUDE_DIRECTORIES(f32-vscaleextexp-test PRIVATE src test)
Marat Dukhana5977df2019-10-30 22:02:15 -07002070 TARGET_LINK_LIBRARIES(f32-vscaleextexp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
Marat Dukhan6f8d4d32019-10-25 17:07:09 -07002071 ADD_TEST(f32-vscaleextexp-test f32-vscaleextexp-test)
2072
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002073 ADD_EXECUTABLE(f32-vsub-test test/f32-vsub.cc)
2074 SET_TARGET_PROPERTIES(f32-vsub-test PROPERTIES
2075 CXX_STANDARD 11
2076 CXX_STANDARD_REQUIRED YES
2077 CXX_EXTENSIONS YES)
2078 TARGET_INCLUDE_DIRECTORIES(f32-vsub-test PRIVATE src test)
2079 TARGET_LINK_LIBRARIES(f32-vsub-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2080 ADD_TEST(f32-vsub-test f32-vsub-test)
2081
Marat Dukhanc76065f2019-11-14 18:13:33 -08002082 ADD_EXECUTABLE(f32-vsubc-test test/f32-vsubc.cc)
2083 SET_TARGET_PROPERTIES(f32-vsubc-test PROPERTIES
2084 CXX_STANDARD 11
2085 CXX_STANDARD_REQUIRED YES
2086 CXX_EXTENSIONS YES)
2087 TARGET_INCLUDE_DIRECTORIES(f32-vsubc-test PRIVATE src test)
2088 TARGET_LINK_LIBRARIES(f32-vsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2089 ADD_TEST(f32-vsubc-test f32-vsubc-test)
2090
2091 ADD_EXECUTABLE(f32-vrsubc-test test/f32-vrsubc.cc)
2092 SET_TARGET_PROPERTIES(f32-vrsubc-test PROPERTIES
2093 CXX_STANDARD 11
2094 CXX_STANDARD_REQUIRED YES
2095 CXX_EXTENSIONS YES)
2096 TARGET_INCLUDE_DIRECTORIES(f32-vrsubc-test PRIVATE src test)
2097 TARGET_LINK_LIBRARIES(f32-vrsubc-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2098 ADD_TEST(f32-vrsubc-test f32-vrsubc-test)
2099
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002100 ADD_EXECUTABLE(q8-avgpool-test test/q8-avgpool.cc)
2101 SET_TARGET_PROPERTIES(q8-avgpool-test PROPERTIES
2102 CXX_STANDARD 11
2103 CXX_STANDARD_REQUIRED YES
2104 CXX_EXTENSIONS YES)
2105 TARGET_INCLUDE_DIRECTORIES(q8-avgpool-test PRIVATE src test)
2106 TARGET_LINK_LIBRARIES(q8-avgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2107 ADD_TEST(q8-avgpool-test q8-avgpool-test)
2108
2109 ADD_EXECUTABLE(q8-dwconv-test test/q8-dwconv.cc)
2110 SET_TARGET_PROPERTIES(q8-dwconv-test PROPERTIES
2111 CXX_STANDARD 11
2112 CXX_STANDARD_REQUIRED YES
2113 CXX_EXTENSIONS YES)
2114 TARGET_INCLUDE_DIRECTORIES(q8-dwconv-test PRIVATE src test)
2115 TARGET_LINK_LIBRARIES(q8-dwconv-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2116 ADD_TEST(q8-dwconv-test q8-dwconv-test)
2117
2118 ADD_EXECUTABLE(q8-gavgpool-test test/q8-gavgpool.cc)
2119 SET_TARGET_PROPERTIES(q8-gavgpool-test PROPERTIES
2120 CXX_STANDARD 11
2121 CXX_STANDARD_REQUIRED YES
2122 CXX_EXTENSIONS YES)
2123 TARGET_INCLUDE_DIRECTORIES(q8-gavgpool-test PRIVATE src test)
2124 TARGET_LINK_LIBRARIES(q8-gavgpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2125 ADD_TEST(q8-gavgpool-test q8-gavgpool-test)
2126
2127 ADD_EXECUTABLE(q8-gemm-test test/q8-gemm.cc)
2128 SET_TARGET_PROPERTIES(q8-gemm-test PROPERTIES
2129 CXX_STANDARD 11
2130 CXX_STANDARD_REQUIRED YES
2131 CXX_EXTENSIONS YES)
2132 TARGET_INCLUDE_DIRECTORIES(q8-gemm-test PRIVATE src test)
2133 TARGET_LINK_LIBRARIES(q8-gemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2134 ADD_TEST(q8-gemm-test q8-gemm-test)
2135
2136 ADD_EXECUTABLE(q8-igemm-test test/q8-igemm.cc)
2137 SET_TARGET_PROPERTIES(q8-igemm-test PROPERTIES
2138 CXX_STANDARD 11
2139 CXX_STANDARD_REQUIRED YES
2140 CXX_EXTENSIONS YES)
2141 TARGET_INCLUDE_DIRECTORIES(q8-igemm-test PRIVATE src test)
2142 TARGET_LINK_LIBRARIES(q8-igemm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2143 ADD_TEST(q8-igemm-test q8-igemm-test)
2144
Marat Dukhan53873d02019-12-06 17:21:30 -08002145 ADD_EXECUTABLE(q8-vadd-test test/q8-vadd.cc)
2146 SET_TARGET_PROPERTIES(q8-vadd-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002147 CXX_STANDARD 11
2148 CXX_STANDARD_REQUIRED YES
2149 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002150 TARGET_INCLUDE_DIRECTORIES(q8-vadd-test PRIVATE src test)
2151 TARGET_LINK_LIBRARIES(q8-vadd-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2152 ADD_TEST(q8-vadd-test q8-vadd-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002153
Marat Dukhan53873d02019-12-06 17:21:30 -08002154 ADD_EXECUTABLE(u8-clamp-test test/u8-clamp.cc)
2155 SET_TARGET_PROPERTIES(u8-clamp-test PROPERTIES
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002156 CXX_STANDARD 11
2157 CXX_STANDARD_REQUIRED YES
2158 CXX_EXTENSIONS YES)
Marat Dukhan53873d02019-12-06 17:21:30 -08002159 TARGET_INCLUDE_DIRECTORIES(u8-clamp-test PRIVATE src test)
2160 TARGET_LINK_LIBRARIES(u8-clamp-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2161 ADD_TEST(u8-clamp-test u8-clamp-test)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002162
2163 ADD_EXECUTABLE(u8-lut32norm-test test/u8-lut32norm.cc)
2164 SET_TARGET_PROPERTIES(u8-lut32norm-test PROPERTIES
2165 CXX_STANDARD 11
2166 CXX_STANDARD_REQUIRED YES
2167 CXX_EXTENSIONS YES)
2168 TARGET_INCLUDE_DIRECTORIES(u8-lut32norm-test PRIVATE src test)
2169 TARGET_LINK_LIBRARIES(u8-lut32norm-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2170 ADD_TEST(u8-lut32norm-test u8-lut32norm-test)
2171
2172 ADD_EXECUTABLE(u8-maxpool-test test/u8-maxpool.cc)
2173 SET_TARGET_PROPERTIES(u8-maxpool-test PROPERTIES
2174 CXX_STANDARD 11
2175 CXX_STANDARD_REQUIRED YES
2176 CXX_EXTENSIONS YES)
2177 TARGET_INCLUDE_DIRECTORIES(u8-maxpool-test PRIVATE src test)
2178 TARGET_LINK_LIBRARIES(u8-maxpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2179 ADD_TEST(u8-maxpool-test u8-maxpool-test)
2180
2181 ADD_EXECUTABLE(u8-rmax-test test/u8-rmax.cc)
2182 SET_TARGET_PROPERTIES(u8-rmax-test PROPERTIES
2183 CXX_STANDARD 11
2184 CXX_STANDARD_REQUIRED YES
2185 CXX_EXTENSIONS YES)
2186 TARGET_INCLUDE_DIRECTORIES(u8-rmax-test PRIVATE src test)
2187 TARGET_LINK_LIBRARIES(u8-rmax-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2188 ADD_TEST(u8-rmax-test u8-rmax-test)
2189
2190 ADD_EXECUTABLE(x32-packx-test test/x32-packx.cc)
2191 SET_TARGET_PROPERTIES(x32-packx-test PROPERTIES
2192 CXX_STANDARD 11
2193 CXX_STANDARD_REQUIRED YES
2194 CXX_EXTENSIONS YES)
2195 TARGET_INCLUDE_DIRECTORIES(x32-packx-test PRIVATE src test)
2196 TARGET_LINK_LIBRARIES(x32-packx-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2197 ADD_TEST(x32-packx-test x32-packx-test)
2198
2199 ADD_EXECUTABLE(x32-pad-test test/x32-pad.cc)
2200 SET_TARGET_PROPERTIES(x32-pad-test PROPERTIES
2201 CXX_STANDARD 11
2202 CXX_STANDARD_REQUIRED YES
2203 CXX_EXTENSIONS YES)
2204 TARGET_INCLUDE_DIRECTORIES(x32-pad-test PRIVATE src test)
2205 TARGET_LINK_LIBRARIES(x32-pad-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2206 ADD_TEST(x32-pad-test x32-pad-test)
2207
2208 ADD_EXECUTABLE(x32-unpool-test test/x32-unpool.cc)
2209 SET_TARGET_PROPERTIES(x32-unpool-test PROPERTIES
2210 CXX_STANDARD 11
2211 CXX_STANDARD_REQUIRED YES
2212 CXX_EXTENSIONS YES)
2213 TARGET_INCLUDE_DIRECTORIES(x32-unpool-test PRIVATE src test)
2214 TARGET_LINK_LIBRARIES(x32-unpool-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2215 ADD_TEST(x32-unpool-test x32-unpool-test)
2216
2217 ADD_EXECUTABLE(x32-zip-test test/x32-zip.cc)
2218 SET_TARGET_PROPERTIES(x32-zip-test PROPERTIES
2219 CXX_STANDARD 11
2220 CXX_STANDARD_REQUIRED YES
2221 CXX_EXTENSIONS YES)
2222 TARGET_INCLUDE_DIRECTORIES(x32-zip-test PRIVATE src test)
2223 TARGET_LINK_LIBRARIES(x32-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2224 ADD_TEST(x32-zip-test x32-zip-test)
2225
2226 ADD_EXECUTABLE(x8-lut-test test/x8-lut.cc)
2227 SET_TARGET_PROPERTIES(x8-lut-test PROPERTIES
2228 CXX_STANDARD 11
2229 CXX_STANDARD_REQUIRED YES
2230 CXX_EXTENSIONS YES)
2231 TARGET_INCLUDE_DIRECTORIES(x8-lut-test PRIVATE src test)
2232 TARGET_LINK_LIBRARIES(x8-lut-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2233 ADD_TEST(x8-lut-test x8-lut-test)
2234
2235 ADD_EXECUTABLE(x8-zip-test test/x8-zip.cc)
2236 SET_TARGET_PROPERTIES(x8-zip-test PROPERTIES
2237 CXX_STANDARD 11
2238 CXX_STANDARD_REQUIRED YES
2239 CXX_EXTENSIONS YES)
2240 TARGET_INCLUDE_DIRECTORIES(x8-zip-test PRIVATE src test)
2241 TARGET_LINK_LIBRARIES(x8-zip-test PRIVATE XNNPACK cpuinfo fp16 gtest gtest_main)
2242 ADD_TEST(x8-zip-test x8-zip-test)
2243ENDIF()
2244
2245# ---[ XNNPACK microbenchmarks
2246IF(XNNPACK_BUILD_BENCHMARKS)
2247 # ---[ Build google benchmark
2248 IF(NOT TARGET benchmark)
2249 SET(BENCHMARK_ENABLE_TESTING OFF CACHE BOOL "")
2250 ADD_SUBDIRECTORY(
2251 "${GOOGLEBENCHMARK_SOURCE_DIR}"
2252 "${CONFU_DEPENDENCIES_BINARY_DIR}/googlebenchmark")
2253 ENDIF()
2254
2255 ADD_LIBRARY(bench-utils bench/utils.cc)
2256 SET_TARGET_PROPERTIES(bench-utils PROPERTIES
2257 CXX_STANDARD 11
2258 CXX_STANDARD_REQUIRED YES
2259 CXX_EXTENSIONS NO)
2260 TARGET_INCLUDE_DIRECTORIES(bench-utils PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanbad48fe2019-11-04 10:35:22 -08002261 TARGET_LINK_LIBRARIES(bench-utils PRIVATE benchmark cpuinfo)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002262
Marat Dukhancb10f262019-11-16 15:52:37 -08002263 # ---[ Build accuracy microbenchmarks
2264 ADD_EXECUTABLE(f32-exp-eval eval/f32-exp.cc)
2265 SET_TARGET_PROPERTIES(f32-exp-eval PROPERTIES
2266 CXX_STANDARD 11
2267 CXX_STANDARD_REQUIRED YES
2268 CXX_EXTENSIONS NO)
2269 TARGET_INCLUDE_DIRECTORIES(f32-exp-eval PRIVATE src)
2270 TARGET_LINK_LIBRARIES(f32-exp-eval PRIVATE XNNPACK benchmark fp16)
2271
2272 ADD_EXECUTABLE(f32-expminus-eval eval/f32-expminus.cc)
2273 SET_TARGET_PROPERTIES(f32-expminus-eval PROPERTIES
2274 CXX_STANDARD 11
2275 CXX_STANDARD_REQUIRED YES
2276 CXX_EXTENSIONS NO)
2277 TARGET_INCLUDE_DIRECTORIES(f32-expminus-eval PRIVATE src)
2278 TARGET_LINK_LIBRARIES(f32-expminus-eval PRIVATE XNNPACK benchmark fp16)
2279
2280 ADD_EXECUTABLE(f32-extexp-eval eval/f32-extexp.cc)
2281 SET_TARGET_PROPERTIES(f32-extexp-eval PROPERTIES
2282 CXX_STANDARD 11
2283 CXX_STANDARD_REQUIRED YES
2284 CXX_EXTENSIONS YES)
2285 TARGET_INCLUDE_DIRECTORIES(f32-extexp-eval PRIVATE src)
2286 TARGET_LINK_LIBRARIES(f32-extexp-eval PRIVATE XNNPACK benchmark fp16)
2287
2288 ADD_EXECUTABLE(f32-sigmoid-eval eval/f32-sigmoid.cc)
2289 SET_TARGET_PROPERTIES(f32-sigmoid-eval PROPERTIES
2290 CXX_STANDARD 11
2291 CXX_STANDARD_REQUIRED YES
2292 CXX_EXTENSIONS NO)
2293 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-eval PRIVATE src)
2294 TARGET_LINK_LIBRARIES(f32-sigmoid-eval PRIVATE XNNPACK benchmark fp16)
2295
Marat Dukhan5f18d262019-10-31 10:24:14 -07002296 # ---[ Build end-to-end microbenchmarks
Marat Dukhan17e16282019-12-10 12:09:35 -08002297 ADD_LIBRARY(bench-models STATIC
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002298 models/mobilenet-v1.cc
2299 models/mobilenet-v2.cc
2300 models/mobilenet-v3-large.cc
2301 models/mobilenet-v3-small.cc)
2302 SET_TARGET_PROPERTIES(bench-models PROPERTIES
2303 CXX_STANDARD 11
2304 CXX_STANDARD_REQUIRED YES
2305 CXX_EXTENSIONS YES)
2306 TARGET_INCLUDE_DIRECTORIES(bench-models PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2307 TARGET_LINK_LIBRARIES(bench-models PRIVATE XNNPACK benchmark bench-utils)
2308
2309 ADD_EXECUTABLE(end2end-bench bench/end2end.cc)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002310 SET_TARGET_PROPERTIES(end2end-bench PROPERTIES
2311 CXX_STANDARD 11
2312 CXX_STANDARD_REQUIRED YES
2313 CXX_EXTENSIONS NO)
2314 TARGET_INCLUDE_DIRECTORIES(end2end-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002315 TARGET_LINK_LIBRARIES(end2end-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002316
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002317 ADD_EXECUTABLE(f32-dwconv-e2e-bench bench/f32-dwconv-e2e.cc)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002318 SET_TARGET_PROPERTIES(f32-dwconv-e2e-bench PROPERTIES
2319 CXX_STANDARD 11
2320 CXX_STANDARD_REQUIRED YES
2321 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002322 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002323 TARGET_LINK_LIBRARIES(f32-dwconv-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhanef4416e2019-10-31 13:44:40 -07002324
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002325 ADD_EXECUTABLE(f32-gemm-e2e-bench bench/f32-gemm-e2e.cc)
Marat Dukhan0a5a53f2019-10-31 10:58:31 -07002326 SET_TARGET_PROPERTIES(f32-gemm-e2e-bench PROPERTIES
Marat Dukhan5f18d262019-10-31 10:24:14 -07002327 CXX_STANDARD 11
2328 CXX_STANDARD_REQUIRED YES
2329 CXX_EXTENSIONS NO)
Marat Dukhanc9d2f3f2019-10-31 14:02:07 -07002330 TARGET_INCLUDE_DIRECTORIES(f32-gemm-e2e-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}" src)
Marat Dukhanc08cdf52019-12-09 09:17:51 -08002331 TARGET_LINK_LIBRARIES(f32-gemm-e2e-bench PRIVATE XNNPACK benchmark bench-models bench-utils)
Marat Dukhan5f18d262019-10-31 10:24:14 -07002332
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002333 # ---[ Build operator-level microbenchmarks
2334 ADD_EXECUTABLE(add-bench bench/add.cc)
2335 SET_TARGET_PROPERTIES(add-bench PROPERTIES
2336 CXX_STANDARD 11
2337 CXX_STANDARD_REQUIRED YES
2338 CXX_EXTENSIONS NO)
2339 TARGET_INCLUDE_DIRECTORIES(add-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2340 TARGET_LINK_LIBRARIES(add-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2341
2342 ADD_EXECUTABLE(average-pooling-bench bench/average-pooling.cc)
2343 SET_TARGET_PROPERTIES(average-pooling-bench PROPERTIES
2344 CXX_STANDARD 11
2345 CXX_STANDARD_REQUIRED YES
2346 CXX_EXTENSIONS NO)
2347 TARGET_INCLUDE_DIRECTORIES(average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2348 TARGET_LINK_LIBRARIES(average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2349
2350 ADD_EXECUTABLE(channel-shuffle-bench bench/channel-shuffle.cc)
2351 SET_TARGET_PROPERTIES(channel-shuffle-bench PROPERTIES
2352 CXX_STANDARD 11
2353 CXX_STANDARD_REQUIRED YES
2354 CXX_EXTENSIONS NO)
2355 TARGET_INCLUDE_DIRECTORIES(channel-shuffle-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2356 TARGET_LINK_LIBRARIES(channel-shuffle-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2357
2358 ADD_EXECUTABLE(convolution-bench bench/convolution.cc)
2359 SET_TARGET_PROPERTIES(convolution-bench PROPERTIES
2360 CXX_STANDARD 11
2361 CXX_STANDARD_REQUIRED YES
2362 CXX_EXTENSIONS NO)
2363 TARGET_INCLUDE_DIRECTORIES(convolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2364 TARGET_LINK_LIBRARIES(convolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2365
2366 ADD_EXECUTABLE(deconvolution-bench bench/deconvolution.cc)
2367 SET_TARGET_PROPERTIES(deconvolution-bench PROPERTIES
2368 CXX_STANDARD 11
2369 CXX_STANDARD_REQUIRED YES
2370 CXX_EXTENSIONS NO)
2371 TARGET_INCLUDE_DIRECTORIES(deconvolution-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2372 TARGET_LINK_LIBRARIES(deconvolution-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2373
2374 ADD_EXECUTABLE(global-average-pooling-bench bench/global-average-pooling.cc)
2375 SET_TARGET_PROPERTIES(global-average-pooling-bench PROPERTIES
2376 CXX_STANDARD 11
2377 CXX_STANDARD_REQUIRED YES
2378 CXX_EXTENSIONS NO)
2379 TARGET_INCLUDE_DIRECTORIES(global-average-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2380 TARGET_LINK_LIBRARIES(global-average-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2381
2382 ADD_EXECUTABLE(max-pooling-bench bench/max-pooling.cc)
2383 SET_TARGET_PROPERTIES(max-pooling-bench PROPERTIES
2384 CXX_STANDARD 11
2385 CXX_STANDARD_REQUIRED YES
2386 CXX_EXTENSIONS NO)
2387 TARGET_INCLUDE_DIRECTORIES(max-pooling-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2388 TARGET_LINK_LIBRARIES(max-pooling-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2389
Marat Dukhan95b22432019-10-30 16:30:14 -07002390 ADD_EXECUTABLE(prelu-bench bench/prelu.cc)
2391 SET_TARGET_PROPERTIES(prelu-bench PROPERTIES
2392 CXX_STANDARD 11
2393 CXX_STANDARD_REQUIRED YES
2394 CXX_EXTENSIONS NO)
2395 TARGET_INCLUDE_DIRECTORIES(prelu-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2396 TARGET_LINK_LIBRARIES(prelu-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2397
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002398 ADD_EXECUTABLE(sigmoid-bench bench/sigmoid.cc)
2399 SET_TARGET_PROPERTIES(sigmoid-bench PROPERTIES
2400 CXX_STANDARD 11
2401 CXX_STANDARD_REQUIRED YES
2402 CXX_EXTENSIONS NO)
2403 TARGET_INCLUDE_DIRECTORIES(sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2404 TARGET_LINK_LIBRARIES(sigmoid-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2405
2406 ADD_EXECUTABLE(softargmax-bench bench/softargmax.cc)
2407 SET_TARGET_PROPERTIES(softargmax-bench PROPERTIES
2408 CXX_STANDARD 11
2409 CXX_STANDARD_REQUIRED YES
2410 CXX_EXTENSIONS NO)
2411 TARGET_INCLUDE_DIRECTORIES(softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2412 TARGET_LINK_LIBRARIES(softargmax-bench PRIVATE XNNPACK cpuinfo benchmark bench-utils)
2413
2414 # ---[ Build microkernel-level microbenchmarks
2415 ADD_EXECUTABLE(f16-gemm-bench bench/f16-gemm.cc)
2416 SET_TARGET_PROPERTIES(f16-gemm-bench PROPERTIES
2417 CXX_STANDARD 11
2418 CXX_STANDARD_REQUIRED YES
2419 CXX_EXTENSIONS YES)
2420 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE src)
2421 TARGET_INCLUDE_DIRECTORIES(f16-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2422 TARGET_LINK_LIBRARIES(f16-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2423
2424 ADD_EXECUTABLE(f32-conv-hwc-bench bench/f32-conv-hwc.cc)
2425 SET_TARGET_PROPERTIES(f32-conv-hwc-bench PROPERTIES
2426 CXX_STANDARD 11
2427 CXX_STANDARD_REQUIRED YES
2428 CXX_EXTENSIONS YES)
2429 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE src)
2430 TARGET_INCLUDE_DIRECTORIES(f32-conv-hwc-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2431 TARGET_LINK_LIBRARIES(f32-conv-hwc-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2432
2433 ADD_EXECUTABLE(f32-dwconv-spchw-bench bench/f32-dwconv-spchw.cc)
2434 SET_TARGET_PROPERTIES(f32-dwconv-spchw-bench PROPERTIES
2435 CXX_STANDARD 11
2436 CXX_STANDARD_REQUIRED YES
2437 CXX_EXTENSIONS YES)
2438 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE src)
2439 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-spchw-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2440 TARGET_LINK_LIBRARIES(f32-dwconv-spchw-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2441
2442 ADD_EXECUTABLE(f32-dwconv-bench bench/f32-dwconv.cc)
2443 SET_TARGET_PROPERTIES(f32-dwconv-bench PROPERTIES
2444 CXX_STANDARD 11
2445 CXX_STANDARD_REQUIRED YES
2446 CXX_EXTENSIONS YES)
2447 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE src)
2448 TARGET_INCLUDE_DIRECTORIES(f32-dwconv-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2449 TARGET_LINK_LIBRARIES(f32-dwconv-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2450
2451 ADD_EXECUTABLE(f32-gemm-bench bench/f32-gemm.cc)
2452 SET_TARGET_PROPERTIES(f32-gemm-bench PROPERTIES
2453 CXX_STANDARD 11
2454 CXX_STANDARD_REQUIRED YES
2455 CXX_EXTENSIONS YES)
2456 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE src)
2457 TARGET_INCLUDE_DIRECTORIES(f32-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2458 TARGET_LINK_LIBRARIES(f32-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2459
2460 ADD_EXECUTABLE(f32-igemm-bench bench/f32-igemm.cc)
2461 SET_TARGET_PROPERTIES(f32-igemm-bench PROPERTIES
2462 CXX_STANDARD 11
2463 CXX_STANDARD_REQUIRED YES
2464 CXX_EXTENSIONS YES)
2465 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE src)
2466 TARGET_INCLUDE_DIRECTORIES(f32-igemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2467 TARGET_LINK_LIBRARIES(f32-igemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2468
2469 ADD_EXECUTABLE(f32-im2col-gemm-bench bench/f32-im2col-gemm.cc src/im2col.c)
2470 SET_TARGET_PROPERTIES(f32-im2col-gemm-bench PROPERTIES
2471 C_STANDARD 99
2472 C_STANDARD_REQUIRED YES
2473 C_EXTENSIONS NO
2474 CXX_STANDARD 11
2475 CXX_STANDARD_REQUIRED YES
2476 CXX_EXTENSIONS YES)
2477 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE src)
2478 TARGET_INCLUDE_DIRECTORIES(f32-im2col-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2479 TARGET_LINK_LIBRARIES(f32-im2col-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2480
2481 ADD_EXECUTABLE(f32-rmax-bench bench/f32-rmax.cc)
2482 SET_TARGET_PROPERTIES(f32-rmax-bench PROPERTIES
2483 CXX_STANDARD 11
2484 CXX_STANDARD_REQUIRED YES
2485 CXX_EXTENSIONS YES)
2486 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE src)
2487 TARGET_INCLUDE_DIRECTORIES(f32-rmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2488 TARGET_LINK_LIBRARIES(f32-rmax-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2489
Marat Dukhan581c1ac2019-11-18 14:57:54 -08002490 ADD_EXECUTABLE(f32-sigmoid-bench bench/f32-sigmoid.cc)
2491 SET_TARGET_PROPERTIES(f32-sigmoid-bench PROPERTIES
2492 CXX_STANDARD 11
2493 CXX_STANDARD_REQUIRED YES
2494 CXX_EXTENSIONS YES)
2495 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE src)
2496 TARGET_INCLUDE_DIRECTORIES(f32-sigmoid-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2497 TARGET_LINK_LIBRARIES(f32-sigmoid-bench PRIVATE XNNPACK benchmark bench-utils)
2498
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002499 ADD_EXECUTABLE(f32-spmm-bench bench/f32-spmm.cc)
2500 SET_TARGET_PROPERTIES(f32-spmm-bench PROPERTIES
2501 CXX_STANDARD 11
2502 CXX_STANDARD_REQUIRED YES
2503 CXX_EXTENSIONS YES)
2504 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE src)
2505 TARGET_INCLUDE_DIRECTORIES(f32-spmm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2506 TARGET_LINK_LIBRARIES(f32-spmm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2507
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07002508 ADD_EXECUTABLE(f32-softargmax-bench bench/f32-softargmax.cc)
2509 SET_TARGET_PROPERTIES(f32-softargmax-bench PROPERTIES
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002510 CXX_STANDARD 11
2511 CXX_STANDARD_REQUIRED YES
2512 CXX_EXTENSIONS YES)
Ashkan Aliabadi7892d972019-10-24 16:00:52 -07002513 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE src)
2514 TARGET_INCLUDE_DIRECTORIES(f32-softargmax-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2515 TARGET_LINK_LIBRARIES(f32-softargmax-bench PRIVATE XNNPACK fp16 benchmark bench-utils)
Marat Dukhan4a4a7fa2019-10-21 13:46:14 -07002516
Marat Dukhan2dbdc2f2019-10-08 16:36:23 -07002517 ADD_EXECUTABLE(q8-gemm-bench bench/q8-gemm.cc)
2518 SET_TARGET_PROPERTIES(q8-gemm-bench PROPERTIES
2519 CXX_STANDARD 11
2520 CXX_STANDARD_REQUIRED YES
2521 CXX_EXTENSIONS YES)
2522 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE src)
2523 TARGET_INCLUDE_DIRECTORIES(q8-gemm-bench PRIVATE "${CMAKE_CURRENT_SOURCE_DIR}")
2524 TARGET_LINK_LIBRARIES(q8-gemm-bench PRIVATE XNNPACK cpuinfo fp16 benchmark bench-utils)
2525ENDIF()