xref: /aosp_15_r20/external/XNNPACK/Android.bp (revision 4bdc94577ba0e567308109d787f7fec7b531ce36)
1// Copyright (C) 2020 The Android Open Source Project
2//
3// Licensed under the Apache License, Version 2.0 (the "License");
4// you may not use this file except in compliance with the License.
5// You may obtain a copy of the License at
6//
7//      http://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS,
11// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12// See the License for the specific language governing permissions and
13// limitations under the License.
14
15package {
16    default_applicable_licenses: ["external_XNNPACK_license"],
17}
18
19// Added automatically by a large-scale-change
20// See: http://go/android-license-faq
21license {
22    name: "external_XNNPACK_license",
23    visibility: [":__subpackages__"],
24    license_kinds: [
25        "SPDX-license-identifier-BSD",
26    ],
27    license_text: [
28        "LICENSE",
29    ],
30}
31
32OPERATOR_SRCS = [
33    "src/operator-delete.c",
34    "src/operator-run.c",
35    "src/operator-utils.c",
36    "src/operators/argmax-pooling-nhwc.c",
37    "src/operators/average-pooling-nhwc.c",
38    "src/operators/binary-elementwise-nd.c",
39    "src/operators/channel-shuffle-nc.c",
40    "src/operators/constant-pad-nd.c",
41    "src/operators/convolution-nchw.c",
42    "src/operators/convolution-nhwc.c",
43    "src/operators/deconvolution-nhwc.c",
44    "src/operators/fully-connected-nc.c",
45    "src/operators/global-average-pooling-ncw.c",
46    "src/operators/global-average-pooling-nwc.c",
47    "src/operators/lut-elementwise-nc.c",
48    "src/operators/max-pooling-nhwc.c",
49    "src/operators/prelu-nc.c",
50    "src/operators/resize-bilinear-nchw.c",
51    "src/operators/resize-bilinear-nhwc.c",
52    "src/operators/softmax-nc.c",
53    "src/operators/transpose-nd.c",
54    "src/operators/unary-elementwise-nc.c",
55    "src/operators/unpooling-nhwc.c",
56]
57
58LOGGING_SRCS = [
59    "src/datatype-strings.c",
60    "src/log.c",
61    "src/node-type.c",
62    "src/operator-strings.c",
63    "src/ukernel-strings.c",
64]
65
66SUBGRAPH_SRCS = [
67    "src/memory-planner.c",
68    "src/runtime.c",
69    "src/subgraph.c",
70    "src/subgraph/abs.c",
71    "src/subgraph/add2.c",
72    "src/subgraph/argmax-pooling-2d.c",
73    "src/subgraph/average-pooling-2d.c",
74    "src/subgraph/bankers-rounding.c",
75    "src/subgraph/ceiling.c",
76    "src/subgraph/clamp.c",
77    "src/subgraph/concatenate.c",
78    "src/subgraph/convert.c",
79    "src/subgraph/convolution-2d.c",
80    "src/subgraph/deconvolution-2d.c",
81    "src/subgraph/depth-to-space.c",
82    "src/subgraph/depthwise-convolution-2d.c",
83    "src/subgraph/divide.c",
84    "src/subgraph/elu.c",
85    "src/subgraph/even-split.c",
86    "src/subgraph/floor.c",
87    "src/subgraph/fully-connected.c",
88    "src/subgraph/global-average-pooling.c",
89    "src/subgraph/hardswish.c",
90    "src/subgraph/leaky-relu.c",
91    "src/subgraph/max-pooling-2d.c",
92    "src/subgraph/maximum2.c",
93    "src/subgraph/minimum2.c",
94    "src/subgraph/multiply2.c",
95    "src/subgraph/negate.c",
96    "src/subgraph/prelu.c",
97    "src/subgraph/sigmoid.c",
98    "src/subgraph/softmax.c",
99    "src/subgraph/square-root.c",
100    "src/subgraph/square.c",
101    "src/subgraph/squared-difference.c",
102    "src/subgraph/static-constant-pad.c",
103    "src/subgraph/static-reshape.c",
104    "src/subgraph/static-resize-bilinear-2d.c",
105    "src/subgraph/static-transpose.c",
106    "src/subgraph/subtract.c",
107    "src/subgraph/unpooling-2d.c",
108    "src/subgraph/validation.c",
109    "src/tensor.c",
110]
111
112TABLE_SRCS = [
113    "src/tables/exp2-k-over-64.c",
114    "src/tables/exp2-k-over-2048.c",
115    "src/tables/exp2minus-k-over-4.c",
116    "src/tables/exp2minus-k-over-8.c",
117    "src/tables/exp2minus-k-over-16.c",
118    "src/tables/exp2minus-k-over-64.c",
119    "src/tables/exp2minus-k-over-2048.c",
120    "src/tables/vlog.c",
121]
122
123PROD_SCALAR_PORTABLE_MICROKERNEL_SRCS = [
124    "src/u8-lut32norm/scalar.c",
125    "src/xx-copy/memcpy.c",
126    "src/xx-transpose/1x1-memcpy.c",
127    "src/x8-lut/gen/lut-scalar-x4.c",
128]
129
130PROD_SCALAR_AARCH32_MICROKERNEL_SRCS = [
131    "src/f16-f32-vcvt/gen/vcvt-scalar-x4.c",
132    "src/f32-argmaxpool/4x-scalar-c1.c",
133    "src/f32-argmaxpool/9p8x-scalar-c1.c",
134    "src/f32-argmaxpool/9x-scalar-c1.c",
135    "src/f32-avgpool/9p8x-minmax-scalar-c1.c",
136    "src/f32-avgpool/9x-minmax-scalar-c1.c",
137    "src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c",
138    "src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c",
139    "src/f32-conv-hwc2chw/3x3s2p1c3x4-scalar-1x1.c",
140    "src/f32-dwconv/gen/up1x3-minmax-scalar-acc2.c",
141    "src/f32-dwconv/gen/up1x3-scalar-acc2.c",
142    "src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c",
143    "src/f32-dwconv/gen/up1x4-scalar-acc2.c",
144    "src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c",
145    "src/f32-dwconv/gen/up1x9-scalar-acc2.c",
146    "src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c",
147    "src/f32-dwconv/gen/up1x25-scalar-acc2.c",
148    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-4x1.c",
149    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-2x1-acc2.c",
150    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-2x1-acc2.c",
151    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-2x1-acc2.c",
152    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x2.c",
153    "src/f32-gavgpool-cw/scalar-x1.c",
154    "src/f32-gavgpool/7p7x-minmax-scalar-c1.c",
155    "src/f32-gavgpool/7x-minmax-scalar-c1.c",
156    "src/f32-gemm/gen/1x4-minmax-scalar.c",
157    "src/f32-gemm/gen/1x4-relu-scalar.c",
158    "src/f32-gemm/gen/1x4-scalar.c",
159    "src/f32-gemm/gen/4x2-minmax-scalar.c",
160    "src/f32-gemm/gen/4x2-scalar.c",
161    "src/f32-gemm/gen/4x4-minmax-scalar.c",
162    "src/f32-gemm/gen/4x4-relu-scalar.c",
163    "src/f32-gemm/gen/4x4-scalar.c",
164    "src/f32-ibilinear-chw/gen/scalar-p4.c",
165    "src/f32-ibilinear/gen/scalar-c2.c",
166    "src/f32-igemm/gen/1x4-minmax-scalar.c",
167    "src/f32-igemm/gen/1x4-relu-scalar.c",
168    "src/f32-igemm/gen/1x4-scalar.c",
169    "src/f32-igemm/gen/4x2-minmax-scalar.c",
170    "src/f32-igemm/gen/4x2-scalar.c",
171    "src/f32-igemm/gen/4x4-minmax-scalar.c",
172    "src/f32-igemm/gen/4x4-relu-scalar.c",
173    "src/f32-igemm/gen/4x4-scalar.c",
174    "src/f32-maxpool/9p8x-minmax-scalar-c1.c",
175    "src/f32-pavgpool/9p8x-minmax-scalar-c1.c",
176    "src/f32-pavgpool/9x-minmax-scalar-c1.c",
177    "src/f32-prelu/gen/scalar-2x4.c",
178    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x4.c",
179    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x4.c",
180    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4-acc2.c",
181    "src/f32-rmax/scalar.c",
182    "src/f32-spmm/gen/8x1-minmax-scalar.c",
183    "src/f32-spmm/gen/8x2-minmax-scalar.c",
184    "src/f32-spmm/gen/8x4-minmax-scalar.c",
185    "src/f32-vbinary/gen/vadd-minmax-scalar-x8.c",
186    "src/f32-vbinary/gen/vaddc-minmax-scalar-x8.c",
187    "src/f32-vbinary/gen/vdiv-minmax-scalar-x2.c",
188    "src/f32-vbinary/gen/vdivc-minmax-scalar-x2.c",
189    "src/f32-vbinary/gen/vmax-scalar-x8.c",
190    "src/f32-vbinary/gen/vmaxc-scalar-x8.c",
191    "src/f32-vbinary/gen/vmin-scalar-x8.c",
192    "src/f32-vbinary/gen/vminc-scalar-x8.c",
193    "src/f32-vbinary/gen/vmul-minmax-scalar-x8.c",
194    "src/f32-vbinary/gen/vmulc-minmax-scalar-x8.c",
195    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x2.c",
196    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x8.c",
197    "src/f32-vbinary/gen/vsqrdiff-scalar-x8.c",
198    "src/f32-vbinary/gen/vsqrdiffc-scalar-x8.c",
199    "src/f32-vbinary/gen/vsub-minmax-scalar-x8.c",
200    "src/f32-vbinary/gen/vsubc-minmax-scalar-x8.c",
201    "src/f32-vclamp/gen/vclamp-scalar-x4.c",
202    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x4.c",
203    "src/f32-vhswish/gen/vhswish-scalar-x4.c",
204    "src/f32-vlrelu/gen/vlrelu-scalar-x4.c",
205    "src/f32-vmulcaddc/gen/c1-minmax-scalar-2x.c",
206    "src/f32-vrelu/gen/vrelu-scalar-x8.c",
207    "src/f32-vrnd/gen/vrndd-scalar-libm-x1.c",
208    "src/f32-vrnd/gen/vrndne-scalar-libm-x1.c",
209    "src/f32-vrnd/gen/vrndu-scalar-libm-x1.c",
210    "src/f32-vrnd/gen/vrndz-scalar-libm-x1.c",
211    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x2.c",
212    "src/f32-vsqrt/gen/scalar-sqrt-x1.c",
213    "src/f32-vunary/gen/vabs-scalar-x4.c",
214    "src/f32-vunary/gen/vneg-scalar-x4.c",
215    "src/f32-vunary/gen/vsqr-scalar-x4.c",
216    "src/qc8-dwconv/gen/up1x3-minmax-fp32-scalar-fmagic.c",
217    "src/qc8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
218    "src/qc8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
219    "src/qc8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
220    "src/qc8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
221    "src/qc8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
222    "src/qc8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
223    "src/qs8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
224    "src/qs8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
225    "src/qs8-f32-vcvt/gen/vcvt-scalar-x4.c",
226    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
227    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
228    "src/qs8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
229    "src/qs8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
230    "src/qs8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
231    "src/qs8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
232    "src/qs8-vadd/gen/minmax-scalar-x1.c",
233    "src/qs8-vaddc/gen/minmax-scalar-x1.c",
234    "src/qs8-vmul/gen/minmax-fp32-scalar-x4.c",
235    "src/qs8-vmulc/gen/minmax-fp32-scalar-x4.c",
236    "src/qu8-avgpool/9p8x-minmax-scalar-c1.c",
237    "src/qu8-avgpool/9x-minmax-scalar-c1.c",
238    "src/qu8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
239    "src/qu8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
240    "src/qu8-f32-vcvt/gen/vcvt-scalar-x4.c",
241    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
242    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
243    "src/qu8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
244    "src/qu8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
245    "src/qu8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
246    "src/qu8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
247    "src/qu8-vadd/gen/minmax-scalar-x1.c",
248    "src/qu8-vaddc/gen/minmax-scalar-x1.c",
249    "src/qu8-vmul/gen/minmax-fp32-scalar-x4.c",
250    "src/qu8-vmulc/gen/minmax-fp32-scalar-x4.c",
251    "src/s8-ibilinear/gen/scalar-c1.c",
252    "src/s8-maxpool/9p8x-minmax-scalar-c1.c",
253    "src/s8-vclamp/scalar-x4.c",
254    "src/u8-ibilinear/gen/scalar-c1.c",
255    "src/u8-maxpool/9p8x-minmax-scalar-c1.c",
256    "src/u8-rmax/scalar.c",
257    "src/u8-vclamp/scalar-x4.c",
258    "src/xx-fill/scalar-x16.c",
259    "src/xx-pad/scalar.c",
260    "src/x8-transposec/gen/2x4-scalar-int.c",
261    "src/x8-zip/xm-scalar.c",
262    "src/x8-zip/x2-scalar.c",
263    "src/x8-zip/x3-scalar.c",
264    "src/x8-zip/x4-scalar.c",
265    "src/x16-transposec/gen/2x4-scalar-int.c",
266    "src/x32-packx/x2-scalar.c",
267    "src/x32-packx/x3-scalar.c",
268    "src/x32-packx/x4-scalar.c",
269    "src/x32-transposec/gen/2x4-scalar-int.c",
270    "src/x32-unpool/scalar.c",
271    "src/x32-zip/xm-scalar.c",
272    "src/x32-zip/x2-scalar.c",
273    "src/x32-zip/x3-scalar.c",
274    "src/x32-zip/x4-scalar.c",
275]
276
277PROD_SCALAR_WASM_MICROKERNEL_SRCS = [
278    "src/f16-f32-vcvt/gen/vcvt-scalar-x1.c",
279    "src/f32-argmaxpool/4x-scalar-c1.c",
280    "src/f32-argmaxpool/9p8x-scalar-c1.c",
281    "src/f32-argmaxpool/9x-scalar-c1.c",
282    "src/f32-avgpool/9p8x-minmax-scalar-c1.c",
283    "src/f32-avgpool/9x-minmax-scalar-c1.c",
284    "src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c",
285    "src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c",
286    "src/f32-conv-hwc2chw/3x3s2p1c3x4-scalar-1x1.c",
287    "src/f32-dwconv/gen/up1x3-minmax-scalar-acc2.c",
288    "src/f32-dwconv/gen/up1x3-scalar-acc2.c",
289    "src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c",
290    "src/f32-dwconv/gen/up1x4-scalar-acc2.c",
291    "src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c",
292    "src/f32-dwconv/gen/up1x9-scalar-acc2.c",
293    "src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c",
294    "src/f32-dwconv/gen/up1x25-scalar-acc2.c",
295    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1-acc2.c",
296    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1-acc2.c",
297    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc5.c",
298    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc5.c",
299    "src/f32-f16-vcvt/gen/vcvt-scalar-bitcast-x4.c",
300    "src/f32-gavgpool-cw/scalar-x1.c",
301    "src/f32-gavgpool/7p7x-minmax-scalar-c1.c",
302    "src/f32-gavgpool/7x-minmax-scalar-c1.c",
303    "src/f32-gemm/gen/1x4-scalar.c",
304    "src/f32-gemm/gen/2x4-minmax-scalar.c",
305    "src/f32-gemm/gen/2x4-relu-scalar.c",
306    "src/f32-gemm/gen/2x4-scalar.c",
307    "src/f32-gemm/gen/4x2-scalar.c",
308    "src/f32-gemm/gen/4x4-scalar.c",
309    "src/f32-ibilinear-chw/gen/scalar-p4.c",
310    "src/f32-ibilinear/gen/scalar-c2.c",
311    "src/f32-igemm/gen/1x4-scalar.c",
312    "src/f32-igemm/gen/2x4-minmax-scalar.c",
313    "src/f32-igemm/gen/2x4-relu-scalar.c",
314    "src/f32-igemm/gen/2x4-scalar.c",
315    "src/f32-igemm/gen/4x2-scalar.c",
316    "src/f32-igemm/gen/4x4-scalar.c",
317    "src/f32-maxpool/9p8x-minmax-scalar-c1.c",
318    "src/f32-pavgpool/9p8x-minmax-scalar-c1.c",
319    "src/f32-pavgpool/9x-minmax-scalar-c1.c",
320    "src/f32-prelu/gen/scalar-2x4.c",
321    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x1.c",
322    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x1.c",
323    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4-acc2.c",
324    "src/f32-rmax/scalar.c",
325    "src/f32-spmm/gen/8x1-minmax-scalar.c",
326    "src/f32-spmm/gen/8x2-minmax-scalar.c",
327    "src/f32-spmm/gen/8x4-minmax-scalar.c",
328    "src/f32-vbinary/gen/vadd-minmax-scalar-x8.c",
329    "src/f32-vbinary/gen/vaddc-minmax-scalar-x8.c",
330    "src/f32-vbinary/gen/vdiv-minmax-scalar-x8.c",
331    "src/f32-vbinary/gen/vdivc-minmax-scalar-x8.c",
332    "src/f32-vbinary/gen/vmax-scalar-x8.c",
333    "src/f32-vbinary/gen/vmaxc-scalar-x8.c",
334    "src/f32-vbinary/gen/vmin-scalar-x8.c",
335    "src/f32-vbinary/gen/vminc-scalar-x8.c",
336    "src/f32-vbinary/gen/vmul-minmax-scalar-x8.c",
337    "src/f32-vbinary/gen/vmulc-minmax-scalar-x8.c",
338    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x8.c",
339    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x8.c",
340    "src/f32-vbinary/gen/vsqrdiff-scalar-x8.c",
341    "src/f32-vbinary/gen/vsqrdiffc-scalar-x8.c",
342    "src/f32-vbinary/gen/vsub-minmax-scalar-x8.c",
343    "src/f32-vbinary/gen/vsubc-minmax-scalar-x8.c",
344    "src/f32-vclamp/gen/vclamp-scalar-x4.c",
345    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x2.c",
346    "src/f32-vhswish/gen/vhswish-scalar-x4.c",
347    "src/f32-vlrelu/gen/vlrelu-scalar-x4.c",
348    "src/f32-vmulcaddc/gen/c1-minmax-scalar-2x.c",
349    "src/f32-vrelu/gen/vrelu-scalar-x8.c",
350    "src/f32-vrnd/gen/vrndd-scalar-libm-x4.c",
351    "src/f32-vrnd/gen/vrndne-scalar-libm-x4.c",
352    "src/f32-vrnd/gen/vrndu-scalar-libm-x4.c",
353    "src/f32-vrnd/gen/vrndz-scalar-libm-x4.c",
354    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x2.c",
355    "src/f32-vsqrt/gen/scalar-sqrt-x1.c",
356    "src/f32-vunary/gen/vabs-scalar-x4.c",
357    "src/f32-vunary/gen/vneg-scalar-x4.c",
358    "src/f32-vunary/gen/vsqr-scalar-x4.c",
359    "src/qc8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
360    "src/qc8-dwconv/gen/up2x3-minmax-fp32-scalar-imagic.c",
361    "src/qc8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
362    "src/qc8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
363    "src/qc8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
364    "src/qc8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
365    "src/qc8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
366    "src/qs8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
367    "src/qs8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
368    "src/qs8-f32-vcvt/gen/vcvt-scalar-x1.c",
369    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c4.c",
370    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c4.c",
371    "src/qs8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
372    "src/qs8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
373    "src/qs8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
374    "src/qs8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
375    "src/qs8-vadd/gen/minmax-scalar-x4.c",
376    "src/qs8-vaddc/gen/minmax-scalar-x4.c",
377    "src/qs8-vcvt/gen/vcvt-scalar-x1.c",
378    "src/qs8-vcvt/gen/vcvt-scalar-x4.c",
379    "src/qs8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
380    "src/qs8-vlrelu/gen/vlrelu-scalar-select-x4.c",
381    "src/qs8-vmul/gen/minmax-fp32-scalar-x4.c",
382    "src/qs8-vmulc/gen/minmax-fp32-scalar-x4.c",
383    "src/qu8-avgpool/9p8x-minmax-scalar-c1.c",
384    "src/qu8-avgpool/9x-minmax-scalar-c1.c",
385    "src/qu8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
386    "src/qu8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
387    "src/qu8-f32-vcvt/gen/vcvt-scalar-x1.c",
388    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c4.c",
389    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c4.c",
390    "src/qu8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
391    "src/qu8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
392    "src/qu8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
393    "src/qu8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
394    "src/qu8-vadd/gen/minmax-scalar-x4.c",
395    "src/qu8-vaddc/gen/minmax-scalar-x4.c",
396    "src/qu8-vcvt/gen/vcvt-scalar-x1.c",
397    "src/qu8-vcvt/gen/vcvt-scalar-x4.c",
398    "src/qu8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
399    "src/qu8-vlrelu/gen/vlrelu-scalar-select-x4.c",
400    "src/qu8-vmul/gen/minmax-fp32-scalar-x4.c",
401    "src/qu8-vmulc/gen/minmax-fp32-scalar-x4.c",
402    "src/s8-ibilinear/gen/scalar-c1.c",
403    "src/s8-maxpool/9p8x-minmax-scalar-c1.c",
404    "src/s8-vclamp/scalar-x4.c",
405    "src/u8-ibilinear/gen/scalar-c1.c",
406    "src/u8-maxpool/9p8x-minmax-scalar-c1.c",
407    "src/u8-rmax/scalar.c",
408    "src/u8-vclamp/scalar-x4.c",
409    "src/xx-fill/scalar-x16.c",
410    "src/xx-pad/scalar.c",
411    "src/x8-transposec/gen/2x4-scalar-int.c",
412    "src/x8-zip/xm-scalar.c",
413    "src/x8-zip/x2-scalar.c",
414    "src/x8-zip/x3-scalar.c",
415    "src/x8-zip/x4-scalar.c",
416    "src/x16-transposec/gen/2x4-scalar-int.c",
417    "src/x32-packx/x2-scalar.c",
418    "src/x32-packx/x3-scalar.c",
419    "src/x32-packx/x4-scalar.c",
420    "src/x32-transposec/gen/2x4-scalar-int.c",
421    "src/x32-unpool/scalar.c",
422    "src/x32-zip/xm-scalar.c",
423    "src/x32-zip/x2-scalar.c",
424    "src/x32-zip/x3-scalar.c",
425    "src/x32-zip/x4-scalar.c",
426]
427
428PROD_SCALAR_RISCV_MICROKERNEL_SRCS = [
429    "src/f16-f32-vcvt/gen/vcvt-scalar-x4.c",
430    "src/f32-argmaxpool/4x-scalar-c1.c",
431    "src/f32-argmaxpool/9p8x-scalar-c1.c",
432    "src/f32-argmaxpool/9x-scalar-c1.c",
433    "src/f32-avgpool/9p8x-minmax-scalar-c1.c",
434    "src/f32-avgpool/9x-minmax-scalar-c1.c",
435    "src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c",
436    "src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c",
437    "src/f32-conv-hwc2chw/3x3s2p1c3x4-scalar-1x1.c",
438    "src/f32-dwconv/gen/up1x3-minmax-scalar-acc2.c",
439    "src/f32-dwconv/gen/up1x3-scalar-acc2.c",
440    "src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c",
441    "src/f32-dwconv/gen/up1x4-scalar-acc2.c",
442    "src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c",
443    "src/f32-dwconv/gen/up1x9-scalar-acc2.c",
444    "src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c",
445    "src/f32-dwconv/gen/up1x25-scalar-acc2.c",
446    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1-acc2.c",
447    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1-acc2.c",
448    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc5.c",
449    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc5.c",
450    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x2.c",
451    "src/f32-gavgpool-cw/scalar-x1.c",
452    "src/f32-gavgpool/7p7x-minmax-scalar-c1.c",
453    "src/f32-gavgpool/7x-minmax-scalar-c1.c",
454    "src/f32-gemm/gen/1x4-minmax-scalar.c",
455    "src/f32-gemm/gen/1x4-relu-scalar.c",
456    "src/f32-gemm/gen/1x4-scalar.c",
457    "src/f32-gemm/gen/4x2-minmax-scalar.c",
458    "src/f32-gemm/gen/4x2-scalar.c",
459    "src/f32-gemm/gen/4x4-minmax-scalar.c",
460    "src/f32-gemm/gen/4x4-relu-scalar.c",
461    "src/f32-gemm/gen/4x4-scalar.c",
462    "src/f32-ibilinear-chw/gen/scalar-p4.c",
463    "src/f32-ibilinear/gen/scalar-c2.c",
464    "src/f32-igemm/gen/1x4-minmax-scalar.c",
465    "src/f32-igemm/gen/1x4-relu-scalar.c",
466    "src/f32-igemm/gen/1x4-scalar.c",
467    "src/f32-igemm/gen/4x2-minmax-scalar.c",
468    "src/f32-igemm/gen/4x2-scalar.c",
469    "src/f32-igemm/gen/4x4-minmax-scalar.c",
470    "src/f32-igemm/gen/4x4-relu-scalar.c",
471    "src/f32-igemm/gen/4x4-scalar.c",
472    "src/f32-maxpool/9p8x-minmax-scalar-c1.c",
473    "src/f32-pavgpool/9p8x-minmax-scalar-c1.c",
474    "src/f32-pavgpool/9x-minmax-scalar-c1.c",
475    "src/f32-prelu/gen/scalar-2x4.c",
476    "src/f32-qs8-vcvt/gen/vcvt-scalar-lrintf-x4.c",
477    "src/f32-qu8-vcvt/gen/vcvt-scalar-lrintf-x4.c",
478    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4-acc2.c",
479    "src/f32-rmax/scalar.c",
480    "src/f32-spmm/gen/8x1-minmax-scalar.c",
481    "src/f32-spmm/gen/8x2-minmax-scalar.c",
482    "src/f32-spmm/gen/8x4-minmax-scalar.c",
483    "src/f32-vbinary/gen/vadd-minmax-scalar-x8.c",
484    "src/f32-vbinary/gen/vaddc-minmax-scalar-x8.c",
485    "src/f32-vbinary/gen/vdiv-minmax-scalar-x2.c",
486    "src/f32-vbinary/gen/vdivc-minmax-scalar-x2.c",
487    "src/f32-vbinary/gen/vmax-scalar-x8.c",
488    "src/f32-vbinary/gen/vmaxc-scalar-x8.c",
489    "src/f32-vbinary/gen/vmin-scalar-x8.c",
490    "src/f32-vbinary/gen/vminc-scalar-x8.c",
491    "src/f32-vbinary/gen/vmul-minmax-scalar-x8.c",
492    "src/f32-vbinary/gen/vmulc-minmax-scalar-x8.c",
493    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x2.c",
494    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x8.c",
495    "src/f32-vbinary/gen/vsqrdiff-scalar-x8.c",
496    "src/f32-vbinary/gen/vsqrdiffc-scalar-x8.c",
497    "src/f32-vbinary/gen/vsub-minmax-scalar-x8.c",
498    "src/f32-vbinary/gen/vsubc-minmax-scalar-x8.c",
499    "src/f32-vclamp/gen/vclamp-scalar-x4.c",
500    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x4.c",
501    "src/f32-vhswish/gen/vhswish-scalar-x4.c",
502    "src/f32-vlrelu/gen/vlrelu-scalar-x4.c",
503    "src/f32-vmulcaddc/gen/c1-minmax-scalar-2x.c",
504    "src/f32-vrelu/gen/vrelu-scalar-x8.c",
505    "src/f32-vrnd/gen/vrndd-scalar-libm-x1.c",
506    "src/f32-vrnd/gen/vrndne-scalar-libm-x1.c",
507    "src/f32-vrnd/gen/vrndu-scalar-libm-x1.c",
508    "src/f32-vrnd/gen/vrndz-scalar-libm-x1.c",
509    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x2.c",
510    "src/f32-vsqrt/gen/scalar-sqrt-x1.c",
511    "src/f32-vunary/gen/vabs-scalar-x4.c",
512    "src/f32-vunary/gen/vneg-scalar-x4.c",
513    "src/f32-vunary/gen/vsqr-scalar-x4.c",
514    "src/qc8-dwconv/gen/up2x3-minmax-fp32-scalar-lrintf.c",
515    "src/qc8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
516    "src/qc8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
517    "src/qc8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
518    "src/qc8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
519    "src/qc8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
520    "src/qc8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
521    "src/qs8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
522    "src/qs8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
523    "src/qs8-f32-vcvt/gen/vcvt-scalar-x4.c",
524    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
525    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
526    "src/qs8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
527    "src/qs8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
528    "src/qs8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
529    "src/qs8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
530    "src/qs8-vadd/gen/minmax-scalar-x4.c",
531    "src/qs8-vaddc/gen/minmax-scalar-x4.c",
532    "src/qs8-vcvt/gen/vcvt-scalar-x4.c",
533    "src/qs8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
534    "src/qs8-vmul/gen/minmax-fp32-scalar-x4.c",
535    "src/qs8-vmulc/gen/minmax-fp32-scalar-x4.c",
536    "src/qu8-avgpool/9p8x-minmax-scalar-c1.c",
537    "src/qu8-avgpool/9x-minmax-scalar-c1.c",
538    "src/qu8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
539    "src/qu8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
540    "src/qu8-f32-vcvt/gen/vcvt-scalar-x4.c",
541    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
542    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
543    "src/qu8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
544    "src/qu8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
545    "src/qu8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
546    "src/qu8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
547    "src/qu8-vadd/gen/minmax-scalar-x4.c",
548    "src/qu8-vaddc/gen/minmax-scalar-x4.c",
549    "src/qu8-vcvt/gen/vcvt-scalar-x4.c",
550    "src/qu8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
551    "src/qu8-vmul/gen/minmax-fp32-scalar-x4.c",
552    "src/qu8-vmulc/gen/minmax-fp32-scalar-x4.c",
553    "src/s8-ibilinear/gen/scalar-c1.c",
554    "src/s8-maxpool/9p8x-minmax-scalar-c1.c",
555    "src/s8-vclamp/scalar-x4.c",
556    "src/u8-ibilinear/gen/scalar-c1.c",
557    "src/u8-maxpool/9p8x-minmax-scalar-c1.c",
558    "src/u8-rmax/scalar.c",
559    "src/u8-vclamp/scalar-x4.c",
560    "src/xx-fill/scalar-x16.c",
561    "src/xx-pad/scalar.c",
562    "src/x8-transposec/gen/2x4-scalar-int.c",
563    "src/x8-zip/xm-scalar.c",
564    "src/x8-zip/x2-scalar.c",
565    "src/x8-zip/x3-scalar.c",
566    "src/x8-zip/x4-scalar.c",
567    "src/x16-transposec/gen/2x4-scalar-int.c",
568    "src/x32-packx/x2-scalar.c",
569    "src/x32-packx/x3-scalar.c",
570    "src/x32-packx/x4-scalar.c",
571    "src/x32-transposec/gen/2x4-scalar-int.c",
572    "src/x32-unpool/scalar.c",
573    "src/x32-zip/xm-scalar.c",
574    "src/x32-zip/x2-scalar.c",
575    "src/x32-zip/x3-scalar.c",
576    "src/x32-zip/x4-scalar.c",
577]
578
579ALL_SCALAR_MICROKERNEL_SRCS = [
580    "src/cs16-bfly4/gen/scalar-x1.c",
581    "src/cs16-bfly4/gen/scalar-x2.c",
582    "src/cs16-bfly4/gen/scalar-x3.c",
583    "src/cs16-bfly4/gen/scalar-x4.c",
584    "src/cs16-bfly4/samples1-scalar.c",
585    "src/cs16-fftr/gen/scalar-x1.c",
586    "src/cs16-fftr/gen/scalar-x2.c",
587    "src/cs16-fftr/gen/scalar-x3.c",
588    "src/cs16-fftr/gen/scalar-x4.c",
589    "src/cs16-vsquareabs/gen/scalar-x1.c",
590    "src/cs16-vsquareabs/gen/scalar-x2.c",
591    "src/cs16-vsquareabs/gen/scalar-x3.c",
592    "src/cs16-vsquareabs/gen/scalar-x4.c",
593    "src/f16-f32-vcvt/gen/vcvt-scalar-x1.c",
594    "src/f16-f32-vcvt/gen/vcvt-scalar-x2.c",
595    "src/f16-f32-vcvt/gen/vcvt-scalar-x3.c",
596    "src/f16-f32-vcvt/gen/vcvt-scalar-x4.c",
597    "src/f32-argmaxpool/4x-scalar-c1.c",
598    "src/f32-argmaxpool/9p8x-scalar-c1.c",
599    "src/f32-argmaxpool/9x-scalar-c1.c",
600    "src/f32-avgpool/9p8x-minmax-scalar-c1.c",
601    "src/f32-avgpool/9x-minmax-scalar-c1.c",
602    "src/f32-conv-hwc/3x3s2p0p1c3x4-scalar-1x1.c",
603    "src/f32-conv-hwc/3x3s2p1c3x4-scalar-1x1.c",
604    "src/f32-conv-hwc2chw/3x3s2p1c3x4-scalar-1x1.c",
605    "src/f32-dwconv/gen/up1x3-minmax-scalar-acc2.c",
606    "src/f32-dwconv/gen/up1x3-minmax-scalar.c",
607    "src/f32-dwconv/gen/up1x3-scalar-acc2.c",
608    "src/f32-dwconv/gen/up1x3-scalar.c",
609    "src/f32-dwconv/gen/up1x4-minmax-scalar-acc2.c",
610    "src/f32-dwconv/gen/up1x4-minmax-scalar.c",
611    "src/f32-dwconv/gen/up1x4-scalar-acc2.c",
612    "src/f32-dwconv/gen/up1x4-scalar.c",
613    "src/f32-dwconv/gen/up1x9-minmax-scalar-acc2.c",
614    "src/f32-dwconv/gen/up1x9-minmax-scalar.c",
615    "src/f32-dwconv/gen/up1x9-scalar-acc2.c",
616    "src/f32-dwconv/gen/up1x9-scalar.c",
617    "src/f32-dwconv/gen/up1x25-minmax-scalar-acc2.c",
618    "src/f32-dwconv/gen/up1x25-minmax-scalar.c",
619    "src/f32-dwconv/gen/up1x25-scalar-acc2.c",
620    "src/f32-dwconv/gen/up1x25-scalar.c",
621    "src/f32-dwconv/gen/up2x3-minmax-scalar-acc2.c",
622    "src/f32-dwconv/gen/up2x3-minmax-scalar.c",
623    "src/f32-dwconv/gen/up2x3-scalar-acc2.c",
624    "src/f32-dwconv/gen/up2x3-scalar.c",
625    "src/f32-dwconv/gen/up2x4-minmax-scalar-acc2.c",
626    "src/f32-dwconv/gen/up2x4-minmax-scalar.c",
627    "src/f32-dwconv/gen/up2x4-scalar-acc2.c",
628    "src/f32-dwconv/gen/up2x4-scalar.c",
629    "src/f32-dwconv/gen/up2x9-minmax-scalar-acc2.c",
630    "src/f32-dwconv/gen/up2x9-minmax-scalar.c",
631    "src/f32-dwconv/gen/up2x9-scalar-acc2.c",
632    "src/f32-dwconv/gen/up2x9-scalar.c",
633    "src/f32-dwconv/gen/up2x25-minmax-scalar-acc2.c",
634    "src/f32-dwconv/gen/up2x25-minmax-scalar.c",
635    "src/f32-dwconv/gen/up2x25-scalar-acc2.c",
636    "src/f32-dwconv/gen/up2x25-scalar.c",
637    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc2.c",
638    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc3.c",
639    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1-acc4.c",
640    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-1x1.c",
641    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1-acc2.c",
642    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-2x1.c",
643    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-3x1.c",
644    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-4x1.c",
645    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-5x1.c",
646    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-scalar-6x1.c",
647    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1-acc2.c",
648    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1-acc3.c",
649    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1-acc4.c",
650    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-1x1.c",
651    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-2x1-acc2.c",
652    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-2x1.c",
653    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-3x1.c",
654    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-scalar-4x1.c",
655    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc2.c",
656    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc3.c",
657    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc4.c",
658    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1-acc5.c",
659    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-1x1.c",
660    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-2x1-acc2.c",
661    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-2x1-acc3.c",
662    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-2x1.c",
663    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-3x1-acc2.c",
664    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-scalar-3x1.c",
665    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc2.c",
666    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc3.c",
667    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc4.c",
668    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1-acc5.c",
669    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-1x1.c",
670    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-2x1-acc2.c",
671    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-2x1-acc3.c",
672    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-2x1.c",
673    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-3x1-acc2.c",
674    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-scalar-3x1.c",
675    "src/f32-f16-vcvt/gen/vcvt-scalar-bitcast-x1.c",
676    "src/f32-f16-vcvt/gen/vcvt-scalar-bitcast-x2.c",
677    "src/f32-f16-vcvt/gen/vcvt-scalar-bitcast-x3.c",
678    "src/f32-f16-vcvt/gen/vcvt-scalar-bitcast-x4.c",
679    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x1.c",
680    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x2.c",
681    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x3.c",
682    "src/f32-f16-vcvt/gen/vcvt-scalar-fabsf-x4.c",
683    "src/f32-gavgpool-cw/scalar-x1.c",
684    "src/f32-gavgpool/7p7x-minmax-scalar-c1.c",
685    "src/f32-gavgpool/7x-minmax-scalar-c1.c",
686    "src/f32-gemm/gen-inc/1x4inc-minmax-scalar.c",
687    "src/f32-gemm/gen-inc/2x4inc-minmax-scalar.c",
688    "src/f32-gemm/gen-inc/4x4inc-minmax-scalar.c",
689    "src/f32-gemm/gen/1x4-minmax-scalar.c",
690    "src/f32-gemm/gen/1x4-relu-scalar.c",
691    "src/f32-gemm/gen/1x4-scalar.c",
692    "src/f32-gemm/gen/2x4-minmax-scalar.c",
693    "src/f32-gemm/gen/2x4-relu-scalar.c",
694    "src/f32-gemm/gen/2x4-scalar.c",
695    "src/f32-gemm/gen/4x2-minmax-scalar.c",
696    "src/f32-gemm/gen/4x2-relu-scalar.c",
697    "src/f32-gemm/gen/4x2-scalar.c",
698    "src/f32-gemm/gen/4x4-minmax-scalar.c",
699    "src/f32-gemm/gen/4x4-relu-scalar.c",
700    "src/f32-gemm/gen/4x4-scalar.c",
701    "src/f32-ibilinear-chw/gen/scalar-p1.c",
702    "src/f32-ibilinear-chw/gen/scalar-p2.c",
703    "src/f32-ibilinear-chw/gen/scalar-p4.c",
704    "src/f32-ibilinear/gen/scalar-c1.c",
705    "src/f32-ibilinear/gen/scalar-c2.c",
706    "src/f32-ibilinear/gen/scalar-c4.c",
707    "src/f32-igemm/gen/1x4-minmax-scalar.c",
708    "src/f32-igemm/gen/1x4-relu-scalar.c",
709    "src/f32-igemm/gen/1x4-scalar.c",
710    "src/f32-igemm/gen/2x4-minmax-scalar.c",
711    "src/f32-igemm/gen/2x4-relu-scalar.c",
712    "src/f32-igemm/gen/2x4-scalar.c",
713    "src/f32-igemm/gen/4x2-minmax-scalar.c",
714    "src/f32-igemm/gen/4x2-relu-scalar.c",
715    "src/f32-igemm/gen/4x2-scalar.c",
716    "src/f32-igemm/gen/4x4-minmax-scalar.c",
717    "src/f32-igemm/gen/4x4-relu-scalar.c",
718    "src/f32-igemm/gen/4x4-scalar.c",
719    "src/f32-maxpool/9p8x-minmax-scalar-c1.c",
720    "src/f32-pavgpool/9p8x-minmax-scalar-c1.c",
721    "src/f32-pavgpool/9x-minmax-scalar-c1.c",
722    "src/f32-ppmm/gen/2x4-minmax-scalar.c",
723    "src/f32-ppmm/gen/3x3-minmax-scalar.c",
724    "src/f32-ppmm/gen/4x2-minmax-scalar.c",
725    "src/f32-ppmm/gen/4x4-minmax-scalar.c",
726    "src/f32-prelu/gen/scalar-2x1.c",
727    "src/f32-prelu/gen/scalar-2x4.c",
728    "src/f32-qs8-vcvt/gen/vcvt-scalar-fmagic-x1.c",
729    "src/f32-qs8-vcvt/gen/vcvt-scalar-fmagic-x2.c",
730    "src/f32-qs8-vcvt/gen/vcvt-scalar-fmagic-x3.c",
731    "src/f32-qs8-vcvt/gen/vcvt-scalar-fmagic-x4.c",
732    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x1.c",
733    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x2.c",
734    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x3.c",
735    "src/f32-qs8-vcvt/gen/vcvt-scalar-imagic-x4.c",
736    "src/f32-qs8-vcvt/gen/vcvt-scalar-lrintf-x1.c",
737    "src/f32-qs8-vcvt/gen/vcvt-scalar-lrintf-x2.c",
738    "src/f32-qs8-vcvt/gen/vcvt-scalar-lrintf-x3.c",
739    "src/f32-qs8-vcvt/gen/vcvt-scalar-lrintf-x4.c",
740    "src/f32-qu8-vcvt/gen/vcvt-scalar-fmagic-x1.c",
741    "src/f32-qu8-vcvt/gen/vcvt-scalar-fmagic-x2.c",
742    "src/f32-qu8-vcvt/gen/vcvt-scalar-fmagic-x3.c",
743    "src/f32-qu8-vcvt/gen/vcvt-scalar-fmagic-x4.c",
744    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x1.c",
745    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x2.c",
746    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x3.c",
747    "src/f32-qu8-vcvt/gen/vcvt-scalar-imagic-x4.c",
748    "src/f32-qu8-vcvt/gen/vcvt-scalar-lrintf-x1.c",
749    "src/f32-qu8-vcvt/gen/vcvt-scalar-lrintf-x2.c",
750    "src/f32-qu8-vcvt/gen/vcvt-scalar-lrintf-x3.c",
751    "src/f32-qu8-vcvt/gen/vcvt-scalar-lrintf-x4.c",
752    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x1.c",
753    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x2-acc2.c",
754    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x2.c",
755    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x4-acc2.c",
756    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x4-acc4.c",
757    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-lut64-p2-x4.c",
758    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x1.c",
759    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x2-acc2.c",
760    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x2.c",
761    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4-acc2.c",
762    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4-acc4.c",
763    "src/f32-raddstoreexpminusmax/gen/scalar-rr2-p5-x4.c",
764    "src/f32-rmax/scalar.c",
765    "src/f32-spmm/gen/1x1-minmax-scalar-pipelined.c",
766    "src/f32-spmm/gen/1x1-minmax-scalar.c",
767    "src/f32-spmm/gen/2x1-minmax-scalar-pipelined.c",
768    "src/f32-spmm/gen/2x1-minmax-scalar.c",
769    "src/f32-spmm/gen/4x1-minmax-scalar-pipelined.c",
770    "src/f32-spmm/gen/4x1-minmax-scalar.c",
771    "src/f32-spmm/gen/8x1-minmax-scalar-pipelined.c",
772    "src/f32-spmm/gen/8x1-minmax-scalar.c",
773    "src/f32-spmm/gen/8x2-minmax-scalar.c",
774    "src/f32-spmm/gen/8x4-minmax-scalar.c",
775    "src/f32-vbinary/gen/vadd-minmax-scalar-x1.c",
776    "src/f32-vbinary/gen/vadd-minmax-scalar-x2.c",
777    "src/f32-vbinary/gen/vadd-minmax-scalar-x4.c",
778    "src/f32-vbinary/gen/vadd-minmax-scalar-x8.c",
779    "src/f32-vbinary/gen/vadd-relu-scalar-x1.c",
780    "src/f32-vbinary/gen/vadd-relu-scalar-x2.c",
781    "src/f32-vbinary/gen/vadd-relu-scalar-x4.c",
782    "src/f32-vbinary/gen/vadd-relu-scalar-x8.c",
783    "src/f32-vbinary/gen/vadd-scalar-x1.c",
784    "src/f32-vbinary/gen/vadd-scalar-x2.c",
785    "src/f32-vbinary/gen/vadd-scalar-x4.c",
786    "src/f32-vbinary/gen/vadd-scalar-x8.c",
787    "src/f32-vbinary/gen/vaddc-minmax-scalar-x1.c",
788    "src/f32-vbinary/gen/vaddc-minmax-scalar-x2.c",
789    "src/f32-vbinary/gen/vaddc-minmax-scalar-x4.c",
790    "src/f32-vbinary/gen/vaddc-minmax-scalar-x8.c",
791    "src/f32-vbinary/gen/vaddc-relu-scalar-x1.c",
792    "src/f32-vbinary/gen/vaddc-relu-scalar-x2.c",
793    "src/f32-vbinary/gen/vaddc-relu-scalar-x4.c",
794    "src/f32-vbinary/gen/vaddc-relu-scalar-x8.c",
795    "src/f32-vbinary/gen/vaddc-scalar-x1.c",
796    "src/f32-vbinary/gen/vaddc-scalar-x2.c",
797    "src/f32-vbinary/gen/vaddc-scalar-x4.c",
798    "src/f32-vbinary/gen/vaddc-scalar-x8.c",
799    "src/f32-vbinary/gen/vdiv-minmax-scalar-x1.c",
800    "src/f32-vbinary/gen/vdiv-minmax-scalar-x2.c",
801    "src/f32-vbinary/gen/vdiv-minmax-scalar-x4.c",
802    "src/f32-vbinary/gen/vdiv-minmax-scalar-x8.c",
803    "src/f32-vbinary/gen/vdiv-relu-scalar-x1.c",
804    "src/f32-vbinary/gen/vdiv-relu-scalar-x2.c",
805    "src/f32-vbinary/gen/vdiv-relu-scalar-x4.c",
806    "src/f32-vbinary/gen/vdiv-relu-scalar-x8.c",
807    "src/f32-vbinary/gen/vdiv-scalar-x1.c",
808    "src/f32-vbinary/gen/vdiv-scalar-x2.c",
809    "src/f32-vbinary/gen/vdiv-scalar-x4.c",
810    "src/f32-vbinary/gen/vdiv-scalar-x8.c",
811    "src/f32-vbinary/gen/vdivc-minmax-scalar-x1.c",
812    "src/f32-vbinary/gen/vdivc-minmax-scalar-x2.c",
813    "src/f32-vbinary/gen/vdivc-minmax-scalar-x4.c",
814    "src/f32-vbinary/gen/vdivc-minmax-scalar-x8.c",
815    "src/f32-vbinary/gen/vdivc-relu-scalar-x1.c",
816    "src/f32-vbinary/gen/vdivc-relu-scalar-x2.c",
817    "src/f32-vbinary/gen/vdivc-relu-scalar-x4.c",
818    "src/f32-vbinary/gen/vdivc-relu-scalar-x8.c",
819    "src/f32-vbinary/gen/vdivc-scalar-x1.c",
820    "src/f32-vbinary/gen/vdivc-scalar-x2.c",
821    "src/f32-vbinary/gen/vdivc-scalar-x4.c",
822    "src/f32-vbinary/gen/vdivc-scalar-x8.c",
823    "src/f32-vbinary/gen/vmax-scalar-x1.c",
824    "src/f32-vbinary/gen/vmax-scalar-x2.c",
825    "src/f32-vbinary/gen/vmax-scalar-x4.c",
826    "src/f32-vbinary/gen/vmax-scalar-x8.c",
827    "src/f32-vbinary/gen/vmaxc-scalar-x1.c",
828    "src/f32-vbinary/gen/vmaxc-scalar-x2.c",
829    "src/f32-vbinary/gen/vmaxc-scalar-x4.c",
830    "src/f32-vbinary/gen/vmaxc-scalar-x8.c",
831    "src/f32-vbinary/gen/vmin-scalar-x1.c",
832    "src/f32-vbinary/gen/vmin-scalar-x2.c",
833    "src/f32-vbinary/gen/vmin-scalar-x4.c",
834    "src/f32-vbinary/gen/vmin-scalar-x8.c",
835    "src/f32-vbinary/gen/vminc-scalar-x1.c",
836    "src/f32-vbinary/gen/vminc-scalar-x2.c",
837    "src/f32-vbinary/gen/vminc-scalar-x4.c",
838    "src/f32-vbinary/gen/vminc-scalar-x8.c",
839    "src/f32-vbinary/gen/vmul-minmax-scalar-x1.c",
840    "src/f32-vbinary/gen/vmul-minmax-scalar-x2.c",
841    "src/f32-vbinary/gen/vmul-minmax-scalar-x4.c",
842    "src/f32-vbinary/gen/vmul-minmax-scalar-x8.c",
843    "src/f32-vbinary/gen/vmul-relu-scalar-x1.c",
844    "src/f32-vbinary/gen/vmul-relu-scalar-x2.c",
845    "src/f32-vbinary/gen/vmul-relu-scalar-x4.c",
846    "src/f32-vbinary/gen/vmul-relu-scalar-x8.c",
847    "src/f32-vbinary/gen/vmul-scalar-x1.c",
848    "src/f32-vbinary/gen/vmul-scalar-x2.c",
849    "src/f32-vbinary/gen/vmul-scalar-x4.c",
850    "src/f32-vbinary/gen/vmul-scalar-x8.c",
851    "src/f32-vbinary/gen/vmulc-minmax-scalar-x1.c",
852    "src/f32-vbinary/gen/vmulc-minmax-scalar-x2.c",
853    "src/f32-vbinary/gen/vmulc-minmax-scalar-x4.c",
854    "src/f32-vbinary/gen/vmulc-minmax-scalar-x8.c",
855    "src/f32-vbinary/gen/vmulc-relu-scalar-x1.c",
856    "src/f32-vbinary/gen/vmulc-relu-scalar-x2.c",
857    "src/f32-vbinary/gen/vmulc-relu-scalar-x4.c",
858    "src/f32-vbinary/gen/vmulc-relu-scalar-x8.c",
859    "src/f32-vbinary/gen/vmulc-scalar-x1.c",
860    "src/f32-vbinary/gen/vmulc-scalar-x2.c",
861    "src/f32-vbinary/gen/vmulc-scalar-x4.c",
862    "src/f32-vbinary/gen/vmulc-scalar-x8.c",
863    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x1.c",
864    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x2.c",
865    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x4.c",
866    "src/f32-vbinary/gen/vrdivc-minmax-scalar-x8.c",
867    "src/f32-vbinary/gen/vrdivc-relu-scalar-x1.c",
868    "src/f32-vbinary/gen/vrdivc-relu-scalar-x2.c",
869    "src/f32-vbinary/gen/vrdivc-relu-scalar-x4.c",
870    "src/f32-vbinary/gen/vrdivc-relu-scalar-x8.c",
871    "src/f32-vbinary/gen/vrdivc-scalar-x1.c",
872    "src/f32-vbinary/gen/vrdivc-scalar-x2.c",
873    "src/f32-vbinary/gen/vrdivc-scalar-x4.c",
874    "src/f32-vbinary/gen/vrdivc-scalar-x8.c",
875    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x1.c",
876    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x2.c",
877    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x4.c",
878    "src/f32-vbinary/gen/vrsubc-minmax-scalar-x8.c",
879    "src/f32-vbinary/gen/vrsubc-relu-scalar-x1.c",
880    "src/f32-vbinary/gen/vrsubc-relu-scalar-x2.c",
881    "src/f32-vbinary/gen/vrsubc-relu-scalar-x4.c",
882    "src/f32-vbinary/gen/vrsubc-relu-scalar-x8.c",
883    "src/f32-vbinary/gen/vrsubc-scalar-x1.c",
884    "src/f32-vbinary/gen/vrsubc-scalar-x2.c",
885    "src/f32-vbinary/gen/vrsubc-scalar-x4.c",
886    "src/f32-vbinary/gen/vrsubc-scalar-x8.c",
887    "src/f32-vbinary/gen/vsqrdiff-scalar-x1.c",
888    "src/f32-vbinary/gen/vsqrdiff-scalar-x2.c",
889    "src/f32-vbinary/gen/vsqrdiff-scalar-x4.c",
890    "src/f32-vbinary/gen/vsqrdiff-scalar-x8.c",
891    "src/f32-vbinary/gen/vsqrdiffc-scalar-x1.c",
892    "src/f32-vbinary/gen/vsqrdiffc-scalar-x2.c",
893    "src/f32-vbinary/gen/vsqrdiffc-scalar-x4.c",
894    "src/f32-vbinary/gen/vsqrdiffc-scalar-x8.c",
895    "src/f32-vbinary/gen/vsub-minmax-scalar-x1.c",
896    "src/f32-vbinary/gen/vsub-minmax-scalar-x2.c",
897    "src/f32-vbinary/gen/vsub-minmax-scalar-x4.c",
898    "src/f32-vbinary/gen/vsub-minmax-scalar-x8.c",
899    "src/f32-vbinary/gen/vsub-relu-scalar-x1.c",
900    "src/f32-vbinary/gen/vsub-relu-scalar-x2.c",
901    "src/f32-vbinary/gen/vsub-relu-scalar-x4.c",
902    "src/f32-vbinary/gen/vsub-relu-scalar-x8.c",
903    "src/f32-vbinary/gen/vsub-scalar-x1.c",
904    "src/f32-vbinary/gen/vsub-scalar-x2.c",
905    "src/f32-vbinary/gen/vsub-scalar-x4.c",
906    "src/f32-vbinary/gen/vsub-scalar-x8.c",
907    "src/f32-vbinary/gen/vsubc-minmax-scalar-x1.c",
908    "src/f32-vbinary/gen/vsubc-minmax-scalar-x2.c",
909    "src/f32-vbinary/gen/vsubc-minmax-scalar-x4.c",
910    "src/f32-vbinary/gen/vsubc-minmax-scalar-x8.c",
911    "src/f32-vbinary/gen/vsubc-relu-scalar-x1.c",
912    "src/f32-vbinary/gen/vsubc-relu-scalar-x2.c",
913    "src/f32-vbinary/gen/vsubc-relu-scalar-x4.c",
914    "src/f32-vbinary/gen/vsubc-relu-scalar-x8.c",
915    "src/f32-vbinary/gen/vsubc-scalar-x1.c",
916    "src/f32-vbinary/gen/vsubc-scalar-x2.c",
917    "src/f32-vbinary/gen/vsubc-scalar-x4.c",
918    "src/f32-vbinary/gen/vsubc-scalar-x8.c",
919    "src/f32-vclamp/gen/vclamp-scalar-x1.c",
920    "src/f32-vclamp/gen/vclamp-scalar-x2.c",
921    "src/f32-vclamp/gen/vclamp-scalar-x4.c",
922    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x1.c",
923    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x2.c",
924    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x3.c",
925    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x4.c",
926    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x5.c",
927    "src/f32-velu/gen/velu-scalar-rr2-lut16-p3-x6.c",
928    "src/f32-velu/gen/velu-scalar-rr2-p6-x1.c",
929    "src/f32-velu/gen/velu-scalar-rr2-p6-x2.c",
930    "src/f32-velu/gen/velu-scalar-rr2-p6-x3.c",
931    "src/f32-velu/gen/velu-scalar-rr2-p6-x4.c",
932    "src/f32-velu/gen/velu-scalar-rr2-p6-x5.c",
933    "src/f32-velu/gen/velu-scalar-rr2-p6-x6.c",
934    "src/f32-vhswish/gen/vhswish-scalar-x1.c",
935    "src/f32-vhswish/gen/vhswish-scalar-x2.c",
936    "src/f32-vhswish/gen/vhswish-scalar-x4.c",
937    "src/f32-vlrelu/gen/vlrelu-scalar-x1.c",
938    "src/f32-vlrelu/gen/vlrelu-scalar-x2.c",
939    "src/f32-vlrelu/gen/vlrelu-scalar-x4.c",
940    "src/f32-vmulcaddc/gen/c1-minmax-scalar-2x.c",
941    "src/f32-vmulcaddc/gen/c2-minmax-scalar-2x.c",
942    "src/f32-vmulcaddc/gen/c4-minmax-scalar-2x.c",
943    "src/f32-vrelu/gen/vrelu-scalar-x1.c",
944    "src/f32-vrelu/gen/vrelu-scalar-x2.c",
945    "src/f32-vrelu/gen/vrelu-scalar-x4.c",
946    "src/f32-vrelu/gen/vrelu-scalar-x8.c",
947    "src/f32-vrnd/gen/vrndd-scalar-libm-x1.c",
948    "src/f32-vrnd/gen/vrndd-scalar-libm-x2.c",
949    "src/f32-vrnd/gen/vrndd-scalar-libm-x4.c",
950    "src/f32-vrnd/gen/vrndne-scalar-libm-x1.c",
951    "src/f32-vrnd/gen/vrndne-scalar-libm-x2.c",
952    "src/f32-vrnd/gen/vrndne-scalar-libm-x4.c",
953    "src/f32-vrnd/gen/vrndu-scalar-libm-x1.c",
954    "src/f32-vrnd/gen/vrndu-scalar-libm-x2.c",
955    "src/f32-vrnd/gen/vrndu-scalar-libm-x4.c",
956    "src/f32-vrnd/gen/vrndz-scalar-libm-x1.c",
957    "src/f32-vrnd/gen/vrndz-scalar-libm-x2.c",
958    "src/f32-vrnd/gen/vrndz-scalar-libm-x4.c",
959    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x1.c",
960    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x2.c",
961    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut64-p2-div-x4.c",
962    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut2048-p1-div-x1.c",
963    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut2048-p1-div-x2.c",
964    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-lut2048-p1-div-x4.c",
965    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-p5-div-x1.c",
966    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-p5-div-x2.c",
967    "src/f32-vsigmoid/gen/vsigmoid-scalar-rr2-p5-div-x4.c",
968    "src/f32-vsqrt/gen/scalar-sqrt-x1.c",
969    "src/f32-vsqrt/gen/scalar-sqrt-x2.c",
970    "src/f32-vsqrt/gen/scalar-sqrt-x4.c",
971    "src/f32-vunary/gen/vabs-scalar-x1.c",
972    "src/f32-vunary/gen/vabs-scalar-x2.c",
973    "src/f32-vunary/gen/vabs-scalar-x4.c",
974    "src/f32-vunary/gen/vneg-scalar-x1.c",
975    "src/f32-vunary/gen/vneg-scalar-x2.c",
976    "src/f32-vunary/gen/vneg-scalar-x4.c",
977    "src/f32-vunary/gen/vsqr-scalar-x1.c",
978    "src/f32-vunary/gen/vsqr-scalar-x2.c",
979    "src/f32-vunary/gen/vsqr-scalar-x4.c",
980    "src/math/cvt-f32-f16-scalar-bitcast.c",
981    "src/math/cvt-f32-f16-scalar-fabsf.c",
982    "src/math/expminus-f32-scalar-rr2-lut64-p2.c",
983    "src/math/expminus-f32-scalar-rr2-lut2048-p1.c",
984    "src/math/expminus-f32-scalar-rr2-p5.c",
985    "src/math/expm1minus-f32-scalar-rr2-lut4-p4.c",
986    "src/math/expm1minus-f32-scalar-rr2-lut8-p3.c",
987    "src/math/expm1minus-f32-scalar-rr2-lut8-p4.c",
988    "src/math/expm1minus-f32-scalar-rr2-lut16-p3.c",
989    "src/math/expm1minus-f32-scalar-rr2-lut16-p4.c",
990    "src/math/expm1minus-f32-scalar-rr2-p5.c",
991    "src/math/expm1minus-f32-scalar-rr2-p6.c",
992    "src/math/roundd-scalar-addsub.c",
993    "src/math/roundd-scalar-cvt.c",
994    "src/math/roundd-scalar-floor.c",
995    "src/math/roundne-scalar-addsub.c",
996    "src/math/roundne-scalar-nearbyint.c",
997    "src/math/roundne-scalar-rint.c",
998    "src/math/roundu-scalar-addsub.c",
999    "src/math/roundu-scalar-ceil.c",
1000    "src/math/roundu-scalar-cvt.c",
1001    "src/math/roundz-scalar-addsub.c",
1002    "src/math/roundz-scalar-cvt.c",
1003    "src/math/roundz-scalar-trunc.c",
1004    "src/math/sigmoid-f32-scalar-rr2-lut64-p2-div.c",
1005    "src/math/sigmoid-f32-scalar-rr2-lut2048-p1-div.c",
1006    "src/math/sigmoid-f32-scalar-rr2-p5-div.c",
1007    "src/math/sqrt-u32-scalar-bitmanip.c",
1008    "src/math/sqrt-u32-scalar-clz-binsearch.c",
1009    "src/math/sqrt-u32-scalar-clz-newton.c",
1010    "src/math/sqrt-u32-scalar-cvti32-sqrt-lrint.c",
1011    "src/math/sqrt-u32-scalar-cvti64-sqrt-lrint.c",
1012    "src/math/sqrt-u32-scalar-cvti64-sqrtf-lrintf.c",
1013    "src/math/sqrt-u32-scalar-cvtu32-sqrt-lrint.c",
1014    "src/math/sqrt-u32-scalar-cvtu32-sqrtf-lrintf.c",
1015    "src/math/sqrt-u32-scalar-hashemian.c",
1016    "src/math/sqrt-u32-scalar-tflm.c",
1017    "src/math/sqrt-u64-scalar-cvtu32-sqrt-cvtsatu32f64.c",
1018    "src/math/sqrt-u64-scalar-cvtu32-sqrt-llrint.c",
1019    "src/math/sqrt-u64-scalar-cvtu64-sqrt-llrint.c",
1020    "src/qc8-dwconv/gen/up1x3-minmax-fp32-scalar-fmagic.c",
1021    "src/qc8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
1022    "src/qc8-dwconv/gen/up1x9-minmax-fp32-scalar-imagic.c",
1023    "src/qc8-dwconv/gen/up1x9-minmax-fp32-scalar-lrintf.c",
1024    "src/qc8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
1025    "src/qc8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
1026    "src/qc8-dwconv/gen/up1x25-minmax-fp32-scalar-lrintf.c",
1027    "src/qc8-dwconv/gen/up2x3-minmax-fp32-scalar-imagic.c",
1028    "src/qc8-dwconv/gen/up2x3-minmax-fp32-scalar-lrintf.c",
1029    "src/qc8-dwconv/gen/up2x9-minmax-fp32-scalar-fmagic.c",
1030    "src/qc8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
1031    "src/qc8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
1032    "src/qc8-dwconv/gen/up2x25-minmax-fp32-scalar-fmagic.c",
1033    "src/qc8-dwconv/gen/up2x25-minmax-fp32-scalar-imagic.c",
1034    "src/qc8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
1035    "src/qc8-dwconv/gen/up4x9-minmax-fp32-scalar-fmagic.c",
1036    "src/qc8-dwconv/gen/up4x9-minmax-fp32-scalar-imagic.c",
1037    "src/qc8-dwconv/gen/up4x9-minmax-fp32-scalar-lrintf.c",
1038    "src/qc8-dwconv/gen/up4x25-minmax-fp32-scalar-fmagic.c",
1039    "src/qc8-dwconv/gen/up4x25-minmax-fp32-scalar-imagic.c",
1040    "src/qc8-dwconv/gen/up4x25-minmax-fp32-scalar-lrintf.c",
1041    "src/qc8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1042    "src/qc8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1043    "src/qc8-gemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1044    "src/qc8-gemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1045    "src/qc8-gemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1046    "src/qc8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1047    "src/qc8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1048    "src/qc8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1049    "src/qc8-gemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1050    "src/qc8-gemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1051    "src/qc8-gemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1052    "src/qc8-gemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1053    "src/qc8-gemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1054    "src/qc8-gemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1055    "src/qc8-gemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1056    "src/qc8-gemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1057    "src/qc8-gemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1058    "src/qc8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1059    "src/qc8-gemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1060    "src/qc8-gemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1061    "src/qc8-gemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1062    "src/qc8-gemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1063    "src/qc8-gemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1064    "src/qc8-gemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1065    "src/qc8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1066    "src/qc8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1067    "src/qc8-igemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1068    "src/qc8-igemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1069    "src/qc8-igemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1070    "src/qc8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1071    "src/qc8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1072    "src/qc8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1073    "src/qc8-igemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1074    "src/qc8-igemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1075    "src/qc8-igemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1076    "src/qc8-igemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1077    "src/qc8-igemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1078    "src/qc8-igemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1079    "src/qc8-igemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1080    "src/qc8-igemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1081    "src/qc8-igemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1082    "src/qc8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1083    "src/qc8-igemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1084    "src/qc8-igemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1085    "src/qc8-igemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1086    "src/qc8-igemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1087    "src/qc8-igemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1088    "src/qc8-igemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1089    "src/qs8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
1090    "src/qs8-dwconv/gen/up1x9-minmax-fp32-scalar-imagic.c",
1091    "src/qs8-dwconv/gen/up1x9-minmax-fp32-scalar-lrintf.c",
1092    "src/qs8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
1093    "src/qs8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
1094    "src/qs8-dwconv/gen/up1x25-minmax-fp32-scalar-lrintf.c",
1095    "src/qs8-dwconv/gen/up2x9-minmax-fp32-scalar-fmagic.c",
1096    "src/qs8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
1097    "src/qs8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
1098    "src/qs8-dwconv/gen/up2x25-minmax-fp32-scalar-fmagic.c",
1099    "src/qs8-dwconv/gen/up2x25-minmax-fp32-scalar-imagic.c",
1100    "src/qs8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
1101    "src/qs8-dwconv/gen/up4x9-minmax-fp32-scalar-fmagic.c",
1102    "src/qs8-dwconv/gen/up4x9-minmax-fp32-scalar-imagic.c",
1103    "src/qs8-dwconv/gen/up4x9-minmax-fp32-scalar-lrintf.c",
1104    "src/qs8-dwconv/gen/up4x25-minmax-fp32-scalar-fmagic.c",
1105    "src/qs8-dwconv/gen/up4x25-minmax-fp32-scalar-imagic.c",
1106    "src/qs8-dwconv/gen/up4x25-minmax-fp32-scalar-lrintf.c",
1107    "src/qs8-f32-vcvt/gen/vcvt-scalar-x1.c",
1108    "src/qs8-f32-vcvt/gen/vcvt-scalar-x2.c",
1109    "src/qs8-f32-vcvt/gen/vcvt-scalar-x3.c",
1110    "src/qs8-f32-vcvt/gen/vcvt-scalar-x4.c",
1111    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c1.c",
1112    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c2.c",
1113    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c4.c",
1114    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
1115    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c2.c",
1116    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c4.c",
1117    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c1.c",
1118    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c2.c",
1119    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c4.c",
1120    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c1.c",
1121    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c2.c",
1122    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c4.c",
1123    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
1124    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c2.c",
1125    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c4.c",
1126    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c1.c",
1127    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c2.c",
1128    "src/qs8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c4.c",
1129    "src/qs8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1130    "src/qs8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1131    "src/qs8-gemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1132    "src/qs8-gemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1133    "src/qs8-gemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1134    "src/qs8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1135    "src/qs8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1136    "src/qs8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1137    "src/qs8-gemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1138    "src/qs8-gemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1139    "src/qs8-gemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1140    "src/qs8-gemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1141    "src/qs8-gemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1142    "src/qs8-gemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1143    "src/qs8-gemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1144    "src/qs8-gemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1145    "src/qs8-gemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1146    "src/qs8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1147    "src/qs8-gemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1148    "src/qs8-gemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1149    "src/qs8-gemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1150    "src/qs8-gemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1151    "src/qs8-gemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1152    "src/qs8-gemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1153    "src/qs8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1154    "src/qs8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1155    "src/qs8-igemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1156    "src/qs8-igemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1157    "src/qs8-igemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1158    "src/qs8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1159    "src/qs8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1160    "src/qs8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1161    "src/qs8-igemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1162    "src/qs8-igemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1163    "src/qs8-igemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1164    "src/qs8-igemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1165    "src/qs8-igemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1166    "src/qs8-igemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1167    "src/qs8-igemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1168    "src/qs8-igemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1169    "src/qs8-igemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1170    "src/qs8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1171    "src/qs8-igemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1172    "src/qs8-igemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1173    "src/qs8-igemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1174    "src/qs8-igemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1175    "src/qs8-igemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1176    "src/qs8-igemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1177    "src/qs8-requantization/fp32-scalar-fmagic.c",
1178    "src/qs8-requantization/fp32-scalar-lrintf.c",
1179    "src/qs8-requantization/gemmlowp-scalar.c",
1180    "src/qs8-requantization/rndna-scalar-signed64.c",
1181    "src/qs8-requantization/rndna-scalar-unsigned32.c",
1182    "src/qs8-requantization/rndna-scalar-unsigned64.c",
1183    "src/qs8-requantization/rndnu-scalar.c",
1184    "src/qs8-vadd/gen/minmax-scalar-x1.c",
1185    "src/qs8-vadd/gen/minmax-scalar-x2.c",
1186    "src/qs8-vadd/gen/minmax-scalar-x4.c",
1187    "src/qs8-vaddc/gen/minmax-scalar-x1.c",
1188    "src/qs8-vaddc/gen/minmax-scalar-x2.c",
1189    "src/qs8-vaddc/gen/minmax-scalar-x4.c",
1190    "src/qs8-vcvt/gen/vcvt-scalar-x1.c",
1191    "src/qs8-vcvt/gen/vcvt-scalar-x2.c",
1192    "src/qs8-vcvt/gen/vcvt-scalar-x4.c",
1193    "src/qs8-vlrelu/gen/vlrelu-scalar-andxor-x1.c",
1194    "src/qs8-vlrelu/gen/vlrelu-scalar-andxor-x2.c",
1195    "src/qs8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
1196    "src/qs8-vlrelu/gen/vlrelu-scalar-select-x1.c",
1197    "src/qs8-vlrelu/gen/vlrelu-scalar-select-x2.c",
1198    "src/qs8-vlrelu/gen/vlrelu-scalar-select-x4.c",
1199    "src/qs8-vmul/gen/minmax-fp32-scalar-x1.c",
1200    "src/qs8-vmul/gen/minmax-fp32-scalar-x2.c",
1201    "src/qs8-vmul/gen/minmax-fp32-scalar-x4.c",
1202    "src/qs8-vmulc/gen/minmax-fp32-scalar-x1.c",
1203    "src/qs8-vmulc/gen/minmax-fp32-scalar-x2.c",
1204    "src/qs8-vmulc/gen/minmax-fp32-scalar-x4.c",
1205    "src/qu8-avgpool/9p8x-minmax-scalar-c1.c",
1206    "src/qu8-avgpool/9x-minmax-scalar-c1.c",
1207    "src/qu8-dwconv/gen/up1x9-minmax-fp32-scalar-fmagic.c",
1208    "src/qu8-dwconv/gen/up1x9-minmax-fp32-scalar-imagic.c",
1209    "src/qu8-dwconv/gen/up1x9-minmax-fp32-scalar-lrintf.c",
1210    "src/qu8-dwconv/gen/up1x25-minmax-fp32-scalar-fmagic.c",
1211    "src/qu8-dwconv/gen/up1x25-minmax-fp32-scalar-imagic.c",
1212    "src/qu8-dwconv/gen/up1x25-minmax-fp32-scalar-lrintf.c",
1213    "src/qu8-dwconv/gen/up2x9-minmax-fp32-scalar-fmagic.c",
1214    "src/qu8-dwconv/gen/up2x9-minmax-fp32-scalar-imagic.c",
1215    "src/qu8-dwconv/gen/up2x9-minmax-fp32-scalar-lrintf.c",
1216    "src/qu8-dwconv/gen/up2x25-minmax-fp32-scalar-fmagic.c",
1217    "src/qu8-dwconv/gen/up2x25-minmax-fp32-scalar-imagic.c",
1218    "src/qu8-dwconv/gen/up2x25-minmax-fp32-scalar-lrintf.c",
1219    "src/qu8-dwconv/gen/up4x9-minmax-fp32-scalar-fmagic.c",
1220    "src/qu8-dwconv/gen/up4x9-minmax-fp32-scalar-imagic.c",
1221    "src/qu8-dwconv/gen/up4x9-minmax-fp32-scalar-lrintf.c",
1222    "src/qu8-dwconv/gen/up4x25-minmax-fp32-scalar-fmagic.c",
1223    "src/qu8-dwconv/gen/up4x25-minmax-fp32-scalar-imagic.c",
1224    "src/qu8-dwconv/gen/up4x25-minmax-fp32-scalar-lrintf.c",
1225    "src/qu8-f32-vcvt/gen/vcvt-scalar-x1.c",
1226    "src/qu8-f32-vcvt/gen/vcvt-scalar-x2.c",
1227    "src/qu8-f32-vcvt/gen/vcvt-scalar-x3.c",
1228    "src/qu8-f32-vcvt/gen/vcvt-scalar-x4.c",
1229    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c1.c",
1230    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c2.c",
1231    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-fmagic-c4.c",
1232    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c1.c",
1233    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c2.c",
1234    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-imagic-c4.c",
1235    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c1.c",
1236    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c2.c",
1237    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-scalar-lrintf-c4.c",
1238    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c1.c",
1239    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c2.c",
1240    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-fmagic-c4.c",
1241    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c1.c",
1242    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c2.c",
1243    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-imagic-c4.c",
1244    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c1.c",
1245    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c2.c",
1246    "src/qu8-gavgpool/gen/7x-minmax-fp32-scalar-lrintf-c4.c",
1247    "src/qu8-gemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1248    "src/qu8-gemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1249    "src/qu8-gemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1250    "src/qu8-gemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1251    "src/qu8-gemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1252    "src/qu8-gemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1253    "src/qu8-gemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1254    "src/qu8-gemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1255    "src/qu8-gemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1256    "src/qu8-gemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1257    "src/qu8-gemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1258    "src/qu8-gemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1259    "src/qu8-gemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1260    "src/qu8-gemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1261    "src/qu8-gemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1262    "src/qu8-gemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1263    "src/qu8-gemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1264    "src/qu8-gemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1265    "src/qu8-gemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1266    "src/qu8-gemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1267    "src/qu8-gemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1268    "src/qu8-gemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1269    "src/qu8-gemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1270    "src/qu8-gemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1271    "src/qu8-igemm/gen/1x2-minmax-fp32-scalar-fmagic.c",
1272    "src/qu8-igemm/gen/1x2-minmax-fp32-scalar-imagic.c",
1273    "src/qu8-igemm/gen/1x2-minmax-fp32-scalar-lrintf.c",
1274    "src/qu8-igemm/gen/1x4-minmax-fp32-scalar-fmagic.c",
1275    "src/qu8-igemm/gen/1x4-minmax-fp32-scalar-imagic.c",
1276    "src/qu8-igemm/gen/1x4-minmax-fp32-scalar-lrintf.c",
1277    "src/qu8-igemm/gen/2x2-minmax-fp32-scalar-fmagic.c",
1278    "src/qu8-igemm/gen/2x2-minmax-fp32-scalar-imagic.c",
1279    "src/qu8-igemm/gen/2x2-minmax-fp32-scalar-lrintf.c",
1280    "src/qu8-igemm/gen/2x4-minmax-fp32-scalar-fmagic.c",
1281    "src/qu8-igemm/gen/2x4-minmax-fp32-scalar-imagic.c",
1282    "src/qu8-igemm/gen/2x4-minmax-fp32-scalar-lrintf.c",
1283    "src/qu8-igemm/gen/3x2-minmax-fp32-scalar-fmagic.c",
1284    "src/qu8-igemm/gen/3x2-minmax-fp32-scalar-imagic.c",
1285    "src/qu8-igemm/gen/3x2-minmax-fp32-scalar-lrintf.c",
1286    "src/qu8-igemm/gen/3x4-minmax-fp32-scalar-fmagic.c",
1287    "src/qu8-igemm/gen/3x4-minmax-fp32-scalar-imagic.c",
1288    "src/qu8-igemm/gen/3x4-minmax-fp32-scalar-lrintf.c",
1289    "src/qu8-igemm/gen/4x2-minmax-fp32-scalar-fmagic.c",
1290    "src/qu8-igemm/gen/4x2-minmax-fp32-scalar-imagic.c",
1291    "src/qu8-igemm/gen/4x2-minmax-fp32-scalar-lrintf.c",
1292    "src/qu8-igemm/gen/4x4-minmax-fp32-scalar-fmagic.c",
1293    "src/qu8-igemm/gen/4x4-minmax-fp32-scalar-imagic.c",
1294    "src/qu8-igemm/gen/4x4-minmax-fp32-scalar-lrintf.c",
1295    "src/qu8-requantization/fp32-scalar-fmagic.c",
1296    "src/qu8-requantization/fp32-scalar-lrintf.c",
1297    "src/qu8-requantization/gemmlowp-scalar.c",
1298    "src/qu8-requantization/rndna-scalar-signed64.c",
1299    "src/qu8-requantization/rndna-scalar-unsigned32.c",
1300    "src/qu8-requantization/rndna-scalar-unsigned64.c",
1301    "src/qu8-vadd/gen/minmax-scalar-x1.c",
1302    "src/qu8-vadd/gen/minmax-scalar-x2.c",
1303    "src/qu8-vadd/gen/minmax-scalar-x4.c",
1304    "src/qu8-vaddc/gen/minmax-scalar-x1.c",
1305    "src/qu8-vaddc/gen/minmax-scalar-x2.c",
1306    "src/qu8-vaddc/gen/minmax-scalar-x4.c",
1307    "src/qu8-vcvt/gen/vcvt-scalar-x1.c",
1308    "src/qu8-vcvt/gen/vcvt-scalar-x2.c",
1309    "src/qu8-vcvt/gen/vcvt-scalar-x4.c",
1310    "src/qu8-vlrelu/gen/vlrelu-scalar-andxor-x1.c",
1311    "src/qu8-vlrelu/gen/vlrelu-scalar-andxor-x2.c",
1312    "src/qu8-vlrelu/gen/vlrelu-scalar-andxor-x4.c",
1313    "src/qu8-vlrelu/gen/vlrelu-scalar-select-x1.c",
1314    "src/qu8-vlrelu/gen/vlrelu-scalar-select-x2.c",
1315    "src/qu8-vlrelu/gen/vlrelu-scalar-select-x4.c",
1316    "src/qu8-vmul/gen/minmax-fp32-scalar-x1.c",
1317    "src/qu8-vmul/gen/minmax-fp32-scalar-x2.c",
1318    "src/qu8-vmul/gen/minmax-fp32-scalar-x4.c",
1319    "src/qu8-vmulc/gen/minmax-fp32-scalar-x1.c",
1320    "src/qu8-vmulc/gen/minmax-fp32-scalar-x2.c",
1321    "src/qu8-vmulc/gen/minmax-fp32-scalar-x4.c",
1322    "src/s8-ibilinear/gen/scalar-c1.c",
1323    "src/s8-ibilinear/gen/scalar-c2.c",
1324    "src/s8-ibilinear/gen/scalar-c4.c",
1325    "src/s8-maxpool/9p8x-minmax-scalar-c1.c",
1326    "src/s8-vclamp/scalar-x4.c",
1327    "src/s16-rmaxabs/gen/scalar-x1.c",
1328    "src/s16-rmaxabs/gen/scalar-x2.c",
1329    "src/s16-rmaxabs/gen/scalar-x3.c",
1330    "src/s16-rmaxabs/gen/scalar-x4.c",
1331    "src/s16-vlshift/gen/scalar-x1.c",
1332    "src/s16-vlshift/gen/scalar-x2.c",
1333    "src/s16-vlshift/gen/scalar-x3.c",
1334    "src/s16-vlshift/gen/scalar-x4.c",
1335    "src/s16-window/gen/scalar-x1.c",
1336    "src/s16-window/gen/scalar-x2.c",
1337    "src/s16-window/gen/scalar-x3.c",
1338    "src/s16-window/gen/scalar-x4.c",
1339    "src/u8-ibilinear/gen/scalar-c1.c",
1340    "src/u8-ibilinear/gen/scalar-c2.c",
1341    "src/u8-ibilinear/gen/scalar-c4.c",
1342    "src/u8-lut32norm/scalar.c",
1343    "src/u8-maxpool/9p8x-minmax-scalar-c1.c",
1344    "src/u8-rmax/scalar.c",
1345    "src/u8-vclamp/scalar-x4.c",
1346    "src/u32-filterbank-accumulate/gen/scalar-x1.c",
1347    "src/u32-filterbank-subtract/scalar-x2.c",
1348    "src/u32-vlog/gen/scalar-x1.c",
1349    "src/u32-vlog/gen/scalar-x2.c",
1350    "src/u32-vlog/gen/scalar-x3.c",
1351    "src/u32-vlog/gen/scalar-x4.c",
1352    "src/u64-u32-vsqrtshift/scalar-cvtu32-sqrt-cvtu32f64-x1.c",
1353    "src/xx-copy/memcpy.c",
1354    "src/xx-fill/scalar-x16.c",
1355    "src/xx-pad/scalar.c",
1356    "src/xx-transpose/1x1-memcpy.c",
1357    "src/x8-lut/gen/lut-scalar-x1.c",
1358    "src/x8-lut/gen/lut-scalar-x2.c",
1359    "src/x8-lut/gen/lut-scalar-x4.c",
1360    "src/x8-lut/gen/lut-scalar-x8.c",
1361    "src/x8-lut/gen/lut-scalar-x16.c",
1362    "src/x8-transposec/gen/1x2-scalar-int.c",
1363    "src/x8-transposec/gen/1x4-scalar-int.c",
1364    "src/x8-transposec/gen/2x1-scalar-int.c",
1365    "src/x8-transposec/gen/2x2-scalar-int.c",
1366    "src/x8-transposec/gen/2x4-scalar-int.c",
1367    "src/x8-transposec/gen/4x1-scalar-int.c",
1368    "src/x8-transposec/gen/4x2-scalar-int.c",
1369    "src/x8-transposec/gen/4x4-scalar-int.c",
1370    "src/x8-zip/xm-scalar.c",
1371    "src/x8-zip/x2-scalar.c",
1372    "src/x8-zip/x3-scalar.c",
1373    "src/x8-zip/x4-scalar.c",
1374    "src/x16-transposec/gen/1x2-scalar-int.c",
1375    "src/x16-transposec/gen/1x4-scalar-int.c",
1376    "src/x16-transposec/gen/2x1-scalar-int.c",
1377    "src/x16-transposec/gen/2x2-scalar-int.c",
1378    "src/x16-transposec/gen/2x4-scalar-int.c",
1379    "src/x16-transposec/gen/4x1-scalar-int.c",
1380    "src/x16-transposec/gen/4x2-scalar-int.c",
1381    "src/x16-transposec/gen/4x4-scalar-int.c",
1382    "src/x24-transposec/gen/1x2-scalar.c",
1383    "src/x24-transposec/gen/1x4-scalar.c",
1384    "src/x24-transposec/gen/2x1-scalar.c",
1385    "src/x24-transposec/gen/2x2-scalar.c",
1386    "src/x24-transposec/gen/2x4-scalar.c",
1387    "src/x24-transposec/gen/4x1-scalar.c",
1388    "src/x24-transposec/gen/4x2-scalar.c",
1389    "src/x24-transposec/gen/4x4-scalar.c",
1390    "src/x32-packx/x2-scalar.c",
1391    "src/x32-packx/x3-scalar.c",
1392    "src/x32-packx/x4-scalar.c",
1393    "src/x32-transposec/gen/1x2-scalar-float.c",
1394    "src/x32-transposec/gen/1x2-scalar-int.c",
1395    "src/x32-transposec/gen/1x4-scalar-float.c",
1396    "src/x32-transposec/gen/1x4-scalar-int.c",
1397    "src/x32-transposec/gen/2x1-scalar-float.c",
1398    "src/x32-transposec/gen/2x1-scalar-int.c",
1399    "src/x32-transposec/gen/2x2-scalar-float.c",
1400    "src/x32-transposec/gen/2x2-scalar-int.c",
1401    "src/x32-transposec/gen/2x4-scalar-float.c",
1402    "src/x32-transposec/gen/2x4-scalar-int.c",
1403    "src/x32-transposec/gen/4x1-scalar-float.c",
1404    "src/x32-transposec/gen/4x1-scalar-int.c",
1405    "src/x32-transposec/gen/4x2-scalar-float.c",
1406    "src/x32-transposec/gen/4x2-scalar-int.c",
1407    "src/x32-transposec/gen/4x4-scalar-float.c",
1408    "src/x32-transposec/gen/4x4-scalar-int.c",
1409    "src/x32-unpool/scalar.c",
1410    "src/x32-zip/xm-scalar.c",
1411    "src/x32-zip/x2-scalar.c",
1412    "src/x32-zip/x3-scalar.c",
1413    "src/x32-zip/x4-scalar.c",
1414    "src/x64-transposec/gen/1x2-scalar-float.c",
1415    "src/x64-transposec/gen/1x2-scalar-int.c",
1416    "src/x64-transposec/gen/2x1-scalar-float.c",
1417    "src/x64-transposec/gen/2x1-scalar-int.c",
1418    "src/x64-transposec/gen/2x2-scalar-float.c",
1419    "src/x64-transposec/gen/2x2-scalar-int.c",
1420    "src/x64-transposec/gen/4x1-scalar-float.c",
1421    "src/x64-transposec/gen/4x1-scalar-int.c",
1422    "src/x64-transposec/gen/4x2-scalar-float.c",
1423    "src/x64-transposec/gen/4x2-scalar-int.c",
1424]
1425
1426ALL_WASM_MICROKERNEL_SRCS = [
1427    "src/f32-avgpool/9p8x-minmax-wasm-c1.c",
1428    "src/f32-avgpool/9x-minmax-wasm-c1.c",
1429    "src/f32-dwconv/gen/up1x3-minmax-wasm-acc2.c",
1430    "src/f32-dwconv/gen/up1x3-minmax-wasm.c",
1431    "src/f32-dwconv/gen/up1x4-minmax-wasm-acc2.c",
1432    "src/f32-dwconv/gen/up1x4-minmax-wasm.c",
1433    "src/f32-dwconv/gen/up1x9-minmax-wasm-acc2.c",
1434    "src/f32-dwconv/gen/up1x9-minmax-wasm.c",
1435    "src/f32-dwconv/gen/up1x25-minmax-wasm-acc2.c",
1436    "src/f32-dwconv/gen/up1x25-minmax-wasm.c",
1437    "src/f32-dwconv/gen/up2x3-minmax-wasm-acc2.c",
1438    "src/f32-dwconv/gen/up2x3-minmax-wasm.c",
1439    "src/f32-dwconv/gen/up2x4-minmax-wasm-acc2.c",
1440    "src/f32-dwconv/gen/up2x4-minmax-wasm.c",
1441    "src/f32-dwconv/gen/up2x9-minmax-wasm-acc2.c",
1442    "src/f32-dwconv/gen/up2x9-minmax-wasm.c",
1443    "src/f32-dwconv/gen/up2x25-minmax-wasm-acc2.c",
1444    "src/f32-dwconv/gen/up2x25-minmax-wasm.c",
1445    "src/f32-gavgpool/7p7x-minmax-wasm-c1.c",
1446    "src/f32-gavgpool/7x-minmax-wasm-c1.c",
1447    "src/f32-gemm/gen-inc/1x4inc-minmax-wasm.c",
1448    "src/f32-gemm/gen-inc/2x4inc-minmax-wasm.c",
1449    "src/f32-gemm/gen-inc/4x4inc-minmax-wasm.c",
1450    "src/f32-gemm/gen/1x4-minmax-wasm.c",
1451    "src/f32-gemm/gen/1x4-relu-wasm.c",
1452    "src/f32-gemm/gen/2x4-minmax-wasm.c",
1453    "src/f32-gemm/gen/2x4-relu-wasm.c",
1454    "src/f32-gemm/gen/4x2-minmax-wasm.c",
1455    "src/f32-gemm/gen/4x2-relu-wasm.c",
1456    "src/f32-gemm/gen/4x4-minmax-wasm.c",
1457    "src/f32-gemm/gen/4x4-relu-wasm.c",
1458    "src/f32-igemm/gen/1x4-minmax-wasm.c",
1459    "src/f32-igemm/gen/1x4-relu-wasm.c",
1460    "src/f32-igemm/gen/2x4-minmax-wasm.c",
1461    "src/f32-igemm/gen/2x4-relu-wasm.c",
1462    "src/f32-igemm/gen/4x2-minmax-wasm.c",
1463    "src/f32-igemm/gen/4x2-relu-wasm.c",
1464    "src/f32-igemm/gen/4x4-minmax-wasm.c",
1465    "src/f32-igemm/gen/4x4-relu-wasm.c",
1466    "src/f32-maxpool/9p8x-minmax-wasm-c1.c",
1467    "src/f32-pavgpool/9p8x-minmax-wasm-c1.c",
1468    "src/f32-pavgpool/9x-minmax-wasm-c1.c",
1469    "src/f32-prelu/gen/wasm-2x1.c",
1470    "src/f32-prelu/gen/wasm-2x4.c",
1471    "src/f32-qs8-vcvt/gen/vcvt-wasm-fmagic-x1.c",
1472    "src/f32-qs8-vcvt/gen/vcvt-wasm-fmagic-x2.c",
1473    "src/f32-qs8-vcvt/gen/vcvt-wasm-fmagic-x3.c",
1474    "src/f32-qs8-vcvt/gen/vcvt-wasm-fmagic-x4.c",
1475    "src/f32-qu8-vcvt/gen/vcvt-wasm-fmagic-x1.c",
1476    "src/f32-qu8-vcvt/gen/vcvt-wasm-fmagic-x2.c",
1477    "src/f32-qu8-vcvt/gen/vcvt-wasm-fmagic-x3.c",
1478    "src/f32-qu8-vcvt/gen/vcvt-wasm-fmagic-x4.c",
1479    "src/f32-vbinary/gen/vadd-minmax-wasm-x1.c",
1480    "src/f32-vbinary/gen/vadd-minmax-wasm-x2.c",
1481    "src/f32-vbinary/gen/vadd-minmax-wasm-x4.c",
1482    "src/f32-vbinary/gen/vadd-minmax-wasm-x8.c",
1483    "src/f32-vbinary/gen/vadd-relu-wasm-x1.c",
1484    "src/f32-vbinary/gen/vadd-relu-wasm-x2.c",
1485    "src/f32-vbinary/gen/vadd-relu-wasm-x4.c",
1486    "src/f32-vbinary/gen/vadd-relu-wasm-x8.c",
1487    "src/f32-vbinary/gen/vaddc-minmax-wasm-x1.c",
1488    "src/f32-vbinary/gen/vaddc-minmax-wasm-x2.c",
1489    "src/f32-vbinary/gen/vaddc-minmax-wasm-x4.c",
1490    "src/f32-vbinary/gen/vaddc-minmax-wasm-x8.c",
1491    "src/f32-vbinary/gen/vaddc-relu-wasm-x1.c",
1492    "src/f32-vbinary/gen/vaddc-relu-wasm-x2.c",
1493    "src/f32-vbinary/gen/vaddc-relu-wasm-x4.c",
1494    "src/f32-vbinary/gen/vaddc-relu-wasm-x8.c",
1495    "src/f32-vbinary/gen/vdiv-minmax-wasm-x1.c",
1496    "src/f32-vbinary/gen/vdiv-minmax-wasm-x2.c",
1497    "src/f32-vbinary/gen/vdiv-minmax-wasm-x4.c",
1498    "src/f32-vbinary/gen/vdiv-minmax-wasm-x8.c",
1499    "src/f32-vbinary/gen/vdiv-relu-wasm-x1.c",
1500    "src/f32-vbinary/gen/vdiv-relu-wasm-x2.c",
1501    "src/f32-vbinary/gen/vdiv-relu-wasm-x4.c",
1502    "src/f32-vbinary/gen/vdiv-relu-wasm-x8.c",
1503    "src/f32-vbinary/gen/vdivc-minmax-wasm-x1.c",
1504    "src/f32-vbinary/gen/vdivc-minmax-wasm-x2.c",
1505    "src/f32-vbinary/gen/vdivc-minmax-wasm-x4.c",
1506    "src/f32-vbinary/gen/vdivc-minmax-wasm-x8.c",
1507    "src/f32-vbinary/gen/vdivc-relu-wasm-x1.c",
1508    "src/f32-vbinary/gen/vdivc-relu-wasm-x2.c",
1509    "src/f32-vbinary/gen/vdivc-relu-wasm-x4.c",
1510    "src/f32-vbinary/gen/vdivc-relu-wasm-x8.c",
1511    "src/f32-vbinary/gen/vmax-wasm-x1.c",
1512    "src/f32-vbinary/gen/vmax-wasm-x2.c",
1513    "src/f32-vbinary/gen/vmax-wasm-x4.c",
1514    "src/f32-vbinary/gen/vmax-wasm-x8.c",
1515    "src/f32-vbinary/gen/vmaxc-wasm-x1.c",
1516    "src/f32-vbinary/gen/vmaxc-wasm-x2.c",
1517    "src/f32-vbinary/gen/vmaxc-wasm-x4.c",
1518    "src/f32-vbinary/gen/vmaxc-wasm-x8.c",
1519    "src/f32-vbinary/gen/vmin-wasm-x1.c",
1520    "src/f32-vbinary/gen/vmin-wasm-x2.c",
1521    "src/f32-vbinary/gen/vmin-wasm-x4.c",
1522    "src/f32-vbinary/gen/vmin-wasm-x8.c",
1523    "src/f32-vbinary/gen/vminc-wasm-x1.c",
1524    "src/f32-vbinary/gen/vminc-wasm-x2.c",
1525    "src/f32-vbinary/gen/vminc-wasm-x4.c",
1526    "src/f32-vbinary/gen/vminc-wasm-x8.c",
1527    "src/f32-vbinary/gen/vmul-minmax-wasm-x1.c",
1528    "src/f32-vbinary/gen/vmul-minmax-wasm-x2.c",
1529    "src/f32-vbinary/gen/vmul-minmax-wasm-x4.c",
1530    "src/f32-vbinary/gen/vmul-minmax-wasm-x8.c",
1531    "src/f32-vbinary/gen/vmul-relu-wasm-x1.c",
1532    "src/f32-vbinary/gen/vmul-relu-wasm-x2.c",
1533    "src/f32-vbinary/gen/vmul-relu-wasm-x4.c",
1534    "src/f32-vbinary/gen/vmul-relu-wasm-x8.c",
1535    "src/f32-vbinary/gen/vmulc-minmax-wasm-x1.c",
1536    "src/f32-vbinary/gen/vmulc-minmax-wasm-x2.c",
1537    "src/f32-vbinary/gen/vmulc-minmax-wasm-x4.c",
1538    "src/f32-vbinary/gen/vmulc-minmax-wasm-x8.c",
1539    "src/f32-vbinary/gen/vmulc-relu-wasm-x1.c",
1540    "src/f32-vbinary/gen/vmulc-relu-wasm-x2.c",
1541    "src/f32-vbinary/gen/vmulc-relu-wasm-x4.c",
1542    "src/f32-vbinary/gen/vmulc-relu-wasm-x8.c",
1543    "src/f32-vbinary/gen/vrdivc-minmax-wasm-x1.c",
1544    "src/f32-vbinary/gen/vrdivc-minmax-wasm-x2.c",
1545    "src/f32-vbinary/gen/vrdivc-minmax-wasm-x4.c",
1546    "src/f32-vbinary/gen/vrdivc-minmax-wasm-x8.c",
1547    "src/f32-vbinary/gen/vrdivc-relu-wasm-x1.c",
1548    "src/f32-vbinary/gen/vrdivc-relu-wasm-x2.c",
1549    "src/f32-vbinary/gen/vrdivc-relu-wasm-x4.c",
1550    "src/f32-vbinary/gen/vrdivc-relu-wasm-x8.c",
1551    "src/f32-vbinary/gen/vrsubc-minmax-wasm-x1.c",
1552    "src/f32-vbinary/gen/vrsubc-minmax-wasm-x2.c",
1553    "src/f32-vbinary/gen/vrsubc-minmax-wasm-x4.c",
1554    "src/f32-vbinary/gen/vrsubc-minmax-wasm-x8.c",
1555    "src/f32-vbinary/gen/vrsubc-relu-wasm-x1.c",
1556    "src/f32-vbinary/gen/vrsubc-relu-wasm-x2.c",
1557    "src/f32-vbinary/gen/vrsubc-relu-wasm-x4.c",
1558    "src/f32-vbinary/gen/vrsubc-relu-wasm-x8.c",
1559    "src/f32-vbinary/gen/vsub-minmax-wasm-x1.c",
1560    "src/f32-vbinary/gen/vsub-minmax-wasm-x2.c",
1561    "src/f32-vbinary/gen/vsub-minmax-wasm-x4.c",
1562    "src/f32-vbinary/gen/vsub-minmax-wasm-x8.c",
1563    "src/f32-vbinary/gen/vsub-relu-wasm-x1.c",
1564    "src/f32-vbinary/gen/vsub-relu-wasm-x2.c",
1565    "src/f32-vbinary/gen/vsub-relu-wasm-x4.c",
1566    "src/f32-vbinary/gen/vsub-relu-wasm-x8.c",
1567    "src/f32-vbinary/gen/vsubc-minmax-wasm-x1.c",
1568    "src/f32-vbinary/gen/vsubc-minmax-wasm-x2.c",
1569    "src/f32-vbinary/gen/vsubc-minmax-wasm-x4.c",
1570    "src/f32-vbinary/gen/vsubc-minmax-wasm-x8.c",
1571    "src/f32-vbinary/gen/vsubc-relu-wasm-x1.c",
1572    "src/f32-vbinary/gen/vsubc-relu-wasm-x2.c",
1573    "src/f32-vbinary/gen/vsubc-relu-wasm-x4.c",
1574    "src/f32-vbinary/gen/vsubc-relu-wasm-x8.c",
1575    "src/f32-vclamp/gen/vclamp-wasm-x1.c",
1576    "src/f32-vclamp/gen/vclamp-wasm-x2.c",
1577    "src/f32-vclamp/gen/vclamp-wasm-x4.c",
1578    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x1.c",
1579    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x2.c",
1580    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x3.c",
1581    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x4.c",
1582    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x5.c",
1583    "src/f32-velu/gen/velu-wasm-rr2-lut16-p3-x6.c",
1584    "src/f32-velu/gen/velu-wasm-rr2-p6-x1.c",
1585    "src/f32-velu/gen/velu-wasm-rr2-p6-x2.c",
1586    "src/f32-velu/gen/velu-wasm-rr2-p6-x3.c",
1587    "src/f32-velu/gen/velu-wasm-rr2-p6-x4.c",
1588    "src/f32-velu/gen/velu-wasm-rr2-p6-x5.c",
1589    "src/f32-velu/gen/velu-wasm-rr2-p6-x6.c",
1590    "src/f32-vhswish/gen/vhswish-wasm-x1.c",
1591    "src/f32-vhswish/gen/vhswish-wasm-x2.c",
1592    "src/f32-vhswish/gen/vhswish-wasm-x4.c",
1593    "src/f32-vlrelu/gen/vlrelu-wasm-x1.c",
1594    "src/f32-vlrelu/gen/vlrelu-wasm-x2.c",
1595    "src/f32-vlrelu/gen/vlrelu-wasm-x4.c",
1596    "src/f32-vmulcaddc/gen/c1-minmax-wasm-2x.c",
1597    "src/f32-vmulcaddc/gen/c2-minmax-wasm-2x.c",
1598    "src/f32-vmulcaddc/gen/c4-minmax-wasm-2x.c",
1599    "src/f32-vrelu/gen/vrelu-wasm-x1.c",
1600    "src/f32-vrelu/gen/vrelu-wasm-x2.c",
1601    "src/f32-vrelu/gen/vrelu-wasm-x4.c",
1602    "src/f32-vrelu/gen/vrelu-wasm-x8.c",
1603    "src/qc8-dwconv/gen/up1x9-minmax-fp32-wasm-fmagic.c",
1604    "src/qc8-dwconv/gen/up1x25-minmax-fp32-wasm-fmagic.c",
1605    "src/qc8-dwconv/gen/up2x3-minmax-fp32-wasm-fmagic.c",
1606    "src/qc8-dwconv/gen/up2x9-minmax-fp32-wasm-fmagic.c",
1607    "src/qc8-dwconv/gen/up2x25-minmax-fp32-wasm-fmagic.c",
1608    "src/qc8-dwconv/gen/up4x9-minmax-fp32-wasm-fmagic.c",
1609    "src/qc8-dwconv/gen/up4x25-minmax-fp32-wasm-fmagic.c",
1610    "src/qc8-gemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1611    "src/qc8-gemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1612    "src/qc8-gemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1613    "src/qc8-gemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1614    "src/qc8-gemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1615    "src/qc8-gemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1616    "src/qc8-gemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1617    "src/qc8-gemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1618    "src/qc8-igemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1619    "src/qc8-igemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1620    "src/qc8-igemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1621    "src/qc8-igemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1622    "src/qc8-igemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1623    "src/qc8-igemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1624    "src/qc8-igemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1625    "src/qc8-igemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1626    "src/qs8-dwconv/gen/up1x9-minmax-fp32-wasm-fmagic.c",
1627    "src/qs8-dwconv/gen/up1x25-minmax-fp32-wasm-fmagic.c",
1628    "src/qs8-dwconv/gen/up2x9-minmax-fp32-wasm-fmagic.c",
1629    "src/qs8-dwconv/gen/up2x25-minmax-fp32-wasm-fmagic.c",
1630    "src/qs8-dwconv/gen/up4x9-minmax-fp32-wasm-fmagic.c",
1631    "src/qs8-dwconv/gen/up4x25-minmax-fp32-wasm-fmagic.c",
1632    "src/qs8-gemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1633    "src/qs8-gemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1634    "src/qs8-gemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1635    "src/qs8-gemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1636    "src/qs8-gemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1637    "src/qs8-gemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1638    "src/qs8-gemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1639    "src/qs8-gemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1640    "src/qs8-igemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1641    "src/qs8-igemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1642    "src/qs8-igemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1643    "src/qs8-igemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1644    "src/qs8-igemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1645    "src/qs8-igemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1646    "src/qs8-igemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1647    "src/qs8-igemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1648    "src/qu8-dwconv/gen/up1x9-minmax-fp32-wasm-fmagic.c",
1649    "src/qu8-dwconv/gen/up1x25-minmax-fp32-wasm-fmagic.c",
1650    "src/qu8-dwconv/gen/up2x9-minmax-fp32-wasm-fmagic.c",
1651    "src/qu8-dwconv/gen/up2x25-minmax-fp32-wasm-fmagic.c",
1652    "src/qu8-dwconv/gen/up4x9-minmax-fp32-wasm-fmagic.c",
1653    "src/qu8-dwconv/gen/up4x25-minmax-fp32-wasm-fmagic.c",
1654    "src/qu8-gemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1655    "src/qu8-gemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1656    "src/qu8-gemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1657    "src/qu8-gemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1658    "src/qu8-gemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1659    "src/qu8-gemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1660    "src/qu8-gemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1661    "src/qu8-gemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1662    "src/qu8-igemm/gen/1x2-minmax-fp32-wasm-fmagic.c",
1663    "src/qu8-igemm/gen/1x4-minmax-fp32-wasm-fmagic.c",
1664    "src/qu8-igemm/gen/2x2-minmax-fp32-wasm-fmagic.c",
1665    "src/qu8-igemm/gen/2x4-minmax-fp32-wasm-fmagic.c",
1666    "src/qu8-igemm/gen/3x2-minmax-fp32-wasm-fmagic.c",
1667    "src/qu8-igemm/gen/3x4-minmax-fp32-wasm-fmagic.c",
1668    "src/qu8-igemm/gen/4x2-minmax-fp32-wasm-fmagic.c",
1669    "src/qu8-igemm/gen/4x4-minmax-fp32-wasm-fmagic.c",
1670]
1671
1672ALL_WASMSIMD_MICROKERNEL_SRCS = [
1673    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int16-x8.c",
1674    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int16-x16.c",
1675    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int16-x24.c",
1676    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int16-x32.c",
1677    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int32-x8.c",
1678    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int32-x16.c",
1679    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int32-x24.c",
1680    "src/f16-f32-vcvt/gen/vcvt-wasmsimd-int32-x32.c",
1681    "src/f32-argmaxpool/4x-wasmsimd-c4.c",
1682    "src/f32-argmaxpool/9p8x-wasmsimd-c4.c",
1683    "src/f32-argmaxpool/9x-wasmsimd-c4.c",
1684    "src/f32-avgpool/9p8x-minmax-wasmsimd-arm-c4.c",
1685    "src/f32-avgpool/9p8x-minmax-wasmsimd-x86-c4.c",
1686    "src/f32-avgpool/9x-minmax-wasmsimd-arm-c4.c",
1687    "src/f32-avgpool/9x-minmax-wasmsimd-x86-c4.c",
1688    "src/f32-conv-hwc2chw/3x3s2p1c3x4-wasmsimd-2x2.c",
1689    "src/f32-dwconv/gen/up4x3-minmax-wasmsimd-arm-acc2.c",
1690    "src/f32-dwconv/gen/up4x3-minmax-wasmsimd-arm.c",
1691    "src/f32-dwconv/gen/up4x3-minmax-wasmsimd-x86-acc2.c",
1692    "src/f32-dwconv/gen/up4x3-minmax-wasmsimd-x86.c",
1693    "src/f32-dwconv/gen/up4x3-wasmsimd.c",
1694    "src/f32-dwconv/gen/up4x4-minmax-wasmsimd-arm-acc2.c",
1695    "src/f32-dwconv/gen/up4x4-minmax-wasmsimd-arm.c",
1696    "src/f32-dwconv/gen/up4x4-minmax-wasmsimd-x86-acc2.c",
1697    "src/f32-dwconv/gen/up4x4-minmax-wasmsimd-x86.c",
1698    "src/f32-dwconv/gen/up4x4-wasmsimd.c",
1699    "src/f32-dwconv/gen/up4x9-minmax-wasmsimd-arm-acc2.c",
1700    "src/f32-dwconv/gen/up4x9-minmax-wasmsimd-arm.c",
1701    "src/f32-dwconv/gen/up4x9-minmax-wasmsimd-x86-acc2.c",
1702    "src/f32-dwconv/gen/up4x9-minmax-wasmsimd-x86.c",
1703    "src/f32-dwconv/gen/up4x9-wasmsimd-acc2.c",
1704    "src/f32-dwconv/gen/up4x9-wasmsimd.c",
1705    "src/f32-dwconv/gen/up4x25-minmax-wasmsimd-arm-acc2.c",
1706    "src/f32-dwconv/gen/up4x25-minmax-wasmsimd-arm.c",
1707    "src/f32-dwconv/gen/up4x25-minmax-wasmsimd-x86-acc2.c",
1708    "src/f32-dwconv/gen/up4x25-minmax-wasmsimd-x86.c",
1709    "src/f32-dwconv/gen/up4x25-wasmsimd.c",
1710    "src/f32-dwconv/gen/up8x3-minmax-wasmsimd-arm-acc2.c",
1711    "src/f32-dwconv/gen/up8x3-minmax-wasmsimd-arm.c",
1712    "src/f32-dwconv/gen/up8x3-minmax-wasmsimd-x86-acc2.c",
1713    "src/f32-dwconv/gen/up8x3-minmax-wasmsimd-x86.c",
1714    "src/f32-dwconv/gen/up8x3-wasmsimd.c",
1715    "src/f32-dwconv/gen/up8x4-minmax-wasmsimd-arm-acc2.c",
1716    "src/f32-dwconv/gen/up8x4-minmax-wasmsimd-arm.c",
1717    "src/f32-dwconv/gen/up8x4-minmax-wasmsimd-x86-acc2.c",
1718    "src/f32-dwconv/gen/up8x4-minmax-wasmsimd-x86.c",
1719    "src/f32-dwconv/gen/up8x4-wasmsimd.c",
1720    "src/f32-dwconv/gen/up8x9-minmax-wasmsimd-arm-acc2.c",
1721    "src/f32-dwconv/gen/up8x9-minmax-wasmsimd-arm.c",
1722    "src/f32-dwconv/gen/up8x9-minmax-wasmsimd-x86-acc2.c",
1723    "src/f32-dwconv/gen/up8x9-minmax-wasmsimd-x86.c",
1724    "src/f32-dwconv/gen/up8x9-wasmsimd-acc2.c",
1725    "src/f32-dwconv/gen/up8x9-wasmsimd.c",
1726    "src/f32-dwconv/gen/up8x25-minmax-wasmsimd-arm-acc2.c",
1727    "src/f32-dwconv/gen/up8x25-minmax-wasmsimd-arm.c",
1728    "src/f32-dwconv/gen/up8x25-minmax-wasmsimd-x86-acc2.c",
1729    "src/f32-dwconv/gen/up8x25-minmax-wasmsimd-x86.c",
1730    "src/f32-dwconv/gen/up8x25-wasmsimd.c",
1731    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-1x4-acc2.c",
1732    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-1x4-acc3.c",
1733    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-1x4-acc4.c",
1734    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-1x4.c",
1735    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-2x4-acc2.c",
1736    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-2x4.c",
1737    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-3x4.c",
1738    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-4x4.c",
1739    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-5x4.c",
1740    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-loadsplat-6x4.c",
1741    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-1x4-acc2.c",
1742    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-1x4-acc3.c",
1743    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-1x4-acc4.c",
1744    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-1x4.c",
1745    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-2x4-acc2.c",
1746    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-2x4.c",
1747    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-3x4.c",
1748    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-4x4.c",
1749    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-5x4.c",
1750    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-arm-splat-6x4.c",
1751    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-1x4-acc2.c",
1752    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-1x4-acc3.c",
1753    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-1x4-acc4.c",
1754    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-1x4.c",
1755    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-2x4-acc2.c",
1756    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-2x4.c",
1757    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-3x4.c",
1758    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-4x4.c",
1759    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-5x4.c",
1760    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-loadsplat-6x4.c",
1761    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-1x4-acc2.c",
1762    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-1x4-acc3.c",
1763    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-1x4-acc4.c",
1764    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-1x4.c",
1765    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-2x4-acc2.c",
1766    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-2x4.c",
1767    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-3x4.c",
1768    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-4x4.c",
1769    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-5x4.c",
1770    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-wasmsimd-x86-splat-6x4.c",
1771    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-1x4-acc2.c",
1772    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-1x4-acc3.c",
1773    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-1x4-acc4.c",
1774    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-1x4.c",
1775    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-2x4-acc2.c",
1776    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-2x4.c",
1777    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-3x4.c",
1778    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-loadsplat-4x4.c",
1779    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-1x4-acc2.c",
1780    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-1x4-acc3.c",
1781    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-1x4-acc4.c",
1782    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-1x4.c",
1783    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-2x4-acc2.c",
1784    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-2x4.c",
1785    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-3x4.c",
1786    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-arm-splat-4x4.c",
1787    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-1x4-acc2.c",
1788    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-1x4-acc3.c",
1789    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-1x4-acc4.c",
1790    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-1x4.c",
1791    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-2x4-acc2.c",
1792    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-2x4.c",
1793    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-3x4.c",
1794    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-loadsplat-4x4.c",
1795    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-1x4-acc2.c",
1796    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-1x4-acc3.c",
1797    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-1x4-acc4.c",
1798    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-1x4.c",
1799    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-2x4-acc2.c",
1800    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-2x4.c",
1801    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-3x4.c",
1802    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-wasmsimd-x86-splat-4x4.c",
1803    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-1x4-acc2.c",
1804    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-1x4-acc3.c",
1805    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-1x4-acc4.c",
1806    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-1x4-acc5.c",
1807    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-1x4.c",
1808    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-2x4-acc2.c",
1809    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-2x4-acc3.c",
1810    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-2x4.c",
1811    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-3x4-acc2.c",
1812    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-3x4.c",
1813    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-4x4-acc2.c",
1814    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-4x4.c",
1815    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-loadsplat-5x4.c",
1816    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-1x4-acc2.c",
1817    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-1x4-acc3.c",
1818    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-1x4-acc4.c",
1819    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-1x4-acc5.c",
1820    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-1x4.c",
1821    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-2x4-acc2.c",
1822    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-2x4-acc3.c",
1823    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-2x4.c",
1824    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-3x4-acc2.c",
1825    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-3x4.c",
1826    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-4x4-acc2.c",
1827    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-4x4.c",
1828    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-arm-splat-5x4.c",
1829    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-1x4-acc2.c",
1830    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-1x4-acc3.c",
1831    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-1x4-acc4.c",
1832    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-1x4-acc5.c",
1833    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-1x4.c",
1834    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-2x4-acc2.c",
1835    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-2x4-acc3.c",
1836    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-2x4.c",
1837    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-3x4-acc2.c",
1838    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-3x4.c",
1839    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-4x4-acc2.c",
1840    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-4x4.c",
1841    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-loadsplat-5x4.c",
1842    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-1x4-acc2.c",
1843    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-1x4-acc3.c",
1844    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-1x4-acc4.c",
1845    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-1x4-acc5.c",
1846    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-1x4.c",
1847    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-2x4-acc2.c",
1848    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-2x4-acc3.c",
1849    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-2x4.c",
1850    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-3x4-acc2.c",
1851    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-3x4.c",
1852    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-4x4-acc2.c",
1853    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-4x4.c",
1854    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-wasmsimd-x86-splat-5x4.c",
1855    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-1x4-acc2.c",
1856    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-1x4-acc3.c",
1857    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-1x4-acc4.c",
1858    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-1x4-acc5.c",
1859    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-1x4.c",
1860    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-2x4-acc2.c",
1861    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-2x4-acc3.c",
1862    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-2x4.c",
1863    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-3x4-acc2.c",
1864    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-loadsplat-3x4.c",
1865    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-1x4-acc2.c",
1866    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-1x4-acc3.c",
1867    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-1x4-acc4.c",
1868    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-1x4-acc5.c",
1869    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-1x4.c",
1870    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-2x4-acc2.c",
1871    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-2x4-acc3.c",
1872    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-2x4.c",
1873    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-3x4-acc2.c",
1874    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-arm-splat-3x4.c",
1875    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-1x4-acc2.c",
1876    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-1x4-acc3.c",
1877    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-1x4-acc4.c",
1878    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-1x4-acc5.c",
1879    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-1x4.c",
1880    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-2x4-acc2.c",
1881    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-2x4-acc3.c",
1882    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-2x4.c",
1883    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-3x4-acc2.c",
1884    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-loadsplat-3x4.c",
1885    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-1x4-acc2.c",
1886    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-1x4-acc3.c",
1887    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-1x4-acc4.c",
1888    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-1x4-acc5.c",
1889    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-1x4.c",
1890    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-2x4-acc2.c",
1891    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-2x4-acc3.c",
1892    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-2x4.c",
1893    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-3x4-acc2.c",
1894    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-wasmsimd-x86-splat-3x4.c",
1895    "src/f32-f16-vcvt/gen/vcvt-wasmsimd-x8.c",
1896    "src/f32-f16-vcvt/gen/vcvt-wasmsimd-x16.c",
1897    "src/f32-f16-vcvt/gen/vcvt-wasmsimd-x24.c",
1898    "src/f32-f16-vcvt/gen/vcvt-wasmsimd-x32.c",
1899    "src/f32-gavgpool-cw/wasmsimd-arm-x4.c",
1900    "src/f32-gavgpool-cw/wasmsimd-x86-x4.c",
1901    "src/f32-gavgpool/7p7x-minmax-wasmsimd-arm-c4.c",
1902    "src/f32-gavgpool/7p7x-minmax-wasmsimd-x86-c4.c",
1903    "src/f32-gavgpool/7x-minmax-wasmsimd-arm-c4.c",
1904    "src/f32-gavgpool/7x-minmax-wasmsimd-x86-c4.c",
1905    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmsimd-arm-loadsplat.c",
1906    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmsimd-arm-splat.c",
1907    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmsimd-x86-loadsplat.c",
1908    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmsimd-x86-splat.c",
1909    "src/f32-gemm/gen-inc/1x8s4inc-minmax-wasmsimd-arm.c",
1910    "src/f32-gemm/gen-inc/1x8s4inc-minmax-wasmsimd-x86.c",
1911    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmsimd-arm-loadsplat.c",
1912    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmsimd-arm-splat.c",
1913    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmsimd-x86-loadsplat.c",
1914    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmsimd-x86-splat.c",
1915    "src/f32-gemm/gen-inc/3x8s4inc-minmax-wasmsimd-arm.c",
1916    "src/f32-gemm/gen-inc/3x8s4inc-minmax-wasmsimd-x86.c",
1917    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmsimd-arm-loadsplat.c",
1918    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmsimd-arm-splat.c",
1919    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmsimd-x86-loadsplat.c",
1920    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmsimd-x86-splat.c",
1921    "src/f32-gemm/gen-inc/4x8s4inc-minmax-wasmsimd-arm.c",
1922    "src/f32-gemm/gen-inc/4x8s4inc-minmax-wasmsimd-x86.c",
1923    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmsimd-arm-loadsplat.c",
1924    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmsimd-arm-splat.c",
1925    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmsimd-x86-loadsplat.c",
1926    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmsimd-x86-splat.c",
1927    "src/f32-gemm/gen-inc/5x8s4inc-minmax-wasmsimd-arm.c",
1928    "src/f32-gemm/gen-inc/5x8s4inc-minmax-wasmsimd-x86.c",
1929    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmsimd-arm-loadsplat.c",
1930    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmsimd-arm-splat.c",
1931    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmsimd-x86-loadsplat.c",
1932    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmsimd-x86-splat.c",
1933    "src/f32-gemm/gen-inc/6x8s4inc-minmax-wasmsimd-arm.c",
1934    "src/f32-gemm/gen-inc/6x8s4inc-minmax-wasmsimd-x86.c",
1935    "src/f32-gemm/gen/1x8-minmax-wasmsimd-arm-loadsplat.c",
1936    "src/f32-gemm/gen/1x8-minmax-wasmsimd-arm-splat.c",
1937    "src/f32-gemm/gen/1x8-minmax-wasmsimd-x86-loadsplat.c",
1938    "src/f32-gemm/gen/1x8-minmax-wasmsimd-x86-splat.c",
1939    "src/f32-gemm/gen/1x8-relu-wasmsimd-loadsplat.c",
1940    "src/f32-gemm/gen/1x8-relu-wasmsimd-splat.c",
1941    "src/f32-gemm/gen/1x8-wasmsimd-loadsplat.c",
1942    "src/f32-gemm/gen/1x8-wasmsimd-splat.c",
1943    "src/f32-gemm/gen/1x8s4-minmax-wasmsimd-arm.c",
1944    "src/f32-gemm/gen/1x8s4-minmax-wasmsimd-x86.c",
1945    "src/f32-gemm/gen/1x8s4-relu-wasmsimd.c",
1946    "src/f32-gemm/gen/1x8s4-wasmsimd.c",
1947    "src/f32-gemm/gen/3x8-minmax-wasmsimd-arm-loadsplat.c",
1948    "src/f32-gemm/gen/3x8-minmax-wasmsimd-arm-splat.c",
1949    "src/f32-gemm/gen/3x8-minmax-wasmsimd-x86-loadsplat.c",
1950    "src/f32-gemm/gen/3x8-minmax-wasmsimd-x86-splat.c",
1951    "src/f32-gemm/gen/3x8-relu-wasmsimd-loadsplat.c",
1952    "src/f32-gemm/gen/3x8-relu-wasmsimd-splat.c",
1953    "src/f32-gemm/gen/3x8-wasmsimd-loadsplat.c",
1954    "src/f32-gemm/gen/3x8-wasmsimd-splat.c",
1955    "src/f32-gemm/gen/3x8s4-minmax-wasmsimd-arm.c",
1956    "src/f32-gemm/gen/3x8s4-minmax-wasmsimd-x86.c",
1957    "src/f32-gemm/gen/3x8s4-relu-wasmsimd.c",
1958    "src/f32-gemm/gen/3x8s4-wasmsimd.c",
1959    "src/f32-gemm/gen/4x2c4-minmax-wasmsimd-arm.c",
1960    "src/f32-gemm/gen/4x2c4-minmax-wasmsimd-x86.c",
1961    "src/f32-gemm/gen/4x2c4-relu-wasmsimd.c",
1962    "src/f32-gemm/gen/4x2c4-wasmsimd.c",
1963    "src/f32-gemm/gen/4x8-minmax-wasmsimd-arm-loadsplat.c",
1964    "src/f32-gemm/gen/4x8-minmax-wasmsimd-arm-splat.c",
1965    "src/f32-gemm/gen/4x8-minmax-wasmsimd-x86-loadsplat.c",
1966    "src/f32-gemm/gen/4x8-minmax-wasmsimd-x86-splat.c",
1967    "src/f32-gemm/gen/4x8-relu-wasmsimd-loadsplat.c",
1968    "src/f32-gemm/gen/4x8-relu-wasmsimd-splat.c",
1969    "src/f32-gemm/gen/4x8-wasmsimd-loadsplat.c",
1970    "src/f32-gemm/gen/4x8-wasmsimd-splat.c",
1971    "src/f32-gemm/gen/4x8s4-minmax-wasmsimd-arm.c",
1972    "src/f32-gemm/gen/4x8s4-minmax-wasmsimd-x86.c",
1973    "src/f32-gemm/gen/4x8s4-relu-wasmsimd.c",
1974    "src/f32-gemm/gen/4x8s4-wasmsimd.c",
1975    "src/f32-gemm/gen/5x8-minmax-wasmsimd-arm-loadsplat.c",
1976    "src/f32-gemm/gen/5x8-minmax-wasmsimd-arm-splat.c",
1977    "src/f32-gemm/gen/5x8-minmax-wasmsimd-x86-loadsplat.c",
1978    "src/f32-gemm/gen/5x8-minmax-wasmsimd-x86-splat.c",
1979    "src/f32-gemm/gen/5x8-relu-wasmsimd-loadsplat.c",
1980    "src/f32-gemm/gen/5x8-relu-wasmsimd-splat.c",
1981    "src/f32-gemm/gen/5x8-wasmsimd-loadsplat.c",
1982    "src/f32-gemm/gen/5x8-wasmsimd-splat.c",
1983    "src/f32-gemm/gen/5x8s4-minmax-wasmsimd-arm.c",
1984    "src/f32-gemm/gen/5x8s4-minmax-wasmsimd-x86.c",
1985    "src/f32-gemm/gen/5x8s4-relu-wasmsimd.c",
1986    "src/f32-gemm/gen/5x8s4-wasmsimd.c",
1987    "src/f32-gemm/gen/6x8-minmax-wasmsimd-arm-loadsplat.c",
1988    "src/f32-gemm/gen/6x8-minmax-wasmsimd-arm-splat.c",
1989    "src/f32-gemm/gen/6x8-minmax-wasmsimd-x86-loadsplat.c",
1990    "src/f32-gemm/gen/6x8-minmax-wasmsimd-x86-splat.c",
1991    "src/f32-gemm/gen/6x8-relu-wasmsimd-loadsplat.c",
1992    "src/f32-gemm/gen/6x8-relu-wasmsimd-splat.c",
1993    "src/f32-gemm/gen/6x8-wasmsimd-loadsplat.c",
1994    "src/f32-gemm/gen/6x8-wasmsimd-splat.c",
1995    "src/f32-gemm/gen/6x8s4-minmax-wasmsimd-arm.c",
1996    "src/f32-gemm/gen/6x8s4-minmax-wasmsimd-x86.c",
1997    "src/f32-gemm/gen/6x8s4-relu-wasmsimd.c",
1998    "src/f32-gemm/gen/6x8s4-wasmsimd.c",
1999    "src/f32-ibilinear-chw/gen/wasmsimd-p4.c",
2000    "src/f32-ibilinear-chw/gen/wasmsimd-p8.c",
2001    "src/f32-ibilinear/gen/wasmsimd-c4.c",
2002    "src/f32-ibilinear/gen/wasmsimd-c8.c",
2003    "src/f32-igemm/gen/1x8-minmax-wasmsimd-arm-loadsplat.c",
2004    "src/f32-igemm/gen/1x8-minmax-wasmsimd-arm-splat.c",
2005    "src/f32-igemm/gen/1x8-minmax-wasmsimd-x86-loadsplat.c",
2006    "src/f32-igemm/gen/1x8-minmax-wasmsimd-x86-splat.c",
2007    "src/f32-igemm/gen/1x8-relu-wasmsimd-loadsplat.c",
2008    "src/f32-igemm/gen/1x8-relu-wasmsimd-splat.c",
2009    "src/f32-igemm/gen/1x8-wasmsimd-loadsplat.c",
2010    "src/f32-igemm/gen/1x8-wasmsimd-splat.c",
2011    "src/f32-igemm/gen/1x8s4-minmax-wasmsimd-arm.c",
2012    "src/f32-igemm/gen/1x8s4-minmax-wasmsimd-x86.c",
2013    "src/f32-igemm/gen/1x8s4-relu-wasmsimd.c",
2014    "src/f32-igemm/gen/1x8s4-wasmsimd.c",
2015    "src/f32-igemm/gen/3x8-minmax-wasmsimd-arm-loadsplat.c",
2016    "src/f32-igemm/gen/3x8-minmax-wasmsimd-arm-splat.c",
2017    "src/f32-igemm/gen/3x8-minmax-wasmsimd-x86-loadsplat.c",
2018    "src/f32-igemm/gen/3x8-minmax-wasmsimd-x86-splat.c",
2019    "src/f32-igemm/gen/3x8-relu-wasmsimd-loadsplat.c",
2020    "src/f32-igemm/gen/3x8-relu-wasmsimd-splat.c",
2021    "src/f32-igemm/gen/3x8-wasmsimd-loadsplat.c",
2022    "src/f32-igemm/gen/3x8-wasmsimd-splat.c",
2023    "src/f32-igemm/gen/3x8s4-minmax-wasmsimd-arm.c",
2024    "src/f32-igemm/gen/3x8s4-minmax-wasmsimd-x86.c",
2025    "src/f32-igemm/gen/3x8s4-relu-wasmsimd.c",
2026    "src/f32-igemm/gen/3x8s4-wasmsimd.c",
2027    "src/f32-igemm/gen/4x2c4-minmax-wasmsimd-arm.c",
2028    "src/f32-igemm/gen/4x2c4-minmax-wasmsimd-x86.c",
2029    "src/f32-igemm/gen/4x2c4-relu-wasmsimd.c",
2030    "src/f32-igemm/gen/4x2c4-wasmsimd.c",
2031    "src/f32-igemm/gen/4x8-minmax-wasmsimd-arm-loadsplat.c",
2032    "src/f32-igemm/gen/4x8-minmax-wasmsimd-arm-splat.c",
2033    "src/f32-igemm/gen/4x8-minmax-wasmsimd-x86-loadsplat.c",
2034    "src/f32-igemm/gen/4x8-minmax-wasmsimd-x86-splat.c",
2035    "src/f32-igemm/gen/4x8-relu-wasmsimd-loadsplat.c",
2036    "src/f32-igemm/gen/4x8-relu-wasmsimd-splat.c",
2037    "src/f32-igemm/gen/4x8-wasmsimd-loadsplat.c",
2038    "src/f32-igemm/gen/4x8-wasmsimd-splat.c",
2039    "src/f32-igemm/gen/4x8s4-minmax-wasmsimd-arm.c",
2040    "src/f32-igemm/gen/4x8s4-minmax-wasmsimd-x86.c",
2041    "src/f32-igemm/gen/4x8s4-relu-wasmsimd.c",
2042    "src/f32-igemm/gen/4x8s4-wasmsimd.c",
2043    "src/f32-igemm/gen/5x8-minmax-wasmsimd-arm-loadsplat.c",
2044    "src/f32-igemm/gen/5x8-minmax-wasmsimd-arm-splat.c",
2045    "src/f32-igemm/gen/5x8-minmax-wasmsimd-x86-loadsplat.c",
2046    "src/f32-igemm/gen/5x8-minmax-wasmsimd-x86-splat.c",
2047    "src/f32-igemm/gen/5x8-relu-wasmsimd-loadsplat.c",
2048    "src/f32-igemm/gen/5x8-relu-wasmsimd-splat.c",
2049    "src/f32-igemm/gen/5x8-wasmsimd-loadsplat.c",
2050    "src/f32-igemm/gen/5x8-wasmsimd-splat.c",
2051    "src/f32-igemm/gen/5x8s4-minmax-wasmsimd-arm.c",
2052    "src/f32-igemm/gen/5x8s4-minmax-wasmsimd-x86.c",
2053    "src/f32-igemm/gen/5x8s4-relu-wasmsimd.c",
2054    "src/f32-igemm/gen/5x8s4-wasmsimd.c",
2055    "src/f32-igemm/gen/6x8-minmax-wasmsimd-arm-loadsplat.c",
2056    "src/f32-igemm/gen/6x8-minmax-wasmsimd-arm-splat.c",
2057    "src/f32-igemm/gen/6x8-minmax-wasmsimd-x86-loadsplat.c",
2058    "src/f32-igemm/gen/6x8-minmax-wasmsimd-x86-splat.c",
2059    "src/f32-igemm/gen/6x8-relu-wasmsimd-loadsplat.c",
2060    "src/f32-igemm/gen/6x8-relu-wasmsimd-splat.c",
2061    "src/f32-igemm/gen/6x8-wasmsimd-loadsplat.c",
2062    "src/f32-igemm/gen/6x8-wasmsimd-splat.c",
2063    "src/f32-igemm/gen/6x8s4-minmax-wasmsimd-arm.c",
2064    "src/f32-igemm/gen/6x8s4-minmax-wasmsimd-x86.c",
2065    "src/f32-igemm/gen/6x8s4-relu-wasmsimd.c",
2066    "src/f32-igemm/gen/6x8s4-wasmsimd.c",
2067    "src/f32-maxpool/9p8x-minmax-wasmsimd-arm-c4.c",
2068    "src/f32-maxpool/9p8x-minmax-wasmsimd-x86-c4.c",
2069    "src/f32-pavgpool/9p8x-minmax-wasmsimd-arm-c4.c",
2070    "src/f32-pavgpool/9p8x-minmax-wasmsimd-x86-c4.c",
2071    "src/f32-pavgpool/9x-minmax-wasmsimd-arm-c4.c",
2072    "src/f32-pavgpool/9x-minmax-wasmsimd-x86-c4.c",
2073    "src/f32-ppmm/gen/4x8-minmax-wasmsimd-arm-splat.c",
2074    "src/f32-ppmm/gen/4x8-minmax-wasmsimd-x86-splat.c",
2075    "src/f32-prelu/gen/wasmsimd-bitselect-1x4.c",
2076    "src/f32-prelu/gen/wasmsimd-bitselect-1x8.c",
2077    "src/f32-prelu/gen/wasmsimd-bitselect-1x16.c",
2078    "src/f32-prelu/gen/wasmsimd-bitselect-2x4.c",
2079    "src/f32-prelu/gen/wasmsimd-bitselect-2x8.c",
2080    "src/f32-prelu/gen/wasmsimd-bitselect-2x16.c",
2081    "src/f32-prelu/gen/wasmsimd-bitselect-4x4.c",
2082    "src/f32-prelu/gen/wasmsimd-bitselect-4x8.c",
2083    "src/f32-prelu/gen/wasmsimd-bitselect-4x16.c",
2084    "src/f32-prelu/gen/wasmsimd-minmax-1x4.c",
2085    "src/f32-prelu/gen/wasmsimd-minmax-1x8.c",
2086    "src/f32-prelu/gen/wasmsimd-minmax-1x16.c",
2087    "src/f32-prelu/gen/wasmsimd-minmax-2x4.c",
2088    "src/f32-prelu/gen/wasmsimd-minmax-2x8.c",
2089    "src/f32-prelu/gen/wasmsimd-minmax-2x16.c",
2090    "src/f32-prelu/gen/wasmsimd-minmax-4x4.c",
2091    "src/f32-prelu/gen/wasmsimd-minmax-4x8.c",
2092    "src/f32-prelu/gen/wasmsimd-minmax-4x16.c",
2093    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-cvt-x8.c",
2094    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-cvt-x16.c",
2095    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-cvt-x24.c",
2096    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-cvt-x32.c",
2097    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-magic-x8.c",
2098    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-magic-x16.c",
2099    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-magic-x24.c",
2100    "src/f32-qs8-vcvt/gen/vcvt-wasmsimd-magic-x32.c",
2101    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-cvt-x8.c",
2102    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-cvt-x16.c",
2103    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-cvt-x24.c",
2104    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-cvt-x32.c",
2105    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-magic-x8.c",
2106    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-magic-x16.c",
2107    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-magic-x24.c",
2108    "src/f32-qu8-vcvt/gen/vcvt-wasmsimd-magic-x32.c",
2109    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x4.c",
2110    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x8-acc2.c",
2111    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x8.c",
2112    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x12-acc2.c",
2113    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x12-acc3.c",
2114    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x12.c",
2115    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x16-acc2.c",
2116    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x16-acc4.c",
2117    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x16.c",
2118    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x20-acc2.c",
2119    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x20-acc5.c",
2120    "src/f32-raddstoreexpminusmax/gen/wasmsimd-rr2-p5-x20.c",
2121    "src/f32-rmax/wasmsimd-arm.c",
2122    "src/f32-rmax/wasmsimd-x86.c",
2123    "src/f32-spmm/gen/4x1-minmax-wasmsimd-arm-pipelined-x2.c",
2124    "src/f32-spmm/gen/4x1-minmax-wasmsimd-arm-pipelined.c",
2125    "src/f32-spmm/gen/4x1-minmax-wasmsimd-arm-x2.c",
2126    "src/f32-spmm/gen/4x1-minmax-wasmsimd-arm-x4.c",
2127    "src/f32-spmm/gen/4x1-minmax-wasmsimd-arm.c",
2128    "src/f32-spmm/gen/4x1-minmax-wasmsimd-x86-pipelined-x2.c",
2129    "src/f32-spmm/gen/4x1-minmax-wasmsimd-x86-pipelined.c",
2130    "src/f32-spmm/gen/4x1-minmax-wasmsimd-x86-x2.c",
2131    "src/f32-spmm/gen/4x1-minmax-wasmsimd-x86-x4.c",
2132    "src/f32-spmm/gen/4x1-minmax-wasmsimd-x86.c",
2133    "src/f32-spmm/gen/8x1-minmax-wasmsimd-arm-pipelined-x2.c",
2134    "src/f32-spmm/gen/8x1-minmax-wasmsimd-arm-pipelined.c",
2135    "src/f32-spmm/gen/8x1-minmax-wasmsimd-arm-x2.c",
2136    "src/f32-spmm/gen/8x1-minmax-wasmsimd-arm-x4.c",
2137    "src/f32-spmm/gen/8x1-minmax-wasmsimd-arm.c",
2138    "src/f32-spmm/gen/8x1-minmax-wasmsimd-x86-pipelined-x2.c",
2139    "src/f32-spmm/gen/8x1-minmax-wasmsimd-x86-pipelined.c",
2140    "src/f32-spmm/gen/8x1-minmax-wasmsimd-x86-x2.c",
2141    "src/f32-spmm/gen/8x1-minmax-wasmsimd-x86-x4.c",
2142    "src/f32-spmm/gen/8x1-minmax-wasmsimd-x86.c",
2143    "src/f32-spmm/gen/16x1-minmax-wasmsimd-arm-pipelined-x2.c",
2144    "src/f32-spmm/gen/16x1-minmax-wasmsimd-arm-pipelined.c",
2145    "src/f32-spmm/gen/16x1-minmax-wasmsimd-arm-x2.c",
2146    "src/f32-spmm/gen/16x1-minmax-wasmsimd-arm-x4.c",
2147    "src/f32-spmm/gen/16x1-minmax-wasmsimd-arm.c",
2148    "src/f32-spmm/gen/16x1-minmax-wasmsimd-x86-pipelined-x2.c",
2149    "src/f32-spmm/gen/16x1-minmax-wasmsimd-x86-pipelined.c",
2150    "src/f32-spmm/gen/16x1-minmax-wasmsimd-x86-x2.c",
2151    "src/f32-spmm/gen/16x1-minmax-wasmsimd-x86-x4.c",
2152    "src/f32-spmm/gen/16x1-minmax-wasmsimd-x86.c",
2153    "src/f32-spmm/gen/32x1-minmax-wasmsimd-arm-pipelined-x2.c",
2154    "src/f32-spmm/gen/32x1-minmax-wasmsimd-arm-pipelined.c",
2155    "src/f32-spmm/gen/32x1-minmax-wasmsimd-arm-x2.c",
2156    "src/f32-spmm/gen/32x1-minmax-wasmsimd-arm-x4.c",
2157    "src/f32-spmm/gen/32x1-minmax-wasmsimd-arm.c",
2158    "src/f32-spmm/gen/32x1-minmax-wasmsimd-x86-pipelined-x2.c",
2159    "src/f32-spmm/gen/32x1-minmax-wasmsimd-x86-pipelined.c",
2160    "src/f32-spmm/gen/32x1-minmax-wasmsimd-x86-x2.c",
2161    "src/f32-spmm/gen/32x1-minmax-wasmsimd-x86-x4.c",
2162    "src/f32-spmm/gen/32x1-minmax-wasmsimd-x86.c",
2163    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-arm-x4.c",
2164    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-arm-x8.c",
2165    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-arm-x16.c",
2166    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-x86-x4.c",
2167    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-x86-x8.c",
2168    "src/f32-vbinary/gen/vadd-minmax-wasmsimd-x86-x16.c",
2169    "src/f32-vbinary/gen/vadd-relu-wasmsimd-x4.c",
2170    "src/f32-vbinary/gen/vadd-relu-wasmsimd-x8.c",
2171    "src/f32-vbinary/gen/vadd-relu-wasmsimd-x16.c",
2172    "src/f32-vbinary/gen/vadd-wasmsimd-x4.c",
2173    "src/f32-vbinary/gen/vadd-wasmsimd-x8.c",
2174    "src/f32-vbinary/gen/vadd-wasmsimd-x16.c",
2175    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-arm-x4.c",
2176    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-arm-x8.c",
2177    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-arm-x16.c",
2178    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-x86-x4.c",
2179    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-x86-x8.c",
2180    "src/f32-vbinary/gen/vaddc-minmax-wasmsimd-x86-x16.c",
2181    "src/f32-vbinary/gen/vaddc-relu-wasmsimd-x4.c",
2182    "src/f32-vbinary/gen/vaddc-relu-wasmsimd-x8.c",
2183    "src/f32-vbinary/gen/vaddc-relu-wasmsimd-x16.c",
2184    "src/f32-vbinary/gen/vaddc-wasmsimd-x4.c",
2185    "src/f32-vbinary/gen/vaddc-wasmsimd-x8.c",
2186    "src/f32-vbinary/gen/vaddc-wasmsimd-x16.c",
2187    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-arm-x4.c",
2188    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-arm-x8.c",
2189    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-arm-x16.c",
2190    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-x86-x4.c",
2191    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-x86-x8.c",
2192    "src/f32-vbinary/gen/vdiv-minmax-wasmsimd-x86-x16.c",
2193    "src/f32-vbinary/gen/vdiv-relu-wasmsimd-x4.c",
2194    "src/f32-vbinary/gen/vdiv-relu-wasmsimd-x8.c",
2195    "src/f32-vbinary/gen/vdiv-relu-wasmsimd-x16.c",
2196    "src/f32-vbinary/gen/vdiv-wasmsimd-x4.c",
2197    "src/f32-vbinary/gen/vdiv-wasmsimd-x8.c",
2198    "src/f32-vbinary/gen/vdiv-wasmsimd-x16.c",
2199    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-arm-x4.c",
2200    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-arm-x8.c",
2201    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-arm-x16.c",
2202    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-x86-x4.c",
2203    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-x86-x8.c",
2204    "src/f32-vbinary/gen/vdivc-minmax-wasmsimd-x86-x16.c",
2205    "src/f32-vbinary/gen/vdivc-relu-wasmsimd-x4.c",
2206    "src/f32-vbinary/gen/vdivc-relu-wasmsimd-x8.c",
2207    "src/f32-vbinary/gen/vdivc-relu-wasmsimd-x16.c",
2208    "src/f32-vbinary/gen/vdivc-wasmsimd-x4.c",
2209    "src/f32-vbinary/gen/vdivc-wasmsimd-x8.c",
2210    "src/f32-vbinary/gen/vdivc-wasmsimd-x16.c",
2211    "src/f32-vbinary/gen/vmax-wasmsimd-arm-x4.c",
2212    "src/f32-vbinary/gen/vmax-wasmsimd-arm-x8.c",
2213    "src/f32-vbinary/gen/vmax-wasmsimd-arm-x16.c",
2214    "src/f32-vbinary/gen/vmax-wasmsimd-x86-x4.c",
2215    "src/f32-vbinary/gen/vmax-wasmsimd-x86-x8.c",
2216    "src/f32-vbinary/gen/vmax-wasmsimd-x86-x16.c",
2217    "src/f32-vbinary/gen/vmaxc-wasmsimd-arm-x4.c",
2218    "src/f32-vbinary/gen/vmaxc-wasmsimd-arm-x8.c",
2219    "src/f32-vbinary/gen/vmaxc-wasmsimd-arm-x16.c",
2220    "src/f32-vbinary/gen/vmaxc-wasmsimd-x86-x4.c",
2221    "src/f32-vbinary/gen/vmaxc-wasmsimd-x86-x8.c",
2222    "src/f32-vbinary/gen/vmaxc-wasmsimd-x86-x16.c",
2223    "src/f32-vbinary/gen/vmin-wasmsimd-arm-x4.c",
2224    "src/f32-vbinary/gen/vmin-wasmsimd-arm-x8.c",
2225    "src/f32-vbinary/gen/vmin-wasmsimd-arm-x16.c",
2226    "src/f32-vbinary/gen/vmin-wasmsimd-x86-x4.c",
2227    "src/f32-vbinary/gen/vmin-wasmsimd-x86-x8.c",
2228    "src/f32-vbinary/gen/vmin-wasmsimd-x86-x16.c",
2229    "src/f32-vbinary/gen/vminc-wasmsimd-arm-x4.c",
2230    "src/f32-vbinary/gen/vminc-wasmsimd-arm-x8.c",
2231    "src/f32-vbinary/gen/vminc-wasmsimd-arm-x16.c",
2232    "src/f32-vbinary/gen/vminc-wasmsimd-x86-x4.c",
2233    "src/f32-vbinary/gen/vminc-wasmsimd-x86-x8.c",
2234    "src/f32-vbinary/gen/vminc-wasmsimd-x86-x16.c",
2235    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-arm-x4.c",
2236    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-arm-x8.c",
2237    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-arm-x16.c",
2238    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-x86-x4.c",
2239    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-x86-x8.c",
2240    "src/f32-vbinary/gen/vmul-minmax-wasmsimd-x86-x16.c",
2241    "src/f32-vbinary/gen/vmul-relu-wasmsimd-x4.c",
2242    "src/f32-vbinary/gen/vmul-relu-wasmsimd-x8.c",
2243    "src/f32-vbinary/gen/vmul-relu-wasmsimd-x16.c",
2244    "src/f32-vbinary/gen/vmul-wasmsimd-x4.c",
2245    "src/f32-vbinary/gen/vmul-wasmsimd-x8.c",
2246    "src/f32-vbinary/gen/vmul-wasmsimd-x16.c",
2247    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-arm-x4.c",
2248    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-arm-x8.c",
2249    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-arm-x16.c",
2250    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-x86-x4.c",
2251    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-x86-x8.c",
2252    "src/f32-vbinary/gen/vmulc-minmax-wasmsimd-x86-x16.c",
2253    "src/f32-vbinary/gen/vmulc-relu-wasmsimd-x4.c",
2254    "src/f32-vbinary/gen/vmulc-relu-wasmsimd-x8.c",
2255    "src/f32-vbinary/gen/vmulc-relu-wasmsimd-x16.c",
2256    "src/f32-vbinary/gen/vmulc-wasmsimd-x4.c",
2257    "src/f32-vbinary/gen/vmulc-wasmsimd-x8.c",
2258    "src/f32-vbinary/gen/vmulc-wasmsimd-x16.c",
2259    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-arm-x4.c",
2260    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-arm-x8.c",
2261    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-arm-x16.c",
2262    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-x86-x4.c",
2263    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-x86-x8.c",
2264    "src/f32-vbinary/gen/vrdivc-minmax-wasmsimd-x86-x16.c",
2265    "src/f32-vbinary/gen/vrdivc-relu-wasmsimd-x4.c",
2266    "src/f32-vbinary/gen/vrdivc-relu-wasmsimd-x8.c",
2267    "src/f32-vbinary/gen/vrdivc-relu-wasmsimd-x16.c",
2268    "src/f32-vbinary/gen/vrdivc-wasmsimd-x4.c",
2269    "src/f32-vbinary/gen/vrdivc-wasmsimd-x8.c",
2270    "src/f32-vbinary/gen/vrdivc-wasmsimd-x16.c",
2271    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-arm-x4.c",
2272    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-arm-x8.c",
2273    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-arm-x16.c",
2274    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-x86-x4.c",
2275    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-x86-x8.c",
2276    "src/f32-vbinary/gen/vrsubc-minmax-wasmsimd-x86-x16.c",
2277    "src/f32-vbinary/gen/vrsubc-relu-wasmsimd-x4.c",
2278    "src/f32-vbinary/gen/vrsubc-relu-wasmsimd-x8.c",
2279    "src/f32-vbinary/gen/vrsubc-relu-wasmsimd-x16.c",
2280    "src/f32-vbinary/gen/vrsubc-wasmsimd-x4.c",
2281    "src/f32-vbinary/gen/vrsubc-wasmsimd-x8.c",
2282    "src/f32-vbinary/gen/vrsubc-wasmsimd-x16.c",
2283    "src/f32-vbinary/gen/vsqrdiff-wasmsimd-x4.c",
2284    "src/f32-vbinary/gen/vsqrdiff-wasmsimd-x8.c",
2285    "src/f32-vbinary/gen/vsqrdiff-wasmsimd-x16.c",
2286    "src/f32-vbinary/gen/vsqrdiffc-wasmsimd-x4.c",
2287    "src/f32-vbinary/gen/vsqrdiffc-wasmsimd-x8.c",
2288    "src/f32-vbinary/gen/vsqrdiffc-wasmsimd-x16.c",
2289    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-arm-x4.c",
2290    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-arm-x8.c",
2291    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-arm-x16.c",
2292    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-x86-x4.c",
2293    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-x86-x8.c",
2294    "src/f32-vbinary/gen/vsub-minmax-wasmsimd-x86-x16.c",
2295    "src/f32-vbinary/gen/vsub-relu-wasmsimd-x4.c",
2296    "src/f32-vbinary/gen/vsub-relu-wasmsimd-x8.c",
2297    "src/f32-vbinary/gen/vsub-relu-wasmsimd-x16.c",
2298    "src/f32-vbinary/gen/vsub-wasmsimd-x4.c",
2299    "src/f32-vbinary/gen/vsub-wasmsimd-x8.c",
2300    "src/f32-vbinary/gen/vsub-wasmsimd-x16.c",
2301    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-arm-x4.c",
2302    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-arm-x8.c",
2303    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-arm-x16.c",
2304    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-x86-x4.c",
2305    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-x86-x8.c",
2306    "src/f32-vbinary/gen/vsubc-minmax-wasmsimd-x86-x16.c",
2307    "src/f32-vbinary/gen/vsubc-relu-wasmsimd-x4.c",
2308    "src/f32-vbinary/gen/vsubc-relu-wasmsimd-x8.c",
2309    "src/f32-vbinary/gen/vsubc-relu-wasmsimd-x16.c",
2310    "src/f32-vbinary/gen/vsubc-wasmsimd-x4.c",
2311    "src/f32-vbinary/gen/vsubc-wasmsimd-x8.c",
2312    "src/f32-vbinary/gen/vsubc-wasmsimd-x16.c",
2313    "src/f32-vclamp/gen/vclamp-wasmsimd-arm-x4.c",
2314    "src/f32-vclamp/gen/vclamp-wasmsimd-arm-x8.c",
2315    "src/f32-vclamp/gen/vclamp-wasmsimd-x86-x4.c",
2316    "src/f32-vclamp/gen/vclamp-wasmsimd-x86-x8.c",
2317    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x4.c",
2318    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x8.c",
2319    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x12.c",
2320    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x16.c",
2321    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x20.c",
2322    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-lut16-p3-x24.c",
2323    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x4.c",
2324    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x8.c",
2325    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x12.c",
2326    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x16.c",
2327    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x20.c",
2328    "src/f32-velu/gen/velu-wasmsimd-arm-rr2-p6-x24.c",
2329    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x4.c",
2330    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x8.c",
2331    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x12.c",
2332    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x16.c",
2333    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x20.c",
2334    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-lut16-p3-x24.c",
2335    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x4.c",
2336    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x8.c",
2337    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x12.c",
2338    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x16.c",
2339    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x20.c",
2340    "src/f32-velu/gen/velu-wasmsimd-x86-rr2-p6-x24.c",
2341    "src/f32-vhswish/gen/vhswish-wasmsimd-x4.c",
2342    "src/f32-vhswish/gen/vhswish-wasmsimd-x8.c",
2343    "src/f32-vhswish/gen/vhswish-wasmsimd-x16.c",
2344    "src/f32-vlrelu/gen/vlrelu-wasmsimd-bitselect-x4.c",
2345    "src/f32-vlrelu/gen/vlrelu-wasmsimd-bitselect-x8.c",
2346    "src/f32-vlrelu/gen/vlrelu-wasmsimd-minmax-x4.c",
2347    "src/f32-vlrelu/gen/vlrelu-wasmsimd-minmax-x8.c",
2348    "src/f32-vmulcaddc/gen/c4-minmax-wasmsimd-arm-2x.c",
2349    "src/f32-vmulcaddc/gen/c4-minmax-wasmsimd-x86-2x.c",
2350    "src/f32-vmulcaddc/gen/c8-minmax-wasmsimd-arm-2x.c",
2351    "src/f32-vmulcaddc/gen/c8-minmax-wasmsimd-x86-2x.c",
2352    "src/f32-vrelu/gen/vrelu-wasmsimd-x4.c",
2353    "src/f32-vrelu/gen/vrelu-wasmsimd-x8.c",
2354    "src/f32-vrelu/gen/vrelu-wasmsimd-x16.c",
2355    "src/f32-vrnd/gen/vrndd-wasmsimd-x4.c",
2356    "src/f32-vrnd/gen/vrndd-wasmsimd-x8.c",
2357    "src/f32-vrnd/gen/vrndne-wasmsimd-x4.c",
2358    "src/f32-vrnd/gen/vrndne-wasmsimd-x8.c",
2359    "src/f32-vrnd/gen/vrndu-wasmsimd-x4.c",
2360    "src/f32-vrnd/gen/vrndu-wasmsimd-x8.c",
2361    "src/f32-vrnd/gen/vrndz-wasmsimd-x4.c",
2362    "src/f32-vrnd/gen/vrndz-wasmsimd-x8.c",
2363    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x4.c",
2364    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x8.c",
2365    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x12.c",
2366    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x16.c",
2367    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x20.c",
2368    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-lut64-p2-div-x24.c",
2369    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x4.c",
2370    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x8.c",
2371    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x12.c",
2372    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x16.c",
2373    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x20.c",
2374    "src/f32-vsigmoid/gen/vsigmoid-wasmsimd-rr2-p5-div-x24.c",
2375    "src/f32-vsqrt/gen/wasmsimd-sqrt-x4.c",
2376    "src/f32-vsqrt/gen/wasmsimd-sqrt-x8.c",
2377    "src/f32-vunary/gen/vabs-wasmsimd-x4.c",
2378    "src/f32-vunary/gen/vabs-wasmsimd-x8.c",
2379    "src/f32-vunary/gen/vneg-wasmsimd-x4.c",
2380    "src/f32-vunary/gen/vneg-wasmsimd-x8.c",
2381    "src/f32-vunary/gen/vsqr-wasmsimd-x4.c",
2382    "src/f32-vunary/gen/vsqr-wasmsimd-x8.c",
2383    "src/math/cvt-f16-f32-wasmsimd-int16.c",
2384    "src/math/cvt-f16-f32-wasmsimd-int32.c",
2385    "src/math/cvt-f32-f16-wasmsimd.c",
2386    "src/math/cvt-f32-qs8-wasmsimd.c",
2387    "src/math/cvt-f32-qu8-wasmsimd.c",
2388    "src/math/expm1minus-f32-wasmsimd-rr2-lut16-p3-andnot.c",
2389    "src/math/expm1minus-f32-wasmsimd-rr2-lut16-p3-max.c",
2390    "src/math/expm1minus-f32-wasmsimd-rr2-p6-andnot.c",
2391    "src/math/expm1minus-f32-wasmsimd-rr2-p6-max.c",
2392    "src/math/roundd-wasmsimd-addsub.c",
2393    "src/math/roundd-wasmsimd-cvt.c",
2394    "src/math/roundd-wasmsimd-native.c",
2395    "src/math/roundne-wasmsimd-addsub.c",
2396    "src/math/roundne-wasmsimd-native.c",
2397    "src/math/roundu-wasmsimd-addsub.c",
2398    "src/math/roundu-wasmsimd-cvt.c",
2399    "src/math/roundu-wasmsimd-native.c",
2400    "src/math/roundz-wasmsimd-addsub.c",
2401    "src/math/roundz-wasmsimd-cvt.c",
2402    "src/math/roundz-wasmsimd-native.c",
2403    "src/math/sigmoid-f32-wasmsimd-rr2-lut64-p2-div.c",
2404    "src/math/sigmoid-f32-wasmsimd-rr2-p5-div.c",
2405    "src/qc8-dwconv/gen/up8x9-minmax-fp32-wasmsimd-mul16-add16.c",
2406    "src/qc8-dwconv/gen/up8x9-minmax-fp32-wasmsimd-mul16.c",
2407    "src/qc8-dwconv/gen/up8x25-minmax-fp32-wasmsimd-mul16-add16.c",
2408    "src/qc8-dwconv/gen/up8x25-minmax-fp32-wasmsimd-mul16.c",
2409    "src/qc8-dwconv/gen/up16x3-minmax-fp32-wasmsimd-mul16-add16.c",
2410    "src/qc8-dwconv/gen/up16x9-minmax-fp32-wasmsimd-mul16-add16.c",
2411    "src/qc8-dwconv/gen/up16x9-minmax-fp32-wasmsimd-mul16.c",
2412    "src/qc8-dwconv/gen/up16x25-minmax-fp32-wasmsimd-mul16-add16.c",
2413    "src/qc8-dwconv/gen/up16x25-minmax-fp32-wasmsimd-mul16.c",
2414    "src/qc8-dwconv/gen/up24x9-minmax-fp32-wasmsimd-mul16-add16.c",
2415    "src/qc8-dwconv/gen/up24x9-minmax-fp32-wasmsimd-mul16.c",
2416    "src/qc8-dwconv/gen/up24x25-minmax-fp32-wasmsimd-mul16-add16.c",
2417    "src/qc8-dwconv/gen/up24x25-minmax-fp32-wasmsimd-mul16.c",
2418    "src/qc8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2419    "src/qc8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2420    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2421    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2422    "src/qc8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2423    "src/qc8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2424    "src/qc8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2425    "src/qc8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2426    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2427    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2428    "src/qc8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2429    "src/qc8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2430    "src/qc8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2431    "src/qc8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2432    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2433    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2434    "src/qc8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2435    "src/qc8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2436    "src/qc8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2437    "src/qc8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2438    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2439    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2440    "src/qc8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2441    "src/qc8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2442    "src/qc8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2443    "src/qc8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2444    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2445    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2446    "src/qc8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2447    "src/qc8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2448    "src/qc8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2449    "src/qc8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2450    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2451    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2452    "src/qc8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2453    "src/qc8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2454    "src/qc8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2455    "src/qc8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2456    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2457    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2458    "src/qc8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2459    "src/qc8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2460    "src/qc8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2461    "src/qc8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2462    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2463    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2464    "src/qc8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2465    "src/qc8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2466    "src/qs8-dwconv/gen/up8x9-minmax-fp32-wasmsimd-mul16-add16.c",
2467    "src/qs8-dwconv/gen/up8x9-minmax-fp32-wasmsimd-mul16.c",
2468    "src/qs8-dwconv/gen/up8x25-minmax-fp32-wasmsimd-mul16-add16.c",
2469    "src/qs8-dwconv/gen/up8x25-minmax-fp32-wasmsimd-mul16.c",
2470    "src/qs8-dwconv/gen/up16x9-minmax-fp32-wasmsimd-mul16-add16.c",
2471    "src/qs8-dwconv/gen/up16x9-minmax-fp32-wasmsimd-mul16.c",
2472    "src/qs8-dwconv/gen/up16x25-minmax-fp32-wasmsimd-mul16-add16.c",
2473    "src/qs8-dwconv/gen/up16x25-minmax-fp32-wasmsimd-mul16.c",
2474    "src/qs8-dwconv/gen/up24x9-minmax-fp32-wasmsimd-mul16-add16.c",
2475    "src/qs8-dwconv/gen/up24x9-minmax-fp32-wasmsimd-mul16.c",
2476    "src/qs8-dwconv/gen/up24x25-minmax-fp32-wasmsimd-mul16-add16.c",
2477    "src/qs8-dwconv/gen/up24x25-minmax-fp32-wasmsimd-mul16.c",
2478    "src/qs8-f32-vcvt/gen/vcvt-wasmsimd-x8.c",
2479    "src/qs8-f32-vcvt/gen/vcvt-wasmsimd-x16.c",
2480    "src/qs8-f32-vcvt/gen/vcvt-wasmsimd-x24.c",
2481    "src/qs8-f32-vcvt/gen/vcvt-wasmsimd-x32.c",
2482    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c8.c",
2483    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c16.c",
2484    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c24.c",
2485    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c32.c",
2486    "src/qs8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c8.c",
2487    "src/qs8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c16.c",
2488    "src/qs8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c24.c",
2489    "src/qs8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c32.c",
2490    "src/qs8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2491    "src/qs8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2492    "src/qs8-gemm/gen/1x4c2-xw-minmax-fp32-wasmsimd-dot16x2.c",
2493    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2494    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2495    "src/qs8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2496    "src/qs8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2497    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-wasmsimd-dot16x2.c",
2498    "src/qs8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2499    "src/qs8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2500    "src/qs8-gemm/gen/2x4c2-xw-minmax-fp32-wasmsimd-dot16x2.c",
2501    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2502    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2503    "src/qs8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2504    "src/qs8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2505    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-wasmsimd-dot16x2.c",
2506    "src/qs8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2507    "src/qs8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2508    "src/qs8-gemm/gen/3x4c2-xw-minmax-fp32-wasmsimd-dot16x2.c",
2509    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2510    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2511    "src/qs8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2512    "src/qs8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2513    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-wasmsimd-dot16x2.c",
2514    "src/qs8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2515    "src/qs8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2516    "src/qs8-gemm/gen/4x4c2-xw-minmax-fp32-wasmsimd-dot16x2.c",
2517    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2518    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2519    "src/qs8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2520    "src/qs8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2521    "src/qs8-gemm/gen/4x4c8-xw-minmax-fp32-wasmsimd-dot16x2.c",
2522    "src/qs8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2523    "src/qs8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2524    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2525    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2526    "src/qs8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2527    "src/qs8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2528    "src/qs8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2529    "src/qs8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2530    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2531    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2532    "src/qs8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2533    "src/qs8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2534    "src/qs8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2535    "src/qs8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2536    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2537    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2538    "src/qs8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2539    "src/qs8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2540    "src/qs8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2541    "src/qs8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2542    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2543    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2544    "src/qs8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2545    "src/qs8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2546    "src/qs8-requantization/fp32-wasmsimd.c",
2547    "src/qs8-requantization/gemmlowp-wasmsimd.c",
2548    "src/qs8-vadd/gen/minmax-wasmsimd-x8.c",
2549    "src/qs8-vadd/gen/minmax-wasmsimd-x16.c",
2550    "src/qs8-vadd/gen/minmax-wasmsimd-x24.c",
2551    "src/qs8-vadd/gen/minmax-wasmsimd-x32.c",
2552    "src/qs8-vaddc/gen/minmax-wasmsimd-x8.c",
2553    "src/qs8-vaddc/gen/minmax-wasmsimd-x16.c",
2554    "src/qs8-vaddc/gen/minmax-wasmsimd-x24.c",
2555    "src/qs8-vaddc/gen/minmax-wasmsimd-x32.c",
2556    "src/qs8-vcvt/gen/vcvt-wasmsimd-x8.c",
2557    "src/qs8-vcvt/gen/vcvt-wasmsimd-x16.c",
2558    "src/qs8-vcvt/gen/vcvt-wasmsimd-x32.c",
2559    "src/qs8-vlrelu/gen/vlrelu-wasmsimd-arm-x16.c",
2560    "src/qs8-vlrelu/gen/vlrelu-wasmsimd-arm-x32.c",
2561    "src/qs8-vlrelu/gen/vlrelu-wasmsimd-x86-x8.c",
2562    "src/qs8-vlrelu/gen/vlrelu-wasmsimd-x86-x16.c",
2563    "src/qs8-vlrelu/gen/vlrelu-wasmsimd-x86-x32.c",
2564    "src/qs8-vmul/gen/minmax-fp32-wasmsimd-mul32-ld64-x8.c",
2565    "src/qs8-vmul/gen/minmax-fp32-wasmsimd-mul32-ld64-x16.c",
2566    "src/qs8-vmulc/gen/minmax-fp32-wasmsimd-mul32-ld64-x8.c",
2567    "src/qs8-vmulc/gen/minmax-fp32-wasmsimd-mul32-ld64-x16.c",
2568    "src/qu8-dwconv/gen/up8x9-minmax-fp32-wasmsimd-mul16.c",
2569    "src/qu8-dwconv/gen/up8x25-minmax-fp32-wasmsimd-mul16.c",
2570    "src/qu8-dwconv/gen/up16x9-minmax-fp32-wasmsimd-mul16.c",
2571    "src/qu8-dwconv/gen/up16x25-minmax-fp32-wasmsimd-mul16.c",
2572    "src/qu8-dwconv/gen/up24x9-minmax-fp32-wasmsimd-mul16.c",
2573    "src/qu8-dwconv/gen/up24x25-minmax-fp32-wasmsimd-mul16.c",
2574    "src/qu8-f32-vcvt/gen/vcvt-wasmsimd-x8.c",
2575    "src/qu8-f32-vcvt/gen/vcvt-wasmsimd-x16.c",
2576    "src/qu8-f32-vcvt/gen/vcvt-wasmsimd-x24.c",
2577    "src/qu8-f32-vcvt/gen/vcvt-wasmsimd-x32.c",
2578    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c8.c",
2579    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c16.c",
2580    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c24.c",
2581    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-wasmsimd-c32.c",
2582    "src/qu8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c8.c",
2583    "src/qu8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c16.c",
2584    "src/qu8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c24.c",
2585    "src/qu8-gavgpool/gen/7x-minmax-fp32-wasmsimd-c32.c",
2586    "src/qu8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2587    "src/qu8-gemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2588    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2589    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2590    "src/qu8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2591    "src/qu8-gemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2592    "src/qu8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2593    "src/qu8-gemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2594    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2595    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2596    "src/qu8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2597    "src/qu8-gemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2598    "src/qu8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2599    "src/qu8-gemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2600    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2601    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2602    "src/qu8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2603    "src/qu8-gemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2604    "src/qu8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2605    "src/qu8-gemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2606    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2607    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2608    "src/qu8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2609    "src/qu8-gemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2610    "src/qu8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2611    "src/qu8-igemm/gen/1x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2612    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2613    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2614    "src/qu8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2615    "src/qu8-igemm/gen/1x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2616    "src/qu8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2617    "src/qu8-igemm/gen/2x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2618    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2619    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2620    "src/qu8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2621    "src/qu8-igemm/gen/2x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2622    "src/qu8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2623    "src/qu8-igemm/gen/3x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2624    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2625    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2626    "src/qu8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2627    "src/qu8-igemm/gen/3x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2628    "src/qu8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2629    "src/qu8-igemm/gen/4x4c2-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2630    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2631    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2632    "src/qu8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld64.c",
2633    "src/qu8-igemm/gen/4x4c8-minmax-fp32-wasmsimd-dot16x2-ld128.c",
2634    "src/qu8-requantization/fp32-wasmsimd.c",
2635    "src/qu8-requantization/gemmlowp-wasmsimd.c",
2636    "src/qu8-vadd/gen/minmax-wasmsimd-x8.c",
2637    "src/qu8-vadd/gen/minmax-wasmsimd-x16.c",
2638    "src/qu8-vadd/gen/minmax-wasmsimd-x32.c",
2639    "src/qu8-vaddc/gen/minmax-wasmsimd-x8.c",
2640    "src/qu8-vaddc/gen/minmax-wasmsimd-x16.c",
2641    "src/qu8-vaddc/gen/minmax-wasmsimd-x32.c",
2642    "src/qu8-vcvt/gen/vcvt-wasmsimd-x8.c",
2643    "src/qu8-vcvt/gen/vcvt-wasmsimd-x16.c",
2644    "src/qu8-vcvt/gen/vcvt-wasmsimd-x32.c",
2645    "src/qu8-vlrelu/gen/vlrelu-wasmsimd-arm-x16.c",
2646    "src/qu8-vlrelu/gen/vlrelu-wasmsimd-arm-x32.c",
2647    "src/qu8-vlrelu/gen/vlrelu-wasmsimd-x86-x8.c",
2648    "src/qu8-vlrelu/gen/vlrelu-wasmsimd-x86-x16.c",
2649    "src/qu8-vlrelu/gen/vlrelu-wasmsimd-x86-x32.c",
2650    "src/qu8-vmul/gen/minmax-fp32-wasmsimd-mul32-ld64-x8.c",
2651    "src/qu8-vmul/gen/minmax-fp32-wasmsimd-mul32-ld64-x16.c",
2652    "src/qu8-vmulc/gen/minmax-fp32-wasmsimd-mul32-ld64-x8.c",
2653    "src/qu8-vmulc/gen/minmax-fp32-wasmsimd-mul32-ld64-x16.c",
2654    "src/s8-ibilinear/gen/wasmsimd-dot16x2-c8.c",
2655    "src/s8-ibilinear/gen/wasmsimd-dot16x2-c16.c",
2656    "src/s8-ibilinear/gen/wasmsimd-mul32-c8.c",
2657    "src/s8-ibilinear/gen/wasmsimd-mul32-c16.c",
2658    "src/s8-maxpool/9p8x-minmax-wasmsimd-c16.c",
2659    "src/s8-vclamp/wasmsimd-x64.c",
2660    "src/u8-ibilinear/gen/wasmsimd-dot16x2-c8.c",
2661    "src/u8-ibilinear/gen/wasmsimd-dot16x2-c16.c",
2662    "src/u8-ibilinear/gen/wasmsimd-mul32-c8.c",
2663    "src/u8-ibilinear/gen/wasmsimd-mul32-c16.c",
2664    "src/u8-maxpool/9p8x-minmax-wasmsimd-c16.c",
2665    "src/u8-vclamp/wasmsimd-x64.c",
2666    "src/xx-fill/wasmsimd-x64.c",
2667    "src/xx-pad/wasmsimd.c",
2668    "src/x8-lut/gen/lut-wasmsimd-x16.c",
2669    "src/x8-lut/gen/lut-wasmsimd-x32.c",
2670    "src/x8-lut/gen/lut-wasmsimd-x48.c",
2671    "src/x8-lut/gen/lut-wasmsimd-x64.c",
2672    "src/x8-transposec/gen/16x16-reuse-mov-wasmsimd.c",
2673    "src/x8-transposec/gen/16x16-reuse-switch-wasmsimd.c",
2674    "src/x16-transposec/gen/8x8-multi-mov-wasmsimd.c",
2675    "src/x16-transposec/gen/8x8-multi-switch-wasmsimd.c",
2676    "src/x16-transposec/gen/8x8-reuse-mov-wasmsimd.c",
2677    "src/x16-transposec/gen/8x8-reuse-multi-wasmsimd.c",
2678    "src/x16-transposec/gen/8x8-reuse-switch-wasmsimd.c",
2679    "src/x32-packx/x4-wasmsimd.c",
2680    "src/x32-transposec/gen/4x4-multi-mov-wasmsimd.c",
2681    "src/x32-transposec/gen/4x4-multi-multi-wasmsimd.c",
2682    "src/x32-transposec/gen/4x4-multi-switch-wasmsimd.c",
2683    "src/x32-transposec/gen/4x4-reuse-mov-wasmsimd.c",
2684    "src/x32-transposec/gen/4x4-reuse-multi-wasmsimd.c",
2685    "src/x32-transposec/gen/4x4-reuse-switch-wasmsimd.c",
2686    "src/x32-unpool/wasmsimd.c",
2687    "src/x32-zip/xm-wasmsimd.c",
2688    "src/x32-zip/x2-wasmsimd.c",
2689    "src/x32-zip/x3-wasmsimd.c",
2690    "src/x32-zip/x4-wasmsimd.c",
2691]
2692
2693ALL_WASMRELAXEDSIMD_MICROKERNEL_SRCS = [
2694    "src/f32-dwconv/gen/up4x3-minmax-wasmrelaxedsimd-acc2.c",
2695    "src/f32-dwconv/gen/up4x3-minmax-wasmrelaxedsimd-fma-acc2.c",
2696    "src/f32-dwconv/gen/up4x3-minmax-wasmrelaxedsimd-fma.c",
2697    "src/f32-dwconv/gen/up4x3-minmax-wasmrelaxedsimd.c",
2698    "src/f32-dwconv/gen/up4x3-wasmrelaxedsimd-fma.c",
2699    "src/f32-dwconv/gen/up4x4-minmax-wasmrelaxedsimd-acc2.c",
2700    "src/f32-dwconv/gen/up4x4-minmax-wasmrelaxedsimd-fma-acc2.c",
2701    "src/f32-dwconv/gen/up4x4-minmax-wasmrelaxedsimd-fma.c",
2702    "src/f32-dwconv/gen/up4x4-minmax-wasmrelaxedsimd.c",
2703    "src/f32-dwconv/gen/up4x4-wasmrelaxedsimd-fma.c",
2704    "src/f32-dwconv/gen/up4x9-minmax-wasmrelaxedsimd-acc2.c",
2705    "src/f32-dwconv/gen/up4x9-minmax-wasmrelaxedsimd-fma-acc2.c",
2706    "src/f32-dwconv/gen/up4x9-minmax-wasmrelaxedsimd-fma.c",
2707    "src/f32-dwconv/gen/up4x9-minmax-wasmrelaxedsimd.c",
2708    "src/f32-dwconv/gen/up4x9-wasmrelaxedsimd-fma.c",
2709    "src/f32-dwconv/gen/up4x25-minmax-wasmrelaxedsimd-acc2.c",
2710    "src/f32-dwconv/gen/up4x25-minmax-wasmrelaxedsimd-fma-acc2.c",
2711    "src/f32-dwconv/gen/up4x25-minmax-wasmrelaxedsimd-fma.c",
2712    "src/f32-dwconv/gen/up4x25-minmax-wasmrelaxedsimd.c",
2713    "src/f32-dwconv/gen/up4x25-wasmrelaxedsimd-fma.c",
2714    "src/f32-dwconv/gen/up8x3-minmax-wasmrelaxedsimd-acc2.c",
2715    "src/f32-dwconv/gen/up8x3-minmax-wasmrelaxedsimd-fma-acc2.c",
2716    "src/f32-dwconv/gen/up8x3-minmax-wasmrelaxedsimd-fma.c",
2717    "src/f32-dwconv/gen/up8x3-minmax-wasmrelaxedsimd.c",
2718    "src/f32-dwconv/gen/up8x3-wasmrelaxedsimd-fma.c",
2719    "src/f32-dwconv/gen/up8x4-minmax-wasmrelaxedsimd-acc2.c",
2720    "src/f32-dwconv/gen/up8x4-minmax-wasmrelaxedsimd-fma-acc2.c",
2721    "src/f32-dwconv/gen/up8x4-minmax-wasmrelaxedsimd-fma.c",
2722    "src/f32-dwconv/gen/up8x4-minmax-wasmrelaxedsimd.c",
2723    "src/f32-dwconv/gen/up8x4-wasmrelaxedsimd-fma.c",
2724    "src/f32-dwconv/gen/up8x9-minmax-wasmrelaxedsimd-acc2.c",
2725    "src/f32-dwconv/gen/up8x9-minmax-wasmrelaxedsimd-fma-acc2.c",
2726    "src/f32-dwconv/gen/up8x9-minmax-wasmrelaxedsimd-fma.c",
2727    "src/f32-dwconv/gen/up8x9-minmax-wasmrelaxedsimd.c",
2728    "src/f32-dwconv/gen/up8x9-wasmrelaxedsimd-fma.c",
2729    "src/f32-dwconv/gen/up8x25-minmax-wasmrelaxedsimd-acc2.c",
2730    "src/f32-dwconv/gen/up8x25-minmax-wasmrelaxedsimd-fma-acc2.c",
2731    "src/f32-dwconv/gen/up8x25-minmax-wasmrelaxedsimd-fma.c",
2732    "src/f32-dwconv/gen/up8x25-minmax-wasmrelaxedsimd.c",
2733    "src/f32-dwconv/gen/up8x25-wasmrelaxedsimd-fma.c",
2734    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2735    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmrelaxedsimd-fma-splat.c",
2736    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmrelaxedsimd-loadsplat.c",
2737    "src/f32-gemm/gen-inc/1x8inc-minmax-wasmrelaxedsimd-splat.c",
2738    "src/f32-gemm/gen-inc/1x8s4inc-minmax-wasmrelaxedsimd-fma.c",
2739    "src/f32-gemm/gen-inc/1x8s4inc-minmax-wasmrelaxedsimd.c",
2740    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2741    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmrelaxedsimd-fma-splat.c",
2742    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmrelaxedsimd-loadsplat.c",
2743    "src/f32-gemm/gen-inc/3x8inc-minmax-wasmrelaxedsimd-splat.c",
2744    "src/f32-gemm/gen-inc/3x8s4inc-minmax-wasmrelaxedsimd-fma.c",
2745    "src/f32-gemm/gen-inc/3x8s4inc-minmax-wasmrelaxedsimd.c",
2746    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2747    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmrelaxedsimd-fma-splat.c",
2748    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmrelaxedsimd-loadsplat.c",
2749    "src/f32-gemm/gen-inc/4x8inc-minmax-wasmrelaxedsimd-splat.c",
2750    "src/f32-gemm/gen-inc/4x8s4inc-minmax-wasmrelaxedsimd-fma.c",
2751    "src/f32-gemm/gen-inc/4x8s4inc-minmax-wasmrelaxedsimd.c",
2752    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2753    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmrelaxedsimd-fma-splat.c",
2754    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmrelaxedsimd-loadsplat.c",
2755    "src/f32-gemm/gen-inc/5x8inc-minmax-wasmrelaxedsimd-splat.c",
2756    "src/f32-gemm/gen-inc/5x8s4inc-minmax-wasmrelaxedsimd-fma.c",
2757    "src/f32-gemm/gen-inc/5x8s4inc-minmax-wasmrelaxedsimd.c",
2758    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2759    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmrelaxedsimd-fma-splat.c",
2760    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmrelaxedsimd-loadsplat.c",
2761    "src/f32-gemm/gen-inc/6x8inc-minmax-wasmrelaxedsimd-splat.c",
2762    "src/f32-gemm/gen-inc/6x8s4inc-minmax-wasmrelaxedsimd-fma.c",
2763    "src/f32-gemm/gen-inc/6x8s4inc-minmax-wasmrelaxedsimd.c",
2764    "src/f32-gemm/gen/1x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2765    "src/f32-gemm/gen/1x8-minmax-wasmrelaxedsimd-fma-splat.c",
2766    "src/f32-gemm/gen/1x8-minmax-wasmrelaxedsimd-loadsplat.c",
2767    "src/f32-gemm/gen/1x8-minmax-wasmrelaxedsimd-splat.c",
2768    "src/f32-gemm/gen/1x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2769    "src/f32-gemm/gen/1x8-relu-wasmrelaxedsimd-fma-splat.c",
2770    "src/f32-gemm/gen/1x8-wasmrelaxedsimd-fma-loadsplat.c",
2771    "src/f32-gemm/gen/1x8-wasmrelaxedsimd-fma-splat.c",
2772    "src/f32-gemm/gen/1x8s4-minmax-wasmrelaxedsimd-fma.c",
2773    "src/f32-gemm/gen/1x8s4-minmax-wasmrelaxedsimd.c",
2774    "src/f32-gemm/gen/1x8s4-relu-wasmrelaxedsimd-fma.c",
2775    "src/f32-gemm/gen/1x8s4-wasmrelaxedsimd-fma.c",
2776    "src/f32-gemm/gen/3x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2777    "src/f32-gemm/gen/3x8-minmax-wasmrelaxedsimd-fma-splat.c",
2778    "src/f32-gemm/gen/3x8-minmax-wasmrelaxedsimd-loadsplat.c",
2779    "src/f32-gemm/gen/3x8-minmax-wasmrelaxedsimd-splat.c",
2780    "src/f32-gemm/gen/3x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2781    "src/f32-gemm/gen/3x8-relu-wasmrelaxedsimd-fma-splat.c",
2782    "src/f32-gemm/gen/3x8-wasmrelaxedsimd-fma-loadsplat.c",
2783    "src/f32-gemm/gen/3x8-wasmrelaxedsimd-fma-splat.c",
2784    "src/f32-gemm/gen/3x8s4-minmax-wasmrelaxedsimd-fma.c",
2785    "src/f32-gemm/gen/3x8s4-minmax-wasmrelaxedsimd.c",
2786    "src/f32-gemm/gen/3x8s4-relu-wasmrelaxedsimd-fma.c",
2787    "src/f32-gemm/gen/3x8s4-wasmrelaxedsimd-fma.c",
2788    "src/f32-gemm/gen/4x2c4-minmax-wasmrelaxedsimd-fma.c",
2789    "src/f32-gemm/gen/4x2c4-minmax-wasmrelaxedsimd.c",
2790    "src/f32-gemm/gen/4x2c4-relu-wasmrelaxedsimd-fma.c",
2791    "src/f32-gemm/gen/4x2c4-wasmrelaxedsimd-fma.c",
2792    "src/f32-gemm/gen/4x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2793    "src/f32-gemm/gen/4x8-minmax-wasmrelaxedsimd-fma-splat.c",
2794    "src/f32-gemm/gen/4x8-minmax-wasmrelaxedsimd-loadsplat.c",
2795    "src/f32-gemm/gen/4x8-minmax-wasmrelaxedsimd-splat.c",
2796    "src/f32-gemm/gen/4x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2797    "src/f32-gemm/gen/4x8-relu-wasmrelaxedsimd-fma-splat.c",
2798    "src/f32-gemm/gen/4x8-wasmrelaxedsimd-fma-loadsplat.c",
2799    "src/f32-gemm/gen/4x8-wasmrelaxedsimd-fma-splat.c",
2800    "src/f32-gemm/gen/4x8s4-minmax-wasmrelaxedsimd-fma.c",
2801    "src/f32-gemm/gen/4x8s4-minmax-wasmrelaxedsimd.c",
2802    "src/f32-gemm/gen/4x8s4-relu-wasmrelaxedsimd-fma.c",
2803    "src/f32-gemm/gen/4x8s4-wasmrelaxedsimd-fma.c",
2804    "src/f32-gemm/gen/5x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2805    "src/f32-gemm/gen/5x8-minmax-wasmrelaxedsimd-fma-splat.c",
2806    "src/f32-gemm/gen/5x8-minmax-wasmrelaxedsimd-loadsplat.c",
2807    "src/f32-gemm/gen/5x8-minmax-wasmrelaxedsimd-splat.c",
2808    "src/f32-gemm/gen/5x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2809    "src/f32-gemm/gen/5x8-relu-wasmrelaxedsimd-fma-splat.c",
2810    "src/f32-gemm/gen/5x8-wasmrelaxedsimd-fma-loadsplat.c",
2811    "src/f32-gemm/gen/5x8-wasmrelaxedsimd-fma-splat.c",
2812    "src/f32-gemm/gen/5x8s4-minmax-wasmrelaxedsimd-fma.c",
2813    "src/f32-gemm/gen/5x8s4-minmax-wasmrelaxedsimd.c",
2814    "src/f32-gemm/gen/5x8s4-relu-wasmrelaxedsimd-fma.c",
2815    "src/f32-gemm/gen/5x8s4-wasmrelaxedsimd-fma.c",
2816    "src/f32-gemm/gen/6x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2817    "src/f32-gemm/gen/6x8-minmax-wasmrelaxedsimd-fma-splat.c",
2818    "src/f32-gemm/gen/6x8-minmax-wasmrelaxedsimd-loadsplat.c",
2819    "src/f32-gemm/gen/6x8-minmax-wasmrelaxedsimd-splat.c",
2820    "src/f32-gemm/gen/6x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2821    "src/f32-gemm/gen/6x8-relu-wasmrelaxedsimd-fma-splat.c",
2822    "src/f32-gemm/gen/6x8-wasmrelaxedsimd-fma-loadsplat.c",
2823    "src/f32-gemm/gen/6x8-wasmrelaxedsimd-fma-splat.c",
2824    "src/f32-gemm/gen/6x8s4-minmax-wasmrelaxedsimd-fma.c",
2825    "src/f32-gemm/gen/6x8s4-minmax-wasmrelaxedsimd.c",
2826    "src/f32-gemm/gen/6x8s4-relu-wasmrelaxedsimd-fma.c",
2827    "src/f32-gemm/gen/6x8s4-wasmrelaxedsimd-fma.c",
2828    "src/f32-igemm/gen/1x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2829    "src/f32-igemm/gen/1x8-minmax-wasmrelaxedsimd-fma-splat.c",
2830    "src/f32-igemm/gen/1x8-minmax-wasmrelaxedsimd-loadsplat.c",
2831    "src/f32-igemm/gen/1x8-minmax-wasmrelaxedsimd-splat.c",
2832    "src/f32-igemm/gen/1x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2833    "src/f32-igemm/gen/1x8-relu-wasmrelaxedsimd-fma-splat.c",
2834    "src/f32-igemm/gen/1x8-wasmrelaxedsimd-fma-loadsplat.c",
2835    "src/f32-igemm/gen/1x8-wasmrelaxedsimd-fma-splat.c",
2836    "src/f32-igemm/gen/1x8s4-minmax-wasmrelaxedsimd-fma.c",
2837    "src/f32-igemm/gen/1x8s4-minmax-wasmrelaxedsimd.c",
2838    "src/f32-igemm/gen/1x8s4-relu-wasmrelaxedsimd-fma.c",
2839    "src/f32-igemm/gen/1x8s4-wasmrelaxedsimd-fma.c",
2840    "src/f32-igemm/gen/3x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2841    "src/f32-igemm/gen/3x8-minmax-wasmrelaxedsimd-fma-splat.c",
2842    "src/f32-igemm/gen/3x8-minmax-wasmrelaxedsimd-loadsplat.c",
2843    "src/f32-igemm/gen/3x8-minmax-wasmrelaxedsimd-splat.c",
2844    "src/f32-igemm/gen/3x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2845    "src/f32-igemm/gen/3x8-relu-wasmrelaxedsimd-fma-splat.c",
2846    "src/f32-igemm/gen/3x8-wasmrelaxedsimd-fma-loadsplat.c",
2847    "src/f32-igemm/gen/3x8-wasmrelaxedsimd-fma-splat.c",
2848    "src/f32-igemm/gen/3x8s4-minmax-wasmrelaxedsimd-fma.c",
2849    "src/f32-igemm/gen/3x8s4-minmax-wasmrelaxedsimd.c",
2850    "src/f32-igemm/gen/3x8s4-relu-wasmrelaxedsimd-fma.c",
2851    "src/f32-igemm/gen/3x8s4-wasmrelaxedsimd-fma.c",
2852    "src/f32-igemm/gen/4x2c4-minmax-wasmrelaxedsimd-fma.c",
2853    "src/f32-igemm/gen/4x2c4-minmax-wasmrelaxedsimd.c",
2854    "src/f32-igemm/gen/4x2c4-relu-wasmrelaxedsimd-fma.c",
2855    "src/f32-igemm/gen/4x2c4-wasmrelaxedsimd-fma.c",
2856    "src/f32-igemm/gen/4x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2857    "src/f32-igemm/gen/4x8-minmax-wasmrelaxedsimd-fma-splat.c",
2858    "src/f32-igemm/gen/4x8-minmax-wasmrelaxedsimd-loadsplat.c",
2859    "src/f32-igemm/gen/4x8-minmax-wasmrelaxedsimd-splat.c",
2860    "src/f32-igemm/gen/4x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2861    "src/f32-igemm/gen/4x8-relu-wasmrelaxedsimd-fma-splat.c",
2862    "src/f32-igemm/gen/4x8-wasmrelaxedsimd-fma-loadsplat.c",
2863    "src/f32-igemm/gen/4x8-wasmrelaxedsimd-fma-splat.c",
2864    "src/f32-igemm/gen/4x8s4-minmax-wasmrelaxedsimd-fma.c",
2865    "src/f32-igemm/gen/4x8s4-minmax-wasmrelaxedsimd.c",
2866    "src/f32-igemm/gen/4x8s4-relu-wasmrelaxedsimd-fma.c",
2867    "src/f32-igemm/gen/4x8s4-wasmrelaxedsimd-fma.c",
2868    "src/f32-igemm/gen/5x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2869    "src/f32-igemm/gen/5x8-minmax-wasmrelaxedsimd-fma-splat.c",
2870    "src/f32-igemm/gen/5x8-minmax-wasmrelaxedsimd-loadsplat.c",
2871    "src/f32-igemm/gen/5x8-minmax-wasmrelaxedsimd-splat.c",
2872    "src/f32-igemm/gen/5x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2873    "src/f32-igemm/gen/5x8-relu-wasmrelaxedsimd-fma-splat.c",
2874    "src/f32-igemm/gen/5x8-wasmrelaxedsimd-fma-loadsplat.c",
2875    "src/f32-igemm/gen/5x8-wasmrelaxedsimd-fma-splat.c",
2876    "src/f32-igemm/gen/5x8s4-minmax-wasmrelaxedsimd-fma.c",
2877    "src/f32-igemm/gen/5x8s4-minmax-wasmrelaxedsimd.c",
2878    "src/f32-igemm/gen/5x8s4-relu-wasmrelaxedsimd-fma.c",
2879    "src/f32-igemm/gen/5x8s4-wasmrelaxedsimd-fma.c",
2880    "src/f32-igemm/gen/6x8-minmax-wasmrelaxedsimd-fma-loadsplat.c",
2881    "src/f32-igemm/gen/6x8-minmax-wasmrelaxedsimd-fma-splat.c",
2882    "src/f32-igemm/gen/6x8-minmax-wasmrelaxedsimd-loadsplat.c",
2883    "src/f32-igemm/gen/6x8-minmax-wasmrelaxedsimd-splat.c",
2884    "src/f32-igemm/gen/6x8-relu-wasmrelaxedsimd-fma-loadsplat.c",
2885    "src/f32-igemm/gen/6x8-relu-wasmrelaxedsimd-fma-splat.c",
2886    "src/f32-igemm/gen/6x8-wasmrelaxedsimd-fma-loadsplat.c",
2887    "src/f32-igemm/gen/6x8-wasmrelaxedsimd-fma-splat.c",
2888    "src/f32-igemm/gen/6x8s4-minmax-wasmrelaxedsimd-fma.c",
2889    "src/f32-igemm/gen/6x8s4-minmax-wasmrelaxedsimd.c",
2890    "src/f32-igemm/gen/6x8s4-relu-wasmrelaxedsimd-fma.c",
2891    "src/f32-igemm/gen/6x8s4-wasmrelaxedsimd-fma.c",
2892    "src/f32-vmulcaddc/gen/c4-minmax-wasmrelaxedsimd-fma-2x.c",
2893    "src/f32-vmulcaddc/gen/c4-minmax-wasmrelaxedsimd-2x.c",
2894    "src/f32-vmulcaddc/gen/c8-minmax-wasmrelaxedsimd-fma-2x.c",
2895    "src/f32-vmulcaddc/gen/c8-minmax-wasmrelaxedsimd-2x.c",
2896    "src/qs8-vcvt/gen/vcvt-wasmrelaxedsimd-x8.c",
2897    "src/qs8-vcvt/gen/vcvt-wasmrelaxedsimd-x16.c",
2898    "src/qs8-vcvt/gen/vcvt-wasmrelaxedsimd-x32.c",
2899    "src/qs8-vlrelu/gen/vlrelu-wasmrelaxedsimd-arm-x16.c",
2900    "src/qs8-vlrelu/gen/vlrelu-wasmrelaxedsimd-arm-x32.c",
2901    "src/qs8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x8.c",
2902    "src/qs8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x16.c",
2903    "src/qs8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x32.c",
2904    "src/qu8-vcvt/gen/vcvt-wasmrelaxedsimd-x8.c",
2905    "src/qu8-vcvt/gen/vcvt-wasmrelaxedsimd-x16.c",
2906    "src/qu8-vcvt/gen/vcvt-wasmrelaxedsimd-x32.c",
2907    "src/qu8-vlrelu/gen/vlrelu-wasmrelaxedsimd-arm-x16.c",
2908    "src/qu8-vlrelu/gen/vlrelu-wasmrelaxedsimd-arm-x32.c",
2909    "src/qu8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x8.c",
2910    "src/qu8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x16.c",
2911    "src/qu8-vlrelu/gen/vlrelu-wasmrelaxedsimd-x86-x32.c",
2912]
2913
2914PROD_ARMSIMD32_MICROKERNEL_SRCS = [
2915    "src/qc8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2916    "src/qc8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2917    "src/qc8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2918    "src/qc8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2919    "src/qs8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2920    "src/qs8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2921    "src/qs8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2922    "src/qs8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2923    "src/qs8-vcvt/gen/vcvt-armsimd32-x8.c",
2924    "src/qs8-vlrelu/gen/vlrelu-armsimd32-x4.c",
2925    "src/qu8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2926    "src/qu8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2927    "src/qu8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2928    "src/qu8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2929    "src/qu8-vcvt/gen/vcvt-armsimd32-x8.c",
2930    "src/qu8-vlrelu/gen/vlrelu-armsimd32-x4.c",
2931]
2932
2933ALL_ARMSIMD32_MICROKERNEL_SRCS = [
2934    "src/qc8-gemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2935    "src/qc8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2936    "src/qc8-gemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2937    "src/qc8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2938    "src/qc8-igemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2939    "src/qc8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2940    "src/qc8-igemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2941    "src/qc8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2942    "src/qs8-gemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2943    "src/qs8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2944    "src/qs8-gemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2945    "src/qs8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2946    "src/qs8-igemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2947    "src/qs8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2948    "src/qs8-igemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2949    "src/qs8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2950    "src/qs8-vcvt/gen/vcvt-armsimd32-x4.c",
2951    "src/qs8-vcvt/gen/vcvt-armsimd32-x8.c",
2952    "src/qs8-vlrelu/gen/vlrelu-armsimd32-x4.c",
2953    "src/qs8-vlrelu/gen/vlrelu-armsimd32-x8.c",
2954    "src/qu8-gemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2955    "src/qu8-gemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2956    "src/qu8-gemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2957    "src/qu8-gemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2958    "src/qu8-igemm/gen/1x1c4-minmax-fp32-armsimd32.c",
2959    "src/qu8-igemm/gen/1x2c4-minmax-fp32-armsimd32.c",
2960    "src/qu8-igemm/gen/2x1c4-minmax-fp32-armsimd32.c",
2961    "src/qu8-igemm/gen/2x2c4-minmax-fp32-armsimd32.c",
2962    "src/qu8-vcvt/gen/vcvt-armsimd32-x4.c",
2963    "src/qu8-vcvt/gen/vcvt-armsimd32-x8.c",
2964    "src/qu8-vlrelu/gen/vlrelu-armsimd32-x4.c",
2965    "src/qu8-vlrelu/gen/vlrelu-armsimd32-x8.c",
2966]
2967
2968PROD_NEON_MICROKERNEL_SRCS = [
2969    "src/f16-f32-vcvt/gen/vcvt-neon-int16-x16.c",
2970    "src/f32-argmaxpool/4x-neon-c4.c",
2971    "src/f32-argmaxpool/9p8x-neon-c4.c",
2972    "src/f32-argmaxpool/9x-neon-c4.c",
2973    "src/f32-avgpool/9p8x-minmax-neon-c4.c",
2974    "src/f32-avgpool/9x-minmax-neon-c4.c",
2975    "src/f32-conv-hwc2chw/3x3s2p1c3x4-neon-2x2.c",
2976    "src/f32-dwconv/gen/up8x3-minmax-neon.c",
2977    "src/f32-dwconv/gen/up8x4-minmax-neon.c",
2978    "src/f32-dwconv/gen/up8x9-minmax-neon.c",
2979    "src/f32-dwconv/gen/up8x25-minmax-neon-acc2.c",
2980    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-2x4.c",
2981    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-1x4.c",
2982    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4.c",
2983    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4.c",
2984    "src/f32-f16-vcvt/gen/vcvt-neon-x8.c",
2985    "src/f32-gavgpool-cw/neon-x4.c",
2986    "src/f32-gavgpool/7p7x-minmax-neon-c4.c",
2987    "src/f32-gavgpool/7x-minmax-neon-c4.c",
2988    "src/f32-gemm/gen/1x8-minmax-neon-lane-ld64.c",
2989    "src/f32-gemm/gen/4x2-minmax-neon-lane-ld64.c",
2990    "src/f32-gemm/gen/4x8-minmax-neon-lane-ld64.c",
2991    "src/f32-gemm/gen/4x8-minmax-neon-lane-ld128.c",
2992    "src/f32-ibilinear-chw/gen/neon-p8.c",
2993    "src/f32-ibilinear/gen/neon-c8.c",
2994    "src/f32-igemm/gen/1x8-minmax-neon-lane-ld64.c",
2995    "src/f32-igemm/gen/4x2-minmax-neon-lane-ld64.c",
2996    "src/f32-igemm/gen/4x8-minmax-neon-lane-ld64.c",
2997    "src/f32-igemm/gen/4x8-minmax-neon-lane-ld128.c",
2998    "src/f32-maxpool/9p8x-minmax-neon-c4.c",
2999    "src/f32-pavgpool/9p8x-minmax-neon-c4.c",
3000    "src/f32-pavgpool/9x-minmax-neon-c4.c",
3001    "src/f32-prelu/gen/neon-2x8.c",
3002    "src/f32-qs8-vcvt/gen/vcvt-neon-x32.c",
3003    "src/f32-qu8-vcvt/gen/vcvt-neon-x32.c",
3004    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x8.c",
3005    "src/f32-rmax/neon.c",
3006    "src/f32-spmm/gen/32x1-minmax-neon.c",
3007    "src/f32-vbinary/gen/vadd-minmax-neon-x8.c",
3008    "src/f32-vbinary/gen/vaddc-minmax-neon-x8.c",
3009    "src/f32-vbinary/gen/vmax-neon-x8.c",
3010    "src/f32-vbinary/gen/vmaxc-neon-x8.c",
3011    "src/f32-vbinary/gen/vmin-neon-x8.c",
3012    "src/f32-vbinary/gen/vminc-neon-x8.c",
3013    "src/f32-vbinary/gen/vmul-minmax-neon-x8.c",
3014    "src/f32-vbinary/gen/vmulc-minmax-neon-x8.c",
3015    "src/f32-vbinary/gen/vrsubc-minmax-neon-x8.c",
3016    "src/f32-vbinary/gen/vsqrdiff-neon-x8.c",
3017    "src/f32-vbinary/gen/vsqrdiffc-neon-x8.c",
3018    "src/f32-vbinary/gen/vsub-minmax-neon-x8.c",
3019    "src/f32-vbinary/gen/vsubc-minmax-neon-x8.c",
3020    "src/f32-vclamp/gen/vclamp-neon-x8.c",
3021    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x8.c",
3022    "src/f32-vhswish/gen/vhswish-neon-x16.c",
3023    "src/f32-vlrelu/gen/vlrelu-neon-x8.c",
3024    "src/f32-vmulcaddc/gen/c4-minmax-neon-2x.c",
3025    "src/f32-vrnd/gen/vrndd-neon-x8.c",
3026    "src/f32-vrnd/gen/vrndne-neon-x8.c",
3027    "src/f32-vrnd/gen/vrndu-neon-x8.c",
3028    "src/f32-vrnd/gen/vrndz-neon-x8.c",
3029    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x8.c",
3030    "src/f32-vunary/gen/vabs-neon-x8.c",
3031    "src/f32-vunary/gen/vneg-neon-x8.c",
3032    "src/f32-vunary/gen/vsqr-neon-x8.c",
3033    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neon-mla8-ld64.c",
3034    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neon-mla8-ld128.c",
3035    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mla8-ld64.c",
3036    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mla8-ld64.c",
3037    "src/qc8-gemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
3038    "src/qc8-gemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3039    "src/qc8-gemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3040    "src/qc8-igemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
3041    "src/qc8-igemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3042    "src/qc8-igemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3043    "src/qs8-dwconv/gen/up8x25-minmax-rndnu-neon-mla8-ld64.c",
3044    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mla8-ld64.c",
3045    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mla8-ld64.c",
3046    "src/qs8-f32-vcvt/gen/vcvt-neon-x32.c",
3047    "src/qs8-gavgpool/gen/7p7x-minmax-rndnu-neon-c8.c",
3048    "src/qs8-gavgpool/gen/7x-minmax-rndnu-neon-c8.c",
3049    "src/qs8-gemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3050    "src/qs8-gemm/gen/1x8c2s4-minmax-rndnu-neon-mlal.c",
3051    "src/qs8-gemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3052    "src/qs8-gemm/gen/2x8c2s4-minmax-rndnu-neon-mlal.c",
3053    "src/qs8-igemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3054    "src/qs8-igemm/gen/1x8c2s4-minmax-rndnu-neon-mlal.c",
3055    "src/qs8-igemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3056    "src/qs8-igemm/gen/2x8c2s4-minmax-rndnu-neon-mlal.c",
3057    "src/qs8-vadd/gen/minmax-neon-ld64-x16.c",
3058    "src/qs8-vadd/gen/minmax-neon-ld64-x32.c",
3059    "src/qs8-vaddc/gen/minmax-neon-ld64-x16.c",
3060    "src/qs8-vaddc/gen/minmax-neon-ld64-x32.c",
3061    "src/qs8-vcvt/gen/vcvt-neon-x32.c",
3062    "src/qs8-vlrelu/gen/vlrelu-neon-x32.c",
3063    "src/qs8-vmul/gen/minmax-rndnu-neon-ld64-x16.c",
3064    "src/qs8-vmulc/gen/minmax-rndnu-neon-ld64-x16.c",
3065    "src/qu8-avgpool/9p8x-minmax-neon-c8.c",
3066    "src/qu8-avgpool/9x-minmax-neon-c8.c",
3067    "src/qu8-dwconv/gen/up8x25-minmax-rndnu-neon-mul8.c",
3068    "src/qu8-dwconv/gen/up16x9-minmax-rndnu-neon-mul8.c",
3069    "src/qu8-f32-vcvt/gen/vcvt-neon-x32.c",
3070    "src/qu8-gavgpool/gen/7p7x-minmax-rndnu-neon-c8.c",
3071    "src/qu8-gavgpool/gen/7x-minmax-rndnu-neon-c8.c",
3072    "src/qu8-gemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3073    "src/qu8-gemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3074    "src/qu8-gemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
3075    "src/qu8-gemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
3076    "src/qu8-igemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3077    "src/qu8-igemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3078    "src/qu8-igemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
3079    "src/qu8-igemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
3080    "src/qu8-vadd/gen/minmax-neon-ld64-x16.c",
3081    "src/qu8-vadd/gen/minmax-neon-ld64-x32.c",
3082    "src/qu8-vaddc/gen/minmax-neon-ld64-x16.c",
3083    "src/qu8-vaddc/gen/minmax-neon-ld64-x32.c",
3084    "src/qu8-vcvt/gen/vcvt-neon-x32.c",
3085    "src/qu8-vlrelu/gen/vlrelu-neon-x32.c",
3086    "src/qu8-vmul/gen/minmax-rndnu-neon-ld64-x16.c",
3087    "src/qu8-vmulc/gen/minmax-rndnu-neon-ld64-x16.c",
3088    "src/s8-ibilinear/gen/neon-c8.c",
3089    "src/s8-ibilinear/gen/neon-c16.c",
3090    "src/s8-maxpool/9p8x-minmax-neon-c16.c",
3091    "src/s8-vclamp/neon-x64.c",
3092    "src/u8-ibilinear/gen/neon-c8.c",
3093    "src/u8-ibilinear/gen/neon-c16.c",
3094    "src/u8-maxpool/9p8x-minmax-neon-c16.c",
3095    "src/u8-rmax/neon.c",
3096    "src/u8-vclamp/neon-x64.c",
3097    "src/xx-fill/neon-x64.c",
3098    "src/xx-pad/neon.c",
3099    "src/x8-transposec/gen/16x16-reuse-dec-zip-neon.c",
3100    "src/x8-zip/xm-neon.c",
3101    "src/x8-zip/x2-neon.c",
3102    "src/x8-zip/x3-neon.c",
3103    "src/x8-zip/x4-neon.c",
3104    "src/x16-transposec/gen/8x8-reuse-dec-zip-neon.c",
3105    "src/x32-packx/x4-neon-st4.c",
3106    "src/x32-transposec/gen/4x4-reuse-dec-zip-neon.c",
3107    "src/x32-unpool/neon.c",
3108    "src/x32-zip/xm-neon.c",
3109    "src/x32-zip/x2-neon.c",
3110    "src/x32-zip/x3-neon.c",
3111    "src/x32-zip/x4-neon.c",
3112]
3113
3114ALL_NEON_MICROKERNEL_SRCS = [
3115    "src/cs16-bfly4/samples1-neon.c",
3116    "src/cs16-vsquareabs/gen/neon-mlal-ld128-x4.c",
3117    "src/cs16-vsquareabs/gen/neon-mlal-ld128-x8.c",
3118    "src/cs16-vsquareabs/gen/neon-mlal-ld128-x12.c",
3119    "src/cs16-vsquareabs/gen/neon-mlal-ld128-x16.c",
3120    "src/f16-f32-vcvt/gen/vcvt-neon-int16-x8.c",
3121    "src/f16-f32-vcvt/gen/vcvt-neon-int16-x16.c",
3122    "src/f16-f32-vcvt/gen/vcvt-neon-int16-x24.c",
3123    "src/f16-f32-vcvt/gen/vcvt-neon-int16-x32.c",
3124    "src/f16-f32-vcvt/gen/vcvt-neon-int32-x8.c",
3125    "src/f16-f32-vcvt/gen/vcvt-neon-int32-x16.c",
3126    "src/f16-f32-vcvt/gen/vcvt-neon-int32-x24.c",
3127    "src/f16-f32-vcvt/gen/vcvt-neon-int32-x32.c",
3128    "src/f32-argmaxpool/4x-neon-c4.c",
3129    "src/f32-argmaxpool/9p8x-neon-c4.c",
3130    "src/f32-argmaxpool/9x-neon-c4.c",
3131    "src/f32-avgpool/9p8x-minmax-neon-c4.c",
3132    "src/f32-avgpool/9x-minmax-neon-c4.c",
3133    "src/f32-conv-hwc/gen/3x3s2p0p1c3x4-neon-2x1.c",
3134    "src/f32-conv-hwc/gen/3x3s2p0p1c3x4-neon-2x2.c",
3135    "src/f32-conv-hwc/gen/3x3s2p0p1c3x8-neon-2x1.c",
3136    "src/f32-conv-hwc/gen/3x3s2p0p1c3x8-neon-2x2.c",
3137    "src/f32-conv-hwc/gen/3x3s2p1c3x4-neon-2x1.c",
3138    "src/f32-conv-hwc/gen/3x3s2p1c3x4-neon-2x2.c",
3139    "src/f32-conv-hwc/gen/3x3s2p1c3x8-neon-2x1.c",
3140    "src/f32-conv-hwc/gen/3x3s2p1c3x8-neon-2x2.c",
3141    "src/f32-conv-hwc2chw/3x3s2p1c3x4-neon-2x2.c",
3142    "src/f32-dwconv/gen/up4x3-minmax-neon-acc2.c",
3143    "src/f32-dwconv/gen/up4x3-minmax-neon.c",
3144    "src/f32-dwconv/gen/up4x4-minmax-neon-acc2.c",
3145    "src/f32-dwconv/gen/up4x4-minmax-neon.c",
3146    "src/f32-dwconv/gen/up4x9-minmax-neon-acc2.c",
3147    "src/f32-dwconv/gen/up4x9-minmax-neon.c",
3148    "src/f32-dwconv/gen/up4x25-minmax-neon-acc2.c",
3149    "src/f32-dwconv/gen/up4x25-minmax-neon.c",
3150    "src/f32-dwconv/gen/up8x3-minmax-neon-acc2.c",
3151    "src/f32-dwconv/gen/up8x3-minmax-neon.c",
3152    "src/f32-dwconv/gen/up8x4-minmax-neon-acc2.c",
3153    "src/f32-dwconv/gen/up8x4-minmax-neon.c",
3154    "src/f32-dwconv/gen/up8x9-minmax-neon-acc2.c",
3155    "src/f32-dwconv/gen/up8x9-minmax-neon.c",
3156    "src/f32-dwconv/gen/up8x25-minmax-neon-acc2.c",
3157    "src/f32-dwconv/gen/up8x25-minmax-neon.c",
3158    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-1x4-acc2.c",
3159    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-1x4-acc3.c",
3160    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-1x4-acc4.c",
3161    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-1x4.c",
3162    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-2x4-acc2.c",
3163    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-2x4.c",
3164    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-3x4.c",
3165    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-4x4.c",
3166    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-5x4.c",
3167    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neon-6x4.c",
3168    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-1x4-acc2.c",
3169    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-1x4-acc3.c",
3170    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-1x4-acc4.c",
3171    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-1x4.c",
3172    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-2x4-acc2.c",
3173    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-2x4.c",
3174    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-3x4.c",
3175    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neon-4x4.c",
3176    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4-acc2.c",
3177    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4-acc3.c",
3178    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4-acc4.c",
3179    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4-acc5.c",
3180    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-1x4.c",
3181    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-2x4-acc2.c",
3182    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-2x4-acc3.c",
3183    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-2x4.c",
3184    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-3x4-acc2.c",
3185    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-3x4.c",
3186    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-4x4-acc2.c",
3187    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-4x4.c",
3188    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neon-5x4.c",
3189    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4-acc2.c",
3190    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4-acc3.c",
3191    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4-acc4.c",
3192    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4-acc5.c",
3193    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-1x4.c",
3194    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-2x4-acc2.c",
3195    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-2x4-acc3.c",
3196    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-2x4.c",
3197    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-3x4-acc2.c",
3198    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neon-3x4.c",
3199    "src/f32-f16-vcvt/gen/vcvt-neon-x8.c",
3200    "src/f32-f16-vcvt/gen/vcvt-neon-x16.c",
3201    "src/f32-f16-vcvt/gen/vcvt-neon-x24.c",
3202    "src/f32-f16-vcvt/gen/vcvt-neon-x32.c",
3203    "src/f32-gavgpool-cw/neon-x4.c",
3204    "src/f32-gavgpool/7p7x-minmax-neon-c4.c",
3205    "src/f32-gavgpool/7x-minmax-neon-c4.c",
3206    "src/f32-gemm/gen-inc/1x8inc-minmax-neon-dup-ld64.c",
3207    "src/f32-gemm/gen-inc/1x8inc-minmax-neon-lane-ld64.c",
3208    "src/f32-gemm/gen-inc/1x8s4inc-minmax-neon.c",
3209    "src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld64.c",
3210    "src/f32-gemm/gen-inc/4x8inc-minmax-neon-dup-ld128.c",
3211    "src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld64.c",
3212    "src/f32-gemm/gen-inc/4x8inc-minmax-neon-lane-ld128.c",
3213    "src/f32-gemm/gen-inc/4x8s4inc-minmax-neon.c",
3214    "src/f32-gemm/gen-inc/5x8inc-minmax-neon-lane-ld64.c",
3215    "src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld64.c",
3216    "src/f32-gemm/gen-inc/6x8inc-minmax-neon-dup-ld128.c",
3217    "src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld64.c",
3218    "src/f32-gemm/gen-inc/6x8inc-minmax-neon-lane-ld128.c",
3219    "src/f32-gemm/gen-inc/6x8s4inc-minmax-neon.c",
3220    "src/f32-gemm/gen-inc/8x8s4inc-minmax-neon.c",
3221    "src/f32-gemm/gen/1x8-minmax-neon-dup-ld64.c",
3222    "src/f32-gemm/gen/1x8-minmax-neon-lane-ld64.c",
3223    "src/f32-gemm/gen/1x8s4-minmax-neon.c",
3224    "src/f32-gemm/gen/4x2-minmax-neon-lane-ld64.c",
3225    "src/f32-gemm/gen/4x8-minmax-neon-dup-ld64.c",
3226    "src/f32-gemm/gen/4x8-minmax-neon-dup-ld128.c",
3227    "src/f32-gemm/gen/4x8-minmax-neon-lane-ld64.c",
3228    "src/f32-gemm/gen/4x8-minmax-neon-lane-ld128.c",
3229    "src/f32-gemm/gen/4x8s4-minmax-neon.c",
3230    "src/f32-gemm/gen/5x8-minmax-neon-lane-ld64.c",
3231    "src/f32-gemm/gen/6x2-minmax-neon-lane-ld64.c",
3232    "src/f32-gemm/gen/6x8-minmax-neon-dup-ld64.c",
3233    "src/f32-gemm/gen/6x8-minmax-neon-dup-ld128.c",
3234    "src/f32-gemm/gen/6x8-minmax-neon-lane-ld64.c",
3235    "src/f32-gemm/gen/6x8-minmax-neon-lane-ld128.c",
3236    "src/f32-gemm/gen/6x8s4-minmax-neon.c",
3237    "src/f32-gemm/gen/8x8s4-minmax-neon.c",
3238    "src/f32-ibilinear-chw/gen/neon-p4.c",
3239    "src/f32-ibilinear-chw/gen/neon-p8.c",
3240    "src/f32-ibilinear-chw/gen/neon-p16.c",
3241    "src/f32-ibilinear/gen/neon-c4.c",
3242    "src/f32-ibilinear/gen/neon-c8.c",
3243    "src/f32-igemm/gen/1x8-minmax-neon-dup-ld64.c",
3244    "src/f32-igemm/gen/1x8-minmax-neon-lane-ld64.c",
3245    "src/f32-igemm/gen/1x8s4-minmax-neon.c",
3246    "src/f32-igemm/gen/4x2-minmax-neon-lane-ld64.c",
3247    "src/f32-igemm/gen/4x4-minmax-neon-lane-ld64.c",
3248    "src/f32-igemm/gen/4x8-minmax-neon-dup-ld64.c",
3249    "src/f32-igemm/gen/4x8-minmax-neon-dup-ld128.c",
3250    "src/f32-igemm/gen/4x8-minmax-neon-lane-ld64.c",
3251    "src/f32-igemm/gen/4x8-minmax-neon-lane-ld128.c",
3252    "src/f32-igemm/gen/4x8s4-minmax-neon.c",
3253    "src/f32-igemm/gen/6x2-minmax-neon-lane-ld64.c",
3254    "src/f32-igemm/gen/6x8-minmax-neon-dup-ld64.c",
3255    "src/f32-igemm/gen/6x8-minmax-neon-dup-ld128.c",
3256    "src/f32-igemm/gen/6x8-minmax-neon-lane-ld64.c",
3257    "src/f32-igemm/gen/6x8-minmax-neon-lane-ld128.c",
3258    "src/f32-igemm/gen/6x8s4-minmax-neon.c",
3259    "src/f32-igemm/gen/8x8s4-minmax-neon.c",
3260    "src/f32-maxpool/9p8x-minmax-neon-c4.c",
3261    "src/f32-pavgpool/9p8x-minmax-neon-c4.c",
3262    "src/f32-pavgpool/9x-minmax-neon-c4.c",
3263    "src/f32-ppmm/gen/4x8-minmax-neon.c",
3264    "src/f32-ppmm/gen/8x8-minmax-neon.c",
3265    "src/f32-prelu/gen/neon-1x4.c",
3266    "src/f32-prelu/gen/neon-1x8.c",
3267    "src/f32-prelu/gen/neon-1x16.c",
3268    "src/f32-prelu/gen/neon-2x4.c",
3269    "src/f32-prelu/gen/neon-2x8.c",
3270    "src/f32-prelu/gen/neon-2x16.c",
3271    "src/f32-prelu/gen/neon-4x4.c",
3272    "src/f32-prelu/gen/neon-4x8.c",
3273    "src/f32-prelu/gen/neon-4x16.c",
3274    "src/f32-qs8-vcvt/gen/vcvt-neon-x8.c",
3275    "src/f32-qs8-vcvt/gen/vcvt-neon-x16.c",
3276    "src/f32-qs8-vcvt/gen/vcvt-neon-x24.c",
3277    "src/f32-qs8-vcvt/gen/vcvt-neon-x32.c",
3278    "src/f32-qu8-vcvt/gen/vcvt-neon-x8.c",
3279    "src/f32-qu8-vcvt/gen/vcvt-neon-x16.c",
3280    "src/f32-qu8-vcvt/gen/vcvt-neon-x24.c",
3281    "src/f32-qu8-vcvt/gen/vcvt-neon-x32.c",
3282    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x4.c",
3283    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x8-acc2.c",
3284    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x8.c",
3285    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x12-acc2.c",
3286    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x12-acc3.c",
3287    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x12.c",
3288    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x16-acc2.c",
3289    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x16-acc4.c",
3290    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x16.c",
3291    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x20-acc2.c",
3292    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x20-acc5.c",
3293    "src/f32-raddstoreexpminusmax/gen/neon-rr2-lut64-p2-x20.c",
3294    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x4.c",
3295    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x8-acc2.c",
3296    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x8.c",
3297    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x12-acc2.c",
3298    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x12-acc3.c",
3299    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x12.c",
3300    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x16-acc2.c",
3301    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x16-acc4.c",
3302    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x16.c",
3303    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x20-acc2.c",
3304    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x20-acc5.c",
3305    "src/f32-raddstoreexpminusmax/gen/neon-rr2-p5-x20.c",
3306    "src/f32-rmax/neon.c",
3307    "src/f32-spmm/gen/4x1-minmax-neon-pipelined.c",
3308    "src/f32-spmm/gen/4x1-minmax-neon-x2.c",
3309    "src/f32-spmm/gen/4x1-minmax-neon.c",
3310    "src/f32-spmm/gen/8x1-minmax-neon-pipelined.c",
3311    "src/f32-spmm/gen/8x1-minmax-neon-x2.c",
3312    "src/f32-spmm/gen/8x1-minmax-neon.c",
3313    "src/f32-spmm/gen/12x1-minmax-neon.c",
3314    "src/f32-spmm/gen/16x1-minmax-neon-pipelined.c",
3315    "src/f32-spmm/gen/16x1-minmax-neon-x2.c",
3316    "src/f32-spmm/gen/16x1-minmax-neon.c",
3317    "src/f32-spmm/gen/32x1-minmax-neon-pipelined.c",
3318    "src/f32-spmm/gen/32x1-minmax-neon-x2.c",
3319    "src/f32-spmm/gen/32x1-minmax-neon.c",
3320    "src/f32-vbinary/gen/vadd-minmax-neon-x4.c",
3321    "src/f32-vbinary/gen/vadd-minmax-neon-x8.c",
3322    "src/f32-vbinary/gen/vaddc-minmax-neon-x4.c",
3323    "src/f32-vbinary/gen/vaddc-minmax-neon-x8.c",
3324    "src/f32-vbinary/gen/vmax-neon-x4.c",
3325    "src/f32-vbinary/gen/vmax-neon-x8.c",
3326    "src/f32-vbinary/gen/vmaxc-neon-x4.c",
3327    "src/f32-vbinary/gen/vmaxc-neon-x8.c",
3328    "src/f32-vbinary/gen/vmin-neon-x4.c",
3329    "src/f32-vbinary/gen/vmin-neon-x8.c",
3330    "src/f32-vbinary/gen/vminc-neon-x4.c",
3331    "src/f32-vbinary/gen/vminc-neon-x8.c",
3332    "src/f32-vbinary/gen/vmul-minmax-neon-x4.c",
3333    "src/f32-vbinary/gen/vmul-minmax-neon-x8.c",
3334    "src/f32-vbinary/gen/vmulc-minmax-neon-x4.c",
3335    "src/f32-vbinary/gen/vmulc-minmax-neon-x8.c",
3336    "src/f32-vbinary/gen/vrsubc-minmax-neon-x4.c",
3337    "src/f32-vbinary/gen/vrsubc-minmax-neon-x8.c",
3338    "src/f32-vbinary/gen/vsqrdiff-neon-x4.c",
3339    "src/f32-vbinary/gen/vsqrdiff-neon-x8.c",
3340    "src/f32-vbinary/gen/vsqrdiffc-neon-x4.c",
3341    "src/f32-vbinary/gen/vsqrdiffc-neon-x8.c",
3342    "src/f32-vbinary/gen/vsub-minmax-neon-x4.c",
3343    "src/f32-vbinary/gen/vsub-minmax-neon-x8.c",
3344    "src/f32-vbinary/gen/vsubc-minmax-neon-x4.c",
3345    "src/f32-vbinary/gen/vsubc-minmax-neon-x8.c",
3346    "src/f32-vclamp/gen/vclamp-neon-x4.c",
3347    "src/f32-vclamp/gen/vclamp-neon-x8.c",
3348    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x4.c",
3349    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x8.c",
3350    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x12.c",
3351    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x16.c",
3352    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x20.c",
3353    "src/f32-velu/gen/velu-neon-rr2-lut16-p3-x24.c",
3354    "src/f32-velu/gen/velu-neon-rr2-p6-x4.c",
3355    "src/f32-velu/gen/velu-neon-rr2-p6-x8.c",
3356    "src/f32-velu/gen/velu-neon-rr2-p6-x12.c",
3357    "src/f32-velu/gen/velu-neon-rr2-p6-x16.c",
3358    "src/f32-velu/gen/velu-neon-rr2-p6-x20.c",
3359    "src/f32-velu/gen/velu-neon-rr2-p6-x24.c",
3360    "src/f32-vhswish/gen/vhswish-neon-x4.c",
3361    "src/f32-vhswish/gen/vhswish-neon-x8.c",
3362    "src/f32-vhswish/gen/vhswish-neon-x16.c",
3363    "src/f32-vlrelu/gen/vlrelu-neon-x4.c",
3364    "src/f32-vlrelu/gen/vlrelu-neon-x8.c",
3365    "src/f32-vmulcaddc/gen/c4-minmax-neon-2x.c",
3366    "src/f32-vmulcaddc/gen/c8-minmax-neon-2x.c",
3367    "src/f32-vrelu/gen/vrelu-neon-x4.c",
3368    "src/f32-vrelu/gen/vrelu-neon-x8.c",
3369    "src/f32-vrnd/gen/vrndd-neon-x4.c",
3370    "src/f32-vrnd/gen/vrndd-neon-x8.c",
3371    "src/f32-vrnd/gen/vrndne-neon-x4.c",
3372    "src/f32-vrnd/gen/vrndne-neon-x8.c",
3373    "src/f32-vrnd/gen/vrndu-neon-x4.c",
3374    "src/f32-vrnd/gen/vrndu-neon-x8.c",
3375    "src/f32-vrnd/gen/vrndz-neon-x4.c",
3376    "src/f32-vrnd/gen/vrndz-neon-x8.c",
3377    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x4.c",
3378    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x8.c",
3379    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x12.c",
3380    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x16.c",
3381    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x20.c",
3382    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut64-p2-nr2recps-x24.c",
3383    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x4.c",
3384    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x8.c",
3385    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x12.c",
3386    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x16.c",
3387    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x20.c",
3388    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-lut2048-p1-nr2recps-x24.c",
3389    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x4.c",
3390    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x8.c",
3391    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x12.c",
3392    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x16.c",
3393    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x20.c",
3394    "src/f32-vsigmoid/gen/vsigmoid-neon-rr2-p5-nr2recps-x24.c",
3395    "src/f32-vunary/gen/vabs-neon-x4.c",
3396    "src/f32-vunary/gen/vabs-neon-x8.c",
3397    "src/f32-vunary/gen/vneg-neon-x4.c",
3398    "src/f32-vunary/gen/vneg-neon-x8.c",
3399    "src/f32-vunary/gen/vsqr-neon-x4.c",
3400    "src/f32-vunary/gen/vsqr-neon-x8.c",
3401    "src/math/cvt-f16-f32-neon-int16.c",
3402    "src/math/cvt-f16-f32-neon-int32.c",
3403    "src/math/cvt-f32-f16-neon.c",
3404    "src/math/cvt-f32-qs8-neon.c",
3405    "src/math/cvt-f32-qu8-neon.c",
3406    "src/math/expm1minus-f32-neon-rr2-lut16-p3.c",
3407    "src/math/expm1minus-f32-neon-rr2-p6.c",
3408    "src/math/roundd-neon-addsub.c",
3409    "src/math/roundd-neon-cvt.c",
3410    "src/math/roundne-neon-addsub.c",
3411    "src/math/roundu-neon-addsub.c",
3412    "src/math/roundu-neon-cvt.c",
3413    "src/math/roundz-neon-addsub.c",
3414    "src/math/roundz-neon-cvt.c",
3415    "src/math/sigmoid-f32-neon-rr2-lut64-p2-nr2recps.c",
3416    "src/math/sigmoid-f32-neon-rr2-lut2048-p1-nr2recps.c",
3417    "src/math/sigmoid-f32-neon-rr2-p5-nr2recps.c",
3418    "src/math/sqrt-neon-nr1rsqrts.c",
3419    "src/math/sqrt-neon-nr2rsqrts.c",
3420    "src/math/sqrt-neon-nr3rsqrts.c",
3421    "src/qc8-dwconv/gen/up8x3-minmax-fp32-neon-mla8-ld64.c",
3422    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neon-mla8-ld64.c",
3423    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neon-mul8-ld64.c",
3424    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neon-mul16.c",
3425    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neon-mla8-ld64.c",
3426    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neon-mul8-ld64.c",
3427    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neon-mul16.c",
3428    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neon-mla8-ld64.c",
3429    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neon-mla8-ld128.c",
3430    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mla8-ld64.c",
3431    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mla8-ld128.c",
3432    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mul8-ld64.c",
3433    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mul8-ld128.c",
3434    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neon-mul16.c",
3435    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mla8-ld64.c",
3436    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mla8-ld128.c",
3437    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mul8-ld64.c",
3438    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mul8-ld128.c",
3439    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neon-mul16.c",
3440    "src/qc8-dwconv/gen/up24x9-minmax-fp32-neon-mul16.c",
3441    "src/qc8-dwconv/gen/up24x25-minmax-fp32-neon-mul16.c",
3442    "src/qc8-dwconv/gen/up32x9-minmax-fp32-neon-mul16.c",
3443    "src/qc8-dwconv/gen/up32x25-minmax-fp32-neon-mul16.c",
3444    "src/qc8-gemm/gen/1x8-minmax-fp32-neon-mlal-lane-prfm.c",
3445    "src/qc8-gemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
3446    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-dup.c",
3447    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld1r.c",
3448    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld2r.c",
3449    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld4r.c",
3450    "src/qc8-gemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3451    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-dup.c",
3452    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-ld1r.c",
3453    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-ld2r.c",
3454    "src/qc8-gemm/gen/1x8c4s2-minmax-fp32-neon-mlal.c",
3455    "src/qc8-gemm/gen/1x8c8-minmax-fp32-neon-mlal.c",
3456    "src/qc8-gemm/gen/1x16-minmax-fp32-neon-mlal-lane-prfm.c",
3457    "src/qc8-gemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
3458    "src/qc8-gemm/gen/2x8-minmax-fp32-neon-mlal-lane-prfm.c",
3459    "src/qc8-gemm/gen/2x8-minmax-fp32-neon-mlal-lane.c",
3460    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-dup.c",
3461    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld1r.c",
3462    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld2r.c",
3463    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld4r.c",
3464    "src/qc8-gemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3465    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-dup.c",
3466    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-ld1r.c",
3467    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-ld2r.c",
3468    "src/qc8-gemm/gen/2x8c4s2-minmax-fp32-neon-mlal.c",
3469    "src/qc8-gemm/gen/2x8c8-minmax-fp32-neon-mlal.c",
3470    "src/qc8-gemm/gen/2x16-minmax-fp32-neon-mlal-lane-prfm.c",
3471    "src/qc8-gemm/gen/2x16-minmax-fp32-neon-mlal-lane.c",
3472    "src/qc8-gemm/gen/3x8-minmax-fp32-neon-mlal-lane-prfm.c",
3473    "src/qc8-gemm/gen/3x8-minmax-fp32-neon-mlal-lane.c",
3474    "src/qc8-gemm/gen/3x16-minmax-fp32-neon-mlal-lane-prfm.c",
3475    "src/qc8-gemm/gen/3x16-minmax-fp32-neon-mlal-lane.c",
3476    "src/qc8-gemm/gen/4x8-minmax-fp32-neon-mlal-lane-prfm.c",
3477    "src/qc8-gemm/gen/4x8-minmax-fp32-neon-mlal-lane.c",
3478    "src/qc8-gemm/gen/4x16-minmax-fp32-neon-mlal-lane-prfm.c",
3479    "src/qc8-gemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
3480    "src/qc8-gemm/gen/6x8-minmax-fp32-neon-mlal-lane-prfm.c",
3481    "src/qc8-gemm/gen/6x8-minmax-fp32-neon-mlal-lane.c",
3482    "src/qc8-gemm/gen/6x16-minmax-fp32-neon-mlal-lane-prfm.c",
3483    "src/qc8-gemm/gen/6x16-minmax-fp32-neon-mlal-lane.c",
3484    "src/qc8-igemm/gen/1x8-minmax-fp32-neon-mlal-lane-prfm.c",
3485    "src/qc8-igemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
3486    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-dup.c",
3487    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld1r.c",
3488    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld2r.c",
3489    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld4r.c",
3490    "src/qc8-igemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3491    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-dup.c",
3492    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-ld1r.c",
3493    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-ld2r.c",
3494    "src/qc8-igemm/gen/1x8c4s2-minmax-fp32-neon-mlal.c",
3495    "src/qc8-igemm/gen/1x8c8-minmax-fp32-neon-mlal.c",
3496    "src/qc8-igemm/gen/1x16-minmax-fp32-neon-mlal-lane-prfm.c",
3497    "src/qc8-igemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
3498    "src/qc8-igemm/gen/2x8-minmax-fp32-neon-mlal-lane-prfm.c",
3499    "src/qc8-igemm/gen/2x8-minmax-fp32-neon-mlal-lane.c",
3500    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-dup.c",
3501    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld1r.c",
3502    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld2r.c",
3503    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld4r.c",
3504    "src/qc8-igemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3505    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-dup.c",
3506    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-ld1r.c",
3507    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-ld2r.c",
3508    "src/qc8-igemm/gen/2x8c4s2-minmax-fp32-neon-mlal.c",
3509    "src/qc8-igemm/gen/2x8c8-minmax-fp32-neon-mlal.c",
3510    "src/qc8-igemm/gen/2x16-minmax-fp32-neon-mlal-lane-prfm.c",
3511    "src/qc8-igemm/gen/2x16-minmax-fp32-neon-mlal-lane.c",
3512    "src/qc8-igemm/gen/3x8-minmax-fp32-neon-mlal-lane-prfm.c",
3513    "src/qc8-igemm/gen/3x8-minmax-fp32-neon-mlal-lane.c",
3514    "src/qc8-igemm/gen/3x16-minmax-fp32-neon-mlal-lane-prfm.c",
3515    "src/qc8-igemm/gen/3x16-minmax-fp32-neon-mlal-lane.c",
3516    "src/qc8-igemm/gen/4x8-minmax-fp32-neon-mlal-lane-prfm.c",
3517    "src/qc8-igemm/gen/4x8-minmax-fp32-neon-mlal-lane.c",
3518    "src/qc8-igemm/gen/4x16-minmax-fp32-neon-mlal-lane-prfm.c",
3519    "src/qc8-igemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
3520    "src/qc8-igemm/gen/6x8-minmax-fp32-neon-mlal-lane-prfm.c",
3521    "src/qc8-igemm/gen/6x8-minmax-fp32-neon-mlal-lane.c",
3522    "src/qc8-igemm/gen/6x16-minmax-fp32-neon-mlal-lane-prfm.c",
3523    "src/qc8-igemm/gen/6x16-minmax-fp32-neon-mlal-lane.c",
3524    "src/qs8-dwconv/gen/up8x9-minmax-fp32-neon-mul16.c",
3525    "src/qs8-dwconv/gen/up8x9-minmax-rndnu-neon-mla8-ld64.c",
3526    "src/qs8-dwconv/gen/up8x9-minmax-rndnu-neon-mul8-ld64.c",
3527    "src/qs8-dwconv/gen/up8x9-minmax-rndnu-neon-mul16.c",
3528    "src/qs8-dwconv/gen/up8x25-minmax-fp32-neon-mul16.c",
3529    "src/qs8-dwconv/gen/up8x25-minmax-rndnu-neon-mla8-ld64.c",
3530    "src/qs8-dwconv/gen/up8x25-minmax-rndnu-neon-mul8-ld64.c",
3531    "src/qs8-dwconv/gen/up8x25-minmax-rndnu-neon-mul16.c",
3532    "src/qs8-dwconv/gen/up16x9-minmax-fp32-neon-mul16.c",
3533    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mla8-ld64.c",
3534    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mla8-ld128.c",
3535    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mul8-ld64.c",
3536    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mul8-ld128.c",
3537    "src/qs8-dwconv/gen/up16x9-minmax-rndnu-neon-mul16.c",
3538    "src/qs8-dwconv/gen/up16x25-minmax-fp32-neon-mul16.c",
3539    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mla8-ld64.c",
3540    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mla8-ld128.c",
3541    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mul8-ld64.c",
3542    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mul8-ld128.c",
3543    "src/qs8-dwconv/gen/up16x25-minmax-rndnu-neon-mul16.c",
3544    "src/qs8-dwconv/gen/up24x9-minmax-fp32-neon-mul16.c",
3545    "src/qs8-dwconv/gen/up24x9-minmax-rndnu-neon-mul16.c",
3546    "src/qs8-dwconv/gen/up24x25-minmax-fp32-neon-mul16.c",
3547    "src/qs8-dwconv/gen/up24x25-minmax-rndnu-neon-mul16.c",
3548    "src/qs8-dwconv/gen/up32x9-minmax-fp32-neon-mul16.c",
3549    "src/qs8-dwconv/gen/up32x9-minmax-rndnu-neon-mul16.c",
3550    "src/qs8-dwconv/gen/up32x25-minmax-fp32-neon-mul16.c",
3551    "src/qs8-dwconv/gen/up32x25-minmax-rndnu-neon-mul16.c",
3552    "src/qs8-f32-vcvt/gen/vcvt-neon-x8.c",
3553    "src/qs8-f32-vcvt/gen/vcvt-neon-x16.c",
3554    "src/qs8-f32-vcvt/gen/vcvt-neon-x24.c",
3555    "src/qs8-f32-vcvt/gen/vcvt-neon-x32.c",
3556    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neon-c8.c",
3557    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neon-c16.c",
3558    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neon-c24.c",
3559    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neon-c32.c",
3560    "src/qs8-gavgpool/gen/7p7x-minmax-rndnu-neon-c8.c",
3561    "src/qs8-gavgpool/gen/7p7x-minmax-rndnu-neon-c16.c",
3562    "src/qs8-gavgpool/gen/7p7x-minmax-rndnu-neon-c24.c",
3563    "src/qs8-gavgpool/gen/7p7x-minmax-rndnu-neon-c32.c",
3564    "src/qs8-gavgpool/gen/7x-minmax-fp32-neon-c8.c",
3565    "src/qs8-gavgpool/gen/7x-minmax-fp32-neon-c16.c",
3566    "src/qs8-gavgpool/gen/7x-minmax-fp32-neon-c24.c",
3567    "src/qs8-gavgpool/gen/7x-minmax-fp32-neon-c32.c",
3568    "src/qs8-gavgpool/gen/7x-minmax-rndnu-neon-c8.c",
3569    "src/qs8-gavgpool/gen/7x-minmax-rndnu-neon-c16.c",
3570    "src/qs8-gavgpool/gen/7x-minmax-rndnu-neon-c24.c",
3571    "src/qs8-gavgpool/gen/7x-minmax-rndnu-neon-c32.c",
3572    "src/qs8-gemm/gen/1x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3573    "src/qs8-gemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3574    "src/qs8-gemm/gen/1x8-minmax-rndnu-neon-mull-addw-dup.c",
3575    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-dup.c",
3576    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld1r.c",
3577    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld2r.c",
3578    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neon-mlal-ld4r.c",
3579    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mlal-dup.c",
3580    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3581    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3582    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3583    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mull-dup.c",
3584    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mull-ld1r.c",
3585    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mull-ld2r.c",
3586    "src/qs8-gemm/gen/1x8c2-minmax-rndnu-neon-mull-ld4r.c",
3587    "src/qs8-gemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3588    "src/qs8-gemm/gen/1x8c2s4-minmax-rndnu-neon-mlal.c",
3589    "src/qs8-gemm/gen/1x8c2s4-minmax-rndnu-neon-mull.c",
3590    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-dup.c",
3591    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-ld1r.c",
3592    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neon-mlal-ld2r.c",
3593    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mlal-dup.c",
3594    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3595    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3596    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mull-dup.c",
3597    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mull-ld1r.c",
3598    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neon-mull-ld2r.c",
3599    "src/qs8-gemm/gen/1x8c4s2-minmax-fp32-neon-mlal.c",
3600    "src/qs8-gemm/gen/1x8c4s2-minmax-rndnu-neon-mlal.c",
3601    "src/qs8-gemm/gen/1x8c4s2-minmax-rndnu-neon-mull.c",
3602    "src/qs8-gemm/gen/1x8c8-minmax-fp32-neon-mlal.c",
3603    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-neon-mlal.c",
3604    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-neon-mull.c",
3605    "src/qs8-gemm/gen/1x8c16-minmax-rndnu-neon-mlal.c",
3606    "src/qs8-gemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
3607    "src/qs8-gemm/gen/1x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3608    "src/qs8-gemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3609    "src/qs8-gemm/gen/1x16-minmax-rndnu-neon-mull-addw-dup.c",
3610    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mlal-dup.c",
3611    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3612    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3613    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3614    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mull-dup.c",
3615    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mull-ld1r.c",
3616    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mull-ld2r.c",
3617    "src/qs8-gemm/gen/1x16c2-minmax-rndnu-neon-mull-ld4r.c",
3618    "src/qs8-gemm/gen/1x16c2s4-minmax-rndnu-neon-mlal.c",
3619    "src/qs8-gemm/gen/1x16c2s4-minmax-rndnu-neon-mull.c",
3620    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mlal-dup.c",
3621    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3622    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3623    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mull-dup.c",
3624    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mull-ld1r.c",
3625    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neon-mull-ld2r.c",
3626    "src/qs8-gemm/gen/1x16c4s2-minmax-rndnu-neon-mlal.c",
3627    "src/qs8-gemm/gen/1x16c4s2-minmax-rndnu-neon-mull.c",
3628    "src/qs8-gemm/gen/1x16c8-minmax-rndnu-neon-mlal.c",
3629    "src/qs8-gemm/gen/1x16c8-minmax-rndnu-neon-mull.c",
3630    "src/qs8-gemm/gen/1x16c16-minmax-rndnu-neon-mlal.c",
3631    "src/qs8-gemm/gen/2x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3632    "src/qs8-gemm/gen/2x8-minmax-rndnu-neon-mlal-lane.c",
3633    "src/qs8-gemm/gen/2x8-minmax-rndnu-neon-mull-addw-dup.c",
3634    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-dup.c",
3635    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld1r.c",
3636    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld2r.c",
3637    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neon-mlal-ld4r.c",
3638    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mlal-dup.c",
3639    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3640    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3641    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3642    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mull-dup.c",
3643    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mull-ld1r.c",
3644    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mull-ld2r.c",
3645    "src/qs8-gemm/gen/2x8c2-minmax-rndnu-neon-mull-ld4r.c",
3646    "src/qs8-gemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3647    "src/qs8-gemm/gen/2x8c2s4-minmax-rndnu-neon-mlal.c",
3648    "src/qs8-gemm/gen/2x8c2s4-minmax-rndnu-neon-mull.c",
3649    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-dup.c",
3650    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-ld1r.c",
3651    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neon-mlal-ld2r.c",
3652    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mlal-dup.c",
3653    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3654    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3655    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mull-dup.c",
3656    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mull-ld1r.c",
3657    "src/qs8-gemm/gen/2x8c4-minmax-rndnu-neon-mull-ld2r.c",
3658    "src/qs8-gemm/gen/2x8c4s2-minmax-fp32-neon-mlal.c",
3659    "src/qs8-gemm/gen/2x8c4s2-minmax-rndnu-neon-mlal.c",
3660    "src/qs8-gemm/gen/2x8c4s2-minmax-rndnu-neon-mull.c",
3661    "src/qs8-gemm/gen/2x8c8-minmax-fp32-neon-mlal.c",
3662    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-neon-mlal.c",
3663    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-neon-mull.c",
3664    "src/qs8-gemm/gen/2x8c16-minmax-rndnu-neon-mlal.c",
3665    "src/qs8-gemm/gen/2x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3666    "src/qs8-gemm/gen/2x16-minmax-rndnu-neon-mlal-lane.c",
3667    "src/qs8-gemm/gen/2x16-minmax-rndnu-neon-mull-addw-dup.c",
3668    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mlal-dup.c",
3669    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3670    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3671    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3672    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mull-dup.c",
3673    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mull-ld1r.c",
3674    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mull-ld2r.c",
3675    "src/qs8-gemm/gen/2x16c2-minmax-rndnu-neon-mull-ld4r.c",
3676    "src/qs8-gemm/gen/2x16c2s4-minmax-rndnu-neon-mlal.c",
3677    "src/qs8-gemm/gen/2x16c2s4-minmax-rndnu-neon-mull.c",
3678    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mlal-dup.c",
3679    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3680    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3681    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mull-dup.c",
3682    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mull-ld1r.c",
3683    "src/qs8-gemm/gen/2x16c4-minmax-rndnu-neon-mull-ld2r.c",
3684    "src/qs8-gemm/gen/2x16c4s2-minmax-rndnu-neon-mlal.c",
3685    "src/qs8-gemm/gen/2x16c4s2-minmax-rndnu-neon-mull.c",
3686    "src/qs8-gemm/gen/2x16c8-minmax-rndnu-neon-mlal.c",
3687    "src/qs8-gemm/gen/2x16c8-minmax-rndnu-neon-mull.c",
3688    "src/qs8-gemm/gen/2x16c16-minmax-rndnu-neon-mlal.c",
3689    "src/qs8-gemm/gen/3x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3690    "src/qs8-gemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
3691    "src/qs8-gemm/gen/3x8-minmax-rndnu-neon-mull-addw-dup.c",
3692    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mlal-dup.c",
3693    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3694    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3695    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3696    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mull-dup.c",
3697    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mull-ld1r.c",
3698    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mull-ld2r.c",
3699    "src/qs8-gemm/gen/3x8c2-minmax-rndnu-neon-mull-ld4r.c",
3700    "src/qs8-gemm/gen/3x8c2s4-minmax-rndnu-neon-mlal.c",
3701    "src/qs8-gemm/gen/3x8c2s4-minmax-rndnu-neon-mull.c",
3702    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mlal-dup.c",
3703    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3704    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3705    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mull-dup.c",
3706    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mull-ld1r.c",
3707    "src/qs8-gemm/gen/3x8c4-minmax-rndnu-neon-mull-ld2r.c",
3708    "src/qs8-gemm/gen/3x8c4s2-minmax-rndnu-neon-mlal.c",
3709    "src/qs8-gemm/gen/3x8c4s2-minmax-rndnu-neon-mull.c",
3710    "src/qs8-gemm/gen/3x8c8-minmax-rndnu-neon-mlal.c",
3711    "src/qs8-gemm/gen/3x8c8-minmax-rndnu-neon-mull.c",
3712    "src/qs8-gemm/gen/3x8c16-minmax-rndnu-neon-mlal.c",
3713    "src/qs8-gemm/gen/3x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3714    "src/qs8-gemm/gen/3x16-minmax-rndnu-neon-mlal-lane.c",
3715    "src/qs8-gemm/gen/3x16-minmax-rndnu-neon-mull-addw-dup.c",
3716    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mlal-dup.c",
3717    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3718    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3719    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3720    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mull-dup.c",
3721    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mull-ld1r.c",
3722    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mull-ld2r.c",
3723    "src/qs8-gemm/gen/3x16c2-minmax-rndnu-neon-mull-ld4r.c",
3724    "src/qs8-gemm/gen/3x16c2s4-minmax-rndnu-neon-mlal.c",
3725    "src/qs8-gemm/gen/3x16c2s4-minmax-rndnu-neon-mull.c",
3726    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mlal-dup.c",
3727    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3728    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3729    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mull-dup.c",
3730    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mull-ld1r.c",
3731    "src/qs8-gemm/gen/3x16c4-minmax-rndnu-neon-mull-ld2r.c",
3732    "src/qs8-gemm/gen/3x16c4s2-minmax-rndnu-neon-mlal.c",
3733    "src/qs8-gemm/gen/3x16c4s2-minmax-rndnu-neon-mull.c",
3734    "src/qs8-gemm/gen/3x16c8-minmax-rndnu-neon-mlal.c",
3735    "src/qs8-gemm/gen/3x16c8-minmax-rndnu-neon-mull.c",
3736    "src/qs8-gemm/gen/3x16c16-minmax-rndnu-neon-mlal.c",
3737    "src/qs8-gemm/gen/4x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3738    "src/qs8-gemm/gen/4x8-minmax-rndnu-neon-mlal-lane.c",
3739    "src/qs8-gemm/gen/4x8-minmax-rndnu-neon-mull-addw-dup.c",
3740    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mlal-dup.c",
3741    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3742    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3743    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3744    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mull-dup.c",
3745    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mull-ld1r.c",
3746    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mull-ld2r.c",
3747    "src/qs8-gemm/gen/4x8c2-minmax-rndnu-neon-mull-ld4r.c",
3748    "src/qs8-gemm/gen/4x8c2s4-minmax-rndnu-neon-mlal.c",
3749    "src/qs8-gemm/gen/4x8c2s4-minmax-rndnu-neon-mull.c",
3750    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mlal-dup.c",
3751    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3752    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3753    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mull-dup.c",
3754    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mull-ld1r.c",
3755    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neon-mull-ld2r.c",
3756    "src/qs8-gemm/gen/4x8c4s2-minmax-rndnu-neon-mlal.c",
3757    "src/qs8-gemm/gen/4x8c4s2-minmax-rndnu-neon-mull.c",
3758    "src/qs8-gemm/gen/4x8c8-minmax-rndnu-neon-mlal.c",
3759    "src/qs8-gemm/gen/4x8c8-minmax-rndnu-neon-mull.c",
3760    "src/qs8-gemm/gen/4x8c16-minmax-rndnu-neon-mlal.c",
3761    "src/qs8-gemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
3762    "src/qs8-gemm/gen/4x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3763    "src/qs8-gemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
3764    "src/qs8-gemm/gen/4x16-minmax-rndnu-neon-mull-addw-dup.c",
3765    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mlal-dup.c",
3766    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3767    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3768    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3769    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mull-dup.c",
3770    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mull-ld1r.c",
3771    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mull-ld2r.c",
3772    "src/qs8-gemm/gen/4x16c2-minmax-rndnu-neon-mull-ld4r.c",
3773    "src/qs8-gemm/gen/4x16c2s4-minmax-rndnu-neon-mlal.c",
3774    "src/qs8-gemm/gen/4x16c2s4-minmax-rndnu-neon-mull.c",
3775    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mlal-dup.c",
3776    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3777    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3778    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mull-dup.c",
3779    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mull-ld1r.c",
3780    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neon-mull-ld2r.c",
3781    "src/qs8-gemm/gen/4x16c4s2-minmax-rndnu-neon-mlal.c",
3782    "src/qs8-gemm/gen/4x16c4s2-minmax-rndnu-neon-mull.c",
3783    "src/qs8-gemm/gen/4x16c8-minmax-rndnu-neon-mlal.c",
3784    "src/qs8-gemm/gen/4x16c8-minmax-rndnu-neon-mull.c",
3785    "src/qs8-gemm/gen/4x16c16-minmax-rndnu-neon-mlal.c",
3786    "src/qs8-gemm/gen/6x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3787    "src/qs8-gemm/gen/6x8-minmax-rndnu-neon-mlal-lane.c",
3788    "src/qs8-gemm/gen/6x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3789    "src/qs8-gemm/gen/6x16-minmax-rndnu-neon-mlal-lane.c",
3790    "src/qs8-igemm/gen/1x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3791    "src/qs8-igemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
3792    "src/qs8-igemm/gen/1x8-minmax-rndnu-neon-mull-addw-dup.c",
3793    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-dup.c",
3794    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld1r.c",
3795    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld2r.c",
3796    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neon-mlal-ld4r.c",
3797    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mlal-dup.c",
3798    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3799    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3800    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3801    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mull-dup.c",
3802    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mull-ld1r.c",
3803    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mull-ld2r.c",
3804    "src/qs8-igemm/gen/1x8c2-minmax-rndnu-neon-mull-ld4r.c",
3805    "src/qs8-igemm/gen/1x8c2s4-minmax-fp32-neon-mlal.c",
3806    "src/qs8-igemm/gen/1x8c2s4-minmax-rndnu-neon-mlal.c",
3807    "src/qs8-igemm/gen/1x8c2s4-minmax-rndnu-neon-mull.c",
3808    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-dup.c",
3809    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-ld1r.c",
3810    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neon-mlal-ld2r.c",
3811    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mlal-dup.c",
3812    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3813    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3814    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mull-dup.c",
3815    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mull-ld1r.c",
3816    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neon-mull-ld2r.c",
3817    "src/qs8-igemm/gen/1x8c4s2-minmax-fp32-neon-mlal.c",
3818    "src/qs8-igemm/gen/1x8c4s2-minmax-rndnu-neon-mlal.c",
3819    "src/qs8-igemm/gen/1x8c4s2-minmax-rndnu-neon-mull.c",
3820    "src/qs8-igemm/gen/1x8c8-minmax-fp32-neon-mlal.c",
3821    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-neon-mlal.c",
3822    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-neon-mull.c",
3823    "src/qs8-igemm/gen/1x8c16-minmax-rndnu-neon-mlal.c",
3824    "src/qs8-igemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
3825    "src/qs8-igemm/gen/1x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3826    "src/qs8-igemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
3827    "src/qs8-igemm/gen/1x16-minmax-rndnu-neon-mull-addw-dup.c",
3828    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mlal-dup.c",
3829    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3830    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3831    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3832    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mull-dup.c",
3833    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mull-ld1r.c",
3834    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mull-ld2r.c",
3835    "src/qs8-igemm/gen/1x16c2-minmax-rndnu-neon-mull-ld4r.c",
3836    "src/qs8-igemm/gen/1x16c2s4-minmax-rndnu-neon-mlal.c",
3837    "src/qs8-igemm/gen/1x16c2s4-minmax-rndnu-neon-mull.c",
3838    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mlal-dup.c",
3839    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3840    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3841    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mull-dup.c",
3842    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mull-ld1r.c",
3843    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neon-mull-ld2r.c",
3844    "src/qs8-igemm/gen/1x16c4s2-minmax-rndnu-neon-mlal.c",
3845    "src/qs8-igemm/gen/1x16c4s2-minmax-rndnu-neon-mull.c",
3846    "src/qs8-igemm/gen/1x16c8-minmax-rndnu-neon-mlal.c",
3847    "src/qs8-igemm/gen/1x16c8-minmax-rndnu-neon-mull.c",
3848    "src/qs8-igemm/gen/1x16c16-minmax-rndnu-neon-mlal.c",
3849    "src/qs8-igemm/gen/2x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3850    "src/qs8-igemm/gen/2x8-minmax-rndnu-neon-mlal-lane.c",
3851    "src/qs8-igemm/gen/2x8-minmax-rndnu-neon-mull-addw-dup.c",
3852    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-dup.c",
3853    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld1r.c",
3854    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld2r.c",
3855    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neon-mlal-ld4r.c",
3856    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mlal-dup.c",
3857    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3858    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3859    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3860    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mull-dup.c",
3861    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mull-ld1r.c",
3862    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mull-ld2r.c",
3863    "src/qs8-igemm/gen/2x8c2-minmax-rndnu-neon-mull-ld4r.c",
3864    "src/qs8-igemm/gen/2x8c2s4-minmax-fp32-neon-mlal.c",
3865    "src/qs8-igemm/gen/2x8c2s4-minmax-rndnu-neon-mlal.c",
3866    "src/qs8-igemm/gen/2x8c2s4-minmax-rndnu-neon-mull.c",
3867    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-dup.c",
3868    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-ld1r.c",
3869    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neon-mlal-ld2r.c",
3870    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mlal-dup.c",
3871    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3872    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3873    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mull-dup.c",
3874    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mull-ld1r.c",
3875    "src/qs8-igemm/gen/2x8c4-minmax-rndnu-neon-mull-ld2r.c",
3876    "src/qs8-igemm/gen/2x8c4s2-minmax-fp32-neon-mlal.c",
3877    "src/qs8-igemm/gen/2x8c4s2-minmax-rndnu-neon-mlal.c",
3878    "src/qs8-igemm/gen/2x8c4s2-minmax-rndnu-neon-mull.c",
3879    "src/qs8-igemm/gen/2x8c8-minmax-fp32-neon-mlal.c",
3880    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-neon-mlal.c",
3881    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-neon-mull.c",
3882    "src/qs8-igemm/gen/2x8c16-minmax-rndnu-neon-mlal.c",
3883    "src/qs8-igemm/gen/2x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3884    "src/qs8-igemm/gen/2x16-minmax-rndnu-neon-mlal-lane.c",
3885    "src/qs8-igemm/gen/2x16-minmax-rndnu-neon-mull-addw-dup.c",
3886    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mlal-dup.c",
3887    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3888    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3889    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3890    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mull-dup.c",
3891    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mull-ld1r.c",
3892    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mull-ld2r.c",
3893    "src/qs8-igemm/gen/2x16c2-minmax-rndnu-neon-mull-ld4r.c",
3894    "src/qs8-igemm/gen/2x16c2s4-minmax-rndnu-neon-mlal.c",
3895    "src/qs8-igemm/gen/2x16c2s4-minmax-rndnu-neon-mull.c",
3896    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mlal-dup.c",
3897    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3898    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3899    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mull-dup.c",
3900    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mull-ld1r.c",
3901    "src/qs8-igemm/gen/2x16c4-minmax-rndnu-neon-mull-ld2r.c",
3902    "src/qs8-igemm/gen/2x16c4s2-minmax-rndnu-neon-mlal.c",
3903    "src/qs8-igemm/gen/2x16c4s2-minmax-rndnu-neon-mull.c",
3904    "src/qs8-igemm/gen/2x16c8-minmax-rndnu-neon-mlal.c",
3905    "src/qs8-igemm/gen/2x16c8-minmax-rndnu-neon-mull.c",
3906    "src/qs8-igemm/gen/2x16c16-minmax-rndnu-neon-mlal.c",
3907    "src/qs8-igemm/gen/3x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3908    "src/qs8-igemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
3909    "src/qs8-igemm/gen/3x8-minmax-rndnu-neon-mull-addw-dup.c",
3910    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mlal-dup.c",
3911    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3912    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3913    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3914    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mull-dup.c",
3915    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mull-ld1r.c",
3916    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mull-ld2r.c",
3917    "src/qs8-igemm/gen/3x8c2-minmax-rndnu-neon-mull-ld4r.c",
3918    "src/qs8-igemm/gen/3x8c2s4-minmax-rndnu-neon-mlal.c",
3919    "src/qs8-igemm/gen/3x8c2s4-minmax-rndnu-neon-mull.c",
3920    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mlal-dup.c",
3921    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3922    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3923    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mull-dup.c",
3924    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mull-ld1r.c",
3925    "src/qs8-igemm/gen/3x8c4-minmax-rndnu-neon-mull-ld2r.c",
3926    "src/qs8-igemm/gen/3x8c4s2-minmax-rndnu-neon-mlal.c",
3927    "src/qs8-igemm/gen/3x8c4s2-minmax-rndnu-neon-mull.c",
3928    "src/qs8-igemm/gen/3x8c8-minmax-rndnu-neon-mlal.c",
3929    "src/qs8-igemm/gen/3x8c8-minmax-rndnu-neon-mull.c",
3930    "src/qs8-igemm/gen/3x8c16-minmax-rndnu-neon-mlal.c",
3931    "src/qs8-igemm/gen/3x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3932    "src/qs8-igemm/gen/3x16-minmax-rndnu-neon-mlal-lane.c",
3933    "src/qs8-igemm/gen/3x16-minmax-rndnu-neon-mull-addw-dup.c",
3934    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mlal-dup.c",
3935    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3936    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3937    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3938    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mull-dup.c",
3939    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mull-ld1r.c",
3940    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mull-ld2r.c",
3941    "src/qs8-igemm/gen/3x16c2-minmax-rndnu-neon-mull-ld4r.c",
3942    "src/qs8-igemm/gen/3x16c2s4-minmax-rndnu-neon-mlal.c",
3943    "src/qs8-igemm/gen/3x16c2s4-minmax-rndnu-neon-mull.c",
3944    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mlal-dup.c",
3945    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3946    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3947    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mull-dup.c",
3948    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mull-ld1r.c",
3949    "src/qs8-igemm/gen/3x16c4-minmax-rndnu-neon-mull-ld2r.c",
3950    "src/qs8-igemm/gen/3x16c4s2-minmax-rndnu-neon-mlal.c",
3951    "src/qs8-igemm/gen/3x16c4s2-minmax-rndnu-neon-mull.c",
3952    "src/qs8-igemm/gen/3x16c8-minmax-rndnu-neon-mlal.c",
3953    "src/qs8-igemm/gen/3x16c8-minmax-rndnu-neon-mull.c",
3954    "src/qs8-igemm/gen/3x16c16-minmax-rndnu-neon-mlal.c",
3955    "src/qs8-igemm/gen/4x8-minmax-rndnu-neon-mlal-lane-prfm.c",
3956    "src/qs8-igemm/gen/4x8-minmax-rndnu-neon-mlal-lane.c",
3957    "src/qs8-igemm/gen/4x8-minmax-rndnu-neon-mull-addw-dup.c",
3958    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mlal-dup.c",
3959    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld1r.c",
3960    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld2r.c",
3961    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mlal-ld4r.c",
3962    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mull-dup.c",
3963    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mull-ld1r.c",
3964    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mull-ld2r.c",
3965    "src/qs8-igemm/gen/4x8c2-minmax-rndnu-neon-mull-ld4r.c",
3966    "src/qs8-igemm/gen/4x8c2s4-minmax-rndnu-neon-mlal.c",
3967    "src/qs8-igemm/gen/4x8c2s4-minmax-rndnu-neon-mull.c",
3968    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mlal-dup.c",
3969    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mlal-ld1r.c",
3970    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mlal-ld2r.c",
3971    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mull-dup.c",
3972    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mull-ld1r.c",
3973    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neon-mull-ld2r.c",
3974    "src/qs8-igemm/gen/4x8c4s2-minmax-rndnu-neon-mlal.c",
3975    "src/qs8-igemm/gen/4x8c4s2-minmax-rndnu-neon-mull.c",
3976    "src/qs8-igemm/gen/4x8c8-minmax-rndnu-neon-mlal.c",
3977    "src/qs8-igemm/gen/4x8c8-minmax-rndnu-neon-mull.c",
3978    "src/qs8-igemm/gen/4x8c16-minmax-rndnu-neon-mlal.c",
3979    "src/qs8-igemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
3980    "src/qs8-igemm/gen/4x16-minmax-rndnu-neon-mlal-lane-prfm.c",
3981    "src/qs8-igemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
3982    "src/qs8-igemm/gen/4x16-minmax-rndnu-neon-mull-addw-dup.c",
3983    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mlal-dup.c",
3984    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld1r.c",
3985    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld2r.c",
3986    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mlal-ld4r.c",
3987    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mull-dup.c",
3988    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mull-ld1r.c",
3989    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mull-ld2r.c",
3990    "src/qs8-igemm/gen/4x16c2-minmax-rndnu-neon-mull-ld4r.c",
3991    "src/qs8-igemm/gen/4x16c2s4-minmax-rndnu-neon-mlal.c",
3992    "src/qs8-igemm/gen/4x16c2s4-minmax-rndnu-neon-mull.c",
3993    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mlal-dup.c",
3994    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mlal-ld1r.c",
3995    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mlal-ld2r.c",
3996    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mull-dup.c",
3997    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mull-ld1r.c",
3998    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neon-mull-ld2r.c",
3999    "src/qs8-igemm/gen/4x16c4s2-minmax-rndnu-neon-mlal.c",
4000    "src/qs8-igemm/gen/4x16c4s2-minmax-rndnu-neon-mull.c",
4001    "src/qs8-igemm/gen/4x16c8-minmax-rndnu-neon-mlal.c",
4002    "src/qs8-igemm/gen/4x16c8-minmax-rndnu-neon-mull.c",
4003    "src/qs8-igemm/gen/4x16c16-minmax-rndnu-neon-mlal.c",
4004    "src/qs8-igemm/gen/6x8-minmax-rndnu-neon-mlal-lane-prfm.c",
4005    "src/qs8-igemm/gen/6x8-minmax-rndnu-neon-mlal-lane.c",
4006    "src/qs8-igemm/gen/6x16-minmax-rndnu-neon-mlal-lane-prfm.c",
4007    "src/qs8-igemm/gen/6x16-minmax-rndnu-neon-mlal-lane.c",
4008    "src/qs8-requantization/fp32-neon.c",
4009    "src/qs8-requantization/gemmlowp-neon.c",
4010    "src/qs8-requantization/rndna-neon.c",
4011    "src/qs8-requantization/rndnu-neon-mull.c",
4012    "src/qs8-requantization/rndnu-neon-qdmulh.c",
4013    "src/qs8-vadd/gen/minmax-neon-ld64-x8.c",
4014    "src/qs8-vadd/gen/minmax-neon-ld64-x16.c",
4015    "src/qs8-vadd/gen/minmax-neon-ld64-x24.c",
4016    "src/qs8-vadd/gen/minmax-neon-ld64-x32.c",
4017    "src/qs8-vadd/gen/minmax-neon-ld128-x16.c",
4018    "src/qs8-vadd/gen/minmax-neon-ld128-x32.c",
4019    "src/qs8-vaddc/gen/minmax-neon-ld64-x8.c",
4020    "src/qs8-vaddc/gen/minmax-neon-ld64-x16.c",
4021    "src/qs8-vaddc/gen/minmax-neon-ld64-x24.c",
4022    "src/qs8-vaddc/gen/minmax-neon-ld64-x32.c",
4023    "src/qs8-vaddc/gen/minmax-neon-ld128-x16.c",
4024    "src/qs8-vaddc/gen/minmax-neon-ld128-x32.c",
4025    "src/qs8-vcvt/gen/vcvt-neon-x8.c",
4026    "src/qs8-vcvt/gen/vcvt-neon-x16.c",
4027    "src/qs8-vcvt/gen/vcvt-neon-x32.c",
4028    "src/qs8-vlrelu/gen/vlrelu-neon-x8.c",
4029    "src/qs8-vlrelu/gen/vlrelu-neon-x16.c",
4030    "src/qs8-vlrelu/gen/vlrelu-neon-x32.c",
4031    "src/qs8-vmul/gen/minmax-fp32-neon-ld64-x8.c",
4032    "src/qs8-vmul/gen/minmax-fp32-neon-ld64-x16.c",
4033    "src/qs8-vmul/gen/minmax-fp32-neon-ld128-x16.c",
4034    "src/qs8-vmul/gen/minmax-rndnu-neon-ld64-x8.c",
4035    "src/qs8-vmul/gen/minmax-rndnu-neon-ld64-x16.c",
4036    "src/qs8-vmul/gen/minmax-rndnu-neon-ld128-x16.c",
4037    "src/qs8-vmulc/gen/minmax-fp32-neon-ld64-x8.c",
4038    "src/qs8-vmulc/gen/minmax-fp32-neon-ld64-x16.c",
4039    "src/qs8-vmulc/gen/minmax-fp32-neon-ld128-x16.c",
4040    "src/qs8-vmulc/gen/minmax-rndnu-neon-ld64-x8.c",
4041    "src/qs8-vmulc/gen/minmax-rndnu-neon-ld64-x16.c",
4042    "src/qs8-vmulc/gen/minmax-rndnu-neon-ld128-x16.c",
4043    "src/qu8-avgpool/9p8x-minmax-neon-c8.c",
4044    "src/qu8-avgpool/9x-minmax-neon-c8.c",
4045    "src/qu8-dwconv/gen/up8x9-minmax-fp32-neon-mul16.c",
4046    "src/qu8-dwconv/gen/up8x9-minmax-rndnu-neon-mul8.c",
4047    "src/qu8-dwconv/gen/up8x9-minmax-rndnu-neon-mul16.c",
4048    "src/qu8-dwconv/gen/up8x25-minmax-fp32-neon-mul16.c",
4049    "src/qu8-dwconv/gen/up8x25-minmax-rndnu-neon-mul8.c",
4050    "src/qu8-dwconv/gen/up8x25-minmax-rndnu-neon-mul16.c",
4051    "src/qu8-dwconv/gen/up16x9-minmax-fp32-neon-mul16.c",
4052    "src/qu8-dwconv/gen/up16x9-minmax-rndnu-neon-mul8.c",
4053    "src/qu8-dwconv/gen/up16x9-minmax-rndnu-neon-mul16.c",
4054    "src/qu8-dwconv/gen/up16x25-minmax-fp32-neon-mul16.c",
4055    "src/qu8-dwconv/gen/up16x25-minmax-rndnu-neon-mul8.c",
4056    "src/qu8-dwconv/gen/up16x25-minmax-rndnu-neon-mul16.c",
4057    "src/qu8-dwconv/gen/up24x9-minmax-fp32-neon-mul16.c",
4058    "src/qu8-dwconv/gen/up24x9-minmax-rndnu-neon-mul8.c",
4059    "src/qu8-dwconv/gen/up24x9-minmax-rndnu-neon-mul16.c",
4060    "src/qu8-dwconv/gen/up24x25-minmax-fp32-neon-mul16.c",
4061    "src/qu8-dwconv/gen/up24x25-minmax-rndnu-neon-mul8.c",
4062    "src/qu8-dwconv/gen/up24x25-minmax-rndnu-neon-mul16.c",
4063    "src/qu8-dwconv/gen/up32x9-minmax-fp32-neon-mul16.c",
4064    "src/qu8-dwconv/gen/up32x9-minmax-rndnu-neon-mul8.c",
4065    "src/qu8-dwconv/gen/up32x9-minmax-rndnu-neon-mul16.c",
4066    "src/qu8-dwconv/gen/up32x25-minmax-fp32-neon-mul16.c",
4067    "src/qu8-dwconv/gen/up32x25-minmax-rndnu-neon-mul8.c",
4068    "src/qu8-dwconv/gen/up32x25-minmax-rndnu-neon-mul16.c",
4069    "src/qu8-f32-vcvt/gen/vcvt-neon-x8.c",
4070    "src/qu8-f32-vcvt/gen/vcvt-neon-x16.c",
4071    "src/qu8-f32-vcvt/gen/vcvt-neon-x24.c",
4072    "src/qu8-f32-vcvt/gen/vcvt-neon-x32.c",
4073    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neon-c8.c",
4074    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neon-c16.c",
4075    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neon-c24.c",
4076    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neon-c32.c",
4077    "src/qu8-gavgpool/gen/7p7x-minmax-rndnu-neon-c8.c",
4078    "src/qu8-gavgpool/gen/7p7x-minmax-rndnu-neon-c16.c",
4079    "src/qu8-gavgpool/gen/7p7x-minmax-rndnu-neon-c24.c",
4080    "src/qu8-gavgpool/gen/7p7x-minmax-rndnu-neon-c32.c",
4081    "src/qu8-gavgpool/gen/7x-minmax-fp32-neon-c8.c",
4082    "src/qu8-gavgpool/gen/7x-minmax-fp32-neon-c16.c",
4083    "src/qu8-gavgpool/gen/7x-minmax-fp32-neon-c24.c",
4084    "src/qu8-gavgpool/gen/7x-minmax-fp32-neon-c32.c",
4085    "src/qu8-gavgpool/gen/7x-minmax-rndnu-neon-c8.c",
4086    "src/qu8-gavgpool/gen/7x-minmax-rndnu-neon-c16.c",
4087    "src/qu8-gavgpool/gen/7x-minmax-rndnu-neon-c24.c",
4088    "src/qu8-gavgpool/gen/7x-minmax-rndnu-neon-c32.c",
4089    "src/qu8-gemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
4090    "src/qu8-gemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
4091    "src/qu8-gemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
4092    "src/qu8-gemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
4093    "src/qu8-gemm/gen/2x8-minmax-rndnu-neon-mlal-lane.c",
4094    "src/qu8-gemm/gen/2x16-minmax-rndnu-neon-mlal-lane.c",
4095    "src/qu8-gemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
4096    "src/qu8-gemm/gen/3x16-minmax-rndnu-neon-mlal-lane.c",
4097    "src/qu8-gemm/gen/4x8-minmax-fp32-neon-mlal-lane.c",
4098    "src/qu8-gemm/gen/4x8-minmax-rndnu-neon-mlal-lane.c",
4099    "src/qu8-gemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
4100    "src/qu8-gemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
4101    "src/qu8-gemm/gen/6x8-minmax-rndnu-neon-mlal-lane.c",
4102    "src/qu8-gemm/gen/6x16-minmax-rndnu-neon-mlal-lane.c",
4103    "src/qu8-igemm/gen/1x8-minmax-fp32-neon-mlal-lane.c",
4104    "src/qu8-igemm/gen/1x8-minmax-rndnu-neon-mlal-lane.c",
4105    "src/qu8-igemm/gen/1x16-minmax-fp32-neon-mlal-lane.c",
4106    "src/qu8-igemm/gen/1x16-minmax-rndnu-neon-mlal-lane.c",
4107    "src/qu8-igemm/gen/2x8-minmax-rndnu-neon-mlal-lane.c",
4108    "src/qu8-igemm/gen/2x16-minmax-rndnu-neon-mlal-lane.c",
4109    "src/qu8-igemm/gen/3x8-minmax-rndnu-neon-mlal-lane.c",
4110    "src/qu8-igemm/gen/3x16-minmax-rndnu-neon-mlal-lane.c",
4111    "src/qu8-igemm/gen/4x8-minmax-fp32-neon-mlal-lane.c",
4112    "src/qu8-igemm/gen/4x8-minmax-rndnu-neon-mlal-lane.c",
4113    "src/qu8-igemm/gen/4x16-minmax-fp32-neon-mlal-lane.c",
4114    "src/qu8-igemm/gen/4x16-minmax-rndnu-neon-mlal-lane.c",
4115    "src/qu8-igemm/gen/6x8-minmax-rndnu-neon-mlal-lane.c",
4116    "src/qu8-igemm/gen/6x16-minmax-rndnu-neon-mlal-lane.c",
4117    "src/qu8-requantization/fp32-neon.c",
4118    "src/qu8-requantization/gemmlowp-neon.c",
4119    "src/qu8-requantization/rndna-neon.c",
4120    "src/qu8-vadd/gen/minmax-neon-ld64-x8.c",
4121    "src/qu8-vadd/gen/minmax-neon-ld64-x16.c",
4122    "src/qu8-vadd/gen/minmax-neon-ld64-x32.c",
4123    "src/qu8-vadd/gen/minmax-neon-ld128-x16.c",
4124    "src/qu8-vaddc/gen/minmax-neon-ld64-x8.c",
4125    "src/qu8-vaddc/gen/minmax-neon-ld64-x16.c",
4126    "src/qu8-vaddc/gen/minmax-neon-ld64-x32.c",
4127    "src/qu8-vaddc/gen/minmax-neon-ld128-x16.c",
4128    "src/qu8-vcvt/gen/vcvt-neon-x8.c",
4129    "src/qu8-vcvt/gen/vcvt-neon-x16.c",
4130    "src/qu8-vcvt/gen/vcvt-neon-x32.c",
4131    "src/qu8-vlrelu/gen/vlrelu-neon-x8.c",
4132    "src/qu8-vlrelu/gen/vlrelu-neon-x16.c",
4133    "src/qu8-vlrelu/gen/vlrelu-neon-x32.c",
4134    "src/qu8-vmul/gen/minmax-fp32-neon-ld64-x8.c",
4135    "src/qu8-vmul/gen/minmax-fp32-neon-ld64-x16.c",
4136    "src/qu8-vmul/gen/minmax-fp32-neon-ld128-x16.c",
4137    "src/qu8-vmul/gen/minmax-rndnu-neon-ld64-x8.c",
4138    "src/qu8-vmul/gen/minmax-rndnu-neon-ld64-x16.c",
4139    "src/qu8-vmul/gen/minmax-rndnu-neon-ld128-x16.c",
4140    "src/qu8-vmulc/gen/minmax-fp32-neon-ld64-x8.c",
4141    "src/qu8-vmulc/gen/minmax-fp32-neon-ld64-x16.c",
4142    "src/qu8-vmulc/gen/minmax-fp32-neon-ld128-x16.c",
4143    "src/qu8-vmulc/gen/minmax-rndnu-neon-ld64-x8.c",
4144    "src/qu8-vmulc/gen/minmax-rndnu-neon-ld64-x16.c",
4145    "src/qu8-vmulc/gen/minmax-rndnu-neon-ld128-x16.c",
4146    "src/s8-ibilinear/gen/neon-c8.c",
4147    "src/s8-ibilinear/gen/neon-c16.c",
4148    "src/s8-maxpool/2p2x-minmax-neon-c16.c",
4149    "src/s8-maxpool/4p3x-minmax-neon-c16.c",
4150    "src/s8-maxpool/9p8x-minmax-neon-c16.c",
4151    "src/s8-vclamp/neon-x64.c",
4152    "src/s16-rmaxabs/gen/neon-x8.c",
4153    "src/s16-rmaxabs/gen/neon-x16.c",
4154    "src/s16-rmaxabs/gen/neon-x24.c",
4155    "src/s16-rmaxabs/gen/neon-x32.c",
4156    "src/s16-vlshift/gen/neon-x8.c",
4157    "src/s16-vlshift/gen/neon-x16.c",
4158    "src/s16-vlshift/gen/neon-x24.c",
4159    "src/s16-vlshift/gen/neon-x32.c",
4160    "src/s16-window/gen/neon-shift12-x8.c",
4161    "src/s16-window/gen/neon-shift12-x16.c",
4162    "src/s16-window/gen/neon-shift12-x24.c",
4163    "src/s16-window/gen/neon-shift12-x32.c",
4164    "src/s16-window/gen/neon-shift15-x8.c",
4165    "src/s16-window/gen/neon-shift15-x16.c",
4166    "src/s16-window/gen/neon-shift15-x24.c",
4167    "src/s16-window/gen/neon-shift15-x32.c",
4168    "src/s16-window/gen/neon-x8.c",
4169    "src/s16-window/gen/neon-x16.c",
4170    "src/s16-window/gen/neon-x24.c",
4171    "src/s16-window/gen/neon-x32.c",
4172    "src/u8-ibilinear/gen/neon-c8.c",
4173    "src/u8-ibilinear/gen/neon-c16.c",
4174    "src/u8-maxpool/9p8x-minmax-neon-c16.c",
4175    "src/u8-rmax/neon.c",
4176    "src/u8-vclamp/neon-x64.c",
4177    "src/u32-filterbank-accumulate/gen/neon-x1.c",
4178    "src/u32-filterbank-accumulate/gen/neon-x2.c",
4179    "src/xx-fill/neon-x64.c",
4180    "src/xx-pad/neon.c",
4181    "src/x8-transposec/gen/8x8-multi-dec-zip-neon.c",
4182    "src/x8-transposec/gen/8x8-multi-mov-zip-neon.c",
4183    "src/x8-transposec/gen/8x8-multi-switch-zip-neon.c",
4184    "src/x8-transposec/gen/8x8-reuse-dec-zip-neon.c",
4185    "src/x8-transposec/gen/8x8-reuse-mov-zip-neon.c",
4186    "src/x8-transposec/gen/8x8-reuse-multi-zip-neon.c",
4187    "src/x8-transposec/gen/8x8-reuse-switch-zip-neon.c",
4188    "src/x8-transposec/gen/16x16-reuse-dec-zip-neon.c",
4189    "src/x8-transposec/gen/16x16-reuse-mov-zip-neon.c",
4190    "src/x8-transposec/gen/16x16-reuse-switch-zip-neon.c",
4191    "src/x8-zip/xm-neon.c",
4192    "src/x8-zip/x2-neon.c",
4193    "src/x8-zip/x3-neon.c",
4194    "src/x8-zip/x4-neon.c",
4195    "src/x16-transposec/gen/4x4-multi-dec-zip-neon.c",
4196    "src/x16-transposec/gen/4x4-multi-mov-zip-neon.c",
4197    "src/x16-transposec/gen/4x4-multi-multi-zip-neon.c",
4198    "src/x16-transposec/gen/4x4-multi-switch-zip-neon.c",
4199    "src/x16-transposec/gen/4x4-reuse-dec-zip-neon.c",
4200    "src/x16-transposec/gen/4x4-reuse-mov-zip-neon.c",
4201    "src/x16-transposec/gen/4x4-reuse-multi-zip-neon.c",
4202    "src/x16-transposec/gen/4x4-reuse-switch-zip-neon.c",
4203    "src/x16-transposec/gen/8x8-multi-dec-zip-neon.c",
4204    "src/x16-transposec/gen/8x8-multi-mov-zip-neon.c",
4205    "src/x16-transposec/gen/8x8-multi-switch-zip-neon.c",
4206    "src/x16-transposec/gen/8x8-reuse-dec-zip-neon.c",
4207    "src/x16-transposec/gen/8x8-reuse-mov-zip-neon.c",
4208    "src/x16-transposec/gen/8x8-reuse-multi-zip-neon.c",
4209    "src/x16-transposec/gen/8x8-reuse-switch-zip-neon.c",
4210    "src/x24-transposec/2x2-neon-tbl.c",
4211    "src/x32-packx/x4-neon-st4.c",
4212    "src/x32-transposec/gen/2x2-multi-dec-zip-neon.c",
4213    "src/x32-transposec/gen/2x2-multi-mov-zip-neon.c",
4214    "src/x32-transposec/gen/2x2-multi-multi-zip-neon.c",
4215    "src/x32-transposec/gen/2x2-multi-switch-zip-neon.c",
4216    "src/x32-transposec/gen/2x2-reuse-dec-zip-neon.c",
4217    "src/x32-transposec/gen/2x2-reuse-mov-zip-neon.c",
4218    "src/x32-transposec/gen/2x2-reuse-multi-zip-neon.c",
4219    "src/x32-transposec/gen/2x2-reuse-switch-zip-neon.c",
4220    "src/x32-transposec/gen/4x4-multi-dec-zip-neon.c",
4221    "src/x32-transposec/gen/4x4-multi-mov-zip-neon.c",
4222    "src/x32-transposec/gen/4x4-multi-multi-zip-neon.c",
4223    "src/x32-transposec/gen/4x4-multi-switch-zip-neon.c",
4224    "src/x32-transposec/gen/4x4-reuse-dec-zip-neon.c",
4225    "src/x32-transposec/gen/4x4-reuse-mov-zip-neon.c",
4226    "src/x32-transposec/gen/4x4-reuse-multi-zip-neon.c",
4227    "src/x32-transposec/gen/4x4-reuse-switch-zip-neon.c",
4228    "src/x32-unpool/neon.c",
4229    "src/x32-zip/xm-neon.c",
4230    "src/x32-zip/x2-neon.c",
4231    "src/x32-zip/x3-neon.c",
4232    "src/x32-zip/x4-neon.c",
4233]
4234
4235PROD_NEONFP16_MICROKERNEL_SRCS = [
4236    "src/f16-f32-vcvt/gen/vcvt-neonfp16-x16.c",
4237    "src/f32-f16-vcvt/gen/vcvt-neonfp16-x16.c",
4238]
4239
4240ALL_NEONFP16_MICROKERNEL_SRCS = [
4241    "src/f16-f32-vcvt/gen/vcvt-neonfp16-x8.c",
4242    "src/f16-f32-vcvt/gen/vcvt-neonfp16-x16.c",
4243    "src/f32-f16-vcvt/gen/vcvt-neonfp16-x8.c",
4244    "src/f32-f16-vcvt/gen/vcvt-neonfp16-x16.c",
4245    "src/math/cvt-f16-f32-neonfp16.c",
4246    "src/math/cvt-f32-f16-neonfp16.c",
4247]
4248
4249PROD_NEONFMA_MICROKERNEL_SRCS = [
4250    "src/f32-dwconv/gen/up8x3-minmax-neonfma.c",
4251    "src/f32-dwconv/gen/up8x4-minmax-neonfma.c",
4252    "src/f32-dwconv/gen/up8x9-minmax-neonfma.c",
4253    "src/f32-dwconv/gen/up8x25-minmax-neonfma-acc2.c",
4254    "src/f32-gemm/gen/1x8s4-minmax-neonfma.c",
4255    "src/f32-gemm/gen/6x8s4-minmax-neonfma.c",
4256    "src/f32-ibilinear-chw/gen/neonfma-p8.c",
4257    "src/f32-ibilinear/gen/neonfma-c8.c",
4258    "src/f32-igemm/gen/1x8s4-minmax-neonfma.c",
4259    "src/f32-igemm/gen/6x8s4-minmax-neonfma.c",
4260    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x16.c",
4261    "src/f32-spmm/gen/32x1-minmax-neonfma-pipelined.c",
4262    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x16.c",
4263    "src/f32-velu/gen/velu-neonfma-rr1-p6-x8.c",
4264    "src/f32-vmulcaddc/gen/c4-minmax-neonfma-2x.c",
4265    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x16.c",
4266]
4267
4268ALL_NEONFMA_MICROKERNEL_SRCS = [
4269    "src/bf16-gemm/gen/1x4c8-minmax-neonfma-shland.c",
4270    "src/bf16-gemm/gen/2x4c8-minmax-neonfma-shland.c",
4271    "src/bf16-gemm/gen/3x4c8-minmax-neonfma-shland.c",
4272    "src/bf16-gemm/gen/4x4c8-minmax-neonfma-shland.c",
4273    "src/bf16-gemm/gen/5x4c8-minmax-neonfma-shland.c",
4274    "src/f32-dwconv/gen/up4x3-minmax-neonfma-acc2.c",
4275    "src/f32-dwconv/gen/up4x3-minmax-neonfma.c",
4276    "src/f32-dwconv/gen/up4x4-minmax-neonfma-acc2.c",
4277    "src/f32-dwconv/gen/up4x4-minmax-neonfma.c",
4278    "src/f32-dwconv/gen/up4x9-minmax-neonfma-acc2.c",
4279    "src/f32-dwconv/gen/up4x9-minmax-neonfma.c",
4280    "src/f32-dwconv/gen/up4x25-minmax-neonfma-acc2.c",
4281    "src/f32-dwconv/gen/up4x25-minmax-neonfma.c",
4282    "src/f32-dwconv/gen/up8x3-minmax-neonfma-acc2.c",
4283    "src/f32-dwconv/gen/up8x3-minmax-neonfma.c",
4284    "src/f32-dwconv/gen/up8x4-minmax-neonfma-acc2.c",
4285    "src/f32-dwconv/gen/up8x4-minmax-neonfma.c",
4286    "src/f32-dwconv/gen/up8x9-minmax-neonfma-acc2.c",
4287    "src/f32-dwconv/gen/up8x9-minmax-neonfma.c",
4288    "src/f32-dwconv/gen/up8x25-minmax-neonfma-acc2.c",
4289    "src/f32-dwconv/gen/up8x25-minmax-neonfma.c",
4290    "src/f32-dwconv/gen/up16x3-minmax-neon-acc2.c",
4291    "src/f32-dwconv/gen/up16x3-minmax-neon.c",
4292    "src/f32-dwconv/gen/up16x3-minmax-neonfma-acc2.c",
4293    "src/f32-dwconv/gen/up16x3-minmax-neonfma.c",
4294    "src/f32-dwconv/gen/up16x4-minmax-neon-acc2.c",
4295    "src/f32-dwconv/gen/up16x4-minmax-neon.c",
4296    "src/f32-dwconv/gen/up16x4-minmax-neonfma-acc2.c",
4297    "src/f32-dwconv/gen/up16x4-minmax-neonfma.c",
4298    "src/f32-dwconv/gen/up16x9-minmax-neon-acc2.c",
4299    "src/f32-dwconv/gen/up16x9-minmax-neon.c",
4300    "src/f32-dwconv/gen/up16x9-minmax-neonfma-acc2.c",
4301    "src/f32-dwconv/gen/up16x9-minmax-neonfma.c",
4302    "src/f32-dwconv/gen/up16x25-minmax-neon-acc2.c",
4303    "src/f32-dwconv/gen/up16x25-minmax-neon.c",
4304    "src/f32-dwconv/gen/up16x25-minmax-neonfma-acc2.c",
4305    "src/f32-dwconv/gen/up16x25-minmax-neonfma.c",
4306    "src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-dup-ld64.c",
4307    "src/f32-gemm/gen-inc/1x8s4inc-minmax-neonfma.c",
4308    "src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld64.c",
4309    "src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-dup-ld128.c",
4310    "src/f32-gemm/gen-inc/4x8s4inc-minmax-neonfma.c",
4311    "src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld64.c",
4312    "src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-dup-ld128.c",
4313    "src/f32-gemm/gen-inc/6x8s4inc-minmax-neonfma.c",
4314    "src/f32-gemm/gen-inc/8x8s4inc-minmax-neonfma.c",
4315    "src/f32-gemm/gen/1x8-minmax-neonfma-dup-ld64.c",
4316    "src/f32-gemm/gen/1x8s4-minmax-neonfma.c",
4317    "src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld64.c",
4318    "src/f32-gemm/gen/4x8-minmax-neonfma-dup-ld128.c",
4319    "src/f32-gemm/gen/4x8s4-minmax-neonfma.c",
4320    "src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld64.c",
4321    "src/f32-gemm/gen/6x8-minmax-neonfma-dup-ld128.c",
4322    "src/f32-gemm/gen/6x8s4-minmax-neonfma.c",
4323    "src/f32-gemm/gen/8x8s4-minmax-neonfma.c",
4324    "src/f32-ibilinear-chw/gen/neonfma-p4.c",
4325    "src/f32-ibilinear-chw/gen/neonfma-p8.c",
4326    "src/f32-ibilinear-chw/gen/neonfma-p16.c",
4327    "src/f32-ibilinear/gen/neonfma-c4.c",
4328    "src/f32-ibilinear/gen/neonfma-c8.c",
4329    "src/f32-igemm/gen/1x8-minmax-neonfma-dup-ld64.c",
4330    "src/f32-igemm/gen/1x8s4-minmax-neonfma.c",
4331    "src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld64.c",
4332    "src/f32-igemm/gen/4x8-minmax-neonfma-dup-ld128.c",
4333    "src/f32-igemm/gen/4x8s4-minmax-neonfma.c",
4334    "src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld64.c",
4335    "src/f32-igemm/gen/6x8-minmax-neonfma-dup-ld128.c",
4336    "src/f32-igemm/gen/6x8s4-minmax-neonfma.c",
4337    "src/f32-igemm/gen/8x8s4-minmax-neonfma.c",
4338    "src/f32-ppmm/gen/4x8-minmax-neonfma.c",
4339    "src/f32-ppmm/gen/8x8-minmax-neonfma.c",
4340    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x4.c",
4341    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x8-acc2.c",
4342    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x8.c",
4343    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x12-acc2.c",
4344    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x12-acc3.c",
4345    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x12.c",
4346    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x16-acc2.c",
4347    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x16-acc4.c",
4348    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x16.c",
4349    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x20-acc2.c",
4350    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x20-acc5.c",
4351    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-lut64-p2-x20.c",
4352    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x4.c",
4353    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x8-acc2.c",
4354    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x8.c",
4355    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x12-acc2.c",
4356    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x12-acc3.c",
4357    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x12.c",
4358    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x16-acc2.c",
4359    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x16-acc4.c",
4360    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x16.c",
4361    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x20-acc2.c",
4362    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x20-acc5.c",
4363    "src/f32-raddstoreexpminusmax/gen/neonfma-rr1-p5-x20.c",
4364    "src/f32-spmm/gen/4x1-minmax-neonfma-pipelined.c",
4365    "src/f32-spmm/gen/4x1-minmax-neonfma-x2.c",
4366    "src/f32-spmm/gen/4x1-minmax-neonfma.c",
4367    "src/f32-spmm/gen/8x1-minmax-neonfma-pipelined.c",
4368    "src/f32-spmm/gen/8x1-minmax-neonfma-x2.c",
4369    "src/f32-spmm/gen/8x1-minmax-neonfma.c",
4370    "src/f32-spmm/gen/12x1-minmax-neonfma.c",
4371    "src/f32-spmm/gen/16x1-minmax-neonfma-pipelined.c",
4372    "src/f32-spmm/gen/16x1-minmax-neonfma-x2.c",
4373    "src/f32-spmm/gen/16x1-minmax-neonfma.c",
4374    "src/f32-spmm/gen/32x1-minmax-neonfma-pipelined.c",
4375    "src/f32-spmm/gen/32x1-minmax-neonfma-x2.c",
4376    "src/f32-spmm/gen/32x1-minmax-neonfma.c",
4377    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x4.c",
4378    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x8.c",
4379    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x12.c",
4380    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x16.c",
4381    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x20.c",
4382    "src/f32-velu/gen/velu-neonfma-rr1-lut16-p3-x24.c",
4383    "src/f32-velu/gen/velu-neonfma-rr1-p6-x4.c",
4384    "src/f32-velu/gen/velu-neonfma-rr1-p6-x8.c",
4385    "src/f32-velu/gen/velu-neonfma-rr1-p6-x12.c",
4386    "src/f32-velu/gen/velu-neonfma-rr1-p6-x16.c",
4387    "src/f32-velu/gen/velu-neonfma-rr1-p6-x20.c",
4388    "src/f32-velu/gen/velu-neonfma-rr1-p6-x24.c",
4389    "src/f32-vmulcaddc/gen/c4-minmax-neonfma-2x.c",
4390    "src/f32-vmulcaddc/gen/c8-minmax-neonfma-2x.c",
4391    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x4.c",
4392    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x8.c",
4393    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x12.c",
4394    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x16.c",
4395    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x20.c",
4396    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr1recps1fma-x24.c",
4397    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x4.c",
4398    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x8.c",
4399    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x12.c",
4400    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x16.c",
4401    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x20.c",
4402    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2fma-x24.c",
4403    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x4.c",
4404    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x8.c",
4405    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x12.c",
4406    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x16.c",
4407    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x20.c",
4408    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-nr2recps-x24.c",
4409    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x4.c",
4410    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x8.c",
4411    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x12.c",
4412    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x16.c",
4413    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x20.c",
4414    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma-x24.c",
4415    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x4.c",
4416    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x8.c",
4417    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x12.c",
4418    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x16.c",
4419    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x20.c",
4420    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2fma-x24.c",
4421    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x4.c",
4422    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x8.c",
4423    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x12.c",
4424    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x16.c",
4425    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x20.c",
4426    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x24.c",
4427    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x4.c",
4428    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x8.c",
4429    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x12.c",
4430    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x16.c",
4431    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x20.c",
4432    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr1recps1fma-x24.c",
4433    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x4.c",
4434    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x8.c",
4435    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x12.c",
4436    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x16.c",
4437    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x20.c",
4438    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2fma-x24.c",
4439    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x4.c",
4440    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x8.c",
4441    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x12.c",
4442    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x16.c",
4443    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x20.c",
4444    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-nr2recps-x24.c",
4445    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x4.c",
4446    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x8.c",
4447    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x12.c",
4448    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x16.c",
4449    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x20.c",
4450    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x24.c",
4451    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x28.c",
4452    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x32.c",
4453    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x36.c",
4454    "src/f32-vsqrt/gen/neonfma-nr1rsqrts1fma1adj-x40.c",
4455    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x4.c",
4456    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x8.c",
4457    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x12.c",
4458    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x16.c",
4459    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x20.c",
4460    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x24.c",
4461    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x28.c",
4462    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x32.c",
4463    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x36.c",
4464    "src/f32-vsqrt/gen/neonfma-nr2fma1adj-x40.c",
4465    "src/math/exp-f32-neonfma-rr2-lut64-p2.c",
4466    "src/math/exp-f32-neonfma-rr2-p5.c",
4467    "src/math/expminus-f32-neonfma-rr2-lut64-p2.c",
4468    "src/math/expminus-f32-neonfma-rr2-lut2048-p1.c",
4469    "src/math/expminus-f32-neonfma-rr2-p5.c",
4470    "src/math/expm1minus-f32-neonfma-rr1-lut16-p3.c",
4471    "src/math/expm1minus-f32-neonfma-rr1-p6.c",
4472    "src/math/sigmoid-f32-neonfma-rr1-lut64-p2-nr1recps1fma.c",
4473    "src/math/sigmoid-f32-neonfma-rr1-lut64-p2-nr2fma.c",
4474    "src/math/sigmoid-f32-neonfma-rr1-lut64-p2-nr2recps.c",
4475    "src/math/sigmoid-f32-neonfma-rr1-lut2048-p1-nr1recps1fma.c",
4476    "src/math/sigmoid-f32-neonfma-rr1-lut2048-p1-nr2fma.c",
4477    "src/math/sigmoid-f32-neonfma-rr1-lut2048-p1-nr2recps.c",
4478    "src/math/sigmoid-f32-neonfma-rr1-p5-nr1recps1fma.c",
4479    "src/math/sigmoid-f32-neonfma-rr1-p5-nr2fma.c",
4480    "src/math/sigmoid-f32-neonfma-rr1-p5-nr2recps.c",
4481    "src/math/sigmoid-f32-neonfma-rr2-lut64-p2-nr1recps1fma.c",
4482    "src/math/sigmoid-f32-neonfma-rr2-lut64-p2-nr2fma.c",
4483    "src/math/sigmoid-f32-neonfma-rr2-lut64-p2-nr2recps.c",
4484    "src/math/sigmoid-f32-neonfma-rr2-lut2048-p1-nr1recps1fma.c",
4485    "src/math/sigmoid-f32-neonfma-rr2-lut2048-p1-nr2fma.c",
4486    "src/math/sigmoid-f32-neonfma-rr2-lut2048-p1-nr2recps.c",
4487    "src/math/sigmoid-f32-neonfma-rr2-p5-nr1recps1fma.c",
4488    "src/math/sigmoid-f32-neonfma-rr2-p5-nr2fma.c",
4489    "src/math/sigmoid-f32-neonfma-rr2-p5-nr2recps.c",
4490    "src/math/sqrt-neonfma-nr1fma.c",
4491    "src/math/sqrt-neonfma-nr1rsqrts1fma1adj.c",
4492    "src/math/sqrt-neonfma-nr2fma.c",
4493    "src/math/sqrt-neonfma-nr2fma1adj.c",
4494    "src/math/sqrt-neonfma-nr3fma.c",
4495]
4496
4497PROD_AARCH64_NEON_MICROKERNEL_SRCS = [
4498    "src/f32-conv-hwc2chw/3x3s2p1c3x4-neonfma-2x2.c",
4499    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-3x4.c",
4500    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-2x4-acc2.c",
4501    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-4x4.c",
4502    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4-acc2.c",
4503    "src/f32-gemm/gen/1x8-minmax-neonfma-lane-ld64.c",
4504    "src/f32-gemm/gen/6x2-minmax-neonfma-lane-ld64.c",
4505    "src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld64.c",
4506    "src/f32-igemm/gen/1x8-minmax-neonfma-lane-ld64.c",
4507    "src/f32-igemm/gen/6x2-minmax-neonfma-lane-ld64.c",
4508    "src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld64.c",
4509    "src/f32-spmm/gen/32x2-minmax-neonfma.c",
4510    "src/f32-spmm/gen/32x4-minmax-neonfma.c",
4511    "src/f32-vbinary/gen/vdiv-minmax-neon-x8.c",
4512    "src/f32-vbinary/gen/vdivc-minmax-neon-x8.c",
4513    "src/f32-vbinary/gen/vrdivc-minmax-neon-x8.c",
4514    "src/f32-vsqrt/gen/neon-sqrt-x4.c",
4515    "src/x8-lut/gen/lut-neon-tbx128x4-x64.c",
4516    "src/x32-transposec/4x4-aarch64-tbl.c",
4517]
4518
4519ALL_AARCH64_NEON_MICROKERNEL_SRCS = [
4520    "src/bf16-gemm/gen/1x4c8-minmax-neonfma-zip.c",
4521    "src/bf16-gemm/gen/2x4c8-minmax-neonfma-zip.c",
4522    "src/bf16-gemm/gen/3x4c8-minmax-neonfma-zip.c",
4523    "src/bf16-gemm/gen/4x4c8-minmax-neonfma-zip.c",
4524    "src/bf16-gemm/gen/5x4c8-minmax-neonfma-zip.c",
4525    "src/f32-conv-hwc/gen/3x3s2p0p1c3x4-neonfma-2x1.c",
4526    "src/f32-conv-hwc/gen/3x3s2p0p1c3x4-neonfma-2x2.c",
4527    "src/f32-conv-hwc/gen/3x3s2p0p1c3x8-neonfma-2x1.c",
4528    "src/f32-conv-hwc/gen/3x3s2p0p1c3x8-neonfma-2x2.c",
4529    "src/f32-conv-hwc/gen/3x3s2p1c3x4-neonfma-2x1.c",
4530    "src/f32-conv-hwc/gen/3x3s2p1c3x4-neonfma-2x2.c",
4531    "src/f32-conv-hwc/gen/3x3s2p1c3x8-neonfma-2x1.c",
4532    "src/f32-conv-hwc/gen/3x3s2p1c3x8-neonfma-2x2.c",
4533    "src/f32-conv-hwc2chw/3x3s2p1c3x4-neonfma-2x2.c",
4534    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-1x4-acc2.c",
4535    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-1x4-acc3.c",
4536    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-1x4-acc4.c",
4537    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-1x4.c",
4538    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-2x4-acc2.c",
4539    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-2x4.c",
4540    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-3x4.c",
4541    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-4x4.c",
4542    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-5x4.c",
4543    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-neonfma-6x4.c",
4544    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-1x4-acc2.c",
4545    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-1x4-acc3.c",
4546    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-1x4-acc4.c",
4547    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-1x4.c",
4548    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-2x4-acc2.c",
4549    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-2x4.c",
4550    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-3x4.c",
4551    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-neonfma-4x4.c",
4552    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-1x4-acc2.c",
4553    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-1x4-acc3.c",
4554    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-1x4-acc4.c",
4555    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-1x4-acc5.c",
4556    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-1x4.c",
4557    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-2x4-acc2.c",
4558    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-2x4-acc3.c",
4559    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-2x4.c",
4560    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-3x4-acc2.c",
4561    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-3x4.c",
4562    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-4x4-acc2.c",
4563    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-4x4.c",
4564    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-neonfma-5x4.c",
4565    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4-acc2.c",
4566    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4-acc3.c",
4567    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4-acc4.c",
4568    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4-acc5.c",
4569    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-1x4.c",
4570    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-2x4-acc2.c",
4571    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-2x4-acc3.c",
4572    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-2x4.c",
4573    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-3x4-acc2.c",
4574    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-neonfma-3x4.c",
4575    "src/f32-gemm/gen-inc/1x8inc-minmax-neonfma-lane-ld64.c",
4576    "src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld64.c",
4577    "src/f32-gemm/gen-inc/4x8inc-minmax-neonfma-lane-ld128.c",
4578    "src/f32-gemm/gen-inc/5x8inc-minmax-neonfma-lane-ld64.c",
4579    "src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld64.c",
4580    "src/f32-gemm/gen-inc/6x8inc-minmax-neonfma-lane-ld128.c",
4581    "src/f32-gemm/gen/1x8-minmax-neonfma-lane-ld64.c",
4582    "src/f32-gemm/gen/4x2-minmax-neonfma-lane-ld64.c",
4583    "src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld64.c",
4584    "src/f32-gemm/gen/4x8-minmax-neonfma-lane-ld128.c",
4585    "src/f32-gemm/gen/5x8-minmax-neonfma-lane-ld64.c",
4586    "src/f32-gemm/gen/6x2-minmax-neonfma-lane-ld64.c",
4587    "src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld64.c",
4588    "src/f32-gemm/gen/6x8-minmax-neonfma-lane-ld128.c",
4589    "src/f32-igemm/gen/1x8-minmax-neonfma-lane-ld64.c",
4590    "src/f32-igemm/gen/4x2-minmax-neonfma-lane-ld64.c",
4591    "src/f32-igemm/gen/4x4-minmax-neonfma-lane-ld64.c",
4592    "src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld64.c",
4593    "src/f32-igemm/gen/4x8-minmax-neonfma-lane-ld128.c",
4594    "src/f32-igemm/gen/6x2-minmax-neonfma-lane-ld64.c",
4595    "src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld64.c",
4596    "src/f32-igemm/gen/6x8-minmax-neonfma-lane-ld128.c",
4597    "src/f32-spmm/gen/4x2-minmax-neonfma.c",
4598    "src/f32-spmm/gen/4x4-minmax-neonfma.c",
4599    "src/f32-spmm/gen/8x2-minmax-neonfma.c",
4600    "src/f32-spmm/gen/8x4-minmax-neonfma.c",
4601    "src/f32-spmm/gen/12x2-minmax-neonfma.c",
4602    "src/f32-spmm/gen/12x4-minmax-neonfma.c",
4603    "src/f32-spmm/gen/16x2-minmax-neonfma.c",
4604    "src/f32-spmm/gen/16x4-minmax-neonfma.c",
4605    "src/f32-spmm/gen/32x2-minmax-neonfma.c",
4606    "src/f32-spmm/gen/32x4-minmax-neonfma.c",
4607    "src/f32-vbinary/gen/vdiv-minmax-neon-x4.c",
4608    "src/f32-vbinary/gen/vdiv-minmax-neon-x8.c",
4609    "src/f32-vbinary/gen/vdivc-minmax-neon-x4.c",
4610    "src/f32-vbinary/gen/vdivc-minmax-neon-x8.c",
4611    "src/f32-vbinary/gen/vrdivc-minmax-neon-x4.c",
4612    "src/f32-vbinary/gen/vrdivc-minmax-neon-x8.c",
4613    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x4.c",
4614    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x8.c",
4615    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x12.c",
4616    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x16.c",
4617    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x20.c",
4618    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut64-p2-div-x24.c",
4619    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x4.c",
4620    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x8.c",
4621    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x12.c",
4622    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x16.c",
4623    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x20.c",
4624    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-lut2048-p1-div-x24.c",
4625    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x4.c",
4626    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x8.c",
4627    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x12.c",
4628    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x16.c",
4629    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x20.c",
4630    "src/f32-vsigmoid/gen/vsigmoid-neonfma-rr1-p5-div-x24.c",
4631    "src/f32-vsqrt/gen/neon-sqrt-x4.c",
4632    "src/f32-vsqrt/gen/neon-sqrt-x8.c",
4633    "src/math/sigmoid-f32-neonfma-rr1-lut64-p2-div.c",
4634    "src/math/sigmoid-f32-neonfma-rr1-lut2048-p1-div.c",
4635    "src/math/sigmoid-f32-neonfma-rr1-p5-div.c",
4636    "src/math/sigmoid-f32-neonfma-rr2-lut64-p2-div.c",
4637    "src/math/sigmoid-f32-neonfma-rr2-lut2048-p1-div.c",
4638    "src/math/sigmoid-f32-neonfma-rr2-p5-div.c",
4639    "src/x8-lut/gen/lut-neon-tbx128x4-x16.c",
4640    "src/x8-lut/gen/lut-neon-tbx128x4-x32.c",
4641    "src/x8-lut/gen/lut-neon-tbx128x4-x48.c",
4642    "src/x8-lut/gen/lut-neon-tbx128x4-x64.c",
4643    "src/x24-transposec/4x4-aarch64-tbl.c",
4644    "src/x32-transposec/4x4-aarch64-tbl.c",
4645]
4646
4647PROD_NEONV8_MICROKERNEL_SRCS = [
4648    "src/f32-qs8-vcvt/gen/vcvt-neonv8-x32.c",
4649    "src/f32-qu8-vcvt/gen/vcvt-neonv8-x32.c",
4650    "src/f32-vrnd/gen/vrndd-neonv8-x8.c",
4651    "src/f32-vrnd/gen/vrndne-neonv8-x8.c",
4652    "src/f32-vrnd/gen/vrndu-neonv8-x8.c",
4653    "src/f32-vrnd/gen/vrndz-neonv8-x8.c",
4654    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neonv8-mla8-ld64.c",
4655    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neonv8-mla8-ld128.c",
4656    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mla8-ld64.c",
4657    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mla8-ld64.c",
4658    "src/qc8-gemm/gen/1x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4659    "src/qc8-gemm/gen/1x8-minmax-fp32-neonv8-mlal-lane.c",
4660    "src/qc8-gemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4661    "src/qc8-gemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4662    "src/qc8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4663    "src/qc8-gemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4664    "src/qc8-gemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4665    "src/qc8-gemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4666    "src/qc8-igemm/gen/1x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4667    "src/qc8-igemm/gen/1x8-minmax-fp32-neonv8-mlal-lane.c",
4668    "src/qc8-igemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4669    "src/qc8-igemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4670    "src/qc8-igemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4671    "src/qc8-igemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4672    "src/qc8-igemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4673    "src/qc8-igemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4674]
4675
4676ALL_NEONV8_MICROKERNEL_SRCS = [
4677    "src/f32-qs8-vcvt/gen/vcvt-neonv8-x8.c",
4678    "src/f32-qs8-vcvt/gen/vcvt-neonv8-x16.c",
4679    "src/f32-qs8-vcvt/gen/vcvt-neonv8-x24.c",
4680    "src/f32-qs8-vcvt/gen/vcvt-neonv8-x32.c",
4681    "src/f32-qu8-vcvt/gen/vcvt-neonv8-x8.c",
4682    "src/f32-qu8-vcvt/gen/vcvt-neonv8-x16.c",
4683    "src/f32-qu8-vcvt/gen/vcvt-neonv8-x24.c",
4684    "src/f32-qu8-vcvt/gen/vcvt-neonv8-x32.c",
4685    "src/f32-vrnd/gen/vrndd-neonv8-x4.c",
4686    "src/f32-vrnd/gen/vrndd-neonv8-x8.c",
4687    "src/f32-vrnd/gen/vrndne-neonv8-x4.c",
4688    "src/f32-vrnd/gen/vrndne-neonv8-x8.c",
4689    "src/f32-vrnd/gen/vrndu-neonv8-x4.c",
4690    "src/f32-vrnd/gen/vrndu-neonv8-x8.c",
4691    "src/f32-vrnd/gen/vrndz-neonv8-x4.c",
4692    "src/f32-vrnd/gen/vrndz-neonv8-x8.c",
4693    "src/math/cvt-f32-qs8-neonv8.c",
4694    "src/math/cvt-f32-qu8-neonv8.c",
4695    "src/math/roundd-neonv8.c",
4696    "src/math/roundne-neonv8.c",
4697    "src/math/roundu-neonv8.c",
4698    "src/math/roundz-neonv8.c",
4699    "src/qc8-dwconv/gen/up8x3-minmax-fp32-neonv8-mla8-ld64.c",
4700    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neonv8-mla8-ld64.c",
4701    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neonv8-mul8-ld64.c",
4702    "src/qc8-dwconv/gen/up8x9-minmax-fp32-neonv8-mul16.c",
4703    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neonv8-mla8-ld64.c",
4704    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neonv8-mul8-ld64.c",
4705    "src/qc8-dwconv/gen/up8x25-minmax-fp32-neonv8-mul16.c",
4706    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neonv8-mla8-ld64.c",
4707    "src/qc8-dwconv/gen/up16x3-minmax-fp32-neonv8-mla8-ld128.c",
4708    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mla8-ld64.c",
4709    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mla8-ld128.c",
4710    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul8-ld64.c",
4711    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul8-ld128.c",
4712    "src/qc8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul16.c",
4713    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mla8-ld64.c",
4714    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mla8-ld128.c",
4715    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul8-ld64.c",
4716    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul8-ld128.c",
4717    "src/qc8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul16.c",
4718    "src/qc8-dwconv/gen/up24x9-minmax-fp32-neonv8-mul16.c",
4719    "src/qc8-dwconv/gen/up24x25-minmax-fp32-neonv8-mul16.c",
4720    "src/qc8-dwconv/gen/up32x9-minmax-fp32-neonv8-mul16.c",
4721    "src/qc8-dwconv/gen/up32x25-minmax-fp32-neonv8-mul16.c",
4722    "src/qc8-gemm/gen/1x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4723    "src/qc8-gemm/gen/1x8-minmax-fp32-neonv8-mlal-lane.c",
4724    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-dup.c",
4725    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4726    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4727    "src/qc8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4728    "src/qc8-gemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4729    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-dup.c",
4730    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4731    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4732    "src/qc8-gemm/gen/1x8c4s2-minmax-fp32-neonv8-mlal.c",
4733    "src/qc8-gemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4734    "src/qc8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4735    "src/qc8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4736    "src/qc8-gemm/gen/2x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4737    "src/qc8-gemm/gen/2x8-minmax-fp32-neonv8-mlal-lane.c",
4738    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-dup.c",
4739    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4740    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4741    "src/qc8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4742    "src/qc8-gemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4743    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-dup.c",
4744    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4745    "src/qc8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4746    "src/qc8-gemm/gen/2x8c4s2-minmax-fp32-neonv8-mlal.c",
4747    "src/qc8-gemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4748    "src/qc8-gemm/gen/2x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4749    "src/qc8-gemm/gen/2x16-minmax-fp32-neonv8-mlal-lane.c",
4750    "src/qc8-gemm/gen/3x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4751    "src/qc8-gemm/gen/3x8-minmax-fp32-neonv8-mlal-lane.c",
4752    "src/qc8-gemm/gen/3x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4753    "src/qc8-gemm/gen/3x16-minmax-fp32-neonv8-mlal-lane.c",
4754    "src/qc8-gemm/gen/4x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4755    "src/qc8-gemm/gen/4x8-minmax-fp32-neonv8-mlal-lane.c",
4756    "src/qc8-gemm/gen/4x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4757    "src/qc8-gemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4758    "src/qc8-gemm/gen/6x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4759    "src/qc8-gemm/gen/6x8-minmax-fp32-neonv8-mlal-lane.c",
4760    "src/qc8-gemm/gen/6x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4761    "src/qc8-gemm/gen/6x16-minmax-fp32-neonv8-mlal-lane.c",
4762    "src/qc8-igemm/gen/1x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4763    "src/qc8-igemm/gen/1x8-minmax-fp32-neonv8-mlal-lane.c",
4764    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-dup.c",
4765    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4766    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4767    "src/qc8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4768    "src/qc8-igemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4769    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-dup.c",
4770    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4771    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4772    "src/qc8-igemm/gen/1x8c4s2-minmax-fp32-neonv8-mlal.c",
4773    "src/qc8-igemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4774    "src/qc8-igemm/gen/1x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4775    "src/qc8-igemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4776    "src/qc8-igemm/gen/2x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4777    "src/qc8-igemm/gen/2x8-minmax-fp32-neonv8-mlal-lane.c",
4778    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-dup.c",
4779    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4780    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4781    "src/qc8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4782    "src/qc8-igemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4783    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-dup.c",
4784    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4785    "src/qc8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4786    "src/qc8-igemm/gen/2x8c4s2-minmax-fp32-neonv8-mlal.c",
4787    "src/qc8-igemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4788    "src/qc8-igemm/gen/2x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4789    "src/qc8-igemm/gen/2x16-minmax-fp32-neonv8-mlal-lane.c",
4790    "src/qc8-igemm/gen/3x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4791    "src/qc8-igemm/gen/3x8-minmax-fp32-neonv8-mlal-lane.c",
4792    "src/qc8-igemm/gen/3x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4793    "src/qc8-igemm/gen/3x16-minmax-fp32-neonv8-mlal-lane.c",
4794    "src/qc8-igemm/gen/4x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4795    "src/qc8-igemm/gen/4x8-minmax-fp32-neonv8-mlal-lane.c",
4796    "src/qc8-igemm/gen/4x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4797    "src/qc8-igemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4798    "src/qc8-igemm/gen/6x8-minmax-fp32-neonv8-mlal-lane-prfm.c",
4799    "src/qc8-igemm/gen/6x8-minmax-fp32-neonv8-mlal-lane.c",
4800    "src/qc8-igemm/gen/6x16-minmax-fp32-neonv8-mlal-lane-prfm.c",
4801    "src/qc8-igemm/gen/6x16-minmax-fp32-neonv8-mlal-lane.c",
4802    "src/qs8-dwconv/gen/up8x9-minmax-fp32-neonv8-mul16.c",
4803    "src/qs8-dwconv/gen/up8x25-minmax-fp32-neonv8-mul16.c",
4804    "src/qs8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul16.c",
4805    "src/qs8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul16.c",
4806    "src/qs8-dwconv/gen/up24x9-minmax-fp32-neonv8-mul16.c",
4807    "src/qs8-dwconv/gen/up24x25-minmax-fp32-neonv8-mul16.c",
4808    "src/qs8-dwconv/gen/up32x9-minmax-fp32-neonv8-mul16.c",
4809    "src/qs8-dwconv/gen/up32x25-minmax-fp32-neonv8-mul16.c",
4810    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c8.c",
4811    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c16.c",
4812    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c24.c",
4813    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c32.c",
4814    "src/qs8-gavgpool/gen/7x-minmax-fp32-neonv8-c8.c",
4815    "src/qs8-gavgpool/gen/7x-minmax-fp32-neonv8-c16.c",
4816    "src/qs8-gavgpool/gen/7x-minmax-fp32-neonv8-c24.c",
4817    "src/qs8-gavgpool/gen/7x-minmax-fp32-neonv8-c32.c",
4818    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-dup.c",
4819    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4820    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4821    "src/qs8-gemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4822    "src/qs8-gemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4823    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-dup.c",
4824    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4825    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4826    "src/qs8-gemm/gen/1x8c4s2-minmax-fp32-neonv8-mlal.c",
4827    "src/qs8-gemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4828    "src/qs8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4829    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-dup.c",
4830    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4831    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4832    "src/qs8-gemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4833    "src/qs8-gemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4834    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-dup.c",
4835    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4836    "src/qs8-gemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4837    "src/qs8-gemm/gen/2x8c4s2-minmax-fp32-neonv8-mlal.c",
4838    "src/qs8-gemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4839    "src/qs8-gemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4840    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-dup.c",
4841    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4842    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4843    "src/qs8-igemm/gen/1x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4844    "src/qs8-igemm/gen/1x8c2s4-minmax-fp32-neonv8-mlal.c",
4845    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-dup.c",
4846    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4847    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4848    "src/qs8-igemm/gen/1x8c4s2-minmax-fp32-neonv8-mlal.c",
4849    "src/qs8-igemm/gen/1x8c8-minmax-fp32-neonv8-mlal.c",
4850    "src/qs8-igemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4851    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-dup.c",
4852    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld1r.c",
4853    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld2r.c",
4854    "src/qs8-igemm/gen/2x8c2-minmax-fp32-neonv8-mlal-ld4r.c",
4855    "src/qs8-igemm/gen/2x8c2s4-minmax-fp32-neonv8-mlal.c",
4856    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-dup.c",
4857    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld1r.c",
4858    "src/qs8-igemm/gen/2x8c4-minmax-fp32-neonv8-mlal-ld2r.c",
4859    "src/qs8-igemm/gen/2x8c4s2-minmax-fp32-neonv8-mlal.c",
4860    "src/qs8-igemm/gen/2x8c8-minmax-fp32-neonv8-mlal.c",
4861    "src/qs8-igemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4862    "src/qs8-vmul/gen/minmax-fp32-neonv8-ld64-x8.c",
4863    "src/qs8-vmul/gen/minmax-fp32-neonv8-ld64-x16.c",
4864    "src/qs8-vmul/gen/minmax-fp32-neonv8-ld128-x16.c",
4865    "src/qs8-vmulc/gen/minmax-fp32-neonv8-ld64-x8.c",
4866    "src/qs8-vmulc/gen/minmax-fp32-neonv8-ld64-x16.c",
4867    "src/qs8-vmulc/gen/minmax-fp32-neonv8-ld128-x16.c",
4868    "src/qu8-dwconv/gen/up8x9-minmax-fp32-neonv8-mul16.c",
4869    "src/qu8-dwconv/gen/up8x25-minmax-fp32-neonv8-mul16.c",
4870    "src/qu8-dwconv/gen/up16x9-minmax-fp32-neonv8-mul16.c",
4871    "src/qu8-dwconv/gen/up16x25-minmax-fp32-neonv8-mul16.c",
4872    "src/qu8-dwconv/gen/up24x9-minmax-fp32-neonv8-mul16.c",
4873    "src/qu8-dwconv/gen/up24x25-minmax-fp32-neonv8-mul16.c",
4874    "src/qu8-dwconv/gen/up32x9-minmax-fp32-neonv8-mul16.c",
4875    "src/qu8-dwconv/gen/up32x25-minmax-fp32-neonv8-mul16.c",
4876    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c8.c",
4877    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c16.c",
4878    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c24.c",
4879    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-neonv8-c32.c",
4880    "src/qu8-gavgpool/gen/7x-minmax-fp32-neonv8-c8.c",
4881    "src/qu8-gavgpool/gen/7x-minmax-fp32-neonv8-c16.c",
4882    "src/qu8-gavgpool/gen/7x-minmax-fp32-neonv8-c24.c",
4883    "src/qu8-gavgpool/gen/7x-minmax-fp32-neonv8-c32.c",
4884    "src/qu8-gemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4885    "src/qu8-gemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4886    "src/qu8-igemm/gen/1x16-minmax-fp32-neonv8-mlal-lane.c",
4887    "src/qu8-igemm/gen/4x16-minmax-fp32-neonv8-mlal-lane.c",
4888    "src/qu8-vmul/gen/minmax-fp32-neonv8-ld64-x8.c",
4889    "src/qu8-vmul/gen/minmax-fp32-neonv8-ld64-x16.c",
4890    "src/qu8-vmul/gen/minmax-fp32-neonv8-ld128-x16.c",
4891    "src/qu8-vmulc/gen/minmax-fp32-neonv8-ld64-x8.c",
4892    "src/qu8-vmulc/gen/minmax-fp32-neonv8-ld64-x16.c",
4893    "src/qu8-vmulc/gen/minmax-fp32-neonv8-ld128-x16.c",
4894]
4895
4896PROD_NEONFP16ARITH_MICROKERNEL_SRCS = [
4897    "src/f16-avgpool/9p8x-minmax-neonfp16arith-c8.c",
4898    "src/f16-avgpool/9x-minmax-neonfp16arith-c8.c",
4899    "src/f16-dwconv/gen/up8x25-minmax-neonfp16arith-acc2.c",
4900    "src/f16-dwconv/gen/up16x3-minmax-neonfp16arith.c",
4901    "src/f16-dwconv/gen/up16x4-minmax-neonfp16arith.c",
4902    "src/f16-dwconv/gen/up16x9-minmax-neonfp16arith.c",
4903    "src/f16-gavgpool-cw/neonfp16arith-x4.c",
4904    "src/f16-gavgpool/gen/7p7x-minmax-neonfp16arith-c8.c",
4905    "src/f16-gavgpool/gen/7x-minmax-neonfp16arith-c8.c",
4906    "src/f16-gemm/gen/1x16-minmax-neonfp16arith-ld64.c",
4907    "src/f16-gemm/gen/6x16-minmax-neonfp16arith-ld64.c",
4908    "src/f16-ibilinear-chw/gen/neonfp16arith-p8.c",
4909    "src/f16-ibilinear/gen/neonfp16arith-c8.c",
4910    "src/f16-igemm/gen/1x16-minmax-neonfp16arith-ld64.c",
4911    "src/f16-igemm/gen/6x16-minmax-neonfp16arith-ld64.c",
4912    "src/f16-maxpool/9p8x-minmax-neonfp16arith-c8.c",
4913    "src/f16-pavgpool/9p8x-minmax-neonfp16arith-c8.c",
4914    "src/f16-pavgpool/9x-minmax-neonfp16arith-c8.c",
4915    "src/f16-prelu/gen/neonfp16arith-2x16.c",
4916    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x40.c",
4917    "src/f16-rmax/neonfp16arith.c",
4918    "src/f16-spmm/gen/32x1-minmax-neonfp16arith.c",
4919    "src/f16-vbinary/gen/vadd-minmax-neonfp16arith-x16.c",
4920    "src/f16-vbinary/gen/vaddc-minmax-neonfp16arith-x16.c",
4921    "src/f16-vbinary/gen/vmax-neonfp16arith-x16.c",
4922    "src/f16-vbinary/gen/vmaxc-neonfp16arith-x16.c",
4923    "src/f16-vbinary/gen/vmin-neonfp16arith-x16.c",
4924    "src/f16-vbinary/gen/vminc-neonfp16arith-x16.c",
4925    "src/f16-vbinary/gen/vmul-minmax-neonfp16arith-x16.c",
4926    "src/f16-vbinary/gen/vmulc-minmax-neonfp16arith-x16.c",
4927    "src/f16-vbinary/gen/vrsubc-minmax-neonfp16arith-x16.c",
4928    "src/f16-vbinary/gen/vsqrdiff-neonfp16arith-x16.c",
4929    "src/f16-vbinary/gen/vsqrdiffc-neonfp16arith-x16.c",
4930    "src/f16-vbinary/gen/vsub-minmax-neonfp16arith-x16.c",
4931    "src/f16-vbinary/gen/vsubc-minmax-neonfp16arith-x16.c",
4932    "src/f16-vclamp/gen/vclamp-neonfp16arith-x16.c",
4933    "src/f16-velu/gen/velu-neonfp16arith-rr1-p3-x16.c",
4934    "src/f16-vhswish/gen/vhswish-neonfp16arith-x16.c",
4935    "src/f16-vlrelu/gen/vlrelu-neonfp16arith-x16.c",
4936    "src/f16-vmulcaddc/gen/c8-minmax-neonfp16arith-2x.c",
4937    "src/f16-vrnd/gen/vrndd-neonfp16arith-x16.c",
4938    "src/f16-vrnd/gen/vrndne-neonfp16arith-x16.c",
4939    "src/f16-vrnd/gen/vrndu-neonfp16arith-x16.c",
4940    "src/f16-vrnd/gen/vrndz-neonfp16arith-x16.c",
4941    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x40.c",
4942    "src/f16-vunary/gen/vabs-neonfp16arith-x16.c",
4943    "src/f16-vunary/gen/vneg-neonfp16arith-x16.c",
4944    "src/f16-vunary/gen/vsqr-neonfp16arith-x16.c",
4945]
4946
4947ALL_NEONFP16ARITH_MICROKERNEL_SRCS = [
4948    "src/f16-avgpool/9p8x-minmax-neonfp16arith-c8.c",
4949    "src/f16-avgpool/9x-minmax-neonfp16arith-c8.c",
4950    "src/f16-dwconv/gen/up8x3-minmax-neonfp16arith-acc2.c",
4951    "src/f16-dwconv/gen/up8x3-minmax-neonfp16arith.c",
4952    "src/f16-dwconv/gen/up8x4-minmax-neonfp16arith-acc2.c",
4953    "src/f16-dwconv/gen/up8x4-minmax-neonfp16arith.c",
4954    "src/f16-dwconv/gen/up8x9-minmax-neonfp16arith-acc2.c",
4955    "src/f16-dwconv/gen/up8x9-minmax-neonfp16arith.c",
4956    "src/f16-dwconv/gen/up8x25-minmax-neonfp16arith-acc2.c",
4957    "src/f16-dwconv/gen/up8x25-minmax-neonfp16arith.c",
4958    "src/f16-dwconv/gen/up16x3-minmax-neonfp16arith-acc2.c",
4959    "src/f16-dwconv/gen/up16x3-minmax-neonfp16arith.c",
4960    "src/f16-dwconv/gen/up16x4-minmax-neonfp16arith-acc2.c",
4961    "src/f16-dwconv/gen/up16x4-minmax-neonfp16arith.c",
4962    "src/f16-dwconv/gen/up16x9-minmax-neonfp16arith-acc2.c",
4963    "src/f16-dwconv/gen/up16x9-minmax-neonfp16arith.c",
4964    "src/f16-dwconv/gen/up16x25-minmax-neonfp16arith-acc2.c",
4965    "src/f16-dwconv/gen/up16x25-minmax-neonfp16arith.c",
4966    "src/f16-dwconv/gen/up32x3-minmax-neonfp16arith-acc2.c",
4967    "src/f16-dwconv/gen/up32x3-minmax-neonfp16arith.c",
4968    "src/f16-dwconv/gen/up32x4-minmax-neonfp16arith-acc2.c",
4969    "src/f16-dwconv/gen/up32x4-minmax-neonfp16arith.c",
4970    "src/f16-dwconv/gen/up32x9-minmax-neonfp16arith-acc2.c",
4971    "src/f16-dwconv/gen/up32x9-minmax-neonfp16arith.c",
4972    "src/f16-dwconv/gen/up32x25-minmax-neonfp16arith-acc2.c",
4973    "src/f16-dwconv/gen/up32x25-minmax-neonfp16arith.c",
4974    "src/f16-gavgpool-cw/neonfp16arith-x4.c",
4975    "src/f16-gavgpool-cw/neonfp16arith-x8.c",
4976    "src/f16-gavgpool/gen/7p7x-minmax-neonfp16arith-c8.c",
4977    "src/f16-gavgpool/gen/7p7x-minmax-neonfp16arith-c16.c",
4978    "src/f16-gavgpool/gen/7p7x-minmax-neonfp16arith-c24.c",
4979    "src/f16-gavgpool/gen/7p7x-minmax-neonfp16arith-c32.c",
4980    "src/f16-gavgpool/gen/7x-minmax-neonfp16arith-c8.c",
4981    "src/f16-gavgpool/gen/7x-minmax-neonfp16arith-c16.c",
4982    "src/f16-gavgpool/gen/7x-minmax-neonfp16arith-c24.c",
4983    "src/f16-gavgpool/gen/7x-minmax-neonfp16arith-c32.c",
4984    "src/f16-gemm/gen-inc/1x8inc-minmax-neonfp16arith-ld64.c",
4985    "src/f16-gemm/gen-inc/1x16inc-minmax-neonfp16arith-ld64.c",
4986    "src/f16-gemm/gen-inc/4x8inc-minmax-neonfp16arith-ld64.c",
4987    "src/f16-gemm/gen-inc/4x16inc-minmax-neonfp16arith-ld64.c",
4988    "src/f16-gemm/gen-inc/6x8inc-minmax-neonfp16arith-ld64.c",
4989    "src/f16-gemm/gen-inc/6x16inc-minmax-neonfp16arith-ld64.c",
4990    "src/f16-gemm/gen-inc/8x8inc-minmax-neonfp16arith-ld64.c",
4991    "src/f16-gemm/gen-inc/8x16inc-minmax-neonfp16arith-ld64.c",
4992    "src/f16-gemm/gen/1x8-minmax-neonfp16arith-ld64.c",
4993    "src/f16-gemm/gen/1x16-minmax-neonfp16arith-ld64.c",
4994    "src/f16-gemm/gen/4x8-minmax-neonfp16arith-ld64.c",
4995    "src/f16-gemm/gen/4x16-minmax-neonfp16arith-ld64.c",
4996    "src/f16-gemm/gen/6x8-minmax-neonfp16arith-ld64.c",
4997    "src/f16-gemm/gen/6x16-minmax-neonfp16arith-ld64.c",
4998    "src/f16-gemm/gen/8x8-minmax-neonfp16arith-ld64.c",
4999    "src/f16-gemm/gen/8x16-minmax-neonfp16arith-ld64.c",
5000    "src/f16-ibilinear-chw/gen/neonfp16arith-p4.c",
5001    "src/f16-ibilinear-chw/gen/neonfp16arith-p8.c",
5002    "src/f16-ibilinear-chw/gen/neonfp16arith-p16.c",
5003    "src/f16-ibilinear/gen/neonfp16arith-c8.c",
5004    "src/f16-ibilinear/gen/neonfp16arith-c16.c",
5005    "src/f16-igemm/gen/1x8-minmax-neonfp16arith-ld64.c",
5006    "src/f16-igemm/gen/1x16-minmax-neonfp16arith-ld64.c",
5007    "src/f16-igemm/gen/4x8-minmax-neonfp16arith-ld64.c",
5008    "src/f16-igemm/gen/4x16-minmax-neonfp16arith-ld64.c",
5009    "src/f16-igemm/gen/6x8-minmax-neonfp16arith-ld64.c",
5010    "src/f16-igemm/gen/6x16-minmax-neonfp16arith-ld64.c",
5011    "src/f16-igemm/gen/8x8-minmax-neonfp16arith-ld64.c",
5012    "src/f16-igemm/gen/8x16-minmax-neonfp16arith-ld64.c",
5013    "src/f16-maxpool/9p8x-minmax-neonfp16arith-c8.c",
5014    "src/f16-pavgpool/9p8x-minmax-neonfp16arith-c8.c",
5015    "src/f16-pavgpool/9x-minmax-neonfp16arith-c8.c",
5016    "src/f16-prelu/gen/neonfp16arith-2x8.c",
5017    "src/f16-prelu/gen/neonfp16arith-2x16.c",
5018    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x32-acc2.c",
5019    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x32-acc4.c",
5020    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x32.c",
5021    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x40-acc2.c",
5022    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x40-acc5.c",
5023    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x40.c",
5024    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x48-acc2.c",
5025    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x48-acc3.c",
5026    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x48.c",
5027    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x64-acc2.c",
5028    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x64-acc4.c",
5029    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x64.c",
5030    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x72-acc3.c",
5031    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x72.c",
5032    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x80-acc2.c",
5033    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x80-acc5.c",
5034    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x80.c",
5035    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x96-acc2.c",
5036    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x96-acc3.c",
5037    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x96-acc6.c",
5038    "src/f16-raddstoreexpminusmax/gen/neonfp16arith-rr2-p2-x96.c",
5039    "src/f16-rmax/neonfp16arith.c",
5040    "src/f16-spmm/gen/8x1-minmax-neonfp16arith-x2.c",
5041    "src/f16-spmm/gen/8x1-minmax-neonfp16arith.c",
5042    "src/f16-spmm/gen/16x1-minmax-neonfp16arith-x2.c",
5043    "src/f16-spmm/gen/16x1-minmax-neonfp16arith.c",
5044    "src/f16-spmm/gen/24x1-minmax-neonfp16arith-x2.c",
5045    "src/f16-spmm/gen/24x1-minmax-neonfp16arith.c",
5046    "src/f16-spmm/gen/32x1-minmax-neonfp16arith-x2.c",
5047    "src/f16-spmm/gen/32x1-minmax-neonfp16arith.c",
5048    "src/f16-vbinary/gen/vadd-minmax-neonfp16arith-x8.c",
5049    "src/f16-vbinary/gen/vadd-minmax-neonfp16arith-x16.c",
5050    "src/f16-vbinary/gen/vaddc-minmax-neonfp16arith-x8.c",
5051    "src/f16-vbinary/gen/vaddc-minmax-neonfp16arith-x16.c",
5052    "src/f16-vbinary/gen/vmax-neonfp16arith-x8.c",
5053    "src/f16-vbinary/gen/vmax-neonfp16arith-x16.c",
5054    "src/f16-vbinary/gen/vmaxc-neonfp16arith-x8.c",
5055    "src/f16-vbinary/gen/vmaxc-neonfp16arith-x16.c",
5056    "src/f16-vbinary/gen/vmin-neonfp16arith-x8.c",
5057    "src/f16-vbinary/gen/vmin-neonfp16arith-x16.c",
5058    "src/f16-vbinary/gen/vminc-neonfp16arith-x8.c",
5059    "src/f16-vbinary/gen/vminc-neonfp16arith-x16.c",
5060    "src/f16-vbinary/gen/vmul-minmax-neonfp16arith-x8.c",
5061    "src/f16-vbinary/gen/vmul-minmax-neonfp16arith-x16.c",
5062    "src/f16-vbinary/gen/vmulc-minmax-neonfp16arith-x8.c",
5063    "src/f16-vbinary/gen/vmulc-minmax-neonfp16arith-x16.c",
5064    "src/f16-vbinary/gen/vrsubc-minmax-neonfp16arith-x8.c",
5065    "src/f16-vbinary/gen/vrsubc-minmax-neonfp16arith-x16.c",
5066    "src/f16-vbinary/gen/vsqrdiff-neonfp16arith-x8.c",
5067    "src/f16-vbinary/gen/vsqrdiff-neonfp16arith-x16.c",
5068    "src/f16-vbinary/gen/vsqrdiffc-neonfp16arith-x8.c",
5069    "src/f16-vbinary/gen/vsqrdiffc-neonfp16arith-x16.c",
5070    "src/f16-vbinary/gen/vsub-minmax-neonfp16arith-x8.c",
5071    "src/f16-vbinary/gen/vsub-minmax-neonfp16arith-x16.c",
5072    "src/f16-vbinary/gen/vsubc-minmax-neonfp16arith-x8.c",
5073    "src/f16-vbinary/gen/vsubc-minmax-neonfp16arith-x16.c",
5074    "src/f16-vclamp/gen/vclamp-neonfp16arith-x8.c",
5075    "src/f16-vclamp/gen/vclamp-neonfp16arith-x16.c",
5076    "src/f16-velu/gen/velu-neonfp16arith-rr1-p3-x8.c",
5077    "src/f16-velu/gen/velu-neonfp16arith-rr1-p3-x16.c",
5078    "src/f16-vhswish/gen/vhswish-neonfp16arith-x8.c",
5079    "src/f16-vhswish/gen/vhswish-neonfp16arith-x16.c",
5080    "src/f16-vlrelu/gen/vlrelu-neonfp16arith-x8.c",
5081    "src/f16-vlrelu/gen/vlrelu-neonfp16arith-x16.c",
5082    "src/f16-vmulcaddc/gen/c8-minmax-neonfp16arith-2x.c",
5083    "src/f16-vmulcaddc/gen/c16-minmax-neonfp16arith-2x.c",
5084    "src/f16-vrnd/gen/vrndd-neonfp16arith-x8.c",
5085    "src/f16-vrnd/gen/vrndd-neonfp16arith-x16.c",
5086    "src/f16-vrnd/gen/vrndne-neonfp16arith-x8.c",
5087    "src/f16-vrnd/gen/vrndne-neonfp16arith-x16.c",
5088    "src/f16-vrnd/gen/vrndu-neonfp16arith-x8.c",
5089    "src/f16-vrnd/gen/vrndu-neonfp16arith-x16.c",
5090    "src/f16-vrnd/gen/vrndz-neonfp16arith-x8.c",
5091    "src/f16-vrnd/gen/vrndz-neonfp16arith-x16.c",
5092    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x8.c",
5093    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x16.c",
5094    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x24.c",
5095    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x32.c",
5096    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x40.c",
5097    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x48.c",
5098    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x56.c",
5099    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1fma-x64.c",
5100    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x8.c",
5101    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x16.c",
5102    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x24.c",
5103    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x32.c",
5104    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x40.c",
5105    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x48.c",
5106    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x56.c",
5107    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-nr1recps-x64.c",
5108    "src/f16-vunary/gen/vabs-neonfp16arith-x8.c",
5109    "src/f16-vunary/gen/vabs-neonfp16arith-x16.c",
5110    "src/f16-vunary/gen/vneg-neonfp16arith-x8.c",
5111    "src/f16-vunary/gen/vneg-neonfp16arith-x16.c",
5112    "src/f16-vunary/gen/vsqr-neonfp16arith-x8.c",
5113    "src/f16-vunary/gen/vsqr-neonfp16arith-x16.c",
5114    "src/math/exp-f16-neonfp16arith-rr2-p3.c",
5115    "src/math/expminus-f16-neonfp16arith-rr1-p2.c",
5116    "src/math/expminus-f16-neonfp16arith-rr1-p3.c",
5117    "src/math/expminus-f16-neonfp16arith-rr2-p2.c",
5118    "src/math/expminus-f16-neonfp16arith-rr2-p3.c",
5119    "src/math/expm1minus-f16-neonfp16arith-rr1-p3.c",
5120    "src/math/expm1minus-f16-neonfp16arith-rr2-p3.c",
5121    "src/math/sigmoid-f16-neonfp16arith-rr2-p2-nr1fma.c",
5122    "src/math/sigmoid-f16-neonfp16arith-rr2-p2-nr1recps.c",
5123    "src/math/sigmoid-f16-neonfp16arith-rr2-p2-recpe.c",
5124    "src/math/sigmoid-f16-neonfp16arith-rr2-p3-nr1fma.c",
5125    "src/math/sigmoid-f16-neonfp16arith-rr2-p3-nr1recps.c",
5126    "src/math/sigmoid-f16-neonfp16arith-rr2-p3-recpe.c",
5127]
5128
5129PROD_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS = [
5130    "src/f16-conv-hwc2chw/3x3s2p1c3x4-neonfp16arith-2x2.c",
5131    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-2x8.c",
5132    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-1x4.c",
5133    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4.c",
5134    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4.c",
5135    "src/f16-vbinary/gen/vdiv-minmax-neonfp16arith-x8.c",
5136    "src/f16-vbinary/gen/vdivc-minmax-neonfp16arith-x8.c",
5137    "src/f16-vbinary/gen/vrdivc-minmax-neonfp16arith-x8.c",
5138    "src/f16-vsqrt/gen/neonfp16arith-sqrt-x8.c",
5139]
5140
5141ALL_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS = [
5142    "src/f16-conv-hwc2chw/3x3s2p1c3x4-neonfp16arith-2x2.c",
5143    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-1x8-acc2.c",
5144    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-1x8-acc3.c",
5145    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-1x8-acc4.c",
5146    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-1x8.c",
5147    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-2x8-acc2.c",
5148    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-2x8.c",
5149    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-3x8.c",
5150    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-4x8.c",
5151    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-5x8.c",
5152    "src/f16-dwconv2d-chw/gen/3x3p1-minmax-neonfp16arith-6x8.c",
5153    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-1x4-acc2.c",
5154    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-1x4-acc3.c",
5155    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-1x4-acc4.c",
5156    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-1x4.c",
5157    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-2x4-acc2.c",
5158    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-2x4.c",
5159    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-3x4.c",
5160    "src/f16-dwconv2d-chw/gen/3x3s2p1-minmax-neonfp16arith-4x4.c",
5161    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4-acc2.c",
5162    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4-acc3.c",
5163    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4-acc4.c",
5164    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4-acc5.c",
5165    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-1x4.c",
5166    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-2x4-acc2.c",
5167    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-2x4-acc3.c",
5168    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-2x4.c",
5169    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-3x4-acc2.c",
5170    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-3x4.c",
5171    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-4x4-acc2.c",
5172    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-4x4.c",
5173    "src/f16-dwconv2d-chw/gen/5x5p2-minmax-neonfp16arith-5x4.c",
5174    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4-acc2.c",
5175    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4-acc3.c",
5176    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4-acc4.c",
5177    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4-acc5.c",
5178    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-1x4.c",
5179    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-2x4-acc2.c",
5180    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-2x4-acc3.c",
5181    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-2x4.c",
5182    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-3x4-acc2.c",
5183    "src/f16-dwconv2d-chw/gen/5x5s2p2-minmax-neonfp16arith-3x4.c",
5184    "src/f16-vbinary/gen/vdiv-minmax-neonfp16arith-x8.c",
5185    "src/f16-vbinary/gen/vdiv-minmax-neonfp16arith-x16.c",
5186    "src/f16-vbinary/gen/vdivc-minmax-neonfp16arith-x8.c",
5187    "src/f16-vbinary/gen/vdivc-minmax-neonfp16arith-x16.c",
5188    "src/f16-vbinary/gen/vrdivc-minmax-neonfp16arith-x8.c",
5189    "src/f16-vbinary/gen/vrdivc-minmax-neonfp16arith-x16.c",
5190    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x8.c",
5191    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x16.c",
5192    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x24.c",
5193    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x32.c",
5194    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x40.c",
5195    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x48.c",
5196    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x56.c",
5197    "src/f16-vsigmoid/gen/vsigmoid-neonfp16arith-rr2-p2-div-x64.c",
5198    "src/f16-vsqrt/gen/neonfp16arith-sqrt-x8.c",
5199    "src/f16-vsqrt/gen/neonfp16arith-sqrt-x16.c",
5200    "src/math/sigmoid-f16-neonfp16arith-rr1-p2-div.c",
5201    "src/math/sigmoid-f16-neonfp16arith-rr1-p3-div.c",
5202    "src/math/sigmoid-f16-neonfp16arith-rr2-p2-div.c",
5203    "src/math/sigmoid-f16-neonfp16arith-rr2-p3-div.c",
5204]
5205
5206PROD_NEONBF16_MICROKERNEL_SRCS = [
5207]
5208
5209ALL_NEONBF16_MICROKERNEL_SRCS = [
5210    "src/bf16-gemm/gen/1x4c8-minmax-neonbf16-bfdot.c",
5211    "src/bf16-gemm/gen/1x4c8-minmax-neonbf16-bfmlal.c",
5212    "src/bf16-gemm/gen/1x8c2-minmax-neonbf16-bfdot-lane-ld128.c",
5213    "src/bf16-gemm/gen/2x4c8-minmax-neonbf16-bfdot.c",
5214    "src/bf16-gemm/gen/2x4c8-minmax-neonbf16-bfmlal.c",
5215    "src/bf16-gemm/gen/3x4c8-minmax-neonbf16-bfdot.c",
5216    "src/bf16-gemm/gen/3x4c8-minmax-neonbf16-bfmlal.c",
5217    "src/bf16-gemm/gen/4x4c8-minmax-neonbf16-bfdot.c",
5218    "src/bf16-gemm/gen/4x4c8-minmax-neonbf16-bfmlal.c",
5219    "src/bf16-gemm/gen/4x8c2-minmax-neonbf16-bfdot-lane-ld128.c",
5220    "src/bf16-gemm/gen/5x4c8-minmax-neonbf16-bfdot.c",
5221    "src/bf16-gemm/gen/5x4c8-minmax-neonbf16-bfmlal.c",
5222    "src/bf16-gemm/gen/5x8c2-minmax-neonbf16-bfdot-lane-ld128.c",
5223    "src/bf16-gemm/gen/6x8c2-minmax-neonbf16-bfdot-lane-ld128.c",
5224]
5225
5226PROD_AARCH64_NEONBF16_MICROKERNEL_SRCS = [
5227]
5228
5229ALL_AARCH64_NEONBF16_MICROKERNEL_SRCS = [
5230]
5231
5232PROD_NEONDOT_MICROKERNEL_SRCS = [
5233    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neondot.c",
5234    "src/qc8-gemm/gen/1x16c4-minmax-fp32-neondot.c",
5235    "src/qc8-gemm/gen/4x8c4-minmax-fp32-neondot.c",
5236    "src/qc8-gemm/gen/4x16c4-minmax-fp32-neondot.c",
5237    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neondot.c",
5238    "src/qc8-igemm/gen/1x16c4-minmax-fp32-neondot.c",
5239    "src/qc8-igemm/gen/4x8c4-minmax-fp32-neondot.c",
5240    "src/qc8-igemm/gen/4x16c4-minmax-fp32-neondot.c",
5241    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neondot.c",
5242    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neondot.c",
5243    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neondot.c",
5244    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neondot.c",
5245    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neondot.c",
5246    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neondot.c",
5247    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neondot.c",
5248    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neondot.c",
5249    "src/qu8-gemm/gen/1x8c4-minmax-rndnu-neondot.c",
5250    "src/qu8-gemm/gen/1x16c4-minmax-rndnu-neondot.c",
5251    "src/qu8-gemm/gen/4x8c4-minmax-rndnu-neondot.c",
5252    "src/qu8-gemm/gen/4x16c4-minmax-rndnu-neondot.c",
5253    "src/qu8-igemm/gen/1x8c4-minmax-rndnu-neondot.c",
5254    "src/qu8-igemm/gen/1x16c4-minmax-rndnu-neondot.c",
5255    "src/qu8-igemm/gen/4x8c4-minmax-rndnu-neondot.c",
5256    "src/qu8-igemm/gen/4x16c4-minmax-rndnu-neondot.c",
5257]
5258
5259ALL_NEONDOT_MICROKERNEL_SRCS = [
5260    "src/qc8-gemm/gen/1x8c4-minmax-fp32-neondot.c",
5261    "src/qc8-gemm/gen/1x16c4-minmax-fp32-neondot.c",
5262    "src/qc8-gemm/gen/4x8c4-minmax-fp32-neondot.c",
5263    "src/qc8-gemm/gen/4x16c4-minmax-fp32-neondot.c",
5264    "src/qc8-gemm/gen/6x8c4-minmax-fp32-neondot.c",
5265    "src/qc8-gemm/gen/6x16c4-minmax-fp32-neondot.c",
5266    "src/qc8-gemm/gen/8x8c4-minmax-fp32-neondot.c",
5267    "src/qc8-gemm/gen/8x16c4-minmax-fp32-neondot.c",
5268    "src/qc8-igemm/gen/1x8c4-minmax-fp32-neondot.c",
5269    "src/qc8-igemm/gen/1x16c4-minmax-fp32-neondot.c",
5270    "src/qc8-igemm/gen/4x8c4-minmax-fp32-neondot.c",
5271    "src/qc8-igemm/gen/4x16c4-minmax-fp32-neondot.c",
5272    "src/qc8-igemm/gen/6x8c4-minmax-fp32-neondot.c",
5273    "src/qc8-igemm/gen/6x16c4-minmax-fp32-neondot.c",
5274    "src/qc8-igemm/gen/8x8c4-minmax-fp32-neondot.c",
5275    "src/qc8-igemm/gen/8x16c4-minmax-fp32-neondot.c",
5276    "src/qs8-gemm/gen/1x8c4-minmax-fp32-neondot.c",
5277    "src/qs8-gemm/gen/1x8c4-minmax-rndnu-neondot.c",
5278    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-neondot.c",
5279    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-neondot.c",
5280    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-neondot.c",
5281    "src/qs8-gemm/gen/6x8c4-minmax-rndnu-neondot.c",
5282    "src/qs8-gemm/gen/6x16c4-minmax-rndnu-neondot.c",
5283    "src/qs8-gemm/gen/8x8c4-minmax-rndnu-neondot.c",
5284    "src/qs8-gemm/gen/8x16c4-minmax-rndnu-neondot.c",
5285    "src/qs8-igemm/gen/1x8c4-minmax-fp32-neondot.c",
5286    "src/qs8-igemm/gen/1x8c4-minmax-rndnu-neondot.c",
5287    "src/qs8-igemm/gen/1x16c4-minmax-rndnu-neondot.c",
5288    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-neondot.c",
5289    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-neondot.c",
5290    "src/qs8-igemm/gen/6x8c4-minmax-rndnu-neondot.c",
5291    "src/qs8-igemm/gen/6x16c4-minmax-rndnu-neondot.c",
5292    "src/qs8-igemm/gen/8x8c4-minmax-rndnu-neondot.c",
5293    "src/qs8-igemm/gen/8x16c4-minmax-rndnu-neondot.c",
5294    "src/qu8-gemm/gen/1x8c4-minmax-rndnu-neondot.c",
5295    "src/qu8-gemm/gen/1x16c4-minmax-fp32-neondot.c",
5296    "src/qu8-gemm/gen/1x16c4-minmax-rndnu-neondot.c",
5297    "src/qu8-gemm/gen/1x32c4-minmax-rndnu-neondot.c",
5298    "src/qu8-gemm/gen/2x8c4-minmax-rndnu-neondot.c",
5299    "src/qu8-gemm/gen/2x16c4-minmax-fp32-neondot.c",
5300    "src/qu8-gemm/gen/2x16c4-minmax-rndnu-neondot.c",
5301    "src/qu8-gemm/gen/2x32c4-minmax-rndnu-neondot.c",
5302    "src/qu8-gemm/gen/3x8c4-minmax-rndnu-neondot.c",
5303    "src/qu8-gemm/gen/3x16c4-minmax-rndnu-neondot.c",
5304    "src/qu8-gemm/gen/3x32c4-minmax-rndnu-neondot.c",
5305    "src/qu8-gemm/gen/4x8c4-minmax-rndnu-neondot.c",
5306    "src/qu8-gemm/gen/4x16c4-minmax-fp32-neondot.c",
5307    "src/qu8-gemm/gen/4x16c4-minmax-rndnu-neondot.c",
5308    "src/qu8-gemm/gen/5x8c4-minmax-rndnu-neondot.c",
5309    "src/qu8-gemm/gen/5x16c4-minmax-rndnu-neondot.c",
5310    "src/qu8-gemm/gen/6x8c4-minmax-rndnu-neondot.c",
5311    "src/qu8-gemm/gen/6x16c4-minmax-rndnu-neondot.c",
5312    "src/qu8-gemm/gen/8x8c4-minmax-rndnu-neondot.c",
5313    "src/qu8-gemm/gen/8x16c4-minmax-rndnu-neondot.c",
5314    "src/qu8-igemm/gen/1x8c4-minmax-rndnu-neondot.c",
5315    "src/qu8-igemm/gen/1x16c4-minmax-fp32-neondot.c",
5316    "src/qu8-igemm/gen/1x16c4-minmax-rndnu-neondot.c",
5317    "src/qu8-igemm/gen/1x32c4-minmax-rndnu-neondot.c",
5318    "src/qu8-igemm/gen/2x8c4-minmax-rndnu-neondot.c",
5319    "src/qu8-igemm/gen/2x16c4-minmax-fp32-neondot.c",
5320    "src/qu8-igemm/gen/2x16c4-minmax-rndnu-neondot.c",
5321    "src/qu8-igemm/gen/2x32c4-minmax-rndnu-neondot.c",
5322    "src/qu8-igemm/gen/3x8c4-minmax-rndnu-neondot.c",
5323    "src/qu8-igemm/gen/3x16c4-minmax-rndnu-neondot.c",
5324    "src/qu8-igemm/gen/3x32c4-minmax-rndnu-neondot.c",
5325    "src/qu8-igemm/gen/4x8c4-minmax-rndnu-neondot.c",
5326    "src/qu8-igemm/gen/4x16c4-minmax-fp32-neondot.c",
5327    "src/qu8-igemm/gen/4x16c4-minmax-rndnu-neondot.c",
5328    "src/qu8-igemm/gen/5x8c4-minmax-rndnu-neondot.c",
5329    "src/qu8-igemm/gen/5x16c4-minmax-rndnu-neondot.c",
5330    "src/qu8-igemm/gen/6x8c4-minmax-rndnu-neondot.c",
5331    "src/qu8-igemm/gen/6x16c4-minmax-rndnu-neondot.c",
5332    "src/qu8-igemm/gen/8x8c4-minmax-rndnu-neondot.c",
5333    "src/qu8-igemm/gen/8x16c4-minmax-rndnu-neondot.c",
5334]
5335
5336PROD_SSE_MICROKERNEL_SRCS = [
5337    "src/f32-avgpool/9p8x-minmax-sse-c4.c",
5338    "src/f32-avgpool/9x-minmax-sse-c4.c",
5339    "src/f32-conv-hwc2chw/3x3s2p1c3x4-sse-2x2.c",
5340    "src/f32-dwconv/gen/up8x3-minmax-sse.c",
5341    "src/f32-dwconv/gen/up8x4-minmax-sse.c",
5342    "src/f32-dwconv/gen/up8x9-minmax-sse.c",
5343    "src/f32-dwconv/gen/up8x25-minmax-sse.c",
5344    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-2x4-acc2.c",
5345    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4-acc3.c",
5346    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-4x4.c",
5347    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-2x4.c",
5348    "src/f32-gavgpool-cw/sse-x4.c",
5349    "src/f32-gavgpool/7p7x-minmax-sse-c4.c",
5350    "src/f32-gavgpool/7x-minmax-sse-c4.c",
5351    "src/f32-gemm/gen/1x8-minmax-sse-load1.c",
5352    "src/f32-gemm/gen/4x2c4-minmax-sse.c",
5353    "src/f32-gemm/gen/4x8-minmax-sse-load1.c",
5354    "src/f32-ibilinear-chw/gen/sse-p8.c",
5355    "src/f32-ibilinear/gen/sse-c8.c",
5356    "src/f32-igemm/gen/1x8-minmax-sse-load1.c",
5357    "src/f32-igemm/gen/4x2c4-minmax-sse.c",
5358    "src/f32-igemm/gen/4x8-minmax-sse-load1.c",
5359    "src/f32-maxpool/9p8x-minmax-sse-c4.c",
5360    "src/f32-pavgpool/9p8x-minmax-sse-c4.c",
5361    "src/f32-pavgpool/9x-minmax-sse-c4.c",
5362    "src/f32-rmax/sse.c",
5363    "src/f32-spmm/gen/32x1-minmax-sse.c",
5364    "src/f32-vbinary/gen/vadd-minmax-sse-x8.c",
5365    "src/f32-vbinary/gen/vaddc-minmax-sse-x8.c",
5366    "src/f32-vbinary/gen/vdiv-minmax-sse-x8.c",
5367    "src/f32-vbinary/gen/vdivc-minmax-sse-x8.c",
5368    "src/f32-vbinary/gen/vmax-sse-x8.c",
5369    "src/f32-vbinary/gen/vmaxc-sse-x8.c",
5370    "src/f32-vbinary/gen/vmin-sse-x8.c",
5371    "src/f32-vbinary/gen/vminc-sse-x8.c",
5372    "src/f32-vbinary/gen/vmul-minmax-sse-x8.c",
5373    "src/f32-vbinary/gen/vmulc-minmax-sse-x8.c",
5374    "src/f32-vbinary/gen/vrdivc-minmax-sse-x8.c",
5375    "src/f32-vbinary/gen/vrsubc-minmax-sse-x8.c",
5376    "src/f32-vbinary/gen/vsqrdiff-sse-x8.c",
5377    "src/f32-vbinary/gen/vsqrdiffc-sse-x8.c",
5378    "src/f32-vbinary/gen/vsub-minmax-sse-x8.c",
5379    "src/f32-vbinary/gen/vsubc-minmax-sse-x8.c",
5380    "src/f32-vclamp/gen/vclamp-sse-x8.c",
5381    "src/f32-vhswish/gen/vhswish-sse-x8.c",
5382    "src/f32-vlrelu/gen/vlrelu-sse-x8.c",
5383    "src/f32-vmulcaddc/gen/c4-minmax-sse-2x.c",
5384    "src/f32-vsqrt/gen/sse-sqrt-x4.c",
5385    "src/f32-vunary/gen/vabs-sse-x8.c",
5386    "src/f32-vunary/gen/vneg-sse-x8.c",
5387    "src/f32-vunary/gen/vsqr-sse-x8.c",
5388    "src/x32-packx/x4-sse.c",
5389    "src/x32-transposec/4x4-sse.c",
5390]
5391
5392ALL_SSE_MICROKERNEL_SRCS = [
5393    "src/f32-avgpool/9p8x-minmax-sse-c4.c",
5394    "src/f32-avgpool/9x-minmax-sse-c4.c",
5395    "src/f32-conv-hwc2chw/3x3s2p1c3x4-sse-1x1.c",
5396    "src/f32-conv-hwc2chw/3x3s2p1c3x4-sse-2x2.c",
5397    "src/f32-dwconv/gen/up4x3-minmax-sse-acc2.c",
5398    "src/f32-dwconv/gen/up4x3-minmax-sse.c",
5399    "src/f32-dwconv/gen/up4x4-minmax-sse-acc2.c",
5400    "src/f32-dwconv/gen/up4x4-minmax-sse.c",
5401    "src/f32-dwconv/gen/up4x9-minmax-sse-acc2.c",
5402    "src/f32-dwconv/gen/up4x9-minmax-sse.c",
5403    "src/f32-dwconv/gen/up4x25-minmax-sse-acc2.c",
5404    "src/f32-dwconv/gen/up4x25-minmax-sse.c",
5405    "src/f32-dwconv/gen/up8x3-minmax-sse-acc2.c",
5406    "src/f32-dwconv/gen/up8x3-minmax-sse.c",
5407    "src/f32-dwconv/gen/up8x4-minmax-sse-acc2.c",
5408    "src/f32-dwconv/gen/up8x4-minmax-sse.c",
5409    "src/f32-dwconv/gen/up8x9-minmax-sse-acc2.c",
5410    "src/f32-dwconv/gen/up8x9-minmax-sse.c",
5411    "src/f32-dwconv/gen/up8x25-minmax-sse-acc2.c",
5412    "src/f32-dwconv/gen/up8x25-minmax-sse.c",
5413    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-1x4-acc2.c",
5414    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-1x4-acc3.c",
5415    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-1x4-acc4.c",
5416    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-1x4.c",
5417    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-2x4-acc2.c",
5418    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-2x4.c",
5419    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-3x4.c",
5420    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-4x4.c",
5421    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-5x4.c",
5422    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-sse-6x4.c",
5423    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4-acc2.c",
5424    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4-acc3.c",
5425    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4-acc4.c",
5426    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-1x4.c",
5427    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-2x4-acc2.c",
5428    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-2x4.c",
5429    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-3x4.c",
5430    "src/f32-dwconv2d-chw/gen/3x3s2p1-minmax-sse-4x4.c",
5431    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-1x4-acc2.c",
5432    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-1x4-acc3.c",
5433    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-1x4-acc4.c",
5434    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-1x4-acc5.c",
5435    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-1x4.c",
5436    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-2x4-acc2.c",
5437    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-2x4-acc3.c",
5438    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-2x4.c",
5439    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-3x4-acc2.c",
5440    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-3x4.c",
5441    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-4x4-acc2.c",
5442    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-4x4.c",
5443    "src/f32-dwconv2d-chw/gen/5x5p2-minmax-sse-5x4.c",
5444    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-1x4-acc2.c",
5445    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-1x4-acc3.c",
5446    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-1x4-acc4.c",
5447    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-1x4-acc5.c",
5448    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-1x4.c",
5449    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-2x4-acc2.c",
5450    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-2x4-acc3.c",
5451    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-2x4.c",
5452    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-3x4-acc2.c",
5453    "src/f32-dwconv2d-chw/gen/5x5s2p2-minmax-sse-3x4.c",
5454    "src/f32-gavgpool-cw/sse-x4.c",
5455    "src/f32-gavgpool/7p7x-minmax-sse-c4.c",
5456    "src/f32-gavgpool/7x-minmax-sse-c4.c",
5457    "src/f32-gemm/gen-inc/1x8inc-minmax-sse-dup.c",
5458    "src/f32-gemm/gen-inc/1x8inc-minmax-sse-load1.c",
5459    "src/f32-gemm/gen-inc/1x8s4inc-minmax-sse.c",
5460    "src/f32-gemm/gen-inc/3x8inc-minmax-sse-dup.c",
5461    "src/f32-gemm/gen-inc/3x8inc-minmax-sse-load1.c",
5462    "src/f32-gemm/gen-inc/3x8s4inc-minmax-sse.c",
5463    "src/f32-gemm/gen-inc/4x8inc-minmax-sse-dup.c",
5464    "src/f32-gemm/gen-inc/4x8inc-minmax-sse-load1.c",
5465    "src/f32-gemm/gen-inc/4x8s4inc-minmax-sse.c",
5466    "src/f32-gemm/gen-inc/5x8inc-minmax-sse-dup.c",
5467    "src/f32-gemm/gen-inc/5x8inc-minmax-sse-load1.c",
5468    "src/f32-gemm/gen-inc/5x8s4inc-minmax-sse.c",
5469    "src/f32-gemm/gen/1x8-minmax-sse-dup.c",
5470    "src/f32-gemm/gen/1x8-minmax-sse-load1.c",
5471    "src/f32-gemm/gen/1x8s4-minmax-sse.c",
5472    "src/f32-gemm/gen/3x8-minmax-sse-dup.c",
5473    "src/f32-gemm/gen/3x8-minmax-sse-load1.c",
5474    "src/f32-gemm/gen/3x8s4-minmax-sse.c",
5475    "src/f32-gemm/gen/4x2c4-minmax-sse.c",
5476    "src/f32-gemm/gen/4x8-minmax-sse-dup.c",
5477    "src/f32-gemm/gen/4x8-minmax-sse-load1.c",
5478    "src/f32-gemm/gen/4x8s4-minmax-sse.c",
5479    "src/f32-gemm/gen/5x8-minmax-sse-dup.c",
5480    "src/f32-gemm/gen/5x8-minmax-sse-load1.c",
5481    "src/f32-gemm/gen/5x8s4-minmax-sse.c",
5482    "src/f32-ibilinear-chw/gen/sse-p4.c",
5483    "src/f32-ibilinear-chw/gen/sse-p8.c",
5484    "src/f32-ibilinear/gen/sse-c4.c",
5485    "src/f32-ibilinear/gen/sse-c8.c",
5486    "src/f32-igemm/gen/1x8-minmax-sse-dup.c",
5487    "src/f32-igemm/gen/1x8-minmax-sse-load1.c",
5488    "src/f32-igemm/gen/1x8s4-minmax-sse.c",
5489    "src/f32-igemm/gen/3x8-minmax-sse-dup.c",
5490    "src/f32-igemm/gen/3x8-minmax-sse-load1.c",
5491    "src/f32-igemm/gen/3x8s4-minmax-sse.c",
5492    "src/f32-igemm/gen/4x2c4-minmax-sse.c",
5493    "src/f32-igemm/gen/4x8-minmax-sse-dup.c",
5494    "src/f32-igemm/gen/4x8-minmax-sse-load1.c",
5495    "src/f32-igemm/gen/4x8s4-minmax-sse.c",
5496    "src/f32-igemm/gen/5x8-minmax-sse-dup.c",
5497    "src/f32-igemm/gen/5x8-minmax-sse-load1.c",
5498    "src/f32-igemm/gen/5x8s4-minmax-sse.c",
5499    "src/f32-maxpool/9p8x-minmax-sse-c4.c",
5500    "src/f32-pavgpool/9p8x-minmax-sse-c4.c",
5501    "src/f32-pavgpool/9x-minmax-sse-c4.c",
5502    "src/f32-ppmm/gen/4x8-minmax-sse.c",
5503    "src/f32-prelu/gen/sse-2x4.c",
5504    "src/f32-prelu/gen/sse-2x8.c",
5505    "src/f32-rmax/sse.c",
5506    "src/f32-spmm/gen/4x1-minmax-sse.c",
5507    "src/f32-spmm/gen/8x1-minmax-sse.c",
5508    "src/f32-spmm/gen/16x1-minmax-sse.c",
5509    "src/f32-spmm/gen/32x1-minmax-sse.c",
5510    "src/f32-vbinary/gen/vadd-minmax-sse-x4.c",
5511    "src/f32-vbinary/gen/vadd-minmax-sse-x8.c",
5512    "src/f32-vbinary/gen/vaddc-minmax-sse-x4.c",
5513    "src/f32-vbinary/gen/vaddc-minmax-sse-x8.c",
5514    "src/f32-vbinary/gen/vdiv-minmax-sse-x4.c",
5515    "src/f32-vbinary/gen/vdiv-minmax-sse-x8.c",
5516    "src/f32-vbinary/gen/vdivc-minmax-sse-x4.c",
5517    "src/f32-vbinary/gen/vdivc-minmax-sse-x8.c",
5518    "src/f32-vbinary/gen/vmax-sse-x4.c",
5519    "src/f32-vbinary/gen/vmax-sse-x8.c",
5520    "src/f32-vbinary/gen/vmaxc-sse-x4.c",
5521    "src/f32-vbinary/gen/vmaxc-sse-x8.c",
5522    "src/f32-vbinary/gen/vmin-sse-x4.c",
5523    "src/f32-vbinary/gen/vmin-sse-x8.c",
5524    "src/f32-vbinary/gen/vminc-sse-x4.c",
5525    "src/f32-vbinary/gen/vminc-sse-x8.c",
5526    "src/f32-vbinary/gen/vmul-minmax-sse-x4.c",
5527    "src/f32-vbinary/gen/vmul-minmax-sse-x8.c",
5528    "src/f32-vbinary/gen/vmulc-minmax-sse-x4.c",
5529    "src/f32-vbinary/gen/vmulc-minmax-sse-x8.c",
5530    "src/f32-vbinary/gen/vrdivc-minmax-sse-x4.c",
5531    "src/f32-vbinary/gen/vrdivc-minmax-sse-x8.c",
5532    "src/f32-vbinary/gen/vrsubc-minmax-sse-x4.c",
5533    "src/f32-vbinary/gen/vrsubc-minmax-sse-x8.c",
5534    "src/f32-vbinary/gen/vsqrdiff-sse-x4.c",
5535    "src/f32-vbinary/gen/vsqrdiff-sse-x8.c",
5536    "src/f32-vbinary/gen/vsqrdiffc-sse-x4.c",
5537    "src/f32-vbinary/gen/vsqrdiffc-sse-x8.c",
5538    "src/f32-vbinary/gen/vsub-minmax-sse-x4.c",
5539    "src/f32-vbinary/gen/vsub-minmax-sse-x8.c",
5540    "src/f32-vbinary/gen/vsubc-minmax-sse-x4.c",
5541    "src/f32-vbinary/gen/vsubc-minmax-sse-x8.c",
5542    "src/f32-vclamp/gen/vclamp-sse-x4.c",
5543    "src/f32-vclamp/gen/vclamp-sse-x8.c",
5544    "src/f32-vhswish/gen/vhswish-sse-x4.c",
5545    "src/f32-vhswish/gen/vhswish-sse-x8.c",
5546    "src/f32-vlrelu/gen/vlrelu-sse-x4.c",
5547    "src/f32-vlrelu/gen/vlrelu-sse-x8.c",
5548    "src/f32-vmulcaddc/gen/c4-minmax-sse-2x.c",
5549    "src/f32-vmulcaddc/gen/c8-minmax-sse-2x.c",
5550    "src/f32-vrelu/gen/vrelu-sse-x4.c",
5551    "src/f32-vrelu/gen/vrelu-sse-x8.c",
5552    "src/f32-vsqrt/gen/sse-sqrt-x4.c",
5553    "src/f32-vsqrt/gen/sse-sqrt-x8.c",
5554    "src/f32-vunary/gen/vabs-sse-x4.c",
5555    "src/f32-vunary/gen/vabs-sse-x8.c",
5556    "src/f32-vunary/gen/vneg-sse-x4.c",
5557    "src/f32-vunary/gen/vneg-sse-x8.c",
5558    "src/f32-vunary/gen/vsqr-sse-x4.c",
5559    "src/f32-vunary/gen/vsqr-sse-x8.c",
5560    "src/math/roundd-sse-addsub.c",
5561    "src/math/roundne-sse-addsub.c",
5562    "src/math/roundu-sse-addsub.c",
5563    "src/math/roundz-sse-addsub.c",
5564    "src/math/sqrt-sse-hh1mac.c",
5565    "src/math/sqrt-sse-nr1mac.c",
5566    "src/math/sqrt-sse-nr2mac.c",
5567    "src/x32-packx/x4-sse.c",
5568    "src/x32-transposec/4x4-sse.c",
5569]
5570
5571PROD_SSE2_MICROKERNEL_SRCS = [
5572    "src/f16-f32-vcvt/gen/vcvt-sse2-int16-x32.c",
5573    "src/f16-vunary/gen/vabs-sse2-x16.c",
5574    "src/f16-vunary/gen/vneg-sse2-x16.c",
5575    "src/f32-argmaxpool/4x-sse2-c4.c",
5576    "src/f32-argmaxpool/9p8x-sse2-c4.c",
5577    "src/f32-argmaxpool/9x-sse2-c4.c",
5578    "src/f32-f16-vcvt/gen/vcvt-sse2-x16.c",
5579    "src/f32-prelu/gen/sse2-2x8.c",
5580    "src/f32-qs8-vcvt/gen/vcvt-sse2-x32.c",
5581    "src/f32-qu8-vcvt/gen/vcvt-sse2-x32.c",
5582    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x20-acc2.c",
5583    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x12.c",
5584    "src/f32-vlrelu/gen/vlrelu-sse2-x8.c",
5585    "src/f32-vrnd/gen/vrndd-sse2-x8.c",
5586    "src/f32-vrnd/gen/vrndne-sse2-x8.c",
5587    "src/f32-vrnd/gen/vrndu-sse2-x8.c",
5588    "src/f32-vrnd/gen/vrndz-sse2-x8.c",
5589    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x8.c",
5590    "src/qc8-dwconv/gen/up8x3-minmax-fp32-sse2-mul16.c",
5591    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c",
5592    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c",
5593    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5594    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5595    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5596    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5597    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16-add16.c",
5598    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16-add16.c",
5599    "src/qs8-f32-vcvt/gen/vcvt-sse2-x32.c",
5600    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c",
5601    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c",
5602    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5603    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5604    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5605    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5606    "src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x8.c",
5607    "src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c",
5608    "src/qs8-vcvt/gen/vcvt-sse2-x32.c",
5609    "src/qs8-vlrelu/gen/vlrelu-sse2-x32.c",
5610    "src/qs8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5611    "src/qs8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5612    "src/qu8-avgpool/9p8x-minmax-sse2-c8.c",
5613    "src/qu8-avgpool/9x-minmax-sse2-c8.c",
5614    "src/qu8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c",
5615    "src/qu8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c",
5616    "src/qu8-f32-vcvt/gen/vcvt-sse2-x32.c",
5617    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c",
5618    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c",
5619    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5620    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5621    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5622    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5623    "src/qu8-vadd/gen/minmax-sse2-mul16-ld64-x8.c",
5624    "src/qu8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c",
5625    "src/qu8-vcvt/gen/vcvt-sse2-x32.c",
5626    "src/qu8-vlrelu/gen/vlrelu-sse2-x32.c",
5627    "src/qu8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5628    "src/qu8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5629    "src/s8-ibilinear/gen/sse2-c8.c",
5630    "src/s8-maxpool/9p8x-minmax-sse2-c16.c",
5631    "src/s8-vclamp/sse2-x64.c",
5632    "src/u8-ibilinear/gen/sse2-c8.c",
5633    "src/u8-maxpool/9p8x-minmax-sse2-c16.c",
5634    "src/u8-rmax/sse2.c",
5635    "src/u8-vclamp/sse2-x64.c",
5636    "src/xx-fill/sse2-x64.c",
5637    "src/xx-pad/sse2.c",
5638    "src/x8-transposec/gen/16x16-reuse-mov-sse2.c",
5639    "src/x8-zip/xm-sse2.c",
5640    "src/x8-zip/x2-sse2.c",
5641    "src/x8-zip/x3-sse2.c",
5642    "src/x8-zip/x4-sse2.c",
5643    "src/x16-transposec/gen/8x8-reuse-multi-sse2.c",
5644    "src/x32-unpool/sse2.c",
5645    "src/x32-zip/xm-sse2.c",
5646    "src/x32-zip/x2-sse2.c",
5647    "src/x32-zip/x3-sse2.c",
5648    "src/x32-zip/x4-sse2.c",
5649]
5650
5651ALL_SSE2_MICROKERNEL_SRCS = [
5652    "src/f16-f32-vcvt/gen/vcvt-sse2-int16-x8.c",
5653    "src/f16-f32-vcvt/gen/vcvt-sse2-int16-x16.c",
5654    "src/f16-f32-vcvt/gen/vcvt-sse2-int16-x24.c",
5655    "src/f16-f32-vcvt/gen/vcvt-sse2-int16-x32.c",
5656    "src/f16-f32-vcvt/gen/vcvt-sse2-int32-x8.c",
5657    "src/f16-f32-vcvt/gen/vcvt-sse2-int32-x16.c",
5658    "src/f16-f32-vcvt/gen/vcvt-sse2-int32-x24.c",
5659    "src/f16-f32-vcvt/gen/vcvt-sse2-int32-x32.c",
5660    "src/f16-vunary/gen/vabs-sse2-x8.c",
5661    "src/f16-vunary/gen/vabs-sse2-x16.c",
5662    "src/f16-vunary/gen/vneg-sse2-x8.c",
5663    "src/f16-vunary/gen/vneg-sse2-x16.c",
5664    "src/f32-argmaxpool/4x-sse2-c4.c",
5665    "src/f32-argmaxpool/9p8x-sse2-c4.c",
5666    "src/f32-argmaxpool/9x-sse2-c4.c",
5667    "src/f32-f16-vcvt/gen/vcvt-sse2-x8.c",
5668    "src/f32-f16-vcvt/gen/vcvt-sse2-x16.c",
5669    "src/f32-f16-vcvt/gen/vcvt-sse2-x24.c",
5670    "src/f32-f16-vcvt/gen/vcvt-sse2-x32.c",
5671    "src/f32-gemm/gen-inc/1x8inc-minmax-sse2-dup.c",
5672    "src/f32-gemm/gen-inc/3x8inc-minmax-sse2-dup.c",
5673    "src/f32-gemm/gen-inc/4x8inc-minmax-sse2-dup.c",
5674    "src/f32-gemm/gen-inc/5x8inc-minmax-sse2-dup.c",
5675    "src/f32-gemm/gen/1x8-minmax-sse2-dup.c",
5676    "src/f32-gemm/gen/3x8-minmax-sse2-dup.c",
5677    "src/f32-gemm/gen/4x8-minmax-sse2-dup.c",
5678    "src/f32-gemm/gen/5x8-minmax-sse2-dup.c",
5679    "src/f32-igemm/gen/1x8-minmax-sse2-dup.c",
5680    "src/f32-igemm/gen/3x8-minmax-sse2-dup.c",
5681    "src/f32-igemm/gen/4x8-minmax-sse2-dup.c",
5682    "src/f32-igemm/gen/5x8-minmax-sse2-dup.c",
5683    "src/f32-prelu/gen/sse2-2x4.c",
5684    "src/f32-prelu/gen/sse2-2x8.c",
5685    "src/f32-qs8-vcvt/gen/vcvt-sse2-x8.c",
5686    "src/f32-qs8-vcvt/gen/vcvt-sse2-x16.c",
5687    "src/f32-qs8-vcvt/gen/vcvt-sse2-x24.c",
5688    "src/f32-qs8-vcvt/gen/vcvt-sse2-x32.c",
5689    "src/f32-qu8-vcvt/gen/vcvt-sse2-x8.c",
5690    "src/f32-qu8-vcvt/gen/vcvt-sse2-x16.c",
5691    "src/f32-qu8-vcvt/gen/vcvt-sse2-x24.c",
5692    "src/f32-qu8-vcvt/gen/vcvt-sse2-x32.c",
5693    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x4.c",
5694    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x8-acc2.c",
5695    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x8.c",
5696    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x12-acc2.c",
5697    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x12-acc3.c",
5698    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x12.c",
5699    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x16-acc2.c",
5700    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x16-acc4.c",
5701    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x16.c",
5702    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x20-acc2.c",
5703    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x20-acc5.c",
5704    "src/f32-raddstoreexpminusmax/gen/sse2-rr2-p5-x20.c",
5705    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x4.c",
5706    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x8.c",
5707    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x12.c",
5708    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x16.c",
5709    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x20.c",
5710    "src/f32-velu/gen/velu-sse2-rr2-lut16-p3-x24.c",
5711    "src/f32-velu/gen/velu-sse2-rr2-p6-x4.c",
5712    "src/f32-velu/gen/velu-sse2-rr2-p6-x8.c",
5713    "src/f32-velu/gen/velu-sse2-rr2-p6-x12.c",
5714    "src/f32-velu/gen/velu-sse2-rr2-p6-x16.c",
5715    "src/f32-velu/gen/velu-sse2-rr2-p6-x20.c",
5716    "src/f32-velu/gen/velu-sse2-rr2-p6-x24.c",
5717    "src/f32-vlrelu/gen/vlrelu-sse2-x4.c",
5718    "src/f32-vlrelu/gen/vlrelu-sse2-x8.c",
5719    "src/f32-vrnd/gen/vrndd-sse2-x4.c",
5720    "src/f32-vrnd/gen/vrndd-sse2-x8.c",
5721    "src/f32-vrnd/gen/vrndne-sse2-x4.c",
5722    "src/f32-vrnd/gen/vrndne-sse2-x8.c",
5723    "src/f32-vrnd/gen/vrndu-sse2-x4.c",
5724    "src/f32-vrnd/gen/vrndu-sse2-x8.c",
5725    "src/f32-vrnd/gen/vrndz-sse2-x4.c",
5726    "src/f32-vrnd/gen/vrndz-sse2-x8.c",
5727    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x4.c",
5728    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x8.c",
5729    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x12.c",
5730    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x16.c",
5731    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x20.c",
5732    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-lut64-p2-div-x24.c",
5733    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x4.c",
5734    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x8.c",
5735    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x12.c",
5736    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x16.c",
5737    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x20.c",
5738    "src/f32-vsigmoid/gen/vsigmoid-sse2-rr2-p5-div-x24.c",
5739    "src/math/cvt-f16-f32-sse2-int16.c",
5740    "src/math/cvt-f16-f32-sse2-int32.c",
5741    "src/math/cvt-f32-f16-sse2.c",
5742    "src/math/exp-f32-sse2-rr2-lut64-p2.c",
5743    "src/math/exp-f32-sse2-rr2-p5.c",
5744    "src/math/expminus-f32-sse2-rr2-p5.c",
5745    "src/math/expm1minus-f32-sse2-rr2-lut16-p3.c",
5746    "src/math/expm1minus-f32-sse2-rr2-p6.c",
5747    "src/math/roundd-sse2-cvt.c",
5748    "src/math/roundne-sse2-cvt.c",
5749    "src/math/roundu-sse2-cvt.c",
5750    "src/math/roundz-sse2-cvt.c",
5751    "src/math/sigmoid-f32-sse2-rr2-lut64-p2-div.c",
5752    "src/math/sigmoid-f32-sse2-rr2-lut64-p2-nr1.c",
5753    "src/math/sigmoid-f32-sse2-rr2-lut64-p2-nr2.c",
5754    "src/math/sigmoid-f32-sse2-rr2-p5-div.c",
5755    "src/math/sigmoid-f32-sse2-rr2-p5-nr1.c",
5756    "src/math/sigmoid-f32-sse2-rr2-p5-nr2.c",
5757    "src/qc8-dwconv/gen/up8x3-minmax-fp32-sse2-mul16.c",
5758    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16-add16.c",
5759    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c",
5760    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16-add16.c",
5761    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c",
5762    "src/qc8-dwconv/gen/up16x9-minmax-fp32-sse2-mul16-add16.c",
5763    "src/qc8-dwconv/gen/up16x9-minmax-fp32-sse2-mul16.c",
5764    "src/qc8-dwconv/gen/up16x25-minmax-fp32-sse2-mul16-add16.c",
5765    "src/qc8-dwconv/gen/up16x25-minmax-fp32-sse2-mul16.c",
5766    "src/qc8-dwconv/gen/up24x9-minmax-fp32-sse2-mul16.c",
5767    "src/qc8-dwconv/gen/up24x25-minmax-fp32-sse2-mul16.c",
5768    "src/qc8-gemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5769    "src/qc8-gemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5770    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5771    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5772    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5773    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5774    "src/qc8-gemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5775    "src/qc8-gemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5776    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5777    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5778    "src/qc8-gemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5779    "src/qc8-gemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5780    "src/qc8-gemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5781    "src/qc8-gemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5782    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5783    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5784    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5785    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5786    "src/qc8-gemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5787    "src/qc8-gemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5788    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5789    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5790    "src/qc8-igemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5791    "src/qc8-igemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5792    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5793    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5794    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5795    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5796    "src/qc8-igemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5797    "src/qc8-igemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5798    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5799    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5800    "src/qc8-igemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5801    "src/qc8-igemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5802    "src/qc8-igemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5803    "src/qc8-igemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5804    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5805    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5806    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5807    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5808    "src/qc8-igemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5809    "src/qc8-igemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5810    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5811    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5812    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16-add16.c",
5813    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c",
5814    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16-add16.c",
5815    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c",
5816    "src/qs8-dwconv/gen/up16x9-minmax-fp32-sse2-mul16-add16.c",
5817    "src/qs8-dwconv/gen/up16x9-minmax-fp32-sse2-mul16.c",
5818    "src/qs8-dwconv/gen/up16x25-minmax-fp32-sse2-mul16-add16.c",
5819    "src/qs8-dwconv/gen/up16x25-minmax-fp32-sse2-mul16.c",
5820    "src/qs8-dwconv/gen/up24x9-minmax-fp32-sse2-mul16.c",
5821    "src/qs8-dwconv/gen/up24x25-minmax-fp32-sse2-mul16.c",
5822    "src/qs8-f32-vcvt/gen/vcvt-sse2-x8.c",
5823    "src/qs8-f32-vcvt/gen/vcvt-sse2-x16.c",
5824    "src/qs8-f32-vcvt/gen/vcvt-sse2-x24.c",
5825    "src/qs8-f32-vcvt/gen/vcvt-sse2-x32.c",
5826    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c",
5827    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse2-c16.c",
5828    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse2-c24.c",
5829    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c",
5830    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse2-c16.c",
5831    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse2-c24.c",
5832    "src/qs8-gemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5833    "src/qs8-gemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5834    "src/qs8-gemm/gen/1x4c2-xw-minmax-fp32-sse2.c",
5835    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5836    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5837    "src/qs8-gemm/gen/1x4c2s4-xw-minmax-fp32-sse2.c",
5838    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5839    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5840    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-sse2.c",
5841    "src/qs8-gemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5842    "src/qs8-gemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5843    "src/qs8-gemm/gen/2x4c2-xw-minmax-fp32-sse2.c",
5844    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5845    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5846    "src/qs8-gemm/gen/2x4c2s4-xw-minmax-fp32-sse2.c",
5847    "src/qs8-gemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5848    "src/qs8-gemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5849    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-sse2.c",
5850    "src/qs8-gemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5851    "src/qs8-gemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5852    "src/qs8-gemm/gen/3x4c2-xw-minmax-fp32-sse2.c",
5853    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5854    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5855    "src/qs8-gemm/gen/3x4c2s4-xw-minmax-fp32-sse2.c",
5856    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5857    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5858    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-sse2.c",
5859    "src/qs8-gemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5860    "src/qs8-gemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5861    "src/qs8-gemm/gen/4x4c2-xw-minmax-fp32-sse2.c",
5862    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5863    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5864    "src/qs8-gemm/gen/4x4c2s4-xw-minmax-fp32-sse2.c",
5865    "src/qs8-igemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5866    "src/qs8-igemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5867    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5868    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5869    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5870    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5871    "src/qs8-igemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5872    "src/qs8-igemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5873    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5874    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5875    "src/qs8-igemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5876    "src/qs8-igemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5877    "src/qs8-igemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5878    "src/qs8-igemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5879    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5880    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5881    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5882    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5883    "src/qs8-igemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5884    "src/qs8-igemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5885    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5886    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5887    "src/qs8-requantization/fp32-sse2.c",
5888    "src/qs8-requantization/gemmlowp-sse2.c",
5889    "src/qs8-requantization/rndna-sse2.c",
5890    "src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x8.c",
5891    "src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x16.c",
5892    "src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x24.c",
5893    "src/qs8-vadd/gen/minmax-sse2-mul16-ld64-x32.c",
5894    "src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c",
5895    "src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x16.c",
5896    "src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x24.c",
5897    "src/qs8-vaddc/gen/minmax-sse2-mul16-ld64-x32.c",
5898    "src/qs8-vcvt/gen/vcvt-sse2-x16.c",
5899    "src/qs8-vcvt/gen/vcvt-sse2-x32.c",
5900    "src/qs8-vlrelu/gen/vlrelu-sse2-x16.c",
5901    "src/qs8-vlrelu/gen/vlrelu-sse2-x32.c",
5902    "src/qs8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5903    "src/qs8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x16.c",
5904    "src/qs8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5905    "src/qs8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x16.c",
5906    "src/qu8-avgpool/9p8x-minmax-sse2-c8.c",
5907    "src/qu8-avgpool/9x-minmax-sse2-c8.c",
5908    "src/qu8-dwconv/gen/up8x9-minmax-fp32-sse2-mul16.c",
5909    "src/qu8-dwconv/gen/up8x25-minmax-fp32-sse2-mul16.c",
5910    "src/qu8-dwconv/gen/up16x9-minmax-fp32-sse2-mul16.c",
5911    "src/qu8-dwconv/gen/up16x25-minmax-fp32-sse2-mul16.c",
5912    "src/qu8-f32-vcvt/gen/vcvt-sse2-x8.c",
5913    "src/qu8-f32-vcvt/gen/vcvt-sse2-x16.c",
5914    "src/qu8-f32-vcvt/gen/vcvt-sse2-x24.c",
5915    "src/qu8-f32-vcvt/gen/vcvt-sse2-x32.c",
5916    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse2-c8.c",
5917    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse2-c16.c",
5918    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse2-c24.c",
5919    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse2-c8.c",
5920    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse2-c16.c",
5921    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse2-c24.c",
5922    "src/qu8-gemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5923    "src/qu8-gemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5924    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5925    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5926    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5927    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5928    "src/qu8-gemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5929    "src/qu8-gemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5930    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5931    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5932    "src/qu8-gemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5933    "src/qu8-gemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5934    "src/qu8-gemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5935    "src/qu8-gemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5936    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5937    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5938    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5939    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5940    "src/qu8-gemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5941    "src/qu8-gemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5942    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5943    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5944    "src/qu8-igemm/gen/1x4c2-minmax-fp32-sse2-ld64.c",
5945    "src/qu8-igemm/gen/1x4c2-minmax-fp32-sse2-ld128.c",
5946    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld64.c",
5947    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-sse2-ld128.c",
5948    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse2-ld64.c",
5949    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse2-ld128.c",
5950    "src/qu8-igemm/gen/2x4c2-minmax-fp32-sse2-ld64.c",
5951    "src/qu8-igemm/gen/2x4c2-minmax-fp32-sse2-ld128.c",
5952    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld64.c",
5953    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-sse2-ld128.c",
5954    "src/qu8-igemm/gen/2x4c8-minmax-fp32-sse2-ld64.c",
5955    "src/qu8-igemm/gen/2x4c8-minmax-fp32-sse2-ld128.c",
5956    "src/qu8-igemm/gen/3x4c2-minmax-fp32-sse2-ld64.c",
5957    "src/qu8-igemm/gen/3x4c2-minmax-fp32-sse2-ld128.c",
5958    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld64.c",
5959    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-sse2-ld128.c",
5960    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse2-ld64.c",
5961    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse2-ld128.c",
5962    "src/qu8-igemm/gen/4x4c2-minmax-fp32-sse2-ld64.c",
5963    "src/qu8-igemm/gen/4x4c2-minmax-fp32-sse2-ld128.c",
5964    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld64.c",
5965    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-sse2-ld128.c",
5966    "src/qu8-requantization/fp32-sse2.c",
5967    "src/qu8-requantization/gemmlowp-sse2.c",
5968    "src/qu8-requantization/rndna-sse2.c",
5969    "src/qu8-vadd/gen/minmax-sse2-mul16-ld64-x8.c",
5970    "src/qu8-vadd/gen/minmax-sse2-mul16-ld64-x16.c",
5971    "src/qu8-vaddc/gen/minmax-sse2-mul16-ld64-x8.c",
5972    "src/qu8-vaddc/gen/minmax-sse2-mul16-ld64-x16.c",
5973    "src/qu8-vcvt/gen/vcvt-sse2-x16.c",
5974    "src/qu8-vcvt/gen/vcvt-sse2-x32.c",
5975    "src/qu8-vlrelu/gen/vlrelu-sse2-x16.c",
5976    "src/qu8-vlrelu/gen/vlrelu-sse2-x32.c",
5977    "src/qu8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5978    "src/qu8-vmul/gen/minmax-fp32-sse2-mul16-ld64-x16.c",
5979    "src/qu8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x8.c",
5980    "src/qu8-vmulc/gen/minmax-fp32-sse2-mul16-ld64-x16.c",
5981    "src/s8-ibilinear/gen/sse2-c8.c",
5982    "src/s8-ibilinear/gen/sse2-c16.c",
5983    "src/s8-maxpool/9p8x-minmax-sse2-c16.c",
5984    "src/s8-vclamp/sse2-x64.c",
5985    "src/u8-ibilinear/gen/sse2-c8.c",
5986    "src/u8-ibilinear/gen/sse2-c16.c",
5987    "src/u8-maxpool/9p8x-minmax-sse2-c16.c",
5988    "src/u8-rmax/sse2.c",
5989    "src/u8-vclamp/sse2-x64.c",
5990    "src/xx-fill/sse2-x64.c",
5991    "src/xx-pad/sse2.c",
5992    "src/x8-transposec/gen/16x16-reuse-mov-sse2.c",
5993    "src/x8-transposec/gen/16x16-reuse-switch-sse2.c",
5994    "src/x8-zip/xm-sse2.c",
5995    "src/x8-zip/x2-sse2.c",
5996    "src/x8-zip/x3-sse2.c",
5997    "src/x8-zip/x4-sse2.c",
5998    "src/x16-transposec/gen/8x8-multi-mov-sse2.c",
5999    "src/x16-transposec/gen/8x8-multi-switch-sse2.c",
6000    "src/x16-transposec/gen/8x8-reuse-mov-sse2.c",
6001    "src/x16-transposec/gen/8x8-reuse-multi-sse2.c",
6002    "src/x16-transposec/gen/8x8-reuse-switch-sse2.c",
6003    "src/x16-transposec/4x8-sse2.c",
6004    "src/x32-transposec/gen/4x4-multi-mov-sse2.c",
6005    "src/x32-transposec/gen/4x4-multi-multi-sse2.c",
6006    "src/x32-transposec/gen/4x4-multi-switch-sse2.c",
6007    "src/x32-transposec/gen/4x4-reuse-mov-sse2.c",
6008    "src/x32-transposec/gen/4x4-reuse-multi-sse2.c",
6009    "src/x32-transposec/gen/4x4-reuse-switch-sse2.c",
6010    "src/x32-unpool/sse2.c",
6011    "src/x32-zip/xm-sse2.c",
6012    "src/x32-zip/x2-sse2.c",
6013    "src/x32-zip/x3-sse2.c",
6014    "src/x32-zip/x4-sse2.c",
6015    "src/x64-transposec/gen/2x2-multi-mov-sse2.c",
6016    "src/x64-transposec/gen/2x2-multi-multi-sse2.c",
6017    "src/x64-transposec/gen/2x2-multi-switch-sse2.c",
6018    "src/x64-transposec/gen/2x2-reuse-mov-sse2.c",
6019    "src/x64-transposec/gen/2x2-reuse-multi-sse2.c",
6020    "src/x64-transposec/gen/2x2-reuse-switch-sse2.c",
6021]
6022
6023PROD_SSSE3_MICROKERNEL_SRCS = [
6024    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-2x4-acc2.c",
6025    "src/qs8-vcvt/gen/vcvt-ssse3-x32.c",
6026    "src/qs8-vlrelu/gen/vlrelu-ssse3-x32.c",
6027    "src/qu8-vcvt/gen/vcvt-ssse3-x32.c",
6028    "src/qu8-vlrelu/gen/vlrelu-ssse3-x32.c",
6029]
6030
6031ALL_SSSE3_MICROKERNEL_SRCS = [
6032    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-1x4-acc2.c",
6033    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-1x4-acc3.c",
6034    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-1x4-acc4.c",
6035    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-1x4.c",
6036    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-2x4-acc2.c",
6037    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-2x4.c",
6038    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-3x4.c",
6039    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-4x4.c",
6040    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-5x4.c",
6041    "src/f32-dwconv2d-chw/gen/3x3p1-minmax-ssse3-6x4.c",
6042    "src/qs8-gemm/gen/1x4c8-minmax-fp32-ssse3-ld64.c",
6043    "src/qs8-gemm/gen/1x4c8-minmax-fp32-ssse3-ld128.c",
6044    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-ssse3.c",
6045    "src/qs8-gemm/gen/2x4c8-minmax-fp32-ssse3-ld64.c",
6046    "src/qs8-gemm/gen/2x4c8-minmax-fp32-ssse3-ld128.c",
6047    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-ssse3.c",
6048    "src/qs8-gemm/gen/3x4c8-minmax-fp32-ssse3-ld64.c",
6049    "src/qs8-gemm/gen/3x4c8-minmax-fp32-ssse3-ld128.c",
6050    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-ssse3.c",
6051    "src/qs8-igemm/gen/1x4c8-minmax-fp32-ssse3-ld64.c",
6052    "src/qs8-igemm/gen/1x4c8-minmax-fp32-ssse3-ld128.c",
6053    "src/qs8-igemm/gen/2x4c8-minmax-fp32-ssse3-ld64.c",
6054    "src/qs8-igemm/gen/2x4c8-minmax-fp32-ssse3-ld128.c",
6055    "src/qs8-igemm/gen/3x4c8-minmax-fp32-ssse3-ld64.c",
6056    "src/qs8-igemm/gen/3x4c8-minmax-fp32-ssse3-ld128.c",
6057    "src/qs8-requantization/gemmlowp-ssse3.c",
6058    "src/qs8-requantization/rndna-ssse3.c",
6059    "src/qs8-vcvt/gen/vcvt-ssse3-x16.c",
6060    "src/qs8-vcvt/gen/vcvt-ssse3-x32.c",
6061    "src/qs8-vlrelu/gen/vlrelu-ssse3-x16.c",
6062    "src/qs8-vlrelu/gen/vlrelu-ssse3-x32.c",
6063    "src/qu8-requantization/gemmlowp-ssse3.c",
6064    "src/qu8-requantization/rndna-ssse3.c",
6065    "src/qu8-vcvt/gen/vcvt-ssse3-x16.c",
6066    "src/qu8-vcvt/gen/vcvt-ssse3-x32.c",
6067    "src/qu8-vlrelu/gen/vlrelu-ssse3-x16.c",
6068    "src/qu8-vlrelu/gen/vlrelu-ssse3-x32.c",
6069    "src/x8-lut/gen/lut-ssse3-x16.c",
6070    "src/x8-lut/gen/lut-ssse3-x32.c",
6071    "src/x24-transposec/4x4-ssse3.c",
6072]
6073
6074PROD_SSE41_MICROKERNEL_SRCS = [
6075    "src/f16-f32-vcvt/gen/vcvt-sse41-int16-x16.c",
6076    "src/f32-f16-vcvt/gen/vcvt-sse41-x8.c",
6077    "src/f32-prelu/gen/sse41-2x8.c",
6078    "src/f32-qs8-vcvt/gen/vcvt-sse41-x32.c",
6079    "src/f32-vlrelu/gen/vlrelu-sse41-x8.c",
6080    "src/f32-vrnd/gen/vrndd-sse41-x8.c",
6081    "src/f32-vrnd/gen/vrndne-sse41-x8.c",
6082    "src/f32-vrnd/gen/vrndu-sse41-x8.c",
6083    "src/f32-vrnd/gen/vrndz-sse41-x8.c",
6084    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x8.c",
6085    "src/qc8-dwconv/gen/up8x3-minmax-fp32-sse41-mul16.c",
6086    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c",
6087    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c",
6088    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6089    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6090    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6091    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6092    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16-add16.c",
6093    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16-add16.c",
6094    "src/qs8-f32-vcvt/gen/vcvt-sse41-x16.c",
6095    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c",
6096    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c",
6097    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6098    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6099    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6100    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6101    "src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x8.c",
6102    "src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c",
6103    "src/qs8-vcvt/gen/vcvt-sse41-x32.c",
6104    "src/qs8-vlrelu/gen/vlrelu-sse41-x32.c",
6105    "src/qs8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6106    "src/qs8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6107    "src/qu8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c",
6108    "src/qu8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c",
6109    "src/qu8-f32-vcvt/gen/vcvt-sse41-x16.c",
6110    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c",
6111    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c",
6112    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6113    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6114    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6115    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6116    "src/qu8-vadd/gen/minmax-sse41-mul16-ld64-x8.c",
6117    "src/qu8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c",
6118    "src/qu8-vcvt/gen/vcvt-sse41-x32.c",
6119    "src/qu8-vlrelu/gen/vlrelu-sse41-x32.c",
6120    "src/qu8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6121    "src/qu8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6122    "src/s8-ibilinear/gen/sse41-c16.c",
6123    "src/s8-maxpool/9p8x-minmax-sse41-c16.c",
6124    "src/s8-vclamp/sse41-x64.c",
6125    "src/u8-ibilinear/gen/sse41-c16.c",
6126]
6127
6128ALL_SSE41_MICROKERNEL_SRCS = [
6129    "src/f16-f32-vcvt/gen/vcvt-sse41-int16-x8.c",
6130    "src/f16-f32-vcvt/gen/vcvt-sse41-int16-x16.c",
6131    "src/f16-f32-vcvt/gen/vcvt-sse41-int16-x24.c",
6132    "src/f16-f32-vcvt/gen/vcvt-sse41-int16-x32.c",
6133    "src/f16-f32-vcvt/gen/vcvt-sse41-int32-x8.c",
6134    "src/f16-f32-vcvt/gen/vcvt-sse41-int32-x16.c",
6135    "src/f16-f32-vcvt/gen/vcvt-sse41-int32-x24.c",
6136    "src/f16-f32-vcvt/gen/vcvt-sse41-int32-x32.c",
6137    "src/f32-f16-vcvt/gen/vcvt-sse41-x8.c",
6138    "src/f32-f16-vcvt/gen/vcvt-sse41-x16.c",
6139    "src/f32-f16-vcvt/gen/vcvt-sse41-x24.c",
6140    "src/f32-f16-vcvt/gen/vcvt-sse41-x32.c",
6141    "src/f32-prelu/gen/sse41-2x4.c",
6142    "src/f32-prelu/gen/sse41-2x8.c",
6143    "src/f32-qs8-vcvt/gen/vcvt-sse41-x8.c",
6144    "src/f32-qs8-vcvt/gen/vcvt-sse41-x16.c",
6145    "src/f32-qs8-vcvt/gen/vcvt-sse41-x24.c",
6146    "src/f32-qs8-vcvt/gen/vcvt-sse41-x32.c",
6147    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x4.c",
6148    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x8.c",
6149    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x12.c",
6150    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x16.c",
6151    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x20.c",
6152    "src/f32-velu/gen/velu-sse41-rr2-lut16-p3-x24.c",
6153    "src/f32-velu/gen/velu-sse41-rr2-p6-x4.c",
6154    "src/f32-velu/gen/velu-sse41-rr2-p6-x8.c",
6155    "src/f32-velu/gen/velu-sse41-rr2-p6-x12.c",
6156    "src/f32-velu/gen/velu-sse41-rr2-p6-x16.c",
6157    "src/f32-velu/gen/velu-sse41-rr2-p6-x20.c",
6158    "src/f32-velu/gen/velu-sse41-rr2-p6-x24.c",
6159    "src/f32-vlrelu/gen/vlrelu-sse41-x4.c",
6160    "src/f32-vlrelu/gen/vlrelu-sse41-x8.c",
6161    "src/f32-vrnd/gen/vrndd-sse41-x4.c",
6162    "src/f32-vrnd/gen/vrndd-sse41-x8.c",
6163    "src/f32-vrnd/gen/vrndne-sse41-x4.c",
6164    "src/f32-vrnd/gen/vrndne-sse41-x8.c",
6165    "src/f32-vrnd/gen/vrndu-sse41-x4.c",
6166    "src/f32-vrnd/gen/vrndu-sse41-x8.c",
6167    "src/f32-vrnd/gen/vrndz-sse41-x4.c",
6168    "src/f32-vrnd/gen/vrndz-sse41-x8.c",
6169    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x4.c",
6170    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x8.c",
6171    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x12.c",
6172    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x16.c",
6173    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x20.c",
6174    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-lut64-p2-div-x24.c",
6175    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x4.c",
6176    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x8.c",
6177    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x12.c",
6178    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x16.c",
6179    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x20.c",
6180    "src/f32-vsigmoid/gen/vsigmoid-sse41-rr2-p5-div-x24.c",
6181    "src/math/cvt-f16-f32-sse41-int16.c",
6182    "src/math/cvt-f16-f32-sse41-int32.c",
6183    "src/math/cvt-f32-f16-sse41.c",
6184    "src/math/roundd-sse41.c",
6185    "src/math/roundne-sse41.c",
6186    "src/math/roundu-sse41.c",
6187    "src/math/roundz-sse41.c",
6188    "src/qc8-dwconv/gen/up8x3-minmax-fp32-sse41-mul16.c",
6189    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16-add16.c",
6190    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c",
6191    "src/qc8-dwconv/gen/up8x9-minmax-fp32-sse41-mul32.c",
6192    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16-add16.c",
6193    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c",
6194    "src/qc8-dwconv/gen/up8x25-minmax-fp32-sse41-mul32.c",
6195    "src/qc8-dwconv/gen/up16x9-minmax-fp32-sse41-mul16-add16.c",
6196    "src/qc8-dwconv/gen/up16x9-minmax-fp32-sse41-mul16.c",
6197    "src/qc8-dwconv/gen/up16x9-minmax-fp32-sse41-mul32.c",
6198    "src/qc8-dwconv/gen/up16x25-minmax-fp32-sse41-mul16-add16.c",
6199    "src/qc8-dwconv/gen/up16x25-minmax-fp32-sse41-mul16.c",
6200    "src/qc8-dwconv/gen/up16x25-minmax-fp32-sse41-mul32.c",
6201    "src/qc8-dwconv/gen/up24x9-minmax-fp32-sse41-mul16.c",
6202    "src/qc8-dwconv/gen/up24x9-minmax-fp32-sse41-mul32.c",
6203    "src/qc8-dwconv/gen/up24x25-minmax-fp32-sse41-mul16.c",
6204    "src/qc8-dwconv/gen/up24x25-minmax-fp32-sse41-mul32.c",
6205    "src/qc8-gemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6206    "src/qc8-gemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6207    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6208    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6209    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6210    "src/qc8-gemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6211    "src/qc8-gemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6212    "src/qc8-gemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6213    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6214    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6215    "src/qc8-gemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6216    "src/qc8-gemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6217    "src/qc8-gemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6218    "src/qc8-gemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6219    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6220    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6221    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6222    "src/qc8-gemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6223    "src/qc8-gemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6224    "src/qc8-gemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6225    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6226    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6227    "src/qc8-igemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6228    "src/qc8-igemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6229    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6230    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6231    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6232    "src/qc8-igemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6233    "src/qc8-igemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6234    "src/qc8-igemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6235    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6236    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6237    "src/qc8-igemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6238    "src/qc8-igemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6239    "src/qc8-igemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6240    "src/qc8-igemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6241    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6242    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6243    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6244    "src/qc8-igemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6245    "src/qc8-igemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6246    "src/qc8-igemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6247    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6248    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6249    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16-add16.c",
6250    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c",
6251    "src/qs8-dwconv/gen/up8x9-minmax-fp32-sse41-mul32.c",
6252    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16-add16.c",
6253    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c",
6254    "src/qs8-dwconv/gen/up8x25-minmax-fp32-sse41-mul32.c",
6255    "src/qs8-dwconv/gen/up16x9-minmax-fp32-sse41-mul16-add16.c",
6256    "src/qs8-dwconv/gen/up16x9-minmax-fp32-sse41-mul16.c",
6257    "src/qs8-dwconv/gen/up16x9-minmax-fp32-sse41-mul32.c",
6258    "src/qs8-dwconv/gen/up16x25-minmax-fp32-sse41-mul16-add16.c",
6259    "src/qs8-dwconv/gen/up16x25-minmax-fp32-sse41-mul16.c",
6260    "src/qs8-dwconv/gen/up16x25-minmax-fp32-sse41-mul32.c",
6261    "src/qs8-dwconv/gen/up24x9-minmax-fp32-sse41-mul16.c",
6262    "src/qs8-dwconv/gen/up24x9-minmax-fp32-sse41-mul32.c",
6263    "src/qs8-dwconv/gen/up24x25-minmax-fp32-sse41-mul16.c",
6264    "src/qs8-dwconv/gen/up24x25-minmax-fp32-sse41-mul32.c",
6265    "src/qs8-f32-vcvt/gen/vcvt-sse41-x8.c",
6266    "src/qs8-f32-vcvt/gen/vcvt-sse41-x16.c",
6267    "src/qs8-f32-vcvt/gen/vcvt-sse41-x24.c",
6268    "src/qs8-f32-vcvt/gen/vcvt-sse41-x32.c",
6269    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c",
6270    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse41-c16.c",
6271    "src/qs8-gavgpool/gen/7p7x-minmax-fp32-sse41-c24.c",
6272    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c",
6273    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse41-c16.c",
6274    "src/qs8-gavgpool/gen/7x-minmax-fp32-sse41-c24.c",
6275    "src/qs8-gemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6276    "src/qs8-gemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6277    "src/qs8-gemm/gen/1x4c2-xw-minmax-fp32-sse41.c",
6278    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6279    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6280    "src/qs8-gemm/gen/1x4c2s4-xw-minmax-fp32-sse41.c",
6281    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6282    "src/qs8-gemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6283    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-sse41.c",
6284    "src/qs8-gemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6285    "src/qs8-gemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6286    "src/qs8-gemm/gen/2x4c2-xw-minmax-fp32-sse41.c",
6287    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6288    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6289    "src/qs8-gemm/gen/2x4c2s4-xw-minmax-fp32-sse41.c",
6290    "src/qs8-gemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6291    "src/qs8-gemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6292    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-sse41.c",
6293    "src/qs8-gemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6294    "src/qs8-gemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6295    "src/qs8-gemm/gen/3x4c2-xw-minmax-fp32-sse41.c",
6296    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6297    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6298    "src/qs8-gemm/gen/3x4c2s4-xw-minmax-fp32-sse41.c",
6299    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6300    "src/qs8-gemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6301    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-sse41.c",
6302    "src/qs8-gemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6303    "src/qs8-gemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6304    "src/qs8-gemm/gen/4x4c2-xw-minmax-fp32-sse41.c",
6305    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6306    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6307    "src/qs8-gemm/gen/4x4c2s4-xw-minmax-fp32-sse41.c",
6308    "src/qs8-igemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6309    "src/qs8-igemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6310    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6311    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6312    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6313    "src/qs8-igemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6314    "src/qs8-igemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6315    "src/qs8-igemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6316    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6317    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6318    "src/qs8-igemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6319    "src/qs8-igemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6320    "src/qs8-igemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6321    "src/qs8-igemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6322    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6323    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6324    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6325    "src/qs8-igemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6326    "src/qs8-igemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6327    "src/qs8-igemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6328    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6329    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6330    "src/qs8-requantization/fp32-sse4.c",
6331    "src/qs8-requantization/gemmlowp-sse4.c",
6332    "src/qs8-requantization/rndna-sse4.c",
6333    "src/qs8-requantization/rndnu-sse4-sra.c",
6334    "src/qs8-requantization/rndnu-sse4-srl.c",
6335    "src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x8.c",
6336    "src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x16.c",
6337    "src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x24.c",
6338    "src/qs8-vadd/gen/minmax-sse41-mul16-ld64-x32.c",
6339    "src/qs8-vadd/gen/minmax-sse41-mul32-ld32-x8.c",
6340    "src/qs8-vadd/gen/minmax-sse41-mul32-ld32-x16.c",
6341    "src/qs8-vadd/gen/minmax-sse41-mul32-ld32-x24.c",
6342    "src/qs8-vadd/gen/minmax-sse41-mul32-ld32-x32.c",
6343    "src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c",
6344    "src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x16.c",
6345    "src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x24.c",
6346    "src/qs8-vaddc/gen/minmax-sse41-mul16-ld64-x32.c",
6347    "src/qs8-vaddc/gen/minmax-sse41-mul32-ld32-x8.c",
6348    "src/qs8-vaddc/gen/minmax-sse41-mul32-ld32-x16.c",
6349    "src/qs8-vaddc/gen/minmax-sse41-mul32-ld32-x24.c",
6350    "src/qs8-vaddc/gen/minmax-sse41-mul32-ld32-x32.c",
6351    "src/qs8-vcvt/gen/vcvt-sse41-x8.c",
6352    "src/qs8-vcvt/gen/vcvt-sse41-x16.c",
6353    "src/qs8-vcvt/gen/vcvt-sse41-x32.c",
6354    "src/qs8-vlrelu/gen/vlrelu-sse41-x8.c",
6355    "src/qs8-vlrelu/gen/vlrelu-sse41-x16.c",
6356    "src/qs8-vlrelu/gen/vlrelu-sse41-x32.c",
6357    "src/qs8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x8.c",
6358    "src/qs8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6359    "src/qs8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x8.c",
6360    "src/qs8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6361    "src/qu8-dwconv/gen/up8x9-minmax-fp32-sse41-mul16.c",
6362    "src/qu8-dwconv/gen/up8x9-minmax-fp32-sse41-mul32.c",
6363    "src/qu8-dwconv/gen/up8x25-minmax-fp32-sse41-mul16.c",
6364    "src/qu8-dwconv/gen/up8x25-minmax-fp32-sse41-mul32.c",
6365    "src/qu8-dwconv/gen/up16x9-minmax-fp32-sse41-mul16.c",
6366    "src/qu8-dwconv/gen/up16x9-minmax-fp32-sse41-mul32.c",
6367    "src/qu8-dwconv/gen/up16x25-minmax-fp32-sse41-mul16.c",
6368    "src/qu8-dwconv/gen/up16x25-minmax-fp32-sse41-mul32.c",
6369    "src/qu8-f32-vcvt/gen/vcvt-sse41-x8.c",
6370    "src/qu8-f32-vcvt/gen/vcvt-sse41-x16.c",
6371    "src/qu8-f32-vcvt/gen/vcvt-sse41-x24.c",
6372    "src/qu8-f32-vcvt/gen/vcvt-sse41-x32.c",
6373    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse41-c8.c",
6374    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse41-c16.c",
6375    "src/qu8-gavgpool/gen/7p7x-minmax-fp32-sse41-c24.c",
6376    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse41-c8.c",
6377    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse41-c16.c",
6378    "src/qu8-gavgpool/gen/7x-minmax-fp32-sse41-c24.c",
6379    "src/qu8-gemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6380    "src/qu8-gemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6381    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6382    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6383    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6384    "src/qu8-gemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6385    "src/qu8-gemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6386    "src/qu8-gemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6387    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6388    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6389    "src/qu8-gemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6390    "src/qu8-gemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6391    "src/qu8-gemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6392    "src/qu8-gemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6393    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6394    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6395    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6396    "src/qu8-gemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6397    "src/qu8-gemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6398    "src/qu8-gemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6399    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6400    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6401    "src/qu8-igemm/gen/1x4c2-minmax-fp32-sse41-ld64.c",
6402    "src/qu8-igemm/gen/1x4c2-minmax-fp32-sse41-ld128.c",
6403    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld64.c",
6404    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-sse41-ld128.c",
6405    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse41-ld64.c",
6406    "src/qu8-igemm/gen/1x4c8-minmax-fp32-sse41-ld128.c",
6407    "src/qu8-igemm/gen/2x4c2-minmax-fp32-sse41-ld64.c",
6408    "src/qu8-igemm/gen/2x4c2-minmax-fp32-sse41-ld128.c",
6409    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld64.c",
6410    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-sse41-ld128.c",
6411    "src/qu8-igemm/gen/2x4c8-minmax-fp32-sse41-ld64.c",
6412    "src/qu8-igemm/gen/2x4c8-minmax-fp32-sse41-ld128.c",
6413    "src/qu8-igemm/gen/3x4c2-minmax-fp32-sse41-ld64.c",
6414    "src/qu8-igemm/gen/3x4c2-minmax-fp32-sse41-ld128.c",
6415    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld64.c",
6416    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-sse41-ld128.c",
6417    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse41-ld64.c",
6418    "src/qu8-igemm/gen/3x4c8-minmax-fp32-sse41-ld128.c",
6419    "src/qu8-igemm/gen/4x4c2-minmax-fp32-sse41-ld64.c",
6420    "src/qu8-igemm/gen/4x4c2-minmax-fp32-sse41-ld128.c",
6421    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld64.c",
6422    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-sse41-ld128.c",
6423    "src/qu8-requantization/gemmlowp-sse4.c",
6424    "src/qu8-requantization/rndna-sse4.c",
6425    "src/qu8-vadd/gen/minmax-sse41-mul16-ld64-x8.c",
6426    "src/qu8-vadd/gen/minmax-sse41-mul16-ld64-x16.c",
6427    "src/qu8-vadd/gen/minmax-sse41-mul32-ld32-x8.c",
6428    "src/qu8-vadd/gen/minmax-sse41-mul32-ld32-x16.c",
6429    "src/qu8-vaddc/gen/minmax-sse41-mul16-ld64-x8.c",
6430    "src/qu8-vaddc/gen/minmax-sse41-mul16-ld64-x16.c",
6431    "src/qu8-vaddc/gen/minmax-sse41-mul32-ld32-x8.c",
6432    "src/qu8-vaddc/gen/minmax-sse41-mul32-ld32-x16.c",
6433    "src/qu8-vcvt/gen/vcvt-sse41-x8.c",
6434    "src/qu8-vcvt/gen/vcvt-sse41-x16.c",
6435    "src/qu8-vcvt/gen/vcvt-sse41-x32.c",
6436    "src/qu8-vlrelu/gen/vlrelu-sse41-x8.c",
6437    "src/qu8-vlrelu/gen/vlrelu-sse41-x16.c",
6438    "src/qu8-vlrelu/gen/vlrelu-sse41-x32.c",
6439    "src/qu8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x8.c",
6440    "src/qu8-vmul/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6441    "src/qu8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x8.c",
6442    "src/qu8-vmulc/gen/minmax-fp32-sse41-mul16-ld64-x16.c",
6443    "src/s8-ibilinear/gen/sse41-c8.c",
6444    "src/s8-ibilinear/gen/sse41-c16.c",
6445    "src/s8-maxpool/9p8x-minmax-sse41-c16.c",
6446    "src/s8-vclamp/sse41-x64.c",
6447    "src/u8-ibilinear/gen/sse41-c8.c",
6448    "src/u8-ibilinear/gen/sse41-c16.c",
6449]
6450
6451PROD_AVX_MICROKERNEL_SRCS = [
6452    "src/f16-f32-vcvt/gen/vcvt-avx-int16-x16.c",
6453    "src/f32-dwconv/gen/up8x25-minmax-avx.c",
6454    "src/f32-dwconv/gen/up16x3-minmax-avx.c",
6455    "src/f32-dwconv/gen/up16x4-minmax-avx.c",
6456    "src/f32-dwconv/gen/up16x9-minmax-avx.c",
6457    "src/f32-f16-vcvt/gen/vcvt-avx-x24.c",
6458    "src/f32-gemm/gen/1x16-minmax-avx-broadcast.c",
6459    "src/f32-gemm/gen/5x16-minmax-avx-broadcast.c",
6460    "src/f32-igemm/gen/1x16-minmax-avx-broadcast.c",
6461    "src/f32-igemm/gen/5x16-minmax-avx-broadcast.c",
6462    "src/f32-prelu/gen/avx-2x16.c",
6463    "src/f32-qs8-vcvt/gen/vcvt-avx-x32.c",
6464    "src/f32-qu8-vcvt/gen/vcvt-avx-x32.c",
6465    "src/f32-vbinary/gen/vadd-minmax-avx-x16.c",
6466    "src/f32-vbinary/gen/vaddc-minmax-avx-x16.c",
6467    "src/f32-vbinary/gen/vdiv-minmax-avx-x16.c",
6468    "src/f32-vbinary/gen/vdivc-minmax-avx-x16.c",
6469    "src/f32-vbinary/gen/vmax-avx-x16.c",
6470    "src/f32-vbinary/gen/vmaxc-avx-x16.c",
6471    "src/f32-vbinary/gen/vmin-avx-x16.c",
6472    "src/f32-vbinary/gen/vminc-avx-x16.c",
6473    "src/f32-vbinary/gen/vmul-minmax-avx-x16.c",
6474    "src/f32-vbinary/gen/vmulc-minmax-avx-x16.c",
6475    "src/f32-vbinary/gen/vrdivc-minmax-avx-x16.c",
6476    "src/f32-vbinary/gen/vrsubc-minmax-avx-x16.c",
6477    "src/f32-vbinary/gen/vsqrdiff-avx-x16.c",
6478    "src/f32-vbinary/gen/vsqrdiffc-avx-x16.c",
6479    "src/f32-vbinary/gen/vsub-minmax-avx-x16.c",
6480    "src/f32-vbinary/gen/vsubc-minmax-avx-x16.c",
6481    "src/f32-vclamp/gen/vclamp-avx-x16.c",
6482    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x32.c",
6483    "src/f32-vhswish/gen/vhswish-avx-x16.c",
6484    "src/f32-vlrelu/gen/vlrelu-avx-x16.c",
6485    "src/f32-vrnd/gen/vrndd-avx-x16.c",
6486    "src/f32-vrnd/gen/vrndne-avx-x16.c",
6487    "src/f32-vrnd/gen/vrndu-avx-x16.c",
6488    "src/f32-vrnd/gen/vrndz-avx-x16.c",
6489    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x40.c",
6490    "src/f32-vsqrt/gen/avx-sqrt-x8.c",
6491    "src/f32-vunary/gen/vabs-avx-x16.c",
6492    "src/f32-vunary/gen/vneg-avx-x16.c",
6493    "src/f32-vunary/gen/vsqr-avx-x16.c",
6494    "src/qc8-dwconv/gen/up16x3-minmax-fp32-avx-mul16-add16.c",
6495    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c",
6496    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c",
6497    "src/qc8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6498    "src/qc8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6499    "src/qc8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6500    "src/qc8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6501    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c",
6502    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c",
6503    "src/qs8-f32-vcvt/gen/vcvt-avx-x32.c",
6504    "src/qs8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6505    "src/qs8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6506    "src/qs8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6507    "src/qs8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6508    "src/qs8-vadd/gen/minmax-avx-mul32-ld32-x8.c",
6509    "src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x8.c",
6510    "src/qs8-vcvt/gen/vcvt-avx-x32.c",
6511    "src/qs8-vlrelu/gen/vlrelu-avx-x32.c",
6512    "src/qs8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6513    "src/qs8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6514    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx-mul16.c",
6515    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx-mul16.c",
6516    "src/qu8-f32-vcvt/gen/vcvt-avx-x32.c",
6517    "src/qu8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6518    "src/qu8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6519    "src/qu8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6520    "src/qu8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6521    "src/qu8-vadd/gen/minmax-avx-mul32-ld32-x8.c",
6522    "src/qu8-vaddc/gen/minmax-avx-mul32-ld32-x8.c",
6523    "src/qu8-vcvt/gen/vcvt-avx-x32.c",
6524    "src/qu8-vlrelu/gen/vlrelu-avx-x32.c",
6525    "src/qu8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6526    "src/qu8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6527    "src/x8-lut/gen/lut-avx-x64.c",
6528]
6529
6530ALL_AVX_MICROKERNEL_SRCS = [
6531    "src/f16-f32-vcvt/gen/vcvt-avx-int16-x8.c",
6532    "src/f16-f32-vcvt/gen/vcvt-avx-int16-x16.c",
6533    "src/f16-f32-vcvt/gen/vcvt-avx-int16-x24.c",
6534    "src/f16-f32-vcvt/gen/vcvt-avx-int16-x32.c",
6535    "src/f16-f32-vcvt/gen/vcvt-avx-int32-x8.c",
6536    "src/f16-f32-vcvt/gen/vcvt-avx-int32-x16.c",
6537    "src/f16-f32-vcvt/gen/vcvt-avx-int32-x24.c",
6538    "src/f16-f32-vcvt/gen/vcvt-avx-int32-x32.c",
6539    "src/f32-dwconv/gen/up8x3-minmax-avx-acc2.c",
6540    "src/f32-dwconv/gen/up8x3-minmax-avx.c",
6541    "src/f32-dwconv/gen/up8x4-minmax-avx-acc2.c",
6542    "src/f32-dwconv/gen/up8x4-minmax-avx.c",
6543    "src/f32-dwconv/gen/up8x9-minmax-avx-acc2.c",
6544    "src/f32-dwconv/gen/up8x9-minmax-avx.c",
6545    "src/f32-dwconv/gen/up8x25-minmax-avx-acc2.c",
6546    "src/f32-dwconv/gen/up8x25-minmax-avx.c",
6547    "src/f32-dwconv/gen/up16x3-minmax-avx-acc2.c",
6548    "src/f32-dwconv/gen/up16x3-minmax-avx.c",
6549    "src/f32-dwconv/gen/up16x4-minmax-avx-acc2.c",
6550    "src/f32-dwconv/gen/up16x4-minmax-avx.c",
6551    "src/f32-dwconv/gen/up16x9-minmax-avx-acc2.c",
6552    "src/f32-dwconv/gen/up16x9-minmax-avx.c",
6553    "src/f32-dwconv/gen/up16x25-minmax-avx-acc2.c",
6554    "src/f32-dwconv/gen/up16x25-minmax-avx.c",
6555    "src/f32-f16-vcvt/gen/vcvt-avx-x8.c",
6556    "src/f32-f16-vcvt/gen/vcvt-avx-x16.c",
6557    "src/f32-f16-vcvt/gen/vcvt-avx-x24.c",
6558    "src/f32-f16-vcvt/gen/vcvt-avx-x32.c",
6559    "src/f32-gemm/gen-inc/1x8inc-minmax-avx-broadcast.c",
6560    "src/f32-gemm/gen-inc/1x16inc-minmax-avx-broadcast.c",
6561    "src/f32-gemm/gen-inc/3x16inc-minmax-avx-broadcast.c",
6562    "src/f32-gemm/gen-inc/4x8inc-minmax-avx-broadcast.c",
6563    "src/f32-gemm/gen-inc/4x16inc-minmax-avx-broadcast.c",
6564    "src/f32-gemm/gen-inc/5x8inc-minmax-avx-broadcast.c",
6565    "src/f32-gemm/gen-inc/5x16inc-minmax-avx-broadcast.c",
6566    "src/f32-gemm/gen-inc/6x8inc-minmax-avx-broadcast.c",
6567    "src/f32-gemm/gen-inc/7x8inc-minmax-avx-broadcast.c",
6568    "src/f32-gemm/gen/1x8-minmax-avx-broadcast.c",
6569    "src/f32-gemm/gen/1x16-minmax-avx-broadcast.c",
6570    "src/f32-gemm/gen/3x16-minmax-avx-broadcast.c",
6571    "src/f32-gemm/gen/4x8-minmax-avx-broadcast.c",
6572    "src/f32-gemm/gen/4x16-minmax-avx-broadcast.c",
6573    "src/f32-gemm/gen/5x8-minmax-avx-broadcast.c",
6574    "src/f32-gemm/gen/5x16-minmax-avx-broadcast.c",
6575    "src/f32-gemm/gen/6x8-minmax-avx-broadcast.c",
6576    "src/f32-gemm/gen/7x8-minmax-avx-broadcast.c",
6577    "src/f32-igemm/gen/1x8-minmax-avx-broadcast.c",
6578    "src/f32-igemm/gen/1x16-minmax-avx-broadcast.c",
6579    "src/f32-igemm/gen/3x16-minmax-avx-broadcast.c",
6580    "src/f32-igemm/gen/4x8-minmax-avx-broadcast.c",
6581    "src/f32-igemm/gen/4x16-minmax-avx-broadcast.c",
6582    "src/f32-igemm/gen/5x8-minmax-avx-broadcast.c",
6583    "src/f32-igemm/gen/5x16-minmax-avx-broadcast.c",
6584    "src/f32-igemm/gen/6x8-minmax-avx-broadcast.c",
6585    "src/f32-igemm/gen/7x8-minmax-avx-broadcast.c",
6586    "src/f32-prelu/gen/avx-2x8.c",
6587    "src/f32-prelu/gen/avx-2x16.c",
6588    "src/f32-qs8-vcvt/gen/vcvt-avx-x8.c",
6589    "src/f32-qs8-vcvt/gen/vcvt-avx-x16.c",
6590    "src/f32-qs8-vcvt/gen/vcvt-avx-x24.c",
6591    "src/f32-qs8-vcvt/gen/vcvt-avx-x32.c",
6592    "src/f32-qu8-vcvt/gen/vcvt-avx-x8.c",
6593    "src/f32-qu8-vcvt/gen/vcvt-avx-x16.c",
6594    "src/f32-qu8-vcvt/gen/vcvt-avx-x24.c",
6595    "src/f32-qu8-vcvt/gen/vcvt-avx-x32.c",
6596    "src/f32-rmax/avx.c",
6597    "src/f32-vbinary/gen/vadd-minmax-avx-x8.c",
6598    "src/f32-vbinary/gen/vadd-minmax-avx-x16.c",
6599    "src/f32-vbinary/gen/vaddc-minmax-avx-x8.c",
6600    "src/f32-vbinary/gen/vaddc-minmax-avx-x16.c",
6601    "src/f32-vbinary/gen/vdiv-minmax-avx-x8.c",
6602    "src/f32-vbinary/gen/vdiv-minmax-avx-x16.c",
6603    "src/f32-vbinary/gen/vdivc-minmax-avx-x8.c",
6604    "src/f32-vbinary/gen/vdivc-minmax-avx-x16.c",
6605    "src/f32-vbinary/gen/vmax-avx-x8.c",
6606    "src/f32-vbinary/gen/vmax-avx-x16.c",
6607    "src/f32-vbinary/gen/vmaxc-avx-x8.c",
6608    "src/f32-vbinary/gen/vmaxc-avx-x16.c",
6609    "src/f32-vbinary/gen/vmin-avx-x8.c",
6610    "src/f32-vbinary/gen/vmin-avx-x16.c",
6611    "src/f32-vbinary/gen/vminc-avx-x8.c",
6612    "src/f32-vbinary/gen/vminc-avx-x16.c",
6613    "src/f32-vbinary/gen/vmul-minmax-avx-x8.c",
6614    "src/f32-vbinary/gen/vmul-minmax-avx-x16.c",
6615    "src/f32-vbinary/gen/vmulc-minmax-avx-x8.c",
6616    "src/f32-vbinary/gen/vmulc-minmax-avx-x16.c",
6617    "src/f32-vbinary/gen/vrdivc-minmax-avx-x8.c",
6618    "src/f32-vbinary/gen/vrdivc-minmax-avx-x16.c",
6619    "src/f32-vbinary/gen/vrsubc-minmax-avx-x8.c",
6620    "src/f32-vbinary/gen/vrsubc-minmax-avx-x16.c",
6621    "src/f32-vbinary/gen/vsqrdiff-avx-x8.c",
6622    "src/f32-vbinary/gen/vsqrdiff-avx-x16.c",
6623    "src/f32-vbinary/gen/vsqrdiffc-avx-x8.c",
6624    "src/f32-vbinary/gen/vsqrdiffc-avx-x16.c",
6625    "src/f32-vbinary/gen/vsub-minmax-avx-x8.c",
6626    "src/f32-vbinary/gen/vsub-minmax-avx-x16.c",
6627    "src/f32-vbinary/gen/vsubc-minmax-avx-x8.c",
6628    "src/f32-vbinary/gen/vsubc-minmax-avx-x16.c",
6629    "src/f32-vclamp/gen/vclamp-avx-x8.c",
6630    "src/f32-vclamp/gen/vclamp-avx-x16.c",
6631    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x8.c",
6632    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x16.c",
6633    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x24.c",
6634    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x32.c",
6635    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x40.c",
6636    "src/f32-velu/gen/velu-avx-rr2-lut4-p4-perm-x48.c",
6637    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x8.c",
6638    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x16.c",
6639    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x24.c",
6640    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x32.c",
6641    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x40.c",
6642    "src/f32-velu/gen/velu-avx-rr2-lut16-p3-x48.c",
6643    "src/f32-velu/gen/velu-avx-rr2-p6-x8.c",
6644    "src/f32-velu/gen/velu-avx-rr2-p6-x16.c",
6645    "src/f32-velu/gen/velu-avx-rr2-p6-x24.c",
6646    "src/f32-velu/gen/velu-avx-rr2-p6-x32.c",
6647    "src/f32-velu/gen/velu-avx-rr2-p6-x40.c",
6648    "src/f32-velu/gen/velu-avx-rr2-p6-x48.c",
6649    "src/f32-vhswish/gen/vhswish-avx-x8.c",
6650    "src/f32-vhswish/gen/vhswish-avx-x16.c",
6651    "src/f32-vlrelu/gen/vlrelu-avx-x8.c",
6652    "src/f32-vlrelu/gen/vlrelu-avx-x16.c",
6653    "src/f32-vrelu/gen/vrelu-avx-x8.c",
6654    "src/f32-vrelu/gen/vrelu-avx-x16.c",
6655    "src/f32-vrnd/gen/vrndd-avx-x8.c",
6656    "src/f32-vrnd/gen/vrndd-avx-x16.c",
6657    "src/f32-vrnd/gen/vrndne-avx-x8.c",
6658    "src/f32-vrnd/gen/vrndne-avx-x16.c",
6659    "src/f32-vrnd/gen/vrndu-avx-x8.c",
6660    "src/f32-vrnd/gen/vrndu-avx-x16.c",
6661    "src/f32-vrnd/gen/vrndz-avx-x8.c",
6662    "src/f32-vrnd/gen/vrndz-avx-x16.c",
6663    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x8.c",
6664    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x16.c",
6665    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x24.c",
6666    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x32.c",
6667    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x40.c",
6668    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x48.c",
6669    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x56.c",
6670    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x64.c",
6671    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x72.c",
6672    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-div-x80.c",
6673    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x8.c",
6674    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x16.c",
6675    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x24.c",
6676    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x32.c",
6677    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x40.c",
6678    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x48.c",
6679    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x56.c",
6680    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x64.c",
6681    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x72.c",
6682    "src/f32-vsigmoid/gen/vsigmoid-avx-rr2-p5-nr2-x80.c",
6683    "src/f32-vsqrt/gen/avx-sqrt-x8.c",
6684    "src/f32-vsqrt/gen/avx-sqrt-x16.c",
6685    "src/f32-vunary/gen/vabs-avx-x8.c",
6686    "src/f32-vunary/gen/vabs-avx-x16.c",
6687    "src/f32-vunary/gen/vneg-avx-x8.c",
6688    "src/f32-vunary/gen/vneg-avx-x16.c",
6689    "src/f32-vunary/gen/vsqr-avx-x8.c",
6690    "src/f32-vunary/gen/vsqr-avx-x16.c",
6691    "src/math/exp-f32-avx-rr2-p5.c",
6692    "src/math/expm1minus-f32-avx-rr2-lut4-p4-perm.c",
6693    "src/math/expm1minus-f32-avx-rr2-lut16-p3.c",
6694    "src/math/expm1minus-f32-avx-rr2-p6.c",
6695    "src/math/sigmoid-f32-avx-rr2-lut64-p2-div.c",
6696    "src/math/sigmoid-f32-avx-rr2-p5-div.c",
6697    "src/math/sigmoid-f32-avx-rr2-p5-nr1.c",
6698    "src/math/sigmoid-f32-avx-rr2-p5-nr2.c",
6699    "src/qc8-dwconv/gen/up8x9-minmax-fp32-avx-mul16-add16.c",
6700    "src/qc8-dwconv/gen/up8x9-minmax-fp32-avx-mul16.c",
6701    "src/qc8-dwconv/gen/up8x9-minmax-fp32-avx-mul32.c",
6702    "src/qc8-dwconv/gen/up8x25-minmax-fp32-avx-mul16-add16.c",
6703    "src/qc8-dwconv/gen/up8x25-minmax-fp32-avx-mul16.c",
6704    "src/qc8-dwconv/gen/up8x25-minmax-fp32-avx-mul32.c",
6705    "src/qc8-dwconv/gen/up16x3-minmax-fp32-avx-mul16-add16.c",
6706    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c",
6707    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx-mul16.c",
6708    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx-mul32.c",
6709    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c",
6710    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx-mul16.c",
6711    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx-mul32.c",
6712    "src/qc8-dwconv/gen/up24x9-minmax-fp32-avx-mul16.c",
6713    "src/qc8-dwconv/gen/up24x9-minmax-fp32-avx-mul32.c",
6714    "src/qc8-dwconv/gen/up24x25-minmax-fp32-avx-mul16.c",
6715    "src/qc8-dwconv/gen/up24x25-minmax-fp32-avx-mul32.c",
6716    "src/qc8-gemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6717    "src/qc8-gemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6718    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6719    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6720    "src/qc8-gemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6721    "src/qc8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6722    "src/qc8-gemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6723    "src/qc8-gemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6724    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6725    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6726    "src/qc8-gemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6727    "src/qc8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6728    "src/qc8-gemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6729    "src/qc8-gemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6730    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6731    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6732    "src/qc8-gemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6733    "src/qc8-gemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6734    "src/qc8-gemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6735    "src/qc8-gemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6736    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6737    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6738    "src/qc8-igemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6739    "src/qc8-igemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6740    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6741    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6742    "src/qc8-igemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6743    "src/qc8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6744    "src/qc8-igemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6745    "src/qc8-igemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6746    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6747    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6748    "src/qc8-igemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6749    "src/qc8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6750    "src/qc8-igemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6751    "src/qc8-igemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6752    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6753    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6754    "src/qc8-igemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6755    "src/qc8-igemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6756    "src/qc8-igemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6757    "src/qc8-igemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6758    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6759    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6760    "src/qs8-dwconv/gen/up8x9-minmax-fp32-avx-mul16-add16.c",
6761    "src/qs8-dwconv/gen/up8x9-minmax-fp32-avx-mul16.c",
6762    "src/qs8-dwconv/gen/up8x9-minmax-fp32-avx-mul32.c",
6763    "src/qs8-dwconv/gen/up8x25-minmax-fp32-avx-mul16-add16.c",
6764    "src/qs8-dwconv/gen/up8x25-minmax-fp32-avx-mul16.c",
6765    "src/qs8-dwconv/gen/up8x25-minmax-fp32-avx-mul32.c",
6766    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx-mul16-add16.c",
6767    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx-mul16.c",
6768    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx-mul32.c",
6769    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx-mul16-add16.c",
6770    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx-mul16.c",
6771    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx-mul32.c",
6772    "src/qs8-dwconv/gen/up24x9-minmax-fp32-avx-mul16.c",
6773    "src/qs8-dwconv/gen/up24x9-minmax-fp32-avx-mul32.c",
6774    "src/qs8-dwconv/gen/up24x25-minmax-fp32-avx-mul16.c",
6775    "src/qs8-dwconv/gen/up24x25-minmax-fp32-avx-mul32.c",
6776    "src/qs8-f32-vcvt/gen/vcvt-avx-x8.c",
6777    "src/qs8-f32-vcvt/gen/vcvt-avx-x16.c",
6778    "src/qs8-f32-vcvt/gen/vcvt-avx-x24.c",
6779    "src/qs8-f32-vcvt/gen/vcvt-avx-x32.c",
6780    "src/qs8-gemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6781    "src/qs8-gemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6782    "src/qs8-gemm/gen/1x4c2-xw-minmax-fp32-avx.c",
6783    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6784    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6785    "src/qs8-gemm/gen/1x4c2s4-xw-minmax-fp32-avx.c",
6786    "src/qs8-gemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6787    "src/qs8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6788    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-avx.c",
6789    "src/qs8-gemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6790    "src/qs8-gemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6791    "src/qs8-gemm/gen/2x4c2-xw-minmax-fp32-avx.c",
6792    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6793    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6794    "src/qs8-gemm/gen/2x4c2s4-xw-minmax-fp32-avx.c",
6795    "src/qs8-gemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6796    "src/qs8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6797    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-avx.c",
6798    "src/qs8-gemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6799    "src/qs8-gemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6800    "src/qs8-gemm/gen/3x4c2-xw-minmax-fp32-avx.c",
6801    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6802    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6803    "src/qs8-gemm/gen/3x4c2s4-xw-minmax-fp32-avx.c",
6804    "src/qs8-gemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6805    "src/qs8-gemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6806    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-avx.c",
6807    "src/qs8-gemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6808    "src/qs8-gemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6809    "src/qs8-gemm/gen/4x4c2-xw-minmax-fp32-avx.c",
6810    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6811    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6812    "src/qs8-gemm/gen/4x4c2s4-xw-minmax-fp32-avx.c",
6813    "src/qs8-igemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6814    "src/qs8-igemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6815    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6816    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6817    "src/qs8-igemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6818    "src/qs8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6819    "src/qs8-igemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6820    "src/qs8-igemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6821    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6822    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6823    "src/qs8-igemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6824    "src/qs8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6825    "src/qs8-igemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6826    "src/qs8-igemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6827    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6828    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6829    "src/qs8-igemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6830    "src/qs8-igemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6831    "src/qs8-igemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6832    "src/qs8-igemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6833    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6834    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6835    "src/qs8-vadd/gen/minmax-avx-mul16-ld64-x8.c",
6836    "src/qs8-vadd/gen/minmax-avx-mul16-ld64-x16.c",
6837    "src/qs8-vadd/gen/minmax-avx-mul16-ld64-x24.c",
6838    "src/qs8-vadd/gen/minmax-avx-mul16-ld64-x32.c",
6839    "src/qs8-vadd/gen/minmax-avx-mul32-ld32-x8.c",
6840    "src/qs8-vadd/gen/minmax-avx-mul32-ld32-x16.c",
6841    "src/qs8-vadd/gen/minmax-avx-mul32-ld32-x24.c",
6842    "src/qs8-vadd/gen/minmax-avx-mul32-ld32-x32.c",
6843    "src/qs8-vaddc/gen/minmax-avx-mul16-ld64-x8.c",
6844    "src/qs8-vaddc/gen/minmax-avx-mul16-ld64-x16.c",
6845    "src/qs8-vaddc/gen/minmax-avx-mul16-ld64-x24.c",
6846    "src/qs8-vaddc/gen/minmax-avx-mul16-ld64-x32.c",
6847    "src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x8.c",
6848    "src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x16.c",
6849    "src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x24.c",
6850    "src/qs8-vaddc/gen/minmax-avx-mul32-ld32-x32.c",
6851    "src/qs8-vcvt/gen/vcvt-avx-x8.c",
6852    "src/qs8-vcvt/gen/vcvt-avx-x16.c",
6853    "src/qs8-vcvt/gen/vcvt-avx-x32.c",
6854    "src/qs8-vlrelu/gen/vlrelu-avx-x8.c",
6855    "src/qs8-vlrelu/gen/vlrelu-avx-x16.c",
6856    "src/qs8-vlrelu/gen/vlrelu-avx-x32.c",
6857    "src/qs8-vmul/gen/minmax-fp32-avx-mul16-ld64-x8.c",
6858    "src/qs8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6859    "src/qs8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x8.c",
6860    "src/qs8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6861    "src/qu8-dwconv/gen/up8x9-minmax-fp32-avx-mul16.c",
6862    "src/qu8-dwconv/gen/up8x9-minmax-fp32-avx-mul32.c",
6863    "src/qu8-dwconv/gen/up8x25-minmax-fp32-avx-mul16.c",
6864    "src/qu8-dwconv/gen/up8x25-minmax-fp32-avx-mul32.c",
6865    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx-mul16.c",
6866    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx-mul32.c",
6867    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx-mul16.c",
6868    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx-mul32.c",
6869    "src/qu8-f32-vcvt/gen/vcvt-avx-x8.c",
6870    "src/qu8-f32-vcvt/gen/vcvt-avx-x16.c",
6871    "src/qu8-f32-vcvt/gen/vcvt-avx-x24.c",
6872    "src/qu8-f32-vcvt/gen/vcvt-avx-x32.c",
6873    "src/qu8-gemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6874    "src/qu8-gemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6875    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6876    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6877    "src/qu8-gemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6878    "src/qu8-gemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6879    "src/qu8-gemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6880    "src/qu8-gemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6881    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6882    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6883    "src/qu8-gemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6884    "src/qu8-gemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6885    "src/qu8-gemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6886    "src/qu8-gemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6887    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6888    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6889    "src/qu8-gemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6890    "src/qu8-gemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6891    "src/qu8-gemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6892    "src/qu8-gemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6893    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6894    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6895    "src/qu8-igemm/gen/1x4c2-minmax-fp32-avx-ld64.c",
6896    "src/qu8-igemm/gen/1x4c2-minmax-fp32-avx-ld128.c",
6897    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld64.c",
6898    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-avx-ld128.c",
6899    "src/qu8-igemm/gen/1x4c8-minmax-fp32-avx-ld64.c",
6900    "src/qu8-igemm/gen/1x4c8-minmax-fp32-avx-ld128.c",
6901    "src/qu8-igemm/gen/2x4c2-minmax-fp32-avx-ld64.c",
6902    "src/qu8-igemm/gen/2x4c2-minmax-fp32-avx-ld128.c",
6903    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld64.c",
6904    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-avx-ld128.c",
6905    "src/qu8-igemm/gen/2x4c8-minmax-fp32-avx-ld64.c",
6906    "src/qu8-igemm/gen/2x4c8-minmax-fp32-avx-ld128.c",
6907    "src/qu8-igemm/gen/3x4c2-minmax-fp32-avx-ld64.c",
6908    "src/qu8-igemm/gen/3x4c2-minmax-fp32-avx-ld128.c",
6909    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld64.c",
6910    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-avx-ld128.c",
6911    "src/qu8-igemm/gen/3x4c8-minmax-fp32-avx-ld64.c",
6912    "src/qu8-igemm/gen/3x4c8-minmax-fp32-avx-ld128.c",
6913    "src/qu8-igemm/gen/4x4c2-minmax-fp32-avx-ld64.c",
6914    "src/qu8-igemm/gen/4x4c2-minmax-fp32-avx-ld128.c",
6915    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld64.c",
6916    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-avx-ld128.c",
6917    "src/qu8-vadd/gen/minmax-avx-mul16-ld64-x8.c",
6918    "src/qu8-vadd/gen/minmax-avx-mul16-ld64-x16.c",
6919    "src/qu8-vadd/gen/minmax-avx-mul32-ld32-x8.c",
6920    "src/qu8-vadd/gen/minmax-avx-mul32-ld32-x16.c",
6921    "src/qu8-vaddc/gen/minmax-avx-mul16-ld64-x8.c",
6922    "src/qu8-vaddc/gen/minmax-avx-mul16-ld64-x16.c",
6923    "src/qu8-vaddc/gen/minmax-avx-mul32-ld32-x8.c",
6924    "src/qu8-vaddc/gen/minmax-avx-mul32-ld32-x16.c",
6925    "src/qu8-vcvt/gen/vcvt-avx-x8.c",
6926    "src/qu8-vcvt/gen/vcvt-avx-x16.c",
6927    "src/qu8-vcvt/gen/vcvt-avx-x32.c",
6928    "src/qu8-vlrelu/gen/vlrelu-avx-x8.c",
6929    "src/qu8-vlrelu/gen/vlrelu-avx-x16.c",
6930    "src/qu8-vlrelu/gen/vlrelu-avx-x32.c",
6931    "src/qu8-vmul/gen/minmax-fp32-avx-mul16-ld64-x8.c",
6932    "src/qu8-vmul/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6933    "src/qu8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x8.c",
6934    "src/qu8-vmulc/gen/minmax-fp32-avx-mul16-ld64-x16.c",
6935    "src/x8-lut/gen/lut-avx-x16.c",
6936    "src/x8-lut/gen/lut-avx-x32.c",
6937    "src/x8-lut/gen/lut-avx-x48.c",
6938    "src/x8-lut/gen/lut-avx-x64.c",
6939]
6940
6941PROD_F16C_MICROKERNEL_SRCS = [
6942    "src/f16-avgpool/9p8x-minmax-f16c-c8.c",
6943    "src/f16-avgpool/9x-minmax-f16c-c8.c",
6944    "src/f16-f32-vcvt/gen/vcvt-f16c-x16.c",
6945    "src/f16-gavgpool/gen/7p7x-minmax-f16c-c8.c",
6946    "src/f16-gavgpool/gen/7x-minmax-f16c-c8.c",
6947    "src/f16-maxpool/9p8x-minmax-f16c-c8.c",
6948    "src/f16-prelu/gen/f16c-2x16.c",
6949    "src/f16-rmax/f16c.c",
6950    "src/f16-vbinary/gen/vadd-minmax-f16c-x16.c",
6951    "src/f16-vbinary/gen/vaddc-minmax-f16c-x16.c",
6952    "src/f16-vbinary/gen/vdiv-minmax-f16c-x8.c",
6953    "src/f16-vbinary/gen/vdivc-minmax-f16c-x8.c",
6954    "src/f16-vbinary/gen/vmax-f16c-x16.c",
6955    "src/f16-vbinary/gen/vmaxc-f16c-x16.c",
6956    "src/f16-vbinary/gen/vmin-f16c-x16.c",
6957    "src/f16-vbinary/gen/vminc-f16c-x16.c",
6958    "src/f16-vbinary/gen/vmul-minmax-f16c-x16.c",
6959    "src/f16-vbinary/gen/vmulc-minmax-f16c-x16.c",
6960    "src/f16-vbinary/gen/vrdivc-minmax-f16c-x8.c",
6961    "src/f16-vbinary/gen/vrsubc-minmax-f16c-x16.c",
6962    "src/f16-vbinary/gen/vsqrdiff-f16c-x16.c",
6963    "src/f16-vbinary/gen/vsqrdiffc-f16c-x16.c",
6964    "src/f16-vbinary/gen/vsub-minmax-f16c-x16.c",
6965    "src/f16-vbinary/gen/vsubc-minmax-f16c-x16.c",
6966    "src/f16-vclamp/gen/vclamp-f16c-x16.c",
6967    "src/f16-vhswish/gen/vhswish-f16c-x16.c",
6968    "src/f16-vlrelu/gen/vlrelu-f16c-x16.c",
6969    "src/f16-vrnd/gen/vrndd-f16c-x16.c",
6970    "src/f16-vrnd/gen/vrndne-f16c-x16.c",
6971    "src/f16-vrnd/gen/vrndu-f16c-x16.c",
6972    "src/f16-vrnd/gen/vrndz-f16c-x16.c",
6973    "src/f16-vsqrt/gen/f16c-sqrt-x8.c",
6974    "src/f16-vunary/gen/vsqr-f16c-x16.c",
6975    "src/f32-f16-vcvt/gen/vcvt-f16c-x16.c",
6976]
6977
6978ALL_F16C_MICROKERNEL_SRCS = [
6979    "src/f16-avgpool/9p8x-minmax-f16c-c8.c",
6980    "src/f16-avgpool/9x-minmax-f16c-c8.c",
6981    "src/f16-f32-vcvt/gen/vcvt-f16c-x8.c",
6982    "src/f16-f32-vcvt/gen/vcvt-f16c-x16.c",
6983    "src/f16-gavgpool/gen/7p7x-minmax-f16c-c8.c",
6984    "src/f16-gavgpool/gen/7p7x-minmax-f16c-c16.c",
6985    "src/f16-gavgpool/gen/7p7x-minmax-f16c-c24.c",
6986    "src/f16-gavgpool/gen/7p7x-minmax-f16c-c32.c",
6987    "src/f16-gavgpool/gen/7x-minmax-f16c-c8.c",
6988    "src/f16-gavgpool/gen/7x-minmax-f16c-c16.c",
6989    "src/f16-gavgpool/gen/7x-minmax-f16c-c24.c",
6990    "src/f16-gavgpool/gen/7x-minmax-f16c-c32.c",
6991    "src/f16-maxpool/9p8x-minmax-f16c-c8.c",
6992    "src/f16-prelu/gen/f16c-2x8.c",
6993    "src/f16-prelu/gen/f16c-2x16.c",
6994    "src/f16-rmax/f16c.c",
6995    "src/f16-vbinary/gen/vadd-minmax-f16c-x8.c",
6996    "src/f16-vbinary/gen/vadd-minmax-f16c-x16.c",
6997    "src/f16-vbinary/gen/vaddc-minmax-f16c-x8.c",
6998    "src/f16-vbinary/gen/vaddc-minmax-f16c-x16.c",
6999    "src/f16-vbinary/gen/vdiv-minmax-f16c-x8.c",
7000    "src/f16-vbinary/gen/vdiv-minmax-f16c-x16.c",
7001    "src/f16-vbinary/gen/vdivc-minmax-f16c-x8.c",
7002    "src/f16-vbinary/gen/vdivc-minmax-f16c-x16.c",
7003    "src/f16-vbinary/gen/vmax-f16c-x8.c",
7004    "src/f16-vbinary/gen/vmax-f16c-x16.c",
7005    "src/f16-vbinary/gen/vmaxc-f16c-x8.c",
7006    "src/f16-vbinary/gen/vmaxc-f16c-x16.c",
7007    "src/f16-vbinary/gen/vmin-f16c-x8.c",
7008    "src/f16-vbinary/gen/vmin-f16c-x16.c",
7009    "src/f16-vbinary/gen/vminc-f16c-x8.c",
7010    "src/f16-vbinary/gen/vminc-f16c-x16.c",
7011    "src/f16-vbinary/gen/vmul-minmax-f16c-x8.c",
7012    "src/f16-vbinary/gen/vmul-minmax-f16c-x16.c",
7013    "src/f16-vbinary/gen/vmulc-minmax-f16c-x8.c",
7014    "src/f16-vbinary/gen/vmulc-minmax-f16c-x16.c",
7015    "src/f16-vbinary/gen/vrdivc-minmax-f16c-x8.c",
7016    "src/f16-vbinary/gen/vrdivc-minmax-f16c-x16.c",
7017    "src/f16-vbinary/gen/vrsubc-minmax-f16c-x8.c",
7018    "src/f16-vbinary/gen/vrsubc-minmax-f16c-x16.c",
7019    "src/f16-vbinary/gen/vsqrdiff-f16c-x8.c",
7020    "src/f16-vbinary/gen/vsqrdiff-f16c-x16.c",
7021    "src/f16-vbinary/gen/vsqrdiffc-f16c-x8.c",
7022    "src/f16-vbinary/gen/vsqrdiffc-f16c-x16.c",
7023    "src/f16-vbinary/gen/vsub-minmax-f16c-x8.c",
7024    "src/f16-vbinary/gen/vsub-minmax-f16c-x16.c",
7025    "src/f16-vbinary/gen/vsubc-minmax-f16c-x8.c",
7026    "src/f16-vbinary/gen/vsubc-minmax-f16c-x16.c",
7027    "src/f16-vclamp/gen/vclamp-f16c-x8.c",
7028    "src/f16-vclamp/gen/vclamp-f16c-x16.c",
7029    "src/f16-vhswish/gen/vhswish-f16c-x8.c",
7030    "src/f16-vhswish/gen/vhswish-f16c-x16.c",
7031    "src/f16-vlrelu/gen/vlrelu-f16c-x8.c",
7032    "src/f16-vlrelu/gen/vlrelu-f16c-x16.c",
7033    "src/f16-vrnd/gen/vrndd-f16c-x8.c",
7034    "src/f16-vrnd/gen/vrndd-f16c-x16.c",
7035    "src/f16-vrnd/gen/vrndne-f16c-x8.c",
7036    "src/f16-vrnd/gen/vrndne-f16c-x16.c",
7037    "src/f16-vrnd/gen/vrndu-f16c-x8.c",
7038    "src/f16-vrnd/gen/vrndu-f16c-x16.c",
7039    "src/f16-vrnd/gen/vrndz-f16c-x8.c",
7040    "src/f16-vrnd/gen/vrndz-f16c-x16.c",
7041    "src/f16-vsqrt/gen/f16c-sqrt-x8.c",
7042    "src/f16-vsqrt/gen/f16c-sqrt-x16.c",
7043    "src/f16-vunary/gen/vsqr-f16c-x8.c",
7044    "src/f16-vunary/gen/vsqr-f16c-x16.c",
7045    "src/f32-f16-vcvt/gen/vcvt-f16c-x8.c",
7046    "src/f32-f16-vcvt/gen/vcvt-f16c-x16.c",
7047    "src/math/cvt-f16-f32-f16c.c",
7048    "src/math/cvt-f32-f16-f16c.c",
7049]
7050
7051PROD_XOP_MICROKERNEL_SRCS = [
7052    "src/qc8-dwconv/gen/up16x3-minmax-fp32-xop-mul16-add16.c",
7053    "src/qc8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c",
7054    "src/qc8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c",
7055    "src/qc8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7056    "src/qc8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7057    "src/qc8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7058    "src/qc8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7059    "src/qs8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c",
7060    "src/qs8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c",
7061    "src/qs8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7062    "src/qs8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7063    "src/qs8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7064    "src/qs8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7065    "src/qs8-vadd/gen/minmax-xop-mul32-ld32-x8.c",
7066    "src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x8.c",
7067    "src/qu8-dwconv/gen/up16x9-minmax-fp32-xop-mul32.c",
7068    "src/qu8-dwconv/gen/up16x25-minmax-fp32-xop-mul32.c",
7069    "src/qu8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7070    "src/qu8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7071    "src/qu8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7072    "src/qu8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7073    "src/qu8-vadd/gen/minmax-xop-mul32-ld32-x8.c",
7074    "src/qu8-vaddc/gen/minmax-xop-mul32-ld32-x8.c",
7075]
7076
7077ALL_XOP_MICROKERNEL_SRCS = [
7078    "src/qc8-dwconv/gen/up8x9-minmax-fp32-xop-mul16-add16.c",
7079    "src/qc8-dwconv/gen/up8x9-minmax-fp32-xop-mul32.c",
7080    "src/qc8-dwconv/gen/up8x25-minmax-fp32-xop-mul16-add16.c",
7081    "src/qc8-dwconv/gen/up8x25-minmax-fp32-xop-mul32.c",
7082    "src/qc8-dwconv/gen/up16x3-minmax-fp32-xop-mul16-add16.c",
7083    "src/qc8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c",
7084    "src/qc8-dwconv/gen/up16x9-minmax-fp32-xop-mul32.c",
7085    "src/qc8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c",
7086    "src/qc8-dwconv/gen/up16x25-minmax-fp32-xop-mul32.c",
7087    "src/qc8-dwconv/gen/up24x9-minmax-fp32-xop-mul32.c",
7088    "src/qc8-dwconv/gen/up24x25-minmax-fp32-xop-mul32.c",
7089    "src/qc8-gemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7090    "src/qc8-gemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7091    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7092    "src/qc8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7093    "src/qc8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7094    "src/qc8-gemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7095    "src/qc8-gemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7096    "src/qc8-gemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7097    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7098    "src/qc8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7099    "src/qc8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7100    "src/qc8-gemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7101    "src/qc8-gemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7102    "src/qc8-gemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7103    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7104    "src/qc8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7105    "src/qc8-gemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7106    "src/qc8-gemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7107    "src/qc8-gemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7108    "src/qc8-gemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7109    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7110    "src/qc8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7111    "src/qc8-igemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7112    "src/qc8-igemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7113    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7114    "src/qc8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7115    "src/qc8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7116    "src/qc8-igemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7117    "src/qc8-igemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7118    "src/qc8-igemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7119    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7120    "src/qc8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7121    "src/qc8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7122    "src/qc8-igemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7123    "src/qc8-igemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7124    "src/qc8-igemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7125    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7126    "src/qc8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7127    "src/qc8-igemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7128    "src/qc8-igemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7129    "src/qc8-igemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7130    "src/qc8-igemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7131    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7132    "src/qc8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7133    "src/qs8-dwconv/gen/up8x9-minmax-fp32-xop-mul16-add16.c",
7134    "src/qs8-dwconv/gen/up8x9-minmax-fp32-xop-mul32.c",
7135    "src/qs8-dwconv/gen/up8x25-minmax-fp32-xop-mul16-add16.c",
7136    "src/qs8-dwconv/gen/up8x25-minmax-fp32-xop-mul32.c",
7137    "src/qs8-dwconv/gen/up16x9-minmax-fp32-xop-mul16-add16.c",
7138    "src/qs8-dwconv/gen/up16x9-minmax-fp32-xop-mul32.c",
7139    "src/qs8-dwconv/gen/up16x25-minmax-fp32-xop-mul16-add16.c",
7140    "src/qs8-dwconv/gen/up16x25-minmax-fp32-xop-mul32.c",
7141    "src/qs8-dwconv/gen/up24x9-minmax-fp32-xop-mul32.c",
7142    "src/qs8-dwconv/gen/up24x25-minmax-fp32-xop-mul32.c",
7143    "src/qs8-gemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7144    "src/qs8-gemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7145    "src/qs8-gemm/gen/1x4c2-xw-minmax-fp32-xop.c",
7146    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7147    "src/qs8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7148    "src/qs8-gemm/gen/1x4c2s4-xw-minmax-fp32-xop.c",
7149    "src/qs8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7150    "src/qs8-gemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7151    "src/qs8-gemm/gen/1x4c8-xw-minmax-fp32-xop.c",
7152    "src/qs8-gemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7153    "src/qs8-gemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7154    "src/qs8-gemm/gen/2x4c2-xw-minmax-fp32-xop.c",
7155    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7156    "src/qs8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7157    "src/qs8-gemm/gen/2x4c2s4-xw-minmax-fp32-xop.c",
7158    "src/qs8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7159    "src/qs8-gemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7160    "src/qs8-gemm/gen/2x4c8-xw-minmax-fp32-xop.c",
7161    "src/qs8-gemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7162    "src/qs8-gemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7163    "src/qs8-gemm/gen/3x4c2-xw-minmax-fp32-xop.c",
7164    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7165    "src/qs8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7166    "src/qs8-gemm/gen/3x4c2s4-xw-minmax-fp32-xop.c",
7167    "src/qs8-gemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7168    "src/qs8-gemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7169    "src/qs8-gemm/gen/3x4c8-xw-minmax-fp32-xop.c",
7170    "src/qs8-gemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7171    "src/qs8-gemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7172    "src/qs8-gemm/gen/4x4c2-xw-minmax-fp32-xop.c",
7173    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7174    "src/qs8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7175    "src/qs8-gemm/gen/4x4c2s4-xw-minmax-fp32-xop.c",
7176    "src/qs8-igemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7177    "src/qs8-igemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7178    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7179    "src/qs8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7180    "src/qs8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7181    "src/qs8-igemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7182    "src/qs8-igemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7183    "src/qs8-igemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7184    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7185    "src/qs8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7186    "src/qs8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7187    "src/qs8-igemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7188    "src/qs8-igemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7189    "src/qs8-igemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7190    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7191    "src/qs8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7192    "src/qs8-igemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7193    "src/qs8-igemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7194    "src/qs8-igemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7195    "src/qs8-igemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7196    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7197    "src/qs8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7198    "src/qs8-vadd/gen/minmax-xop-mul32-ld32-x8.c",
7199    "src/qs8-vadd/gen/minmax-xop-mul32-ld32-x16.c",
7200    "src/qs8-vadd/gen/minmax-xop-mul32-ld32-x24.c",
7201    "src/qs8-vadd/gen/minmax-xop-mul32-ld32-x32.c",
7202    "src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x8.c",
7203    "src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x16.c",
7204    "src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x24.c",
7205    "src/qs8-vaddc/gen/minmax-xop-mul32-ld32-x32.c",
7206    "src/qu8-dwconv/gen/up8x9-minmax-fp32-xop-mul32.c",
7207    "src/qu8-dwconv/gen/up8x25-minmax-fp32-xop-mul32.c",
7208    "src/qu8-dwconv/gen/up16x9-minmax-fp32-xop-mul32.c",
7209    "src/qu8-dwconv/gen/up16x25-minmax-fp32-xop-mul32.c",
7210    "src/qu8-gemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7211    "src/qu8-gemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7212    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7213    "src/qu8-gemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7214    "src/qu8-gemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7215    "src/qu8-gemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7216    "src/qu8-gemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7217    "src/qu8-gemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7218    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7219    "src/qu8-gemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7220    "src/qu8-gemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7221    "src/qu8-gemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7222    "src/qu8-gemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7223    "src/qu8-gemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7224    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7225    "src/qu8-gemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7226    "src/qu8-gemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7227    "src/qu8-gemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7228    "src/qu8-gemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7229    "src/qu8-gemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7230    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7231    "src/qu8-gemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7232    "src/qu8-igemm/gen/1x4c2-minmax-fp32-xop-ld64.c",
7233    "src/qu8-igemm/gen/1x4c2-minmax-fp32-xop-ld128.c",
7234    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld64.c",
7235    "src/qu8-igemm/gen/1x4c2s4-minmax-fp32-xop-ld128.c",
7236    "src/qu8-igemm/gen/1x4c8-minmax-fp32-xop-ld64.c",
7237    "src/qu8-igemm/gen/1x4c8-minmax-fp32-xop-ld128.c",
7238    "src/qu8-igemm/gen/2x4c2-minmax-fp32-xop-ld64.c",
7239    "src/qu8-igemm/gen/2x4c2-minmax-fp32-xop-ld128.c",
7240    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld64.c",
7241    "src/qu8-igemm/gen/2x4c2s4-minmax-fp32-xop-ld128.c",
7242    "src/qu8-igemm/gen/2x4c8-minmax-fp32-xop-ld64.c",
7243    "src/qu8-igemm/gen/2x4c8-minmax-fp32-xop-ld128.c",
7244    "src/qu8-igemm/gen/3x4c2-minmax-fp32-xop-ld64.c",
7245    "src/qu8-igemm/gen/3x4c2-minmax-fp32-xop-ld128.c",
7246    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld64.c",
7247    "src/qu8-igemm/gen/3x4c2s4-minmax-fp32-xop-ld128.c",
7248    "src/qu8-igemm/gen/3x4c8-minmax-fp32-xop-ld64.c",
7249    "src/qu8-igemm/gen/3x4c8-minmax-fp32-xop-ld128.c",
7250    "src/qu8-igemm/gen/4x4c2-minmax-fp32-xop-ld64.c",
7251    "src/qu8-igemm/gen/4x4c2-minmax-fp32-xop-ld128.c",
7252    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld64.c",
7253    "src/qu8-igemm/gen/4x4c2s4-minmax-fp32-xop-ld128.c",
7254    "src/qu8-vadd/gen/minmax-xop-mul32-ld32-x8.c",
7255    "src/qu8-vadd/gen/minmax-xop-mul32-ld32-x16.c",
7256    "src/qu8-vaddc/gen/minmax-xop-mul32-ld32-x8.c",
7257    "src/qu8-vaddc/gen/minmax-xop-mul32-ld32-x16.c",
7258]
7259
7260PROD_FMA3_MICROKERNEL_SRCS = [
7261    "src/f16-dwconv/gen/up8x25-minmax-fma3-acc2.c",
7262    "src/f16-dwconv/gen/up16x3-minmax-fma3.c",
7263    "src/f16-dwconv/gen/up16x4-minmax-fma3.c",
7264    "src/f16-dwconv/gen/up16x9-minmax-fma3.c",
7265    "src/f16-ibilinear/gen/fma3-c8.c",
7266    "src/f16-vmulcaddc/gen/c8-minmax-fma3-2x.c",
7267    "src/f32-dwconv/gen/up8x25-minmax-fma3.c",
7268    "src/f32-dwconv/gen/up16x3-minmax-fma3.c",
7269    "src/f32-dwconv/gen/up16x4-minmax-fma3.c",
7270    "src/f32-dwconv/gen/up16x9-minmax-fma3.c",
7271    "src/f32-gemm/gen/1x16-minmax-fma3-broadcast.c",
7272    "src/f32-gemm/gen/1x16s4-minmax-fma3-broadcast.c",
7273    "src/f32-gemm/gen/4x16s4-minmax-fma3-broadcast.c",
7274    "src/f32-gemm/gen/5x16-minmax-fma3-broadcast.c",
7275    "src/f32-igemm/gen/1x16-minmax-fma3-broadcast.c",
7276    "src/f32-igemm/gen/1x16s4-minmax-fma3-broadcast.c",
7277    "src/f32-igemm/gen/4x16s4-minmax-fma3-broadcast.c",
7278    "src/f32-igemm/gen/5x16-minmax-fma3-broadcast.c",
7279    "src/f32-vhswish/gen/vhswish-fma3-x16.c",
7280]
7281
7282ALL_FMA3_MICROKERNEL_SRCS = [
7283    "src/f16-dwconv/gen/up8x3-minmax-fma3-acc2.c",
7284    "src/f16-dwconv/gen/up8x3-minmax-fma3.c",
7285    "src/f16-dwconv/gen/up8x4-minmax-fma3-acc2.c",
7286    "src/f16-dwconv/gen/up8x4-minmax-fma3.c",
7287    "src/f16-dwconv/gen/up8x9-minmax-fma3-acc2.c",
7288    "src/f16-dwconv/gen/up8x9-minmax-fma3.c",
7289    "src/f16-dwconv/gen/up8x25-minmax-fma3-acc2.c",
7290    "src/f16-dwconv/gen/up8x25-minmax-fma3.c",
7291    "src/f16-dwconv/gen/up16x3-minmax-fma3-acc2.c",
7292    "src/f16-dwconv/gen/up16x3-minmax-fma3.c",
7293    "src/f16-dwconv/gen/up16x4-minmax-fma3-acc2.c",
7294    "src/f16-dwconv/gen/up16x4-minmax-fma3.c",
7295    "src/f16-dwconv/gen/up16x9-minmax-fma3-acc2.c",
7296    "src/f16-dwconv/gen/up16x9-minmax-fma3.c",
7297    "src/f16-dwconv/gen/up16x25-minmax-fma3-acc2.c",
7298    "src/f16-dwconv/gen/up16x25-minmax-fma3.c",
7299    "src/f16-dwconv/gen/up32x3-minmax-fma3-acc2.c",
7300    "src/f16-dwconv/gen/up32x3-minmax-fma3.c",
7301    "src/f16-dwconv/gen/up32x4-minmax-fma3-acc2.c",
7302    "src/f16-dwconv/gen/up32x4-minmax-fma3.c",
7303    "src/f16-dwconv/gen/up32x9-minmax-fma3-acc2.c",
7304    "src/f16-dwconv/gen/up32x9-minmax-fma3.c",
7305    "src/f16-dwconv/gen/up32x25-minmax-fma3-acc2.c",
7306    "src/f16-dwconv/gen/up32x25-minmax-fma3.c",
7307    "src/f16-ibilinear/gen/fma3-c8.c",
7308    "src/f16-ibilinear/gen/fma3-c16.c",
7309    "src/f16-vmulcaddc/gen/c8-minmax-fma3-2x.c",
7310    "src/f16-vmulcaddc/gen/c16-minmax-fma3-2x.c",
7311    "src/f32-dwconv/gen/up8x3-minmax-fma3-acc2.c",
7312    "src/f32-dwconv/gen/up8x3-minmax-fma3.c",
7313    "src/f32-dwconv/gen/up8x4-minmax-fma3-acc2.c",
7314    "src/f32-dwconv/gen/up8x4-minmax-fma3.c",
7315    "src/f32-dwconv/gen/up8x9-minmax-fma3-acc2.c",
7316    "src/f32-dwconv/gen/up8x9-minmax-fma3.c",
7317    "src/f32-dwconv/gen/up8x25-minmax-fma3-acc2.c",
7318    "src/f32-dwconv/gen/up8x25-minmax-fma3.c",
7319    "src/f32-dwconv/gen/up16x3-minmax-fma3-acc2.c",
7320    "src/f32-dwconv/gen/up16x3-minmax-fma3.c",
7321    "src/f32-dwconv/gen/up16x4-minmax-fma3-acc2.c",
7322    "src/f32-dwconv/gen/up16x4-minmax-fma3.c",
7323    "src/f32-dwconv/gen/up16x9-minmax-fma3-acc2.c",
7324    "src/f32-dwconv/gen/up16x9-minmax-fma3.c",
7325    "src/f32-dwconv/gen/up16x25-minmax-fma3-acc2.c",
7326    "src/f32-dwconv/gen/up16x25-minmax-fma3.c",
7327    "src/f32-gemm/gen-inc/1x8inc-minmax-fma3-broadcast.c",
7328    "src/f32-gemm/gen-inc/1x16inc-minmax-fma3-broadcast.c",
7329    "src/f32-gemm/gen-inc/1x16s4inc-minmax-fma3-broadcast.c",
7330    "src/f32-gemm/gen-inc/3x16inc-minmax-fma3-broadcast.c",
7331    "src/f32-gemm/gen-inc/3x16s4inc-minmax-fma3-broadcast.c",
7332    "src/f32-gemm/gen-inc/4x8inc-minmax-fma3-broadcast.c",
7333    "src/f32-gemm/gen-inc/4x16inc-minmax-fma3-broadcast.c",
7334    "src/f32-gemm/gen-inc/4x16s4inc-minmax-fma3-broadcast.c",
7335    "src/f32-gemm/gen-inc/5x8inc-minmax-fma3-broadcast.c",
7336    "src/f32-gemm/gen-inc/5x16inc-minmax-fma3-broadcast.c",
7337    "src/f32-gemm/gen-inc/5x16s4inc-minmax-fma3-broadcast.c",
7338    "src/f32-gemm/gen-inc/6x8inc-minmax-fma3-broadcast.c",
7339    "src/f32-gemm/gen-inc/7x8inc-minmax-fma3-broadcast.c",
7340    "src/f32-gemm/gen-inc/8x8inc-minmax-fma3-broadcast.c",
7341    "src/f32-gemm/gen/1x8-minmax-fma3-broadcast.c",
7342    "src/f32-gemm/gen/1x16-minmax-fma3-broadcast.c",
7343    "src/f32-gemm/gen/1x16s4-minmax-fma3-broadcast.c",
7344    "src/f32-gemm/gen/3x16-minmax-fma3-broadcast.c",
7345    "src/f32-gemm/gen/3x16s4-minmax-fma3-broadcast.c",
7346    "src/f32-gemm/gen/4x8-minmax-fma3-broadcast.c",
7347    "src/f32-gemm/gen/4x16-minmax-fma3-broadcast.c",
7348    "src/f32-gemm/gen/4x16s4-minmax-fma3-broadcast.c",
7349    "src/f32-gemm/gen/5x8-minmax-fma3-broadcast.c",
7350    "src/f32-gemm/gen/5x16-minmax-fma3-broadcast.c",
7351    "src/f32-gemm/gen/5x16s4-minmax-fma3-broadcast.c",
7352    "src/f32-gemm/gen/6x8-minmax-fma3-broadcast.c",
7353    "src/f32-gemm/gen/7x8-minmax-fma3-broadcast.c",
7354    "src/f32-gemm/gen/8x8-minmax-fma3-broadcast.c",
7355    "src/f32-igemm/gen/1x8-minmax-fma3-broadcast.c",
7356    "src/f32-igemm/gen/1x16-minmax-fma3-broadcast.c",
7357    "src/f32-igemm/gen/1x16s4-minmax-fma3-broadcast.c",
7358    "src/f32-igemm/gen/3x16-minmax-fma3-broadcast.c",
7359    "src/f32-igemm/gen/3x16s4-minmax-fma3-broadcast.c",
7360    "src/f32-igemm/gen/4x8-minmax-fma3-broadcast.c",
7361    "src/f32-igemm/gen/4x16-minmax-fma3-broadcast.c",
7362    "src/f32-igemm/gen/4x16s4-minmax-fma3-broadcast.c",
7363    "src/f32-igemm/gen/5x8-minmax-fma3-broadcast.c",
7364    "src/f32-igemm/gen/5x16-minmax-fma3-broadcast.c",
7365    "src/f32-igemm/gen/5x16s4-minmax-fma3-broadcast.c",
7366    "src/f32-igemm/gen/6x8-minmax-fma3-broadcast.c",
7367    "src/f32-igemm/gen/7x8-minmax-fma3-broadcast.c",
7368    "src/f32-igemm/gen/8x8-minmax-fma3-broadcast.c",
7369    "src/f32-vhswish/gen/vhswish-fma3-x8.c",
7370    "src/f32-vhswish/gen/vhswish-fma3-x16.c",
7371    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x8.c",
7372    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x16.c",
7373    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x24.c",
7374    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x32.c",
7375    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x40.c",
7376    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x48.c",
7377    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x56.c",
7378    "src/f32-vsqrt/gen/fma3-nr1fma1adj-x64.c",
7379    "src/math/sqrt-fma3-nr1fma.c",
7380    "src/math/sqrt-fma3-nr1fma1adj.c",
7381    "src/math/sqrt-fma3-nr2fma.c",
7382]
7383
7384PROD_AVX2_MICROKERNEL_SRCS = [
7385    "src/f16-gemm/gen/1x16-minmax-avx2-broadcast.c",
7386    "src/f16-gemm/gen/4x16-minmax-avx2-broadcast.c",
7387    "src/f16-igemm/gen/1x16-minmax-avx2-broadcast.c",
7388    "src/f16-igemm/gen/4x16-minmax-avx2-broadcast.c",
7389    "src/f16-pavgpool/9p8x-minmax-avx2-c8.c",
7390    "src/f16-pavgpool/9x-minmax-avx2-c8.c",
7391    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x40.c",
7392    "src/f16-velu/gen/velu-avx2-rr1-p3-x16.c",
7393    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x32.c",
7394    "src/f32-qs8-vcvt/gen/vcvt-avx2-x64.c",
7395    "src/f32-qu8-vcvt/gen/vcvt-avx2-x64.c",
7396    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x56.c",
7397    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x40.c",
7398    "src/qc8-dwconv/gen/up16x3-minmax-fp32-avx2-mul32.c",
7399    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7400    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7401    "src/qc8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7402    "src/qc8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7403    "src/qc8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7404    "src/qc8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7405    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7406    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7407    "src/qs8-f32-vcvt/gen/vcvt-avx2-x16.c",
7408    "src/qs8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7409    "src/qs8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7410    "src/qs8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7411    "src/qs8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7412    "src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x16.c",
7413    "src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c",
7414    "src/qs8-vcvt/gen/vcvt-avx2-x32.c",
7415    "src/qs8-vlrelu/gen/vlrelu-avx2-x32.c",
7416    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7417    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7418    "src/qu8-f32-vcvt/gen/vcvt-avx2-x16.c",
7419    "src/qu8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7420    "src/qu8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7421    "src/qu8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7422    "src/qu8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7423    "src/qu8-vadd/gen/minmax-avx2-mul32-ld64-x16.c",
7424    "src/qu8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c",
7425    "src/qu8-vcvt/gen/vcvt-avx2-x32.c",
7426    "src/qu8-vlrelu/gen/vlrelu-avx2-x32.c",
7427    "src/x8-lut/gen/lut-avx2-x128.c",
7428]
7429
7430ALL_AVX2_MICROKERNEL_SRCS = [
7431    "src/f16-gemm/gen/1x8-minmax-avx2-broadcast.c",
7432    "src/f16-gemm/gen/1x16-minmax-avx2-broadcast.c",
7433    "src/f16-gemm/gen/3x16-minmax-avx2-broadcast.c",
7434    "src/f16-gemm/gen/4x8-minmax-avx2-broadcast.c",
7435    "src/f16-gemm/gen/4x16-minmax-avx2-broadcast.c",
7436    "src/f16-gemm/gen/5x8-minmax-avx2-broadcast.c",
7437    "src/f16-gemm/gen/5x16-minmax-avx2-broadcast.c",
7438    "src/f16-gemm/gen/6x8-minmax-avx2-broadcast.c",
7439    "src/f16-gemm/gen/7x8-minmax-avx2-broadcast.c",
7440    "src/f16-igemm/gen/1x8-minmax-avx2-broadcast.c",
7441    "src/f16-igemm/gen/1x16-minmax-avx2-broadcast.c",
7442    "src/f16-igemm/gen/3x16-minmax-avx2-broadcast.c",
7443    "src/f16-igemm/gen/4x8-minmax-avx2-broadcast.c",
7444    "src/f16-igemm/gen/4x16-minmax-avx2-broadcast.c",
7445    "src/f16-igemm/gen/5x8-minmax-avx2-broadcast.c",
7446    "src/f16-igemm/gen/5x16-minmax-avx2-broadcast.c",
7447    "src/f16-igemm/gen/6x8-minmax-avx2-broadcast.c",
7448    "src/f16-igemm/gen/7x8-minmax-avx2-broadcast.c",
7449    "src/f16-pavgpool/9p8x-minmax-avx2-c8.c",
7450    "src/f16-pavgpool/9x-minmax-avx2-c8.c",
7451    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x32-acc2.c",
7452    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x32-acc4.c",
7453    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x32.c",
7454    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x40-acc2.c",
7455    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x40-acc5.c",
7456    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x40.c",
7457    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x48-acc2.c",
7458    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x48-acc3.c",
7459    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x48.c",
7460    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x64-acc2.c",
7461    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x64-acc4.c",
7462    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x64.c",
7463    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x72-acc3.c",
7464    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x72.c",
7465    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x80-acc2.c",
7466    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x80-acc5.c",
7467    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x80.c",
7468    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x96-acc2.c",
7469    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x96-acc3.c",
7470    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x96-acc6.c",
7471    "src/f16-raddstoreexpminusmax/gen/avx2-rr1-p2-x96.c",
7472    "src/f16-velu/gen/velu-avx2-rr1-p3-x8.c",
7473    "src/f16-velu/gen/velu-avx2-rr1-p3-x16.c",
7474    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x8.c",
7475    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x16.c",
7476    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x24.c",
7477    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x32.c",
7478    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x40.c",
7479    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x48.c",
7480    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x56.c",
7481    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-div-x64.c",
7482    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x8.c",
7483    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x16.c",
7484    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x24.c",
7485    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x32.c",
7486    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x40.c",
7487    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x48.c",
7488    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x56.c",
7489    "src/f16-vsigmoid/gen/vsigmoid-avx2-rr1-p2-rcp-x64.c",
7490    "src/f32-qs8-vcvt/gen/vcvt-avx2-x16.c",
7491    "src/f32-qs8-vcvt/gen/vcvt-avx2-x32.c",
7492    "src/f32-qs8-vcvt/gen/vcvt-avx2-x48.c",
7493    "src/f32-qs8-vcvt/gen/vcvt-avx2-x64.c",
7494    "src/f32-qu8-vcvt/gen/vcvt-avx2-x16.c",
7495    "src/f32-qu8-vcvt/gen/vcvt-avx2-x32.c",
7496    "src/f32-qu8-vcvt/gen/vcvt-avx2-x48.c",
7497    "src/f32-qu8-vcvt/gen/vcvt-avx2-x64.c",
7498    "src/f32-raddexpminusmax/gen/avx2-p5-x64-acc2.c",
7499    "src/f32-raddexpminusmax/gen/avx2-p5-x64-acc4.c",
7500    "src/f32-raddexpminusmax/gen/avx2-p5-x64.c",
7501    "src/f32-raddexpminusmax/gen/avx2-p5-x72-acc3.c",
7502    "src/f32-raddexpminusmax/gen/avx2-p5-x72.c",
7503    "src/f32-raddexpminusmax/gen/avx2-p5-x80-acc2.c",
7504    "src/f32-raddexpminusmax/gen/avx2-p5-x80-acc5.c",
7505    "src/f32-raddexpminusmax/gen/avx2-p5-x80.c",
7506    "src/f32-raddexpminusmax/gen/avx2-p5-x96-acc2.c",
7507    "src/f32-raddexpminusmax/gen/avx2-p5-x96-acc3.c",
7508    "src/f32-raddexpminusmax/gen/avx2-p5-x96-acc6.c",
7509    "src/f32-raddexpminusmax/gen/avx2-p5-x96.c",
7510    "src/f32-raddextexp/gen/avx2-p5-x64-acc2.c",
7511    "src/f32-raddextexp/gen/avx2-p5-x64-acc4.c",
7512    "src/f32-raddextexp/gen/avx2-p5-x64.c",
7513    "src/f32-raddextexp/gen/avx2-p5-x72-acc3.c",
7514    "src/f32-raddextexp/gen/avx2-p5-x72.c",
7515    "src/f32-raddextexp/gen/avx2-p5-x80-acc2.c",
7516    "src/f32-raddextexp/gen/avx2-p5-x80-acc5.c",
7517    "src/f32-raddextexp/gen/avx2-p5-x80.c",
7518    "src/f32-raddextexp/gen/avx2-p5-x96-acc2.c",
7519    "src/f32-raddextexp/gen/avx2-p5-x96-acc3.c",
7520    "src/f32-raddextexp/gen/avx2-p5-x96-acc6.c",
7521    "src/f32-raddextexp/gen/avx2-p5-x96.c",
7522    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x64-acc2.c",
7523    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x64-acc4.c",
7524    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x64.c",
7525    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x72-acc3.c",
7526    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x72.c",
7527    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x80-acc2.c",
7528    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x80-acc5.c",
7529    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x80.c",
7530    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x96-acc2.c",
7531    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x96-acc3.c",
7532    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x96-acc6.c",
7533    "src/f32-raddstoreexpminusmax/gen/avx2-rr1-p5-x96.c",
7534    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x8.c",
7535    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x16.c",
7536    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x24.c",
7537    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x32.c",
7538    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x40.c",
7539    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x48.c",
7540    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x56.c",
7541    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x64.c",
7542    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x72.c",
7543    "src/f32-velu/gen/velu-avx2-rr1-lut4-p4-perm-x80.c",
7544    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x8.c",
7545    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x16.c",
7546    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x24.c",
7547    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x32.c",
7548    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x40.c",
7549    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x48.c",
7550    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x56.c",
7551    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x64.c",
7552    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x72.c",
7553    "src/f32-velu/gen/velu-avx2-rr1-lut8-p4-perm-x80.c",
7554    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x8.c",
7555    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x16.c",
7556    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x24.c",
7557    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x32.c",
7558    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x40.c",
7559    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x48.c",
7560    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x56.c",
7561    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x64.c",
7562    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x72.c",
7563    "src/f32-velu/gen/velu-avx2-rr1-lut16-p3-gather-x80.c",
7564    "src/f32-velu/gen/velu-avx2-rr1-p6-x8.c",
7565    "src/f32-velu/gen/velu-avx2-rr1-p6-x16.c",
7566    "src/f32-velu/gen/velu-avx2-rr1-p6-x24.c",
7567    "src/f32-velu/gen/velu-avx2-rr1-p6-x32.c",
7568    "src/f32-velu/gen/velu-avx2-rr1-p6-x40.c",
7569    "src/f32-velu/gen/velu-avx2-rr1-p6-x48.c",
7570    "src/f32-velu/gen/velu-avx2-rr1-p6-x56.c",
7571    "src/f32-velu/gen/velu-avx2-rr1-p6-x64.c",
7572    "src/f32-velu/gen/velu-avx2-rr1-p6-x72.c",
7573    "src/f32-velu/gen/velu-avx2-rr1-p6-x80.c",
7574    "src/f32-vscaleexpminusmax/gen/avx2-p5-x8.c",
7575    "src/f32-vscaleexpminusmax/gen/avx2-p5-x16.c",
7576    "src/f32-vscaleexpminusmax/gen/avx2-p5-x24.c",
7577    "src/f32-vscaleexpminusmax/gen/avx2-p5-x32.c",
7578    "src/f32-vscaleexpminusmax/gen/avx2-p5-x40.c",
7579    "src/f32-vscaleexpminusmax/gen/avx2-p5-x48.c",
7580    "src/f32-vscaleexpminusmax/gen/avx2-p5-x56.c",
7581    "src/f32-vscaleexpminusmax/gen/avx2-p5-x64.c",
7582    "src/f32-vscaleexpminusmax/gen/avx2-p5-x72.c",
7583    "src/f32-vscaleexpminusmax/gen/avx2-p5-x80.c",
7584    "src/f32-vscaleexpminusmax/gen/avx2-p5-x88.c",
7585    "src/f32-vscaleexpminusmax/gen/avx2-p5-x96.c",
7586    "src/f32-vscaleextexp/gen/avx2-p5-x8.c",
7587    "src/f32-vscaleextexp/gen/avx2-p5-x16.c",
7588    "src/f32-vscaleextexp/gen/avx2-p5-x24.c",
7589    "src/f32-vscaleextexp/gen/avx2-p5-x32.c",
7590    "src/f32-vscaleextexp/gen/avx2-p5-x40.c",
7591    "src/f32-vscaleextexp/gen/avx2-p5-x48.c",
7592    "src/f32-vscaleextexp/gen/avx2-p5-x56.c",
7593    "src/f32-vscaleextexp/gen/avx2-p5-x64.c",
7594    "src/f32-vscaleextexp/gen/avx2-p5-x72.c",
7595    "src/f32-vscaleextexp/gen/avx2-p5-x80.c",
7596    "src/f32-vscaleextexp/gen/avx2-p5-x88.c",
7597    "src/f32-vscaleextexp/gen/avx2-p5-x96.c",
7598    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x8.c",
7599    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x16.c",
7600    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x24.c",
7601    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x32.c",
7602    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x40.c",
7603    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x48.c",
7604    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x56.c",
7605    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x64.c",
7606    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x72.c",
7607    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-div-x80.c",
7608    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x8.c",
7609    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x16.c",
7610    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x24.c",
7611    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x32.c",
7612    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x40.c",
7613    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x48.c",
7614    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x56.c",
7615    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x64.c",
7616    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x72.c",
7617    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr1fma-x80.c",
7618    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x8.c",
7619    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x16.c",
7620    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x24.c",
7621    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x32.c",
7622    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x40.c",
7623    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x48.c",
7624    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x56.c",
7625    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x64.c",
7626    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x72.c",
7627    "src/f32-vsigmoid/gen/vsigmoid-avx2-rr1-p5-nr2fma-x80.c",
7628    "src/math/exp-f32-avx2-rr2-lut8-p3-perm.c",
7629    "src/math/exp-f32-avx2-rr2-lut8-p4-perm.c",
7630    "src/math/exp-f32-avx2-rr2-p5.c",
7631    "src/math/expminus-f16-avx2-rr1-p2.c",
7632    "src/math/expminus-f16-avx2-rr1-p3.c",
7633    "src/math/expminus-f32-avx2-rr1-p5.c",
7634    "src/math/expminus-f32-avx2-rr2-p5.c",
7635    "src/math/expm1minus-f16-avx2-rr1-p3.c",
7636    "src/math/expm1minus-f32-avx2-rr1-lut4-p4-perm.c",
7637    "src/math/expm1minus-f32-avx2-rr1-lut8-p4-perm.c",
7638    "src/math/expm1minus-f32-avx2-rr1-lut16-p3-gather.c",
7639    "src/math/expm1minus-f32-avx2-rr1-p6.c",
7640    "src/math/extexp-avx2-p5.c",
7641    "src/math/sigmoid-f16-avx2-rr1-p2-div.c",
7642    "src/math/sigmoid-f16-avx2-rr1-p2-rcp.c",
7643    "src/math/sigmoid-f16-avx2-rr1-p3-div.c",
7644    "src/math/sigmoid-f16-avx2-rr1-p3-rcp.c",
7645    "src/math/sigmoid-f32-avx2-rr1-lut64-p2-gather-div.c",
7646    "src/math/sigmoid-f32-avx2-rr1-lut64-p2-gather-nr1fma.c",
7647    "src/math/sigmoid-f32-avx2-rr1-lut64-p2-gather-nr2fma.c",
7648    "src/math/sigmoid-f32-avx2-rr1-lut64-p2-gather-nr2fma1adj.c",
7649    "src/math/sigmoid-f32-avx2-rr1-p5-div.c",
7650    "src/math/sigmoid-f32-avx2-rr1-p5-nr1fma.c",
7651    "src/math/sigmoid-f32-avx2-rr1-p5-nr2fma.c",
7652    "src/math/sigmoid-f32-avx2-rr2-lut64-p2-gather-div.c",
7653    "src/math/sigmoid-f32-avx2-rr2-lut64-p2-gather-nr1fma.c",
7654    "src/math/sigmoid-f32-avx2-rr2-lut64-p2-gather-nr2fma.c",
7655    "src/math/sigmoid-f32-avx2-rr2-lut64-p2-gather-nr2fma1adj.c",
7656    "src/math/sigmoid-f32-avx2-rr2-p5-div.c",
7657    "src/math/sigmoid-f32-avx2-rr2-p5-nr1fma.c",
7658    "src/math/sigmoid-f32-avx2-rr2-p5-nr2fma.c",
7659    "src/qc8-dwconv/gen/up8x9-minmax-fp32-avx2-mul32.c",
7660    "src/qc8-dwconv/gen/up8x25-minmax-fp32-avx2-mul32.c",
7661    "src/qc8-dwconv/gen/up16x3-minmax-fp32-avx2-mul32.c",
7662    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7663    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-vpmovsx.c",
7664    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-vpunpck.c",
7665    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7666    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7667    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-vpmovsx.c",
7668    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-vpunpck.c",
7669    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7670    "src/qc8-dwconv/gen/up24x9-minmax-fp32-avx2-mul32.c",
7671    "src/qc8-dwconv/gen/up24x25-minmax-fp32-avx2-mul32.c",
7672    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7673    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-vpmovsx.c",
7674    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-vpunpck.c",
7675    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx2-mul32.c",
7676    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7677    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-vpmovsx.c",
7678    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-vpunpck.c",
7679    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx2-mul32.c",
7680    "src/qc8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7681    "src/qc8-gemm/gen/1x8c8-xw-minmax-fp32-avx2.c",
7682    "src/qc8-gemm/gen/2x8c8-minmax-fp32-avx2.c",
7683    "src/qc8-gemm/gen/2x8c8-xw-minmax-fp32-avx2.c",
7684    "src/qc8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7685    "src/qc8-gemm/gen/3x8c8-xw-minmax-fp32-avx2.c",
7686    "src/qc8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7687    "src/qc8-igemm/gen/2x8c8-minmax-fp32-avx2.c",
7688    "src/qc8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7689    "src/qs8-dwconv/gen/up8x9-minmax-fp32-avx2-mul32.c",
7690    "src/qs8-dwconv/gen/up8x25-minmax-fp32-avx2-mul32.c",
7691    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7692    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-vpmovsx.c",
7693    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul16-vpunpck.c",
7694    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7695    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7696    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-vpmovsx.c",
7697    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul16-vpunpck.c",
7698    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7699    "src/qs8-dwconv/gen/up24x9-minmax-fp32-avx2-mul32.c",
7700    "src/qs8-dwconv/gen/up24x25-minmax-fp32-avx2-mul32.c",
7701    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7702    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-vpmovsx.c",
7703    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx2-mul16-vpunpck.c",
7704    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx2-mul32.c",
7705    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-add16-vpunpck.c",
7706    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-vpmovsx.c",
7707    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx2-mul16-vpunpck.c",
7708    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx2-mul32.c",
7709    "src/qs8-f32-vcvt/gen/vcvt-avx2-x8.c",
7710    "src/qs8-f32-vcvt/gen/vcvt-avx2-x16.c",
7711    "src/qs8-f32-vcvt/gen/vcvt-avx2-x24.c",
7712    "src/qs8-f32-vcvt/gen/vcvt-avx2-x32.c",
7713    "src/qs8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7714    "src/qs8-gemm/gen/1x8c8-xw-minmax-fp32-avx2.c",
7715    "src/qs8-gemm/gen/2x8c8-minmax-fp32-avx2.c",
7716    "src/qs8-gemm/gen/2x8c8-xw-minmax-fp32-avx2.c",
7717    "src/qs8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7718    "src/qs8-gemm/gen/3x8c8-xw-minmax-fp32-avx2.c",
7719    "src/qs8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7720    "src/qs8-igemm/gen/2x8c8-minmax-fp32-avx2.c",
7721    "src/qs8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7722    "src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x8.c",
7723    "src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x16.c",
7724    "src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x24.c",
7725    "src/qs8-vadd/gen/minmax-avx2-mul32-ld64-x32.c",
7726    "src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x8.c",
7727    "src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c",
7728    "src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x24.c",
7729    "src/qs8-vaddc/gen/minmax-avx2-mul32-ld64-x32.c",
7730    "src/qs8-vcvt/gen/vcvt-avx2-x16.c",
7731    "src/qs8-vcvt/gen/vcvt-avx2-x32.c",
7732    "src/qs8-vcvt/gen/vcvt-avx2-x64.c",
7733    "src/qs8-vlrelu/gen/vlrelu-avx2-x16.c",
7734    "src/qs8-vlrelu/gen/vlrelu-avx2-x32.c",
7735    "src/qs8-vlrelu/gen/vlrelu-avx2-x64.c",
7736    "src/qu8-dwconv/gen/up8x9-minmax-fp32-avx2-mul32.c",
7737    "src/qu8-dwconv/gen/up8x25-minmax-fp32-avx2-mul32.c",
7738    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx2-mul32.c",
7739    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx2-mul32.c",
7740    "src/qu8-dwconv/gen/up32x9-minmax-fp32-avx2-mul32.c",
7741    "src/qu8-dwconv/gen/up32x25-minmax-fp32-avx2-mul32.c",
7742    "src/qu8-f32-vcvt/gen/vcvt-avx2-x8.c",
7743    "src/qu8-f32-vcvt/gen/vcvt-avx2-x16.c",
7744    "src/qu8-f32-vcvt/gen/vcvt-avx2-x24.c",
7745    "src/qu8-f32-vcvt/gen/vcvt-avx2-x32.c",
7746    "src/qu8-gemm/gen/1x8c8-minmax-fp32-avx2.c",
7747    "src/qu8-gemm/gen/2x8c8-minmax-fp32-avx2.c",
7748    "src/qu8-gemm/gen/3x8c8-minmax-fp32-avx2.c",
7749    "src/qu8-igemm/gen/1x8c8-minmax-fp32-avx2.c",
7750    "src/qu8-igemm/gen/2x8c8-minmax-fp32-avx2.c",
7751    "src/qu8-igemm/gen/3x8c8-minmax-fp32-avx2.c",
7752    "src/qu8-vadd/gen/minmax-avx2-mul32-ld64-x8.c",
7753    "src/qu8-vadd/gen/minmax-avx2-mul32-ld64-x16.c",
7754    "src/qu8-vaddc/gen/minmax-avx2-mul32-ld64-x8.c",
7755    "src/qu8-vaddc/gen/minmax-avx2-mul32-ld64-x16.c",
7756    "src/qu8-vcvt/gen/vcvt-avx2-x16.c",
7757    "src/qu8-vcvt/gen/vcvt-avx2-x32.c",
7758    "src/qu8-vcvt/gen/vcvt-avx2-x64.c",
7759    "src/qu8-vlrelu/gen/vlrelu-avx2-x16.c",
7760    "src/qu8-vlrelu/gen/vlrelu-avx2-x32.c",
7761    "src/qu8-vlrelu/gen/vlrelu-avx2-x64.c",
7762    "src/x8-lut/gen/lut-avx2-x32.c",
7763    "src/x8-lut/gen/lut-avx2-x64.c",
7764    "src/x8-lut/gen/lut-avx2-x96.c",
7765    "src/x8-lut/gen/lut-avx2-x128.c",
7766]
7767
7768PROD_AVX512F_MICROKERNEL_SRCS = [
7769    "src/f32-dwconv/gen/up16x3-minmax-avx512f.c",
7770    "src/f32-dwconv/gen/up16x4-minmax-avx512f.c",
7771    "src/f32-dwconv/gen/up16x9-minmax-avx512f.c",
7772    "src/f32-dwconv/gen/up16x25-minmax-avx512f.c",
7773    "src/f32-gemm/gen/1x16-minmax-avx512f-broadcast.c",
7774    "src/f32-gemm/gen/7x16-minmax-avx512f-broadcast.c",
7775    "src/f32-igemm/gen/1x16-minmax-avx512f-broadcast.c",
7776    "src/f32-igemm/gen/7x16-minmax-avx512f-broadcast.c",
7777    "src/f32-prelu/gen/avx512f-2x16.c",
7778    "src/f32-vbinary/gen/vadd-minmax-avx512f-x32.c",
7779    "src/f32-vbinary/gen/vaddc-minmax-avx512f-x32.c",
7780    "src/f32-vbinary/gen/vdiv-minmax-avx512f-x32.c",
7781    "src/f32-vbinary/gen/vdivc-minmax-avx512f-x32.c",
7782    "src/f32-vbinary/gen/vmax-avx512f-x32.c",
7783    "src/f32-vbinary/gen/vmaxc-avx512f-x32.c",
7784    "src/f32-vbinary/gen/vmin-avx512f-x32.c",
7785    "src/f32-vbinary/gen/vminc-avx512f-x32.c",
7786    "src/f32-vbinary/gen/vmul-minmax-avx512f-x32.c",
7787    "src/f32-vbinary/gen/vmulc-minmax-avx512f-x32.c",
7788    "src/f32-vbinary/gen/vrdivc-minmax-avx512f-x32.c",
7789    "src/f32-vbinary/gen/vrsubc-minmax-avx512f-x32.c",
7790    "src/f32-vbinary/gen/vsqrdiff-avx512f-x32.c",
7791    "src/f32-vbinary/gen/vsqrdiffc-avx512f-x32.c",
7792    "src/f32-vbinary/gen/vsub-minmax-avx512f-x32.c",
7793    "src/f32-vbinary/gen/vsubc-minmax-avx512f-x32.c",
7794    "src/f32-vclamp/gen/vclamp-avx512f-x16.c",
7795    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x64.c",
7796    "src/f32-vhswish/gen/vhswish-avx512f-x16.c",
7797    "src/f32-vlrelu/gen/vlrelu-avx512f-x16.c",
7798    "src/f32-vrnd/gen/vrndd-avx512f-x16.c",
7799    "src/f32-vrnd/gen/vrndne-avx512f-x16.c",
7800    "src/f32-vrnd/gen/vrndu-avx512f-x16.c",
7801    "src/f32-vrnd/gen/vrndz-avx512f-x16.c",
7802    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x64.c",
7803    "src/f32-vunary/gen/vabs-avx512f-x16.c",
7804    "src/f32-vunary/gen/vneg-avx512f-x16.c",
7805    "src/f32-vunary/gen/vsqr-avx512f-x16.c",
7806]
7807
7808ALL_AVX512F_MICROKERNEL_SRCS = [
7809    "src/f32-dwconv/gen/up16x3-minmax-avx512f-acc2.c",
7810    "src/f32-dwconv/gen/up16x3-minmax-avx512f.c",
7811    "src/f32-dwconv/gen/up16x4-minmax-avx512f-acc2.c",
7812    "src/f32-dwconv/gen/up16x4-minmax-avx512f.c",
7813    "src/f32-dwconv/gen/up16x9-minmax-avx512f-acc2.c",
7814    "src/f32-dwconv/gen/up16x9-minmax-avx512f.c",
7815    "src/f32-dwconv/gen/up16x25-minmax-avx512f-acc2.c",
7816    "src/f32-dwconv/gen/up16x25-minmax-avx512f.c",
7817    "src/f32-dwconv/gen/up32x3-minmax-avx512f-acc2.c",
7818    "src/f32-dwconv/gen/up32x3-minmax-avx512f.c",
7819    "src/f32-dwconv/gen/up32x4-minmax-avx512f-acc2.c",
7820    "src/f32-dwconv/gen/up32x4-minmax-avx512f.c",
7821    "src/f32-dwconv/gen/up32x9-minmax-avx512f-acc2.c",
7822    "src/f32-dwconv/gen/up32x9-minmax-avx512f.c",
7823    "src/f32-dwconv/gen/up32x25-minmax-avx512f-acc2.c",
7824    "src/f32-dwconv/gen/up32x25-minmax-avx512f.c",
7825    "src/f32-gemm/gen-inc/1x16inc-minmax-avx512f-broadcast.c",
7826    "src/f32-gemm/gen-inc/4x16inc-minmax-avx512f-broadcast.c",
7827    "src/f32-gemm/gen-inc/5x16inc-minmax-avx512f-broadcast.c",
7828    "src/f32-gemm/gen-inc/6x16inc-minmax-avx512f-broadcast.c",
7829    "src/f32-gemm/gen-inc/7x16inc-minmax-avx512f-broadcast.c",
7830    "src/f32-gemm/gen-inc/8x16inc-minmax-avx512f-broadcast.c",
7831    "src/f32-gemm/gen/1x16-minmax-avx512f-broadcast.c",
7832    "src/f32-gemm/gen/4x16-minmax-avx512f-broadcast.c",
7833    "src/f32-gemm/gen/5x16-minmax-avx512f-broadcast.c",
7834    "src/f32-gemm/gen/6x16-minmax-avx512f-broadcast.c",
7835    "src/f32-gemm/gen/7x16-minmax-avx512f-broadcast.c",
7836    "src/f32-gemm/gen/8x16-minmax-avx512f-broadcast.c",
7837    "src/f32-igemm/gen/1x16-minmax-avx512f-broadcast.c",
7838    "src/f32-igemm/gen/4x16-minmax-avx512f-broadcast.c",
7839    "src/f32-igemm/gen/5x16-minmax-avx512f-broadcast.c",
7840    "src/f32-igemm/gen/6x16-minmax-avx512f-broadcast.c",
7841    "src/f32-igemm/gen/7x16-minmax-avx512f-broadcast.c",
7842    "src/f32-igemm/gen/8x16-minmax-avx512f-broadcast.c",
7843    "src/f32-prelu/gen/avx512f-2x16.c",
7844    "src/f32-prelu/gen/avx512f-2x32.c",
7845    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc2.c",
7846    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128-acc4.c",
7847    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x128.c",
7848    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144-acc3.c",
7849    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x144.c",
7850    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc2.c",
7851    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160-acc5.c",
7852    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x160.c",
7853    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc2.c",
7854    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc3.c",
7855    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192-acc6.c",
7856    "src/f32-raddexpminusmax/gen/avx512f-p5-scalef-x192.c",
7857    "src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc2.c",
7858    "src/f32-raddextexp/gen/avx512f-p5-scalef-x128-acc4.c",
7859    "src/f32-raddextexp/gen/avx512f-p5-scalef-x128.c",
7860    "src/f32-raddextexp/gen/avx512f-p5-scalef-x144-acc3.c",
7861    "src/f32-raddextexp/gen/avx512f-p5-scalef-x144.c",
7862    "src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc2.c",
7863    "src/f32-raddextexp/gen/avx512f-p5-scalef-x160-acc5.c",
7864    "src/f32-raddextexp/gen/avx512f-p5-scalef-x160.c",
7865    "src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc2.c",
7866    "src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc3.c",
7867    "src/f32-raddextexp/gen/avx512f-p5-scalef-x192-acc6.c",
7868    "src/f32-raddextexp/gen/avx512f-p5-scalef-x192.c",
7869    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x128-acc2.c",
7870    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x128-acc4.c",
7871    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x128.c",
7872    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x144-acc3.c",
7873    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x144.c",
7874    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x160-acc2.c",
7875    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x160-acc5.c",
7876    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x160.c",
7877    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x192-acc2.c",
7878    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x192-acc3.c",
7879    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x192-acc6.c",
7880    "src/f32-raddstoreexpminusmax/gen/avx512f-rr1-p5-scalef-x192.c",
7881    "src/f32-rmax/avx512f.c",
7882    "src/f32-vbinary/gen/vadd-minmax-avx512f-x16.c",
7883    "src/f32-vbinary/gen/vadd-minmax-avx512f-x32.c",
7884    "src/f32-vbinary/gen/vaddc-minmax-avx512f-x16.c",
7885    "src/f32-vbinary/gen/vaddc-minmax-avx512f-x32.c",
7886    "src/f32-vbinary/gen/vdiv-minmax-avx512f-x16.c",
7887    "src/f32-vbinary/gen/vdiv-minmax-avx512f-x32.c",
7888    "src/f32-vbinary/gen/vdivc-minmax-avx512f-x16.c",
7889    "src/f32-vbinary/gen/vdivc-minmax-avx512f-x32.c",
7890    "src/f32-vbinary/gen/vmax-avx512f-x16.c",
7891    "src/f32-vbinary/gen/vmax-avx512f-x32.c",
7892    "src/f32-vbinary/gen/vmaxc-avx512f-x16.c",
7893    "src/f32-vbinary/gen/vmaxc-avx512f-x32.c",
7894    "src/f32-vbinary/gen/vmin-avx512f-x16.c",
7895    "src/f32-vbinary/gen/vmin-avx512f-x32.c",
7896    "src/f32-vbinary/gen/vminc-avx512f-x16.c",
7897    "src/f32-vbinary/gen/vminc-avx512f-x32.c",
7898    "src/f32-vbinary/gen/vmul-minmax-avx512f-x16.c",
7899    "src/f32-vbinary/gen/vmul-minmax-avx512f-x32.c",
7900    "src/f32-vbinary/gen/vmulc-minmax-avx512f-x16.c",
7901    "src/f32-vbinary/gen/vmulc-minmax-avx512f-x32.c",
7902    "src/f32-vbinary/gen/vrdivc-minmax-avx512f-x16.c",
7903    "src/f32-vbinary/gen/vrdivc-minmax-avx512f-x32.c",
7904    "src/f32-vbinary/gen/vrsubc-minmax-avx512f-x16.c",
7905    "src/f32-vbinary/gen/vrsubc-minmax-avx512f-x32.c",
7906    "src/f32-vbinary/gen/vsqrdiff-avx512f-x16.c",
7907    "src/f32-vbinary/gen/vsqrdiff-avx512f-x32.c",
7908    "src/f32-vbinary/gen/vsqrdiffc-avx512f-x16.c",
7909    "src/f32-vbinary/gen/vsqrdiffc-avx512f-x32.c",
7910    "src/f32-vbinary/gen/vsub-minmax-avx512f-x16.c",
7911    "src/f32-vbinary/gen/vsub-minmax-avx512f-x32.c",
7912    "src/f32-vbinary/gen/vsubc-minmax-avx512f-x16.c",
7913    "src/f32-vbinary/gen/vsubc-minmax-avx512f-x32.c",
7914    "src/f32-vclamp/gen/vclamp-avx512f-x16.c",
7915    "src/f32-vclamp/gen/vclamp-avx512f-x32.c",
7916    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x16.c",
7917    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x32.c",
7918    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x48.c",
7919    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x64.c",
7920    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x80.c",
7921    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x96.c",
7922    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x112.c",
7923    "src/f32-velu/gen/velu-avx512f-rr1-lut16-p3-perm-x128.c",
7924    "src/f32-velu/gen/velu-avx512f-rr1-p6-x16.c",
7925    "src/f32-velu/gen/velu-avx512f-rr1-p6-x32.c",
7926    "src/f32-velu/gen/velu-avx512f-rr1-p6-x48.c",
7927    "src/f32-velu/gen/velu-avx512f-rr1-p6-x64.c",
7928    "src/f32-velu/gen/velu-avx512f-rr1-p6-x80.c",
7929    "src/f32-velu/gen/velu-avx512f-rr1-p6-x96.c",
7930    "src/f32-velu/gen/velu-avx512f-rr1-p6-x112.c",
7931    "src/f32-velu/gen/velu-avx512f-rr1-p6-x128.c",
7932    "src/f32-vhswish/gen/vhswish-avx512f-x16.c",
7933    "src/f32-vhswish/gen/vhswish-avx512f-x32.c",
7934    "src/f32-vlrelu/gen/vlrelu-avx512f-x16.c",
7935    "src/f32-vlrelu/gen/vlrelu-avx512f-x32.c",
7936    "src/f32-vrelu/gen/vrelu-avx512f-x16.c",
7937    "src/f32-vrelu/gen/vrelu-avx512f-x32.c",
7938    "src/f32-vrnd/gen/vrndd-avx512f-x16.c",
7939    "src/f32-vrnd/gen/vrndd-avx512f-x32.c",
7940    "src/f32-vrnd/gen/vrndne-avx512f-x16.c",
7941    "src/f32-vrnd/gen/vrndne-avx512f-x32.c",
7942    "src/f32-vrnd/gen/vrndu-avx512f-x16.c",
7943    "src/f32-vrnd/gen/vrndu-avx512f-x32.c",
7944    "src/f32-vrnd/gen/vrndz-avx512f-x16.c",
7945    "src/f32-vrnd/gen/vrndz-avx512f-x32.c",
7946    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x16.c",
7947    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x32.c",
7948    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x48.c",
7949    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x64.c",
7950    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x80.c",
7951    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x96.c",
7952    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x112.c",
7953    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x128.c",
7954    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x144.c",
7955    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x160.c",
7956    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x176.c",
7957    "src/f32-vscaleexpminusmax/gen/avx512f-p5-scalef-x192.c",
7958    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x16.c",
7959    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x32.c",
7960    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x48.c",
7961    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x64.c",
7962    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x80.c",
7963    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x96.c",
7964    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x112.c",
7965    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x128.c",
7966    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x144.c",
7967    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x160.c",
7968    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x176.c",
7969    "src/f32-vscaleextexp/gen/avx512f-p5-scalef-x192.c",
7970    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x16.c",
7971    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x32.c",
7972    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x48.c",
7973    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x64.c",
7974    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x80.c",
7975    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x96.c",
7976    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x112.c",
7977    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-x128.c",
7978    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x16.c",
7979    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x32.c",
7980    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x48.c",
7981    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x64.c",
7982    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x80.c",
7983    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x96.c",
7984    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x112.c",
7985    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-x128.c",
7986    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x16.c",
7987    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x32.c",
7988    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x48.c",
7989    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x64.c",
7990    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x80.c",
7991    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x96.c",
7992    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x112.c",
7993    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-div-x128.c",
7994    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x16.c",
7995    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x32.c",
7996    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x48.c",
7997    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x64.c",
7998    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x80.c",
7999    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x96.c",
8000    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x112.c",
8001    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr1-p5-scalef-nr1fma-x128.c",
8002    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x16.c",
8003    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x32.c",
8004    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x48.c",
8005    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x64.c",
8006    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x80.c",
8007    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x96.c",
8008    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x112.c",
8009    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-x128.c",
8010    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x16.c",
8011    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x32.c",
8012    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x48.c",
8013    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x64.c",
8014    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x80.c",
8015    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x96.c",
8016    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x112.c",
8017    "src/f32-vsigmoid/gen/vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x128.c",
8018    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x16.c",
8019    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x32.c",
8020    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x48.c",
8021    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x64.c",
8022    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x80.c",
8023    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x96.c",
8024    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x112.c",
8025    "src/f32-vsqrt/gen/avx512f-nr1fma1adj-x128.c",
8026    "src/f32-vunary/gen/vabs-avx512f-x16.c",
8027    "src/f32-vunary/gen/vabs-avx512f-x32.c",
8028    "src/f32-vunary/gen/vneg-avx512f-x16.c",
8029    "src/f32-vunary/gen/vneg-avx512f-x32.c",
8030    "src/f32-vunary/gen/vsqr-avx512f-x16.c",
8031    "src/f32-vunary/gen/vsqr-avx512f-x32.c",
8032    "src/math/exp-f32-avx512f-rr2-lut16-p3-perm-scalef.c",
8033    "src/math/exp-f32-avx512f-rr2-lut16-p3-perm.c",
8034    "src/math/exp-f32-avx512f-rr2-lut32-p2-perm2-scalef.c",
8035    "src/math/exp-f32-avx512f-rr2-lut32-p2-perm2.c",
8036    "src/math/exp-f32-avx512f-rr2-p5-scalef.c",
8037    "src/math/exp-f32-avx512f-rr2-p5.c",
8038    "src/math/expm1minus-f32-avx512f-rr1-lut16-p3-perm.c",
8039    "src/math/expm1minus-f32-avx512f-rr1-p6.c",
8040    "src/math/extexp-avx512f-p5.c",
8041    "src/math/sigmoid-f32-avx512f-rr1-lut16-p3-perm-scalef-div.c",
8042    "src/math/sigmoid-f32-avx512f-rr1-lut16-p3-perm-scalef-nr1fma.c",
8043    "src/math/sigmoid-f32-avx512f-rr1-lut16-p3-perm-scalef-nr1fma1adj.c",
8044    "src/math/sigmoid-f32-avx512f-rr1-lut32-p2-perm2-scalef-div.c",
8045    "src/math/sigmoid-f32-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma.c",
8046    "src/math/sigmoid-f32-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma1adj.c",
8047    "src/math/sigmoid-f32-avx512f-rr1-lut64-p2-gather-scalef-div.c",
8048    "src/math/sigmoid-f32-avx512f-rr1-lut64-p2-gather-scalef-nr1fma.c",
8049    "src/math/sigmoid-f32-avx512f-rr1-lut64-p2-gather-scalef-nr1fma1adj.c",
8050    "src/math/sigmoid-f32-avx512f-rr1-p5-scalef-div.c",
8051    "src/math/sigmoid-f32-avx512f-rr1-p5-scalef-nr1fma.c",
8052    "src/math/sigmoid-f32-avx512f-rr1-p5-scalef-nr1fma1adj.c",
8053    "src/math/sigmoid-f32-avx512f-rr2-lut16-p3-perm-scalef-div.c",
8054    "src/math/sigmoid-f32-avx512f-rr2-lut16-p3-perm-scalef-nr1fma.c",
8055    "src/math/sigmoid-f32-avx512f-rr2-lut16-p3-perm-scalef-nr1fma1adj.c",
8056    "src/math/sigmoid-f32-avx512f-rr2-lut32-p2-perm2-scalef-div.c",
8057    "src/math/sigmoid-f32-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma.c",
8058    "src/math/sigmoid-f32-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma1adj.c",
8059    "src/math/sigmoid-f32-avx512f-rr2-lut64-p2-gather-scalef-div.c",
8060    "src/math/sigmoid-f32-avx512f-rr2-lut64-p2-gather-scalef-nr1fma.c",
8061    "src/math/sigmoid-f32-avx512f-rr2-lut64-p2-gather-scalef-nr1fma1adj.c",
8062    "src/math/sigmoid-f32-avx512f-rr2-p5-scalef-div.c",
8063    "src/math/sigmoid-f32-avx512f-rr2-p5-scalef-nr1fma.c",
8064    "src/math/sigmoid-f32-avx512f-rr2-p5-scalef-nr1fma1adj.c",
8065    "src/math/sqrt-avx512f-nr1fma.c",
8066    "src/math/sqrt-avx512f-nr1fma1adj.c",
8067    "src/math/sqrt-avx512f-nr2fma.c",
8068]
8069
8070PROD_AVX512SKX_MICROKERNEL_SRCS = [
8071    "src/f16-f32-vcvt/gen/vcvt-avx512skx-x16.c",
8072    "src/f32-f16-vcvt/gen/vcvt-avx512skx-x16.c",
8073    "src/f32-qs8-vcvt/gen/vcvt-avx512skx-x128.c",
8074    "src/f32-qu8-vcvt/gen/vcvt-avx512skx-x128.c",
8075    "src/qc8-dwconv/gen/up32x3-minmax-fp32-avx512skx-mul32.c",
8076    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8077    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8078    "src/qc8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8079    "src/qc8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8080    "src/qc8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8081    "src/qc8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8082    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8083    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8084    "src/qs8-f32-vcvt/gen/vcvt-avx512skx-x32.c",
8085    "src/qs8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8086    "src/qs8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8087    "src/qs8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8088    "src/qs8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8089    "src/qs8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c",
8090    "src/qs8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c",
8091    "src/qu8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8092    "src/qu8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8093    "src/qu8-f32-vcvt/gen/vcvt-avx512skx-x32.c",
8094    "src/qu8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8095    "src/qu8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8096    "src/qu8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8097    "src/qu8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8098    "src/qu8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c",
8099    "src/qu8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c",
8100    "src/x8-lut/gen/lut-avx512skx-vpshufb-x64.c",
8101]
8102
8103ALL_AVX512SKX_MICROKERNEL_SRCS = [
8104    "src/f16-f32-vcvt/gen/vcvt-avx512skx-x16.c",
8105    "src/f16-f32-vcvt/gen/vcvt-avx512skx-x32.c",
8106    "src/f32-f16-vcvt/gen/vcvt-avx512skx-x16.c",
8107    "src/f32-f16-vcvt/gen/vcvt-avx512skx-x32.c",
8108    "src/f32-qs8-vcvt/gen/vcvt-avx512skx-x32.c",
8109    "src/f32-qs8-vcvt/gen/vcvt-avx512skx-x64.c",
8110    "src/f32-qs8-vcvt/gen/vcvt-avx512skx-x96.c",
8111    "src/f32-qs8-vcvt/gen/vcvt-avx512skx-x128.c",
8112    "src/f32-qu8-vcvt/gen/vcvt-avx512skx-x32.c",
8113    "src/f32-qu8-vcvt/gen/vcvt-avx512skx-x64.c",
8114    "src/f32-qu8-vcvt/gen/vcvt-avx512skx-x96.c",
8115    "src/f32-qu8-vcvt/gen/vcvt-avx512skx-x128.c",
8116    "src/qc8-dwconv/gen/up16x9-minmax-fp32-avx512skx-mul32.c",
8117    "src/qc8-dwconv/gen/up16x25-minmax-fp32-avx512skx-mul32.c",
8118    "src/qc8-dwconv/gen/up32x3-minmax-fp32-avx512skx-mul32.c",
8119    "src/qc8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8120    "src/qc8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8121    "src/qc8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8122    "src/qc8-gemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8123    "src/qc8-gemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8124    "src/qc8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8125    "src/qc8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8126    "src/qc8-igemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8127    "src/qc8-igemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8128    "src/qc8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8129    "src/qs8-dwconv/gen/up16x9-minmax-fp32-avx512skx-mul32.c",
8130    "src/qs8-dwconv/gen/up16x25-minmax-fp32-avx512skx-mul32.c",
8131    "src/qs8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8132    "src/qs8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8133    "src/qs8-f32-vcvt/gen/vcvt-avx512skx-x16.c",
8134    "src/qs8-f32-vcvt/gen/vcvt-avx512skx-x32.c",
8135    "src/qs8-f32-vcvt/gen/vcvt-avx512skx-x48.c",
8136    "src/qs8-f32-vcvt/gen/vcvt-avx512skx-x64.c",
8137    "src/qs8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8138    "src/qs8-gemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8139    "src/qs8-gemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8140    "src/qs8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8141    "src/qs8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8142    "src/qs8-igemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8143    "src/qs8-igemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8144    "src/qs8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8145    "src/qs8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c",
8146    "src/qs8-vadd/gen/minmax-avx512skx-mul32-ld128-x32.c",
8147    "src/qs8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c",
8148    "src/qs8-vaddc/gen/minmax-avx512skx-mul32-ld128-x32.c",
8149    "src/qu8-dwconv/gen/up16x9-minmax-fp32-avx512skx-mul32.c",
8150    "src/qu8-dwconv/gen/up16x25-minmax-fp32-avx512skx-mul32.c",
8151    "src/qu8-dwconv/gen/up32x9-minmax-fp32-avx512skx-mul32.c",
8152    "src/qu8-dwconv/gen/up32x25-minmax-fp32-avx512skx-mul32.c",
8153    "src/qu8-f32-vcvt/gen/vcvt-avx512skx-x16.c",
8154    "src/qu8-f32-vcvt/gen/vcvt-avx512skx-x32.c",
8155    "src/qu8-f32-vcvt/gen/vcvt-avx512skx-x48.c",
8156    "src/qu8-f32-vcvt/gen/vcvt-avx512skx-x64.c",
8157    "src/qu8-gemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8158    "src/qu8-gemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8159    "src/qu8-gemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8160    "src/qu8-gemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8161    "src/qu8-igemm/gen/1x16c8-minmax-fp32-avx512skx.c",
8162    "src/qu8-igemm/gen/2x16c8-minmax-fp32-avx512skx.c",
8163    "src/qu8-igemm/gen/3x16c8-minmax-fp32-avx512skx.c",
8164    "src/qu8-igemm/gen/4x16c8-minmax-fp32-avx512skx.c",
8165    "src/qu8-vadd/gen/minmax-avx512skx-mul32-ld128-x16.c",
8166    "src/qu8-vadd/gen/minmax-avx512skx-mul32-ld128-x32.c",
8167    "src/qu8-vaddc/gen/minmax-avx512skx-mul32-ld128-x16.c",
8168    "src/qu8-vaddc/gen/minmax-avx512skx-mul32-ld128-x32.c",
8169    "src/x8-lut/gen/lut-avx512skx-vpshufb-x64.c",
8170    "src/x8-lut/gen/lut-avx512skx-vpshufb-x128.c",
8171    "src/x8-lut/gen/lut-avx512skx-vpshufb-x192.c",
8172    "src/x8-lut/gen/lut-avx512skx-vpshufb-x256.c",
8173]
8174
8175WASM32_ASM_MICROKERNEL_SRCS = [
8176    "src/f32-vrelu/wasm_shr_x1.S",
8177    "src/f32-vrelu/wasm_shr_x2.S",
8178    "src/f32-vrelu/wasm_shr_x4.S",
8179]
8180
8181AARCH32_ASM_MICROKERNEL_SRCS = [
8182    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-cortex-a7.S",
8183    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-cortex-a53.S",
8184    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S",
8185    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-ld64.S",
8186    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-prfm-cortex-a53.S",
8187    "src/f32-gemm/gen/4x8-minmax-aarch32-neon-prfm-cortex-a75.S",
8188    "src/f32-gemm/4x4-aarch32-vfp-ld64.S",
8189    "src/f32-gemm/4x4-minmax-aarch32-vfp-ld64.S",
8190    "src/f32-gemm/4x8-minmax-aarch32-neon-cortex-a55.S",
8191    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-cortex-a7.S",
8192    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-cortex-a53.S",
8193    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-cortex-a75.S",
8194    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-ld64.S",
8195    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-prfm-cortex-a53.S",
8196    "src/f32-igemm/gen/4x8-minmax-aarch32-neon-prfm-cortex-a75.S",
8197    "src/f32-igemm/4x8-minmax-aarch32-neon-cortex-a55.S",
8198    "src/qc8-dwconv/up8x3-minmax-fp32-aarch32-neonv8-mla8-cortex-a35.S",
8199    "src/qc8-dwconv/up16x3-minmax-fp32-aarch32-neonv8-mla8-cortex-a35.S",
8200    "src/qc8-gemm/gen/1x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a7.S",
8201    "src/qc8-gemm/gen/1x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8202    "src/qc8-gemm/gen/1x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a35.S",
8203    "src/qc8-gemm/gen/1x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a35.S",
8204    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a7.S",
8205    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a53.S",
8206    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-ld64.S",
8207    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8208    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8209    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-ld64.S",
8210    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a35.S",
8211    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a53.S",
8212    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-ld64.S",
8213    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a35.S",
8214    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a53.S",
8215    "src/qc8-gemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-ld64.S",
8216    "src/qc8-gemm/gen/4x8c4-minmax-fp32-aarch32-neondot-cortex-a55.S",
8217    "src/qc8-gemm/gen/4x8c4-minmax-fp32-aarch32-neondot-ld64.S",
8218    "src/qc8-igemm/gen/1x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a7.S",
8219    "src/qc8-igemm/gen/1x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8220    "src/qc8-igemm/gen/1x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a35.S",
8221    "src/qc8-igemm/gen/1x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a35.S",
8222    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a7.S",
8223    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-cortex-a53.S",
8224    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-ld64.S",
8225    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8226    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8227    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neon-mlal-lane-prfm-ld64.S",
8228    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a35.S",
8229    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-cortex-a53.S",
8230    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-ld64.S",
8231    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a35.S",
8232    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-cortex-a53.S",
8233    "src/qc8-igemm/gen/4x8-minmax-fp32-aarch32-neonv8-mlal-lane-prfm-ld64.S",
8234    "src/qc8-igemm/gen/4x8c4-minmax-fp32-aarch32-neondot-cortex-a55.S",
8235    "src/qc8-igemm/gen/4x8c4-minmax-fp32-aarch32-neondot-ld64.S",
8236    "src/qs8-gemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8237    "src/qs8-gemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8238    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8239    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a53.S",
8240    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-ld64.S",
8241    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8242    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8243    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-ld64.S",
8244    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-aarch32-neondot-cortex-a55.S",
8245    "src/qs8-gemm/gen/4x8c4-minmax-rndnu-aarch32-neondot-ld64.S",
8246    "src/qs8-igemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8247    "src/qs8-igemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8248    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8249    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a53.S",
8250    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-ld64.S",
8251    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8252    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8253    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-ld64.S",
8254    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-aarch32-neondot-cortex-a55.S",
8255    "src/qs8-igemm/gen/4x8c4-minmax-rndnu-aarch32-neondot-ld64.S",
8256    "src/qu8-gemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8257    "src/qu8-gemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8258    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8259    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a53.S",
8260    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-ld64.S",
8261    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8262    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8263    "src/qu8-gemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-ld64.S",
8264    "src/qu8-igemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8265    "src/qu8-igemm/gen/1x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8266    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a7.S",
8267    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-cortex-a53.S",
8268    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-ld64.S",
8269    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a7.S",
8270    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-cortex-a53.S",
8271    "src/qu8-igemm/gen/4x8-minmax-rndnu-aarch32-neon-mlal-lane-prfm-ld64.S",
8272    "src/u32-filterbank-accumulate/aarch32-arm-x1.S",
8273    "src/u32-filterbank-accumulate/aarch32-neon-x1.S",
8274    "src/u32-filterbank-accumulate/aarch32-neon-x2.S",
8275]
8276
8277AARCH64_ASM_MICROKERNEL_SRCS = [
8278    "src/f16-gemm/gen-inc/1x8inc-minmax-aarch64-neonfp16arith-ld64.S",
8279    "src/f16-gemm/gen-inc/1x16inc-minmax-aarch64-neonfp16arith-ld32.S",
8280    "src/f16-gemm/gen-inc/4x8inc-minmax-aarch64-neonfp16arith-ld64.S",
8281    "src/f16-gemm/gen-inc/4x16inc-minmax-aarch64-neonfp16arith-ld32.S",
8282    "src/f16-gemm/gen-inc/6x8inc-minmax-aarch64-neonfp16arith-ld64.S",
8283    "src/f16-gemm/gen-inc/6x16inc-minmax-aarch64-neonfp16arith-cortex-a55.S",
8284    "src/f16-gemm/gen-inc/6x16inc-minmax-aarch64-neonfp16arith-cortex-a75.S",
8285    "src/f16-gemm/gen-inc/6x16inc-minmax-aarch64-neonfp16arith-ld32.S",
8286    "src/f16-gemm/gen-inc/8x8inc-minmax-aarch64-neonfp16arith-ld64.S",
8287    "src/f16-gemm/gen/1x8-minmax-aarch64-neonfp16arith-ld64.S",
8288    "src/f16-gemm/gen/1x16-minmax-aarch64-neonfp16arith-ld32.S",
8289    "src/f16-gemm/gen/1x16-minmax-aarch64-neonfp16arith-ld64.S",
8290    "src/f16-gemm/gen/4x8-minmax-aarch64-neonfp16arith-ld64.S",
8291    "src/f16-gemm/gen/4x16-minmax-aarch64-neonfp16arith-ld32.S",
8292    "src/f16-gemm/gen/4x16-minmax-aarch64-neonfp16arith-ld64.S",
8293    "src/f16-gemm/gen/6x8-minmax-aarch64-neonfp16arith-ld64.S",
8294    "src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-cortex-a55.S",
8295    "src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-cortex-a55r0.S",
8296    "src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-cortex-a75.S",
8297    "src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-ld32.S",
8298    "src/f16-gemm/gen/6x16-minmax-aarch64-neonfp16arith-ld64.S",
8299    "src/f16-gemm/gen/8x8-minmax-aarch64-neonfp16arith-ld64.S",
8300    "src/f16-igemm/1x16-minmax-aarch64-neonfp16arith-ld32.S",
8301    "src/f16-igemm/1x16-minmax-aarch64-neonfp16arith-ld64.S",
8302    "src/f16-igemm/4x16-minmax-aarch64-neonfp16arith-ld32.S",
8303    "src/f16-igemm/4x16-minmax-aarch64-neonfp16arith-ld64.S",
8304    "src/f16-igemm/6x16-minmax-aarch64-neonfp16arith-cortex-a55.S",
8305    "src/f16-igemm/6x16-minmax-aarch64-neonfp16arith-cortex-a55r0.S",
8306    "src/f16-igemm/6x16-minmax-aarch64-neonfp16arith-cortex-a75.S",
8307    "src/f16-igemm/6x16-minmax-aarch64-neonfp16arith-ld32.S",
8308    "src/f16-igemm/6x16-minmax-aarch64-neonfp16arith-ld64.S",
8309    "src/f32-dwconv/up4x9-minmax-aarch64-neonfma-cortex-a55.S",
8310    "src/f32-dwconv/up4x9-minmax-aarch64-neonfma.S",
8311    "src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a53.S",
8312    "src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-cortex-a75.S",
8313    "src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-ld64.S",
8314    "src/f32-gemm/gen-inc/1x8inc-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8315    "src/f32-gemm/gen-inc/1x12inc-minmax-aarch64-neonfma-cortex-a53.S",
8316    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a53.S",
8317    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a55.S",
8318    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-cortex-a75.S",
8319    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld64.S",
8320    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-ld128.S",
8321    "src/f32-gemm/gen-inc/4x8inc-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8322    "src/f32-gemm/gen-inc/4x12inc-minmax-aarch64-neonfma-cortex-a53.S",
8323    "src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-cortex-a75.S",
8324    "src/f32-gemm/gen-inc/5x8inc-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8325    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a53.S",
8326    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a55.S",
8327    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a73.S",
8328    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-cortex-a75.S",
8329    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld64.S",
8330    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-ld128.S",
8331    "src/f32-gemm/gen-inc/6x8inc-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8332    "src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a53.S",
8333    "src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S",
8334    "src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-ld64.S",
8335    "src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8336    "src/f32-gemm/gen/1x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8337    "src/f32-gemm/gen/1x12-minmax-aarch64-neonfma-cortex-a53.S",
8338    "src/f32-gemm/gen/4x2-minmax-aarch64-neonfma-cortex-a75.S",
8339    "src/f32-gemm/gen/4x2-minmax-aarch64-neonfma-ld64.S",
8340    "src/f32-gemm/gen/4x2-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8341    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a53.S",
8342    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a55.S",
8343    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S",
8344    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld64.S",
8345    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-ld128.S",
8346    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8347    "src/f32-gemm/gen/4x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8348    "src/f32-gemm/gen/4x12-minmax-aarch64-neonfma-cortex-a53.S",
8349    "src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S",
8350    "src/f32-gemm/gen/5x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8351    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a53.S",
8352    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a55.S",
8353    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a73.S",
8354    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S",
8355    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld64.S",
8356    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-ld128.S",
8357    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8358    "src/f32-gemm/gen/6x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8359    "src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a53.S",
8360    "src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-cortex-a75.S",
8361    "src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8362    "src/f32-igemm/gen/1x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8363    "src/f32-igemm/gen/4x2-minmax-aarch64-neonfma-cortex-a75.S",
8364    "src/f32-igemm/gen/4x2-minmax-aarch64-neonfma-ld64.S",
8365    "src/f32-igemm/gen/4x2-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8366    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a53.S",
8367    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-cortex-a75.S",
8368    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-ld64.S",
8369    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-ld128.S",
8370    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8371    "src/f32-igemm/gen/4x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8372    "src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-cortex-a75.S",
8373    "src/f32-igemm/gen/5x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8374    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a53.S",
8375    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-cortex-a75.S",
8376    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-ld64.S",
8377    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-ld128.S",
8378    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-prfm-cortex-a53.S",
8379    "src/f32-igemm/gen/6x8-minmax-aarch64-neonfma-prfm-cortex-a75.S",
8380    "src/f32-igemm/1x12-minmax-aarch64-neonfma-cortex-a53.S",
8381    "src/f32-igemm/4x8-minmax-aarch64-neonfma-cortex-a55.S",
8382    "src/f32-igemm/4x12-minmax-aarch64-neonfma-cortex-a53.S",
8383    "src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a55.S",
8384    "src/f32-igemm/6x8-minmax-aarch64-neonfma-cortex-a73.S",
8385    "src/qc8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8386    "src/qc8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8387    "src/qc8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8388    "src/qc8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal.S",
8389    "src/qc8-gemm/gen/1x16c4-minmax-fp32-aarch64-neondot-ld32.S",
8390    "src/qc8-gemm/gen/1x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8391    "src/qc8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8392    "src/qc8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8393    "src/qc8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8394    "src/qc8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal.S",
8395    "src/qc8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mull.S",
8396    "src/qc8-gemm/gen/2x8c16-minmax-fp32-aarch64-neon-mlal.S",
8397    "src/qc8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-cortex-a53.S",
8398    "src/qc8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-ld64.S",
8399    "src/qc8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8400    "src/qc8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-ld64.S",
8401    "src/qc8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8402    "src/qc8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld32.S",
8403    "src/qc8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8404    "src/qc8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8405    "src/qc8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8406    "src/qc8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8407    "src/qc8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8408    "src/qc8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal.S",
8409    "src/qc8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8410    "src/qc8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8411    "src/qc8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8412    "src/qc8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal.S",
8413    "src/qc8-igemm/gen/2x8c16-minmax-fp32-aarch64-neon-mlal.S",
8414    "src/qc8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-cortex-a53.S",
8415    "src/qc8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-ld64.S",
8416    "src/qc8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8417    "src/qc8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-ld64.S",
8418    "src/qc8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8419    "src/qc8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8420    "src/qc8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8421    "src/qs8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8422    "src/qs8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8423    "src/qs8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8424    "src/qs8-gemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal.S",
8425    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-cortex-a53.S",
8426    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-prfm-cortex-a53.S",
8427    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-prfm.S",
8428    "src/qs8-gemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal.S",
8429    "src/qs8-gemm/gen/1x16c4-minmax-fp32-aarch64-neondot-ld32.S",
8430    "src/qs8-gemm/gen/1x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8431    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-aarch64-neondot-ld32.S",
8432    "src/qs8-gemm/gen/1x16c4-minmax-rndnu-aarch64-neondot-ld64.S",
8433    "src/qs8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8434    "src/qs8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8435    "src/qs8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8436    "src/qs8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal.S",
8437    "src/qs8-gemm/gen/2x8c8-minmax-fp32-aarch64-neon-mull.S",
8438    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-cortex-a53.S",
8439    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-prfm-cortex-a53.S",
8440    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-prfm.S",
8441    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal.S",
8442    "src/qs8-gemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mull.S",
8443    "src/qs8-gemm/gen/2x8c16-minmax-fp32-aarch64-neon-mlal.S",
8444    "src/qs8-gemm/gen/2x8c16-minmax-rndnu-aarch64-neon-mlal.S",
8445    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8446    "src/qs8-gemm/gen/4x8-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8447    "src/qs8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-cortex-a53.S",
8448    "src/qs8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-ld64.S",
8449    "src/qs8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8450    "src/qs8-gemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-ld64.S",
8451    "src/qs8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a53.S",
8452    "src/qs8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8453    "src/qs8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8454    "src/qs8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8455    "src/qs8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8456    "src/qs8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld32.S",
8457    "src/qs8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8458    "src/qs8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8459    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8460    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld32.S",
8461    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld64.S",
8462    "src/qs8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld128.S",
8463    "src/qs8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8464    "src/qs8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8465    "src/qs8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8466    "src/qs8-igemm/gen/1x8c8-minmax-fp32-aarch64-neon-mlal.S",
8467    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-cortex-a53.S",
8468    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-prfm-cortex-a53.S",
8469    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal-prfm.S",
8470    "src/qs8-igemm/gen/1x8c8-minmax-rndnu-aarch64-neon-mlal.S",
8471    "src/qs8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-cortex-a53.S",
8472    "src/qs8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm-cortex-a53.S",
8473    "src/qs8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal-prfm.S",
8474    "src/qs8-igemm/gen/2x8c8-minmax-fp32-aarch64-neon-mlal.S",
8475    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-cortex-a53.S",
8476    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-prfm-cortex-a53.S",
8477    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal-prfm.S",
8478    "src/qs8-igemm/gen/2x8c8-minmax-rndnu-aarch64-neon-mlal.S",
8479    "src/qs8-igemm/gen/2x8c16-minmax-fp32-aarch64-neon-mlal.S",
8480    "src/qs8-igemm/gen/2x8c16-minmax-rndnu-aarch64-neon-mlal.S",
8481    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8482    "src/qs8-igemm/gen/4x8-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8483    "src/qs8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-cortex-a53.S",
8484    "src/qs8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-ld64.S",
8485    "src/qs8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8486    "src/qs8-igemm/gen/4x16-minmax-fp32-aarch64-neon-mlal-lane-prfm-ld64.S",
8487    "src/qs8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a53.S",
8488    "src/qs8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8489    "src/qs8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8490    "src/qs8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8491    "src/qs8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8492    "src/qs8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld64.S",
8493    "src/qs8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8494    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8495    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld64.S",
8496    "src/qs8-igemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld128.S",
8497    "src/qu8-gemm/gen/4x8c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8498    "src/qu8-gemm/gen/4x8c4-minmax-rndnu-aarch64-neondot-ld128.S",
8499    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a53.S",
8500    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a75.S",
8501    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8502    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8503    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a75.S",
8504    "src/qu8-gemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8505    "src/qu8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8506    "src/qu8-gemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8507    "src/qu8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8508    "src/qu8-gemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld128.S",
8509    "src/qu8-igemm/gen/4x8c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8510    "src/qu8-igemm/gen/4x8c4-minmax-rndnu-aarch64-neondot-ld128.S",
8511    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a53.S",
8512    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-cortex-a75.S",
8513    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-ld64.S",
8514    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a53.S",
8515    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-cortex-a75.S",
8516    "src/qu8-igemm/gen/4x16-minmax-rndnu-aarch64-neon-mlal-lane-prfm-ld64.S",
8517    "src/qu8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-cortex-a55.S",
8518    "src/qu8-igemm/gen/4x16c4-minmax-fp32-aarch64-neondot-ld128.S",
8519    "src/qu8-igemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-cortex-a55.S",
8520    "src/qu8-igemm/gen/4x16c4-minmax-rndnu-aarch64-neondot-ld128.S",
8521]
8522
8523JIT_AARCH32_SRCS = [
8524    "src/f32-gemm/4x8-aarch32-neon-cortex-a7.cc",
8525    "src/f32-gemm/4x8-aarch32-neon-cortex-a53.cc",
8526    "src/f32-gemm/4x8-aarch32-neon-cortex-a55.cc",
8527    "src/f32-gemm/4x8-aarch32-neon-cortex-a75.cc",
8528    "src/f32-gemm/4x8-aarch32-neon-ld64.cc",
8529    "src/f32-igemm/4x8-aarch32-neon-cortex-a7.cc",
8530    "src/f32-igemm/4x8-aarch32-neon-cortex-a53.cc",
8531    "src/f32-igemm/4x8-aarch32-neon-cortex-a55.cc",
8532    "src/f32-igemm/4x8-aarch32-neon-cortex-a75.cc",
8533    "src/f32-igemm/4x8-aarch32-neon-ld64.cc",
8534    "src/qc8-gemm/4x8-fp32-aarch32-neonv8-mlal-lane-ld64.cc",
8535    "src/qc8-gemm/4x8c4-fp32-aarch32-neondot-ld64.cc",
8536    "src/qc8-igemm/4x8-fp32-aarch32-neonv8-mlal-lane-ld64.cc",
8537    "src/qc8-igemm/4x8c4-fp32-aarch32-neondot-ld64.cc",
8538    "src/qs8-gemm/4x8-rndnu-aarch32-neon-mlal-lane-ld64.cc",
8539    "src/qs8-gemm/4x8c4-rndnu-aarch32-neondot-ld64.cc",
8540    "src/qs8-igemm/4x8-rndnu-aarch32-neon-mlal-lane-ld64.cc",
8541    "src/qs8-igemm/4x8c4-rndnu-aarch32-neondot-ld64.cc",
8542]
8543
8544JIT_AARCH64_SRCS = [
8545    "src/f32-gemm/upto6x8-aarch64-neonfma-cortex-a75.cc",
8546    "src/f32-gemm/1x8-aarch64-neonfma-cortex-a75.cc",
8547    "src/f32-gemm/4x8-aarch64-neonfma-cortex-a75.cc",
8548    "src/f32-gemm/6x8-aarch64-neonfma-ld128.cc",
8549    "src/f32-igemm/upto6x8-aarch64-neonfma-cortex-a75.cc",
8550    "src/f32-igemm/1x8-aarch64-neonfma-cortex-a75.cc",
8551    "src/f32-igemm/4x8-aarch64-neonfma-cortex-a75.cc",
8552    "src/f32-igemm/6x8-aarch64-neonfma-ld128.cc",
8553]
8554
8555cc_defaults {
8556    name: "xnnpack_internal_default",
8557    vendor_available: true,
8558    sdk_version: "current",
8559    local_include_dirs: [
8560        "include",
8561        "src",
8562    ],
8563    cflags: [
8564        "-std=c99",
8565        "-DXNN_LOG_LEVEL=2",
8566        "-DXNN_ENABLE_GEMM_M_SPECIALIZATION=1",
8567        "-DXNN_ENABLE_JIT=0",
8568        "-DXNN_ENABLE_SPARSE=1",
8569        "-DXNN_ENABLE_ASSEMBLY=1",
8570        "-DXNN_ENABLE_ARM_DOTPROD=0",
8571        "-Wno-unused-parameter",
8572        "-Wno-missing-field-initializers",
8573        "-Wno-pointer-arith",
8574        "-Wno-ignored-qualifiers",
8575    ],
8576    stl: "libc++_static",
8577}
8578
8579cc_library_static {
8580    name: "xnnpack_tables",
8581    defaults: ["xnnpack_internal_default"],
8582    srcs: TABLE_SRCS,
8583}
8584
8585cc_library_static {
8586    name: "xnnpack_logging",
8587    defaults: ["xnnpack_internal_default"],
8588    srcs: LOGGING_SRCS,
8589    header_libs: [
8590        "fp16_headers",
8591    ],
8592    static_libs: [
8593        "libclog",
8594        "libpthreadpool",
8595    ],
8596    shared_libs: [
8597        "liblog",
8598    ],
8599}
8600
8601cc_library_static {
8602    name: "xnnpack_params",
8603    defaults: ["xnnpack_internal_default"],
8604    srcs: [
8605        "src/params.c",
8606    ],
8607    static_libs: [
8608        "libpthreadpool",
8609    ],
8610}
8611
8612cc_library_static {
8613    name: "xnnpack_microparams_init",
8614    defaults: ["xnnpack_internal_default"],
8615    srcs: [
8616        "src/microparams-init.c",
8617    ],
8618    header_libs: [
8619        "fp16_headers",
8620        "fxdiv_headers",
8621    ],
8622    static_libs: [
8623        "libpthreadpool",
8624    ],
8625}
8626
8627cc_library_static {
8628    name: "xnnpack_allocator",
8629    defaults: ["xnnpack_internal_default"],
8630    srcs: [
8631        "src/allocator.c",
8632        "src/memory.c",
8633    ],
8634    header_libs: [
8635        "fp16_headers",
8636        "fxdiv_headers",
8637    ],
8638    static_libs: [
8639        "libclog",
8640        "libpthreadpool",
8641    ],
8642}
8643
8644cc_library_static {
8645    name: "xnnpack_im2col",
8646    defaults: ["xnnpack_internal_default"],
8647    srcs: [
8648        "src/im2col.c",
8649    ],
8650}
8651
8652cc_library_static {
8653    name: "xnnpack_indirection",
8654    defaults: ["xnnpack_internal_default"],
8655    srcs: [
8656        "src/indirection.c",
8657    ],
8658    header_libs: [
8659        "fp16_headers",
8660        "fxdiv_headers",
8661    ],
8662    static_libs: [
8663        "libpthreadpool",
8664    ],
8665}
8666
8667cc_library_static {
8668    name: "xnnpack_packing",
8669    defaults: ["xnnpack_internal_default"],
8670    srcs: [
8671        "src/packing.c",
8672    ],
8673    header_libs: [
8674        "fp16_headers",
8675        "fxdiv_headers",
8676    ],
8677    static_libs: [
8678        "libpthreadpool",
8679    ],
8680}
8681
8682cc_library_static {
8683    name: "xnnpack_mutex",
8684    defaults: ["xnnpack_internal_default"],
8685    srcs: [
8686        "src/mutex.c",
8687    ],
8688    static_libs: [
8689        "libclog",
8690        "libpthreadpool",
8691        "xnnpack_logging",
8692    ],
8693}
8694
8695cc_library_static {
8696    name: "xnnpack_normalization",
8697    defaults: ["xnnpack_internal_default"],
8698    srcs: [
8699        "src/normalization.c",
8700    ],
8701    static_libs: [
8702        "libclog",
8703        "libpthreadpool",
8704        "xnnpack_logging",
8705    ],
8706}
8707
8708cc_library_static {
8709    name: "xnnpack_cache",
8710    defaults: ["xnnpack_internal_default"],
8711    srcs: [
8712        "src/cache.c",
8713    ],
8714    static_libs: [
8715        "libclog",
8716        "libpthreadpool",
8717        "xnnpack_allocator",
8718        "xnnpack_logging",
8719        "xnnpack_mutex",
8720    ],
8721}
8722
8723cc_library_static {
8724    name: "xnnpack_post_operation",
8725    defaults: ["xnnpack_internal_default"],
8726    srcs: [
8727        "src/operators/post-operation.c",
8728    ],
8729    static_libs: [
8730        "libclog",
8731        "libpthreadpool",
8732        "xnnpack_allocator",
8733        "xnnpack_params",
8734    ],
8735}
8736
8737cc_library_static {
8738    name: "xnnpack_jit",
8739    defaults: ["xnnpack_internal_default"],
8740    srcs: [
8741        "src/jit/aarch32-assembler.cc",
8742        "src/jit/aarch64-assembler.cc",
8743        "src/jit/assembler.cc",
8744    ],
8745    arch: {
8746        arm: {
8747            srcs: JIT_AARCH32_SRCS,
8748        },
8749        arm64: {
8750            srcs: JIT_AARCH64_SRCS,
8751        },
8752    },
8753    static_libs: [
8754        "libclog",
8755        "libpthreadpool",
8756        "xnnpack_allocator",
8757        "xnnpack_logging",
8758        "xnnpack_params",
8759    ],
8760}
8761
8762cc_library_static {
8763    name: "xnnpack_operators",
8764    defaults: ["xnnpack_internal_default"],
8765    srcs: OPERATOR_SRCS,
8766    header_libs: [
8767        "fp16_headers",
8768        "fxdiv_headers",
8769    ],
8770    static_libs: [
8771        "libclog",
8772        "libpthreadpool",
8773        "xnnpack_allocator",
8774        "xnnpack_cache",
8775        "xnnpack_logging",
8776        "xnnpack_microparams_init",
8777        "xnnpack_normalization",
8778        "xnnpack_packing",
8779        "xnnpack_post_operation",
8780    ],
8781    whole_static_libs: [
8782        "xnnpack_indirection",
8783    ],
8784}
8785
8786cc_library_static {
8787    name: "xnnpack_subgraph",
8788    defaults: ["xnnpack_internal_default"],
8789    srcs: SUBGRAPH_SRCS,
8790    header_libs: [
8791        "fp16_headers",
8792        "fxdiv_headers",
8793    ],
8794    static_libs: [
8795        "libclog",
8796        "libpthreadpool",
8797        "xnnpack_allocator",
8798        "xnnpack_cache",
8799        "xnnpack_logging",
8800        "xnnpack_microparams_init",
8801        "xnnpack_normalization",
8802        "xnnpack_packing",
8803        "xnnpack_post_operation",
8804    ],
8805}
8806
8807cc_library_static {
8808    name: "xnnpack_scalar_bench_microkernels",
8809    defaults: ["xnnpack_internal_default"],
8810    srcs: ALL_SCALAR_MICROKERNEL_SRCS,
8811    header_libs: [
8812        "fp16_headers",
8813        "fxdiv_headers",
8814    ],
8815    static_libs: [
8816        "libpthreadpool",
8817        "xnnpack_tables",
8818    ],
8819}
8820
8821cc_library_static {
8822    name: "xnnpack_scalar_prod_microkernels",
8823    defaults: ["xnnpack_internal_default"],
8824    srcs: PROD_SCALAR_PORTABLE_MICROKERNEL_SRCS,
8825    arch: {
8826        arm: {
8827            srcs: PROD_SCALAR_AARCH32_MICROKERNEL_SRCS,
8828            cflags: [
8829                "-marm",
8830            ],
8831        },
8832        arm64: {
8833            srcs: PROD_SCALAR_AARCH32_MICROKERNEL_SRCS,
8834        },
8835        riscv64: {
8836            srcs: PROD_SCALAR_RISCV_MICROKERNEL_SRCS,
8837        },
8838    },
8839    header_libs: [
8840        "fp16_headers",
8841        "fxdiv_headers",
8842    ],
8843    static_libs: [
8844        "libpthreadpool",
8845        "xnnpack_tables",
8846    ],
8847}
8848
8849cc_library_static {
8850    name: "xnnpack_armsimd32_bench_microkernels",
8851    defaults: ["xnnpack_internal_default"],
8852    srcs: ALL_ARMSIMD32_MICROKERNEL_SRCS,
8853    arch: {
8854        arm: {
8855            cflags: [
8856                "-marm",
8857                "-march=armv6",
8858                "-mfpu=vfp",
8859                "-munaligned-access",
8860            ],
8861        },
8862        arm64: {
8863            enabled: false,
8864        },
8865        x86: {
8866            enabled: false,
8867        },
8868        x86_64: {
8869            enabled: false,
8870        },
8871    },
8872    header_libs: [
8873        "fp16_headers",
8874    ],
8875    static_libs: [
8876        "libpthreadpool",
8877        "xnnpack_tables",
8878    ],
8879}
8880
8881cc_library_static {
8882    name: "xnnpack_armsimd32_prod_microkernels",
8883    defaults: ["xnnpack_internal_default"],
8884    srcs: PROD_ARMSIMD32_MICROKERNEL_SRCS,
8885    arch: {
8886        arm: {
8887            cflags: [
8888                "-marm",
8889                "-march=armv6",
8890                "-mfpu=vfp",
8891                "-munaligned-access",
8892            ],
8893        },
8894        arm64: {
8895            enabled: false,
8896        },
8897        x86: {
8898            enabled: false,
8899        },
8900        x86_64: {
8901            enabled: false,
8902        },
8903    },
8904    header_libs: [
8905        "fp16_headers",
8906    ],
8907    static_libs: [
8908        "libpthreadpool",
8909        "xnnpack_tables",
8910    ],
8911}
8912
8913cc_library_static {
8914    name: "xnnpack_neon_bench_microkernels",
8915    defaults: ["xnnpack_internal_default"],
8916    srcs: ALL_NEON_MICROKERNEL_SRCS,
8917    arch: {
8918        arm: {
8919            cflags: [
8920                "-marm",
8921                "-march=armv7-a",
8922                "-mfpu=neon",
8923            ],
8924        },
8925        arm64: {
8926            srcs: ALL_AARCH64_NEON_MICROKERNEL_SRCS,
8927        },
8928        x86: {
8929            enabled: false,
8930        },
8931        x86_64: {
8932            enabled: false,
8933        },
8934    },
8935    header_libs: [
8936        "fp16_headers",
8937    ],
8938    static_libs: [
8939        "libpthreadpool",
8940        "xnnpack_tables",
8941    ],
8942}
8943
8944cc_library_static {
8945    name: "xnnpack_neon_prod_microkernels",
8946    defaults: ["xnnpack_internal_default"],
8947    srcs: PROD_NEON_MICROKERNEL_SRCS,
8948    arch: {
8949        arm: {
8950            cflags: [
8951                "-marm",
8952                "-march=armv7-a",
8953                "-mfpu=neon",
8954            ],
8955        },
8956        arm64: {
8957            srcs: PROD_AARCH64_NEON_MICROKERNEL_SRCS,
8958        },
8959        x86: {
8960            enabled: false,
8961        },
8962        x86_64: {
8963            enabled: false,
8964        },
8965    },
8966    header_libs: [
8967        "fp16_headers",
8968    ],
8969    static_libs: [
8970        "libpthreadpool",
8971        "xnnpack_tables",
8972    ],
8973}
8974
8975cc_library_static {
8976    name: "xnnpack_neonfp16_bench_microkernels",
8977    defaults: ["xnnpack_internal_default"],
8978    arch: {
8979        arm: {
8980            srcs: ALL_NEONFP16_MICROKERNEL_SRCS,
8981            cflags: [
8982                "-marm",
8983                "-march=armv7-a",
8984                "-mfpu=neon-fp16",
8985            ],
8986        },
8987        arm64: {
8988            srcs: ALL_NEONFP16_MICROKERNEL_SRCS,
8989        },
8990        x86: {
8991            enabled: false,
8992        },
8993        x86_64: {
8994            enabled: false,
8995        },
8996    },
8997    header_libs: [
8998        "fp16_headers",
8999    ],
9000    static_libs: [
9001        "libpthreadpool",
9002        "xnnpack_tables",
9003    ],
9004}
9005
9006cc_library_static {
9007    name: "xnnpack_neonfp16_prod_microkernels",
9008    defaults: ["xnnpack_internal_default"],
9009    arch: {
9010        arm: {
9011            srcs: PROD_NEONFP16_MICROKERNEL_SRCS,
9012            cflags: [
9013                "-marm",
9014                "-march=armv7-a",
9015                "-mfpu=neon-fp16",
9016            ],
9017        },
9018        arm64: {
9019            srcs: PROD_NEONFP16_MICROKERNEL_SRCS,
9020        },
9021        x86: {
9022            enabled: false,
9023        },
9024        x86_64: {
9025            enabled: false,
9026        },
9027    },
9028    header_libs: [
9029        "fp16_headers",
9030    ],
9031    static_libs: [
9032        "libpthreadpool",
9033        "xnnpack_tables",
9034    ],
9035}
9036
9037cc_library_static {
9038    name: "xnnpack_neonfma_bench_microkernels",
9039    defaults: ["xnnpack_internal_default"],
9040    arch: {
9041        arm: {
9042            srcs: ALL_NEONFMA_MICROKERNEL_SRCS,
9043            cflags: [
9044                "-marm",
9045                "-march=armv7-a",
9046                "-mfpu=neon-vfpv4",
9047            ],
9048        },
9049        arm64: {
9050            srcs: ALL_NEONFMA_MICROKERNEL_SRCS,
9051        },
9052        x86: {
9053            enabled: false,
9054        },
9055        x86_64: {
9056            enabled: false,
9057        },
9058    },
9059    header_libs: [
9060        "fp16_headers",
9061    ],
9062    static_libs: [
9063        "libpthreadpool",
9064        "xnnpack_tables",
9065    ],
9066}
9067
9068cc_library_static {
9069    name: "xnnpack_neonfma_prod_microkernels",
9070    defaults: ["xnnpack_internal_default"],
9071    arch: {
9072        arm: {
9073            srcs: PROD_NEONFMA_MICROKERNEL_SRCS,
9074            cflags: [
9075                "-marm",
9076                "-march=armv7-a",
9077                "-mfpu=neon-vfpv4",
9078            ],
9079        },
9080        arm64: {
9081            srcs: PROD_NEONFMA_MICROKERNEL_SRCS,
9082        },
9083        x86: {
9084            enabled: false,
9085        },
9086        x86_64: {
9087            enabled: false,
9088        },
9089    },
9090    header_libs: [
9091        "fp16_headers",
9092    ],
9093    static_libs: [
9094        "libpthreadpool",
9095        "xnnpack_tables",
9096    ],
9097}
9098
9099cc_library_static {
9100    name: "xnnpack_neonv8_bench_microkernels",
9101    defaults: ["xnnpack_internal_default"],
9102    arch: {
9103        arm: {
9104            srcs: ALL_NEONV8_MICROKERNEL_SRCS,
9105            cflags: [
9106                "-marm",
9107                "-march=armv8-a",
9108                "-mfpu=neon-fp-armv8",
9109            ],
9110        },
9111        arm64: {
9112            srcs: ALL_NEONV8_MICROKERNEL_SRCS,
9113        },
9114        x86: {
9115            enabled: false,
9116        },
9117        x86_64: {
9118            enabled: false,
9119        },
9120    },
9121    header_libs: [
9122        "fp16_headers",
9123    ],
9124    static_libs: [
9125        "libpthreadpool",
9126        "xnnpack_tables",
9127    ],
9128}
9129
9130cc_library_static {
9131    name: "xnnpack_neonv8_prod_microkernels",
9132    defaults: ["xnnpack_internal_default"],
9133    arch: {
9134        arm: {
9135            srcs: PROD_NEONV8_MICROKERNEL_SRCS,
9136            cflags: [
9137                "-marm",
9138                "-march=armv8-a",
9139                "-mfpu=neon-fp-armv8",
9140            ],
9141        },
9142        arm64: {
9143            srcs: PROD_NEONV8_MICROKERNEL_SRCS,
9144        },
9145        x86: {
9146            enabled: false,
9147        },
9148        x86_64: {
9149            enabled: false,
9150        },
9151    },
9152    header_libs: [
9153        "fp16_headers",
9154    ],
9155    static_libs: [
9156        "libpthreadpool",
9157        "xnnpack_tables",
9158    ],
9159}
9160
9161cc_library_static {
9162    name: "xnnpack_neonfp16arith_bench_microkernels",
9163    defaults: ["xnnpack_internal_default"],
9164    arch: {
9165        arm: {
9166            srcs: ALL_NEONFP16ARITH_MICROKERNEL_SRCS,
9167            cflags: [
9168                "-marm",
9169                "-march=armv8.2-a+fp16",
9170                "-mfpu=neon-fp-armv8",
9171            ],
9172        },
9173        arm64: {
9174            srcs: ALL_NEONFP16ARITH_MICROKERNEL_SRCS + ALL_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS,
9175            cflags: [
9176                "-march=armv8.2-a+fp16",
9177            ],
9178        },
9179        x86: {
9180            enabled: false,
9181        },
9182        x86_64: {
9183            enabled: false,
9184        },
9185    },
9186    header_libs: [
9187        "fp16_headers",
9188    ],
9189    static_libs: [
9190        "libpthreadpool",
9191        "xnnpack_tables",
9192    ],
9193}
9194
9195cc_library_static {
9196    name: "xnnpack_neonfp16arith_prod_microkernels",
9197    defaults: ["xnnpack_internal_default"],
9198    arch: {
9199        arm: {
9200            srcs: PROD_NEONFP16ARITH_MICROKERNEL_SRCS,
9201            cflags: [
9202                "-marm",
9203                "-march=armv8.2-a+fp16",
9204                "-mfpu=neon-fp-armv8",
9205            ],
9206        },
9207        arm64: {
9208            srcs: PROD_NEONFP16ARITH_MICROKERNEL_SRCS + PROD_AARCH64_NEONFP16ARITH_MICROKERNEL_SRCS,
9209            cflags: [
9210                "-march=armv8.2-a+fp16",
9211            ],
9212        },
9213        x86: {
9214            enabled: false,
9215        },
9216        x86_64: {
9217            enabled: false,
9218        },
9219    },
9220    header_libs: [
9221        "fp16_headers",
9222    ],
9223    static_libs: [
9224        "libpthreadpool",
9225        "xnnpack_tables",
9226    ],
9227}
9228
9229cc_library_static {
9230    name: "xnnpack_neonbf16_prod_microkernels",
9231    defaults: ["xnnpack_internal_default"],
9232    arch: {
9233        arm: {
9234            srcs: PROD_NEONBF16_MICROKERNEL_SRCS,
9235            cflags: [
9236                "-marm",
9237                "-march=armv8.2-a+bf16",
9238                "-mfpu=neon-fp-armv8",
9239            ],
9240        },
9241        arm64: {
9242            srcs: PROD_NEONBF16_MICROKERNEL_SRCS + PROD_AARCH64_NEONBF16_MICROKERNEL_SRCS,
9243            cflags: [
9244                "-march=armv8.2-a+bf16",
9245            ],
9246        },
9247        x86: {
9248            enabled: false,
9249        },
9250        x86_64: {
9251            enabled: false,
9252        },
9253    },
9254    header_libs: [
9255        "fp16_headers",
9256    ],
9257    static_libs: [
9258        "libpthreadpool",
9259        "xnnpack_tables",
9260    ],
9261}
9262
9263cc_library_static {
9264    name: "xnnpack_neondot_bench_microkernels",
9265    defaults: ["xnnpack_internal_default"],
9266    arch: {
9267        arm: {
9268            srcs: ALL_NEONDOT_MICROKERNEL_SRCS,
9269            cflags: [
9270                "-marm",
9271                "-march=armv8.2-a+dotprod",
9272                "-mfpu=neon-fp-armv8",
9273            ],
9274        },
9275        arm64: {
9276            srcs: ALL_NEONDOT_MICROKERNEL_SRCS,
9277            cflags: [
9278                "-march=armv8.2-a+dotprod",
9279            ],
9280        },
9281        x86: {
9282            enabled: false,
9283        },
9284        x86_64: {
9285            enabled: false,
9286        },
9287    },
9288    header_libs: [
9289        "fp16_headers",
9290    ],
9291    static_libs: [
9292        "libpthreadpool",
9293        "xnnpack_tables",
9294    ],
9295}
9296
9297cc_library_static {
9298    name: "xnnpack_neondot_prod_microkernels",
9299    defaults: ["xnnpack_internal_default"],
9300    arch: {
9301        arm: {
9302            srcs: PROD_NEONDOT_MICROKERNEL_SRCS,
9303            cflags: [
9304                "-marm",
9305                "-march=armv8.2-a+dotprod",
9306                "-mfpu=neon-fp-armv8",
9307            ],
9308        },
9309        arm64: {
9310            srcs: PROD_NEONDOT_MICROKERNEL_SRCS,
9311            cflags: [
9312                "-march=armv8.2-a+dotprod",
9313            ],
9314        },
9315        x86: {
9316            enabled: false,
9317        },
9318        x86_64: {
9319            enabled: false,
9320        },
9321    },
9322    header_libs: [
9323        "fp16_headers",
9324    ],
9325    static_libs: [
9326        "libpthreadpool",
9327        "xnnpack_tables",
9328    ],
9329}
9330
9331cc_library_static {
9332    name: "xnnpack_asm_microkernels",
9333    defaults: ["xnnpack_internal_default"],
9334    arch: {
9335        arm: {
9336            srcs: AARCH32_ASM_MICROKERNEL_SRCS,
9337            asflags: [
9338                "-marm",
9339                "-march=armv8.2-a+dotprod",
9340                "-mfpu=neon-fp-armv8",
9341            ],
9342        },
9343        arm64: {
9344            srcs: AARCH64_ASM_MICROKERNEL_SRCS,
9345            asflags: [
9346                "-march=armv8.2-a+fp16+dotprod",
9347            ],
9348        },
9349        x86: {
9350            enabled: false,
9351        },
9352        x86_64: {
9353            enabled: false,
9354        },
9355    },
9356}
9357
9358cc_library_static {
9359    name: "xnnpack_sse2_amalgam_microkernels",
9360    defaults: ["xnnpack_internal_default"],
9361    arch: {
9362        arm: {
9363            enabled: false,
9364        },
9365        arm64: {
9366            enabled: false,
9367        },
9368        x86: {
9369            srcs: [
9370                "src/amalgam/sse.c",
9371                "src/amalgam/sse2.c",
9372            ],
9373            cflags: [
9374                "-msse2",
9375            ],
9376        },
9377        x86_64: {
9378            srcs: [
9379                "src/amalgam/sse.c",
9380                "src/amalgam/sse2.c",
9381            ],
9382            cflags: [
9383                "-msse2",
9384            ],
9385        },
9386    },
9387    header_libs: [
9388        "fp16_headers",
9389    ],
9390    static_libs: [
9391        "libpthreadpool",
9392        "xnnpack_tables",
9393    ],
9394}
9395
9396cc_library_static {
9397    name: "xnnpack_sse2_bench_microkernels",
9398    defaults: ["xnnpack_internal_default"],
9399    arch: {
9400        arm: {
9401            enabled: false,
9402        },
9403        arm64: {
9404            enabled: false,
9405        },
9406        x86: {
9407            srcs: ALL_SSE_MICROKERNEL_SRCS + ALL_SSE2_MICROKERNEL_SRCS,
9408            cflags: [
9409                "-msse2",
9410            ],
9411        },
9412        x86_64: {
9413            srcs: ALL_SSE_MICROKERNEL_SRCS + ALL_SSE2_MICROKERNEL_SRCS,
9414            cflags: [
9415                "-msse2",
9416            ],
9417        },
9418    },
9419    header_libs: [
9420        "fp16_headers",
9421    ],
9422    static_libs: [
9423        "libpthreadpool",
9424        "xnnpack_tables",
9425    ],
9426}
9427
9428cc_library_static {
9429    name: "xnnpack_sse2_prod_microkernels",
9430    defaults: ["xnnpack_internal_default"],
9431    arch: {
9432        arm: {
9433            enabled: false,
9434        },
9435        arm64: {
9436            enabled: false,
9437        },
9438        x86: {
9439            srcs: ALL_SSE_MICROKERNEL_SRCS + ALL_SSE2_MICROKERNEL_SRCS,
9440            cflags: [
9441                "-msse2",
9442            ],
9443        },
9444        x86_64: {
9445            srcs: ALL_SSE_MICROKERNEL_SRCS + ALL_SSE2_MICROKERNEL_SRCS,
9446            cflags: [
9447                "-msse2",
9448            ],
9449        },
9450    },
9451    header_libs: [
9452        "fp16_headers",
9453    ],
9454    static_libs: [
9455        "libpthreadpool",
9456        "xnnpack_tables",
9457    ],
9458}
9459
9460cc_library_static {
9461    name: "xnnpack_ssse3_amalgam_microkernels",
9462    defaults: ["xnnpack_internal_default"],
9463    arch: {
9464        arm: {
9465            enabled: false,
9466        },
9467        arm64: {
9468            enabled: false,
9469        },
9470        x86: {
9471            srcs: [
9472                "src/amalgam/ssse3.c",
9473            ],
9474            cflags: [
9475                "-mssse3",
9476            ],
9477        },
9478        x86_64: {
9479            srcs: [
9480                "src/amalgam/ssse3.c",
9481            ],
9482            cflags: [
9483                "-mssse3",
9484            ],
9485        },
9486    },
9487    header_libs: [
9488        "fp16_headers",
9489    ],
9490    static_libs: [
9491        "libpthreadpool",
9492        "xnnpack_tables",
9493    ],
9494}
9495
9496cc_library_static {
9497    name: "xnnpack_ssse3_bench_microkernels",
9498    defaults: ["xnnpack_internal_default"],
9499    arch: {
9500        arm: {
9501            enabled: false,
9502        },
9503        arm64: {
9504            enabled: false,
9505        },
9506        x86: {
9507            srcs: ALL_SSSE3_MICROKERNEL_SRCS,
9508            cflags: [
9509                "-mssse3",
9510            ],
9511        },
9512        x86_64: {
9513            srcs: ALL_SSSE3_MICROKERNEL_SRCS,
9514            cflags: [
9515                "-mssse3",
9516            ],
9517        },
9518    },
9519    header_libs: [
9520        "fp16_headers",
9521    ],
9522    static_libs: [
9523        "libpthreadpool",
9524        "xnnpack_tables",
9525    ],
9526}
9527
9528cc_library_static {
9529    name: "xnnpack_ssse3_prod_microkernels",
9530    defaults: ["xnnpack_internal_default"],
9531    arch: {
9532        arm: {
9533            enabled: false,
9534        },
9535        arm64: {
9536            enabled: false,
9537        },
9538        x86: {
9539            srcs: PROD_SSSE3_MICROKERNEL_SRCS,
9540            cflags: [
9541                "-mssse3",
9542            ],
9543        },
9544        x86_64: {
9545            srcs: PROD_SSSE3_MICROKERNEL_SRCS,
9546            cflags: [
9547                "-mssse3",
9548            ],
9549        },
9550    },
9551    header_libs: [
9552        "fp16_headers",
9553    ],
9554    static_libs: [
9555        "libpthreadpool",
9556        "xnnpack_tables",
9557    ],
9558}
9559
9560cc_library_static {
9561    name: "xnnpack_sse41_amalgam_microkernels",
9562    defaults: ["xnnpack_internal_default"],
9563    arch: {
9564        arm: {
9565            enabled: false,
9566        },
9567        arm64: {
9568            enabled: false,
9569        },
9570        x86: {
9571            srcs: [
9572                "src/amalgam/sse41.c",
9573            ],
9574            cflags: [
9575                "-msse4.1",
9576            ],
9577        },
9578        x86_64: {
9579            srcs: [
9580                "src/amalgam/sse41.c",
9581            ],
9582            cflags: [
9583                "-msse4.1",
9584            ],
9585        },
9586    },
9587    header_libs: [
9588        "fp16_headers",
9589    ],
9590    static_libs: [
9591        "libpthreadpool",
9592        "xnnpack_tables",
9593    ],
9594}
9595
9596cc_library_static {
9597    name: "xnnpack_sse41_bench_microkernels",
9598    defaults: ["xnnpack_internal_default"],
9599    arch: {
9600        arm: {
9601            enabled: false,
9602        },
9603        arm64: {
9604            enabled: false,
9605        },
9606        x86: {
9607            srcs: ALL_SSE41_MICROKERNEL_SRCS,
9608            cflags: [
9609                "-msse4.1",
9610            ],
9611        },
9612        x86_64: {
9613            srcs: ALL_SSE41_MICROKERNEL_SRCS,
9614            cflags: [
9615                "-msse4.1",
9616            ],
9617        },
9618    },
9619    header_libs: [
9620        "fp16_headers",
9621    ],
9622    static_libs: [
9623        "libpthreadpool",
9624        "xnnpack_tables",
9625    ],
9626}
9627
9628cc_library_static {
9629    name: "xnnpack_sse41_prod_microkernels",
9630    defaults: ["xnnpack_internal_default"],
9631    arch: {
9632        arm: {
9633            enabled: false,
9634        },
9635        arm64: {
9636            enabled: false,
9637        },
9638        x86: {
9639            srcs: PROD_SSE41_MICROKERNEL_SRCS,
9640            cflags: [
9641                "-msse4.1",
9642            ],
9643        },
9644        x86_64: {
9645            srcs: PROD_SSE41_MICROKERNEL_SRCS,
9646            cflags: [
9647                "-msse4.1",
9648            ],
9649        },
9650    },
9651    header_libs: [
9652        "fp16_headers",
9653    ],
9654    static_libs: [
9655        "libpthreadpool",
9656        "xnnpack_tables",
9657    ],
9658}
9659
9660cc_library_static {
9661    name: "xnnpack_avx_amalgam_microkernels",
9662    defaults: ["xnnpack_internal_default"],
9663    arch: {
9664        arm: {
9665            enabled: false,
9666        },
9667        arm64: {
9668            enabled: false,
9669        },
9670        x86: {
9671            srcs: [
9672                "src/amalgam/avx.c",
9673            ],
9674            cflags: [
9675                "-mavx",
9676            ],
9677        },
9678        x86_64: {
9679            srcs: [
9680                "src/amalgam/avx.c",
9681            ],
9682            cflags: [
9683                "-mavx",
9684            ],
9685        },
9686    },
9687    header_libs: [
9688        "fp16_headers",
9689    ],
9690    static_libs: [
9691        "libpthreadpool",
9692        "xnnpack_tables",
9693    ],
9694}
9695
9696cc_library_static {
9697    name: "xnnpack_avx_bench_microkernels",
9698    defaults: ["xnnpack_internal_default"],
9699    arch: {
9700        arm: {
9701            enabled: false,
9702        },
9703        arm64: {
9704            enabled: false,
9705        },
9706        x86: {
9707            srcs: ALL_AVX_MICROKERNEL_SRCS,
9708            cflags: [
9709                "-mavx",
9710            ],
9711        },
9712        x86_64: {
9713            srcs: ALL_AVX_MICROKERNEL_SRCS,
9714            cflags: [
9715                "-mavx",
9716            ],
9717        },
9718    },
9719    header_libs: [
9720        "fp16_headers",
9721    ],
9722    static_libs: [
9723        "libpthreadpool",
9724        "xnnpack_tables",
9725    ],
9726}
9727
9728cc_library_static {
9729    name: "xnnpack_avx_prod_microkernels",
9730    defaults: ["xnnpack_internal_default"],
9731    arch: {
9732        arm: {
9733            enabled: false,
9734        },
9735        arm64: {
9736            enabled: false,
9737        },
9738        x86: {
9739            srcs: PROD_AVX_MICROKERNEL_SRCS,
9740            cflags: [
9741                "-mavx",
9742            ],
9743        },
9744        x86_64: {
9745            srcs: PROD_AVX_MICROKERNEL_SRCS,
9746            cflags: [
9747                "-mavx",
9748            ],
9749        },
9750    },
9751    header_libs: [
9752        "fp16_headers",
9753    ],
9754    static_libs: [
9755        "libpthreadpool",
9756        "xnnpack_tables",
9757    ],
9758}
9759
9760cc_library_static {
9761    name: "xnnpack_f16c_amalgam_microkernels",
9762    defaults: ["xnnpack_internal_default"],
9763    arch: {
9764        arm: {
9765            enabled: false,
9766        },
9767        arm64: {
9768            enabled: false,
9769        },
9770        x86: {
9771            srcs: [
9772                "src/amalgam/f16c.c",
9773            ],
9774            cflags: [
9775                "-mf16c",
9776            ],
9777        },
9778        x86_64: {
9779            srcs: [
9780                "src/amalgam/f16c.c",
9781            ],
9782            cflags: [
9783                "-mf16c",
9784            ],
9785        },
9786    },
9787    header_libs: [
9788        "fp16_headers",
9789    ],
9790    static_libs: [
9791        "libpthreadpool",
9792        "xnnpack_tables",
9793    ],
9794}
9795
9796cc_library_static {
9797    name: "xnnpack_f16c_bench_microkernels",
9798    defaults: ["xnnpack_internal_default"],
9799    arch: {
9800        arm: {
9801            enabled: false,
9802        },
9803        arm64: {
9804            enabled: false,
9805        },
9806        x86: {
9807            srcs: ALL_F16C_MICROKERNEL_SRCS,
9808            cflags: [
9809                "-mf16c",
9810            ],
9811        },
9812        x86_64: {
9813            srcs: ALL_F16C_MICROKERNEL_SRCS,
9814            cflags: [
9815                "-mf16c",
9816            ],
9817        },
9818    },
9819    header_libs: [
9820        "fp16_headers",
9821    ],
9822    static_libs: [
9823        "libpthreadpool",
9824        "xnnpack_tables",
9825    ],
9826}
9827
9828cc_library_static {
9829    name: "xnnpack_f16c_prod_microkernels",
9830    defaults: ["xnnpack_internal_default"],
9831    arch: {
9832        arm: {
9833            enabled: false,
9834        },
9835        arm64: {
9836            enabled: false,
9837        },
9838        x86: {
9839            srcs: PROD_F16C_MICROKERNEL_SRCS,
9840            cflags: [
9841                "-mf16c",
9842            ],
9843        },
9844        x86_64: {
9845            srcs: PROD_F16C_MICROKERNEL_SRCS,
9846            cflags: [
9847                "-mf16c",
9848            ],
9849        },
9850    },
9851    header_libs: [
9852        "fp16_headers",
9853    ],
9854    static_libs: [
9855        "libpthreadpool",
9856        "xnnpack_tables",
9857    ],
9858}
9859
9860cc_library_static {
9861    name: "xnnpack_xop_bench_microkernels",
9862    defaults: ["xnnpack_internal_default"],
9863    arch: {
9864        arm: {
9865            enabled: false,
9866        },
9867        arm64: {
9868            enabled: false,
9869        },
9870        x86: {
9871            srcs: ALL_XOP_MICROKERNEL_SRCS,
9872            cflags: [
9873                "-mxop",
9874            ],
9875        },
9876        x86_64: {
9877            srcs: ALL_XOP_MICROKERNEL_SRCS,
9878            cflags: [
9879                "-mxop",
9880            ],
9881        },
9882    },
9883    header_libs: [
9884        "fp16_headers",
9885    ],
9886    static_libs: [
9887        "libpthreadpool",
9888        "xnnpack_tables",
9889    ],
9890}
9891
9892cc_library_static {
9893    name: "xnnpack_xop_prod_microkernels",
9894    defaults: ["xnnpack_internal_default"],
9895    arch: {
9896        arm: {
9897            enabled: false,
9898        },
9899        arm64: {
9900            enabled: false,
9901        },
9902        x86: {
9903            srcs: PROD_XOP_MICROKERNEL_SRCS,
9904            cflags: [
9905                "-mxop",
9906            ],
9907        },
9908        x86_64: {
9909            srcs: PROD_XOP_MICROKERNEL_SRCS,
9910            cflags: [
9911                "-mxop",
9912            ],
9913        },
9914    },
9915    header_libs: [
9916        "fp16_headers",
9917    ],
9918    static_libs: [
9919        "libpthreadpool",
9920        "xnnpack_tables",
9921    ],
9922}
9923
9924cc_library_static {
9925    name: "xnnpack_fma3_amalgam_microkernels",
9926    defaults: ["xnnpack_internal_default"],
9927    arch: {
9928        arm: {
9929            enabled: false,
9930        },
9931        arm64: {
9932            enabled: false,
9933        },
9934        x86: {
9935            srcs: [
9936                "src/amalgam/fma3.c",
9937            ],
9938            cflags: [
9939                "-mf16c",
9940                "-mfma",
9941            ],
9942        },
9943        x86_64: {
9944            srcs: [
9945                "src/amalgam/fma3.c",
9946            ],
9947            cflags: [
9948                "-mf16c",
9949                "-mfma",
9950            ],
9951        },
9952    },
9953    header_libs: [
9954        "fp16_headers",
9955    ],
9956    static_libs: [
9957        "libpthreadpool",
9958        "xnnpack_tables",
9959    ],
9960}
9961
9962cc_library_static {
9963    name: "xnnpack_fma3_bench_microkernels",
9964    defaults: ["xnnpack_internal_default"],
9965    arch: {
9966        arm: {
9967            enabled: false,
9968        },
9969        arm64: {
9970            enabled: false,
9971        },
9972        x86: {
9973            srcs: ALL_FMA3_MICROKERNEL_SRCS,
9974            cflags: [
9975                "-mf16c",
9976                "-mfma",
9977            ],
9978        },
9979        x86_64: {
9980            srcs: ALL_FMA3_MICROKERNEL_SRCS,
9981            cflags: [
9982                "-mf16c",
9983                "-mfma",
9984            ],
9985        },
9986    },
9987    header_libs: [
9988        "fp16_headers",
9989    ],
9990    static_libs: [
9991        "libpthreadpool",
9992        "xnnpack_tables",
9993    ],
9994}
9995
9996cc_library_static {
9997    name: "xnnpack_fma3_prod_microkernels",
9998    defaults: ["xnnpack_internal_default"],
9999    arch: {
10000        arm: {
10001            enabled: false,
10002        },
10003        arm64: {
10004            enabled: false,
10005        },
10006        x86: {
10007            srcs: PROD_FMA3_MICROKERNEL_SRCS,
10008            cflags: [
10009                "-mf16c",
10010                "-mfma",
10011            ],
10012        },
10013        x86_64: {
10014            srcs: PROD_FMA3_MICROKERNEL_SRCS,
10015            cflags: [
10016                "-mf16c",
10017                "-mfma",
10018            ],
10019        },
10020    },
10021    header_libs: [
10022        "fp16_headers",
10023    ],
10024    static_libs: [
10025        "libpthreadpool",
10026        "xnnpack_tables",
10027    ],
10028}
10029
10030cc_library_static {
10031    name: "xnnpack_avx2_amalgam_microkernels",
10032    defaults: ["xnnpack_internal_default"],
10033    arch: {
10034        arm: {
10035            enabled: false,
10036        },
10037        arm64: {
10038            enabled: false,
10039        },
10040        x86: {
10041            srcs: [
10042                "src/amalgam/avx2.c",
10043            ],
10044            cflags: [
10045                "-mf16c",
10046                "-mfma",
10047                "-mavx2",
10048            ],
10049        },
10050        x86_64: {
10051            srcs: [
10052                "src/amalgam/avx2.c",
10053            ],
10054            cflags: [
10055                "-mf16c",
10056                "-mfma",
10057                "-mavx2",
10058            ],
10059        },
10060    },
10061    header_libs: [
10062        "fp16_headers",
10063    ],
10064    static_libs: [
10065        "libpthreadpool",
10066        "xnnpack_tables",
10067    ],
10068}
10069
10070cc_library_static {
10071    name: "xnnpack_avx2_bench_microkernels",
10072    defaults: ["xnnpack_internal_default"],
10073    arch: {
10074        arm: {
10075            enabled: false,
10076        },
10077        arm64: {
10078            enabled: false,
10079        },
10080        x86: {
10081            srcs: ALL_AVX2_MICROKERNEL_SRCS,
10082            cflags: [
10083                "-mf16c",
10084                "-mfma",
10085                "-mavx2",
10086            ],
10087        },
10088        x86_64: {
10089            srcs: ALL_AVX2_MICROKERNEL_SRCS,
10090            cflags: [
10091                "-mf16c",
10092                "-mfma",
10093                "-mavx2",
10094            ],
10095        },
10096    },
10097    header_libs: [
10098        "fp16_headers",
10099    ],
10100    static_libs: [
10101        "libpthreadpool",
10102        "xnnpack_tables",
10103    ],
10104}
10105
10106cc_library_static {
10107    name: "xnnpack_avx2_prod_microkernels",
10108    defaults: ["xnnpack_internal_default"],
10109    arch: {
10110        arm: {
10111            enabled: false,
10112        },
10113        arm64: {
10114            enabled: false,
10115        },
10116        x86: {
10117            srcs: PROD_AVX2_MICROKERNEL_SRCS,
10118            cflags: [
10119                "-mf16c",
10120                "-mfma",
10121                "-mavx2",
10122            ],
10123        },
10124        x86_64: {
10125            srcs: PROD_AVX2_MICROKERNEL_SRCS,
10126            cflags: [
10127                "-mf16c",
10128                "-mfma",
10129                "-mavx2",
10130            ],
10131        },
10132    },
10133    header_libs: [
10134        "fp16_headers",
10135    ],
10136    static_libs: [
10137        "libpthreadpool",
10138        "xnnpack_tables",
10139    ],
10140}
10141
10142cc_library_static {
10143    name: "xnnpack_avx512skx_amalgam_microkernels",
10144    defaults: ["xnnpack_internal_default"],
10145    arch: {
10146        arm: {
10147            enabled: false,
10148        },
10149        arm64: {
10150            enabled: false,
10151        },
10152        x86: {
10153            srcs: [
10154                "src/amalgam/avx512skx.c",
10155            ],
10156            cflags: [
10157                "-mavx512f",
10158                "-mavx512cd",
10159                "-mavx512bw",
10160                "-mavx512dq",
10161                "-mavx512vl",
10162            ],
10163        },
10164        x86_64: {
10165            srcs: [
10166                "src/amalgam/avx512skx.c",
10167            ],
10168            cflags: [
10169                "-mavx512f",
10170                "-mavx512cd",
10171                "-mavx512bw",
10172                "-mavx512dq",
10173                "-mavx512vl",
10174            ],
10175        },
10176    },
10177    header_libs: [
10178        "fp16_headers",
10179    ],
10180    static_libs: [
10181        "libpthreadpool",
10182        "xnnpack_tables",
10183    ],
10184}
10185
10186cc_library_static {
10187    name: "xnnpack_avx512skx_bench_microkernels",
10188    defaults: ["xnnpack_internal_default"],
10189    arch: {
10190        arm: {
10191            enabled: false,
10192        },
10193        arm64: {
10194            enabled: false,
10195        },
10196        x86: {
10197            srcs: ALL_AVX512SKX_MICROKERNEL_SRCS,
10198            cflags: [
10199                "-mavx512f",
10200                "-mavx512cd",
10201                "-mavx512bw",
10202                "-mavx512dq",
10203                "-mavx512vl",
10204            ],
10205        },
10206        x86_64: {
10207            srcs: ALL_AVX512SKX_MICROKERNEL_SRCS,
10208            cflags: [
10209                "-mavx512f",
10210                "-mavx512cd",
10211                "-mavx512bw",
10212                "-mavx512dq",
10213                "-mavx512vl",
10214            ],
10215        },
10216    },
10217    header_libs: [
10218        "fp16_headers",
10219    ],
10220    static_libs: [
10221        "libpthreadpool",
10222        "xnnpack_tables",
10223    ],
10224}
10225
10226cc_library_static {
10227    name: "xnnpack_avx512skx_prod_microkernels",
10228    defaults: ["xnnpack_internal_default"],
10229    arch: {
10230        arm: {
10231            enabled: false,
10232        },
10233        arm64: {
10234            enabled: false,
10235        },
10236        x86: {
10237            srcs: PROD_AVX512SKX_MICROKERNEL_SRCS,
10238            cflags: [
10239                "-mavx512f",
10240                "-mavx512cd",
10241                "-mavx512bw",
10242                "-mavx512dq",
10243                "-mavx512vl",
10244            ],
10245        },
10246        x86_64: {
10247            srcs: PROD_AVX512SKX_MICROKERNEL_SRCS,
10248            cflags: [
10249                "-mavx512f",
10250                "-mavx512cd",
10251                "-mavx512bw",
10252                "-mavx512dq",
10253                "-mavx512vl",
10254            ],
10255        },
10256    },
10257    header_libs: [
10258        "fp16_headers",
10259    ],
10260    static_libs: [
10261        "libpthreadpool",
10262        "xnnpack_tables",
10263    ],
10264}
10265
10266cc_library_static {
10267    name: "xnnpack_avx512f_amalgam_microkernels",
10268    defaults: ["xnnpack_internal_default"],
10269    arch: {
10270        arm: {
10271            enabled: false,
10272        },
10273        arm64: {
10274            enabled: false,
10275        },
10276        x86: {
10277            srcs: [
10278                "src/amalgam/avx512f.c",
10279            ],
10280            cflags: [
10281                "-mavx512f",
10282            ],
10283        },
10284        x86_64: {
10285            srcs: [
10286                "src/amalgam/avx512f.c",
10287            ],
10288            cflags: [
10289                "-mavx512f",
10290            ],
10291        },
10292    },
10293    header_libs: [
10294        "fp16_headers",
10295    ],
10296    static_libs: [
10297        "libpthreadpool",
10298        "xnnpack_tables",
10299    ],
10300}
10301
10302cc_library_static {
10303    name: "xnnpack_avx512f_bench_microkernels",
10304    defaults: ["xnnpack_internal_default"],
10305    arch: {
10306        arm: {
10307            enabled: false,
10308        },
10309        arm64: {
10310            enabled: false,
10311        },
10312        x86: {
10313            srcs: ALL_AVX512F_MICROKERNEL_SRCS,
10314            cflags: [
10315                "-mavx512f",
10316            ],
10317        },
10318        x86_64: {
10319            srcs: ALL_AVX512F_MICROKERNEL_SRCS,
10320            cflags: [
10321                "-mavx512f",
10322            ],
10323        },
10324    },
10325    header_libs: [
10326        "fp16_headers",
10327    ],
10328    static_libs: [
10329        "libpthreadpool",
10330        "xnnpack_tables",
10331    ],
10332}
10333
10334cc_library_static {
10335    name: "xnnpack_avx512f_prod_microkernels",
10336    defaults: ["xnnpack_internal_default"],
10337    arch: {
10338        arm: {
10339            enabled: false,
10340        },
10341        arm64: {
10342            enabled: false,
10343        },
10344        x86: {
10345            srcs: PROD_AVX512F_MICROKERNEL_SRCS,
10346            cflags: [
10347                "-mavx512f",
10348            ],
10349        },
10350        x86_64: {
10351            srcs: PROD_AVX512F_MICROKERNEL_SRCS,
10352            cflags: [
10353                "-mavx512f",
10354            ],
10355        },
10356    },
10357    header_libs: [
10358        "fp16_headers",
10359    ],
10360    static_libs: [
10361        "libpthreadpool",
10362        "xnnpack_tables",
10363    ],
10364}
10365
10366cc_library_static {
10367    name: "xnnpack_amalgam_microkernels",
10368    defaults: ["xnnpack_internal_default"],
10369    arch: {
10370        arm: {
10371            whole_static_libs: [
10372                "xnnpack_armsimd32_prod_microkernels",
10373                "xnnpack_neon_prod_microkernels",
10374                "xnnpack_neonfp16_prod_microkernels",
10375                "xnnpack_neonfma_prod_microkernels",
10376                "xnnpack_neonv8_prod_microkernels",
10377                "xnnpack_asm_microkernels",
10378            ],
10379        },
10380        arm64: {
10381            whole_static_libs: [
10382                "xnnpack_neon_prod_microkernels",
10383                "xnnpack_neonfp16_prod_microkernels",
10384                "xnnpack_neonfma_prod_microkernels",
10385                "xnnpack_neonv8_prod_microkernels",
10386                "xnnpack_asm_microkernels",
10387            ],
10388        },
10389        x86: {
10390            whole_static_libs: [
10391                "xnnpack_sse2_amalgam_microkernels",
10392                "xnnpack_ssse3_amalgam_microkernels",
10393                "xnnpack_sse41_amalgam_microkernels",
10394                "xnnpack_avx_amalgam_microkernels",
10395                "xnnpack_f16c_amalgam_microkernels",
10396                "xnnpack_fma3_amalgam_microkernels",
10397                "xnnpack_avx2_amalgam_microkernels",
10398                "xnnpack_avx512f_amalgam_microkernels",
10399                "xnnpack_avx512skx_amalgam_microkernels",
10400            ],
10401        },
10402        x86_64: {
10403            whole_static_libs: [
10404                "xnnpack_sse2_amalgam_microkernels",
10405                "xnnpack_ssse3_amalgam_microkernels",
10406                "xnnpack_sse41_amalgam_microkernels",
10407                "xnnpack_avx_amalgam_microkernels",
10408                "xnnpack_f16c_amalgam_microkernels",
10409                "xnnpack_fma3_amalgam_microkernels",
10410                "xnnpack_avx2_amalgam_microkernels",
10411                "xnnpack_avx512f_amalgam_microkernels",
10412                "xnnpack_avx512skx_amalgam_microkernels",
10413            ],
10414        },
10415    },
10416    whole_static_libs: [
10417        "xnnpack_scalar_prod_microkernels",
10418        "xnnpack_tables",
10419    ],
10420}
10421
10422cc_library_static {
10423    name: "xnnpack_bench_microkernels",
10424    defaults: ["xnnpack_internal_default"],
10425    arch: {
10426        arm: {
10427            whole_static_libs: [
10428                "xnnpack_armsimd32_bench_microkernels",
10429                "xnnpack_neon_bench_microkernels",
10430                "xnnpack_neonfp16_bench_microkernels",
10431                "xnnpack_neonfma_bench_microkernels",
10432                "xnnpack_neonv8_bench_microkernels",
10433                "xnnpack_asm_microkernels",
10434            ],
10435        },
10436        arm64: {
10437            whole_static_libs: [
10438                "xnnpack_neon_bench_microkernels",
10439                "xnnpack_neonfp16_bench_microkernels",
10440                "xnnpack_neonfma_bench_microkernels",
10441                "xnnpack_neonv8_bench_microkernels",
10442                "xnnpack_asm_microkernels",
10443            ],
10444        },
10445        x86: {
10446            whole_static_libs: [
10447                "xnnpack_sse2_bench_microkernels",
10448                "xnnpack_ssse3_bench_microkernels",
10449                "xnnpack_sse41_bench_microkernels",
10450                "xnnpack_avx_bench_microkernels",
10451                "xnnpack_f16c_bench_microkernels",
10452                "xnnpack_xop_bench_microkernels",
10453                "xnnpack_fma3_bench_microkernels",
10454                "xnnpack_avx2_bench_microkernels",
10455                "xnnpack_avx512f_bench_microkernels",
10456                "xnnpack_avx512skx_bench_microkernels",
10457            ],
10458        },
10459        x86_64: {
10460            whole_static_libs: [
10461                "xnnpack_sse2_bench_microkernels",
10462                "xnnpack_ssse3_bench_microkernels",
10463                "xnnpack_sse41_bench_microkernels",
10464                "xnnpack_avx_bench_microkernels",
10465                "xnnpack_f16c_bench_microkernels",
10466                "xnnpack_xop_bench_microkernels",
10467                "xnnpack_fma3_bench_microkernels",
10468                "xnnpack_avx2_bench_microkernels",
10469                "xnnpack_avx512f_bench_microkernels",
10470                "xnnpack_avx512skx_bench_microkernels",
10471            ],
10472        },
10473    },
10474    whole_static_libs: [
10475        "xnnpack_scalar_bench_microkernels",
10476        "xnnpack_tables",
10477    ],
10478}
10479
10480cc_library_static {
10481    name: "xnnpack_prod_microkernels",
10482    defaults: ["xnnpack_internal_default"],
10483    arch: {
10484        arm: {
10485            whole_static_libs: [
10486                "xnnpack_armsimd32_prod_microkernels",
10487                "xnnpack_neon_prod_microkernels",
10488                "xnnpack_neonfp16_prod_microkernels",
10489                "xnnpack_neonfma_prod_microkernels",
10490                "xnnpack_neonv8_prod_microkernels",
10491                "xnnpack_asm_microkernels",
10492            ],
10493        },
10494        arm64: {
10495            whole_static_libs: [
10496                "xnnpack_neon_prod_microkernels",
10497                "xnnpack_neonfp16_prod_microkernels",
10498                "xnnpack_neonfma_prod_microkernels",
10499                "xnnpack_neonv8_prod_microkernels",
10500                "xnnpack_asm_microkernels",
10501            ],
10502        },
10503        x86: {
10504            whole_static_libs: [
10505                "xnnpack_sse2_prod_microkernels",
10506                "xnnpack_ssse3_prod_microkernels",
10507                "xnnpack_sse41_prod_microkernels",
10508                "xnnpack_avx_prod_microkernels",
10509                "xnnpack_f16c_prod_microkernels",
10510                "xnnpack_xop_prod_microkernels",
10511                "xnnpack_fma3_prod_microkernels",
10512                "xnnpack_avx2_prod_microkernels",
10513                "xnnpack_avx512f_prod_microkernels",
10514                "xnnpack_avx512skx_prod_microkernels",
10515            ],
10516        },
10517        x86_64: {
10518            whole_static_libs: [
10519                "xnnpack_sse2_prod_microkernels",
10520                "xnnpack_ssse3_prod_microkernels",
10521                "xnnpack_sse41_prod_microkernels",
10522                "xnnpack_avx_prod_microkernels",
10523                "xnnpack_f16c_prod_microkernels",
10524                "xnnpack_xop_prod_microkernels",
10525                "xnnpack_fma3_prod_microkernels",
10526                "xnnpack_avx2_prod_microkernels",
10527                "xnnpack_avx512f_prod_microkernels",
10528                "xnnpack_avx512skx_prod_microkernels",
10529            ],
10530        },
10531    },
10532    whole_static_libs: [
10533        "xnnpack_scalar_prod_microkernels",
10534        "xnnpack_tables",
10535    ],
10536}
10537
10538cc_library_static {
10539    name: "libXNNPACK",
10540    defaults: ["xnnpack_internal_default"],
10541    export_include_dirs: ["include"],
10542    srcs: [
10543        "src/init.c",
10544    ],
10545    header_libs: [
10546        "fp16_headers",
10547    ],
10548    whole_static_libs: [
10549        "libclog",
10550        "libcpuinfo",
10551        "libpthreadpool",
10552        "xnnpack_allocator",
10553        "xnnpack_cache",
10554        "xnnpack_jit",
10555        "xnnpack_prod_microkernels",
10556        "xnnpack_operators",
10557        "xnnpack_logging",
10558        "xnnpack_microparams_init",
10559        "xnnpack_mutex",
10560        "xnnpack_normalization",
10561        "xnnpack_packing",
10562        "xnnpack_params",
10563        "xnnpack_subgraph",
10564    ],
10565}
10566
10567// Tests and benchmarks
10568cc_defaults {
10569    name: "xnnpack_tests_default",
10570    vendor_available: true,
10571    stl: "libc++_static",
10572    local_include_dirs: [
10573        "bench",
10574        "models",
10575        "test",
10576        "src",
10577    ],
10578    cflags: [
10579        "-Wno-missing-field-initializers",
10580        "-Wno-unused-function",
10581        "-Wno-unused-parameter",
10582        "-Wno-unused-private-field",
10583    ],
10584    header_libs: [
10585        "fp16_headers",
10586    ],
10587    static_libs: [
10588        "libXNNPACK",
10589        "libpthreadpool",
10590        "libgmock",
10591        "xnnpack_allocator",
10592        "xnnpack_cache",
10593        "xnnpack_microparams_init",
10594        "xnnpack_mutex",
10595        "xnnpack_normalization",
10596        "xnnpack_params",
10597    ],
10598    shared_libs: [
10599        "liblog",
10600    ],
10601}
10602
10603cc_library_static {
10604    name: "xnnpack_mobilenet_v1_fp32",
10605    defaults: ["xnnpack_tests_default"],
10606    srcs: [
10607        "models/fp32-mobilenet-v1.cc",
10608    ],
10609}
10610
10611cc_library_static {
10612    name: "xnnpack_mobilenet_v1_fp32_sparse",
10613    defaults: ["xnnpack_tests_default"],
10614    srcs: [
10615        "models/fp32-sparse-mobilenet-v1.cc",
10616    ],
10617}
10618
10619cc_library_static {
10620    name: "xnnpack_qc8_mobilenet_v1",
10621    defaults: ["xnnpack_tests_default"],
10622    srcs: [
10623        "models/qc8-mobilenet-v1.cc",
10624    ],
10625}
10626
10627cc_library_static {
10628    name: "xnnpack_qc8_mobilenet_v2",
10629    defaults: ["xnnpack_tests_default"],
10630    srcs: [
10631        "models/qc8-mobilenet-v2.cc",
10632    ],
10633}
10634
10635cc_library_static {
10636    name: "xnnpack_qs8_mobilenet_v1",
10637    defaults: ["xnnpack_tests_default"],
10638    srcs: [
10639        "models/qs8-mobilenet-v1.cc",
10640    ],
10641}
10642
10643cc_library_static {
10644    name: "xnnpack_qu8_mobilenet_v1",
10645    defaults: ["xnnpack_tests_default"],
10646    srcs: [
10647        "models/qu8-mobilenet-v1.cc",
10648    ],
10649}
10650
10651cc_library_static {
10652    name: "xnnpack_qu8_mobilenet_v2",
10653    defaults: ["xnnpack_tests_default"],
10654    srcs: [
10655        "models/qu8-mobilenet-v2.cc",
10656    ],
10657}
10658
10659cc_library_static {
10660    name: "xnnpack_mobilenet_v1_fp16",
10661    defaults: ["xnnpack_tests_default"],
10662    srcs: [
10663        "models/fp16-mobilenet-v1.cc",
10664    ],
10665}
10666
10667cc_library_static {
10668    name: "xnnpack_qs8_mobilenet_v2",
10669    defaults: ["xnnpack_tests_default"],
10670    srcs: [
10671        "models/qs8-mobilenet-v2.cc",
10672    ],
10673}
10674
10675cc_library_static {
10676    name: "xnnpack_mobilenet_v2_fp32",
10677    defaults: ["xnnpack_tests_default"],
10678    srcs: [
10679        "models/fp32-mobilenet-v2.cc",
10680    ],
10681}
10682
10683cc_library_static {
10684    name: "xnnpack_mobilenet_v2_fp32_sparse",
10685    defaults: ["xnnpack_tests_default"],
10686    srcs: [
10687        "models/fp32-sparse-mobilenet-v2.cc",
10688    ],
10689}
10690
10691cc_library_static {
10692    name: "xnnpack_mobilenet_v2_fp16",
10693    defaults: ["xnnpack_tests_default"],
10694    srcs: [
10695        "models/fp16-mobilenet-v2.cc",
10696    ],
10697}
10698
10699cc_library_static {
10700    name: "xnnpack_mobilenet_v3_large_fp32",
10701    defaults: ["xnnpack_tests_default"],
10702    srcs: [
10703        "models/fp32-mobilenet-v3-large.cc",
10704    ],
10705}
10706
10707cc_library_static {
10708    name: "xnnpack_mobilenet_v3_large_fp32_sparse",
10709    defaults: ["xnnpack_tests_default"],
10710    srcs: [
10711        "models/fp32-sparse-mobilenet-v3-large.cc",
10712    ],
10713}
10714
10715cc_library_static {
10716    name: "xnnpack_mobilenet_v3_large_fp16",
10717    defaults: ["xnnpack_tests_default"],
10718    srcs: [
10719        "models/fp16-mobilenet-v3-large.cc",
10720    ],
10721}
10722
10723cc_library_static {
10724    name: "xnnpack_mobilenet_v3_small_fp32",
10725    defaults: ["xnnpack_tests_default"],
10726    srcs: [
10727        "models/fp32-mobilenet-v3-small.cc",
10728    ],
10729}
10730
10731cc_library_static {
10732    name: "xnnpack_mobilenet_v3_small_fp32_sparse",
10733    defaults: ["xnnpack_tests_default"],
10734    srcs: [
10735        "models/fp32-sparse-mobilenet-v3-small.cc",
10736    ],
10737}
10738
10739cc_library_static {
10740    name: "xnnpack_mobilenet_v3_small_fp16",
10741    defaults: ["xnnpack_tests_default"],
10742    srcs: [
10743        "models/fp16-mobilenet-v3-small.cc",
10744    ],
10745}
10746
10747cc_benchmark {
10748    name: "xnnpack_end2end_bench",
10749    defaults: ["xnnpack_tests_default"],
10750    srcs: [
10751        "bench/end2end.cc",
10752        "bench/utils.cc",
10753    ],
10754    cflags: [
10755        "-Wno-unused-result",
10756    ],
10757    static_libs: [
10758        "libcpuinfo",
10759        "libgoogle-benchmark",
10760        "xnnpack_qc8_mobilenet_v1",
10761        "xnnpack_qc8_mobilenet_v2",
10762        "xnnpack_qs8_mobilenet_v1",
10763        "xnnpack_mobilenet_v1_fp32",
10764        "xnnpack_mobilenet_v1_fp32_sparse",
10765        "xnnpack_mobilenet_v1_fp16",
10766        "xnnpack_qs8_mobilenet_v2",
10767        "xnnpack_mobilenet_v2_fp32",
10768        "xnnpack_mobilenet_v2_fp32_sparse",
10769        "xnnpack_mobilenet_v2_fp16",
10770        "xnnpack_mobilenet_v3_large_fp32",
10771        "xnnpack_mobilenet_v3_large_fp32_sparse",
10772        "xnnpack_mobilenet_v3_large_fp16",
10773        "xnnpack_mobilenet_v3_small_fp32",
10774        "xnnpack_mobilenet_v3_small_fp32_sparse",
10775        "xnnpack_mobilenet_v3_small_fp16",
10776        "xnnpack_qu8_mobilenet_v1",
10777        "xnnpack_qu8_mobilenet_v2",
10778    ],
10779}
10780
10781cc_test {
10782    name: "xnnpack_abs_nc_test",
10783    defaults: ["xnnpack_tests_default"],
10784    srcs: [
10785        "test/abs-nc.cc",
10786    ],
10787    test_suites: [
10788        "general-tests",
10789    ],
10790}
10791
10792cc_test {
10793    name: "xnnpack_add_nd_test",
10794    defaults: ["xnnpack_tests_default"],
10795    srcs: [
10796        "test/add-nd.cc",
10797    ],
10798    test_suites: [
10799        "general-tests",
10800    ],
10801}
10802
10803cc_test {
10804    name: "xnnpack_argmax_pooling_nhwc_test",
10805    defaults: ["xnnpack_tests_default"],
10806    srcs: [
10807        "test/argmax-pooling-nhwc.cc",
10808    ],
10809    test_suites: [
10810        "general-tests",
10811    ],
10812}
10813
10814cc_test {
10815    name: "xnnpack_average_pooling_nhwc_test",
10816    defaults: ["xnnpack_tests_default"],
10817    srcs: [
10818        "test/average-pooling-nhwc.cc",
10819    ],
10820    test_suites: [
10821        "general-tests",
10822    ],
10823}
10824
10825cc_test {
10826    name: "xnnpack_bankers_rounding_nc_test",
10827    defaults: ["xnnpack_tests_default"],
10828    srcs: [
10829        "test/bankers-rounding-nc.cc",
10830    ],
10831    test_suites: [
10832        "general-tests",
10833    ],
10834}
10835
10836cc_test {
10837    name: "xnnpack_ceiling_nc_test",
10838    defaults: ["xnnpack_tests_default"],
10839    srcs: [
10840        "test/ceiling-nc.cc",
10841    ],
10842    test_suites: [
10843        "general-tests",
10844    ],
10845}
10846
10847cc_test {
10848    name: "xnnpack_channel_shuffle_nc_test",
10849    defaults: ["xnnpack_tests_default"],
10850    srcs: [
10851        "test/channel-shuffle-nc.cc",
10852    ],
10853    test_suites: [
10854        "general-tests",
10855    ],
10856}
10857
10858cc_test {
10859    name: "xnnpack_clamp_nc_test",
10860    defaults: ["xnnpack_tests_default"],
10861    srcs: [
10862        "test/clamp-nc.cc",
10863    ],
10864    test_suites: [
10865        "general-tests",
10866    ],
10867}
10868
10869cc_test {
10870    name: "xnnpack_constant_pad_nd_test",
10871    defaults: ["xnnpack_tests_default"],
10872    srcs: [
10873        "test/constant-pad-nd.cc",
10874    ],
10875    test_suites: [
10876        "general-tests",
10877    ],
10878}
10879
10880cc_test {
10881    name: "xnnpack_convolution_nhwc_test",
10882    defaults: ["xnnpack_tests_default"],
10883    srcs: [
10884        "test/convolution-nhwc.cc",
10885        "test/convolution-test-helpers.cc",
10886    ],
10887    test_suites: [
10888        "general-tests",
10889    ],
10890}
10891
10892cc_test {
10893    name: "xnnpack_convolution_nchw_test",
10894    defaults: ["xnnpack_tests_default"],
10895    srcs: [
10896        "test/convolution-nchw.cc",
10897        "test/convolution-test-helpers.cc",
10898    ],
10899    test_suites: [
10900        "general-tests",
10901    ],
10902}
10903
10904cc_test {
10905    name: "xnnpack_copy_nc_test",
10906    defaults: ["xnnpack_tests_default"],
10907    srcs: [
10908        "test/copy-nc.cc",
10909    ],
10910    test_suites: [
10911        "general-tests",
10912    ],
10913}
10914
10915cc_test {
10916    name: "xnnpack_deconvolution_nhwc_test",
10917    defaults: ["xnnpack_tests_default"],
10918    srcs: [
10919        "test/deconvolution-nhwc.cc",
10920    ],
10921    test_suites: [
10922        "general-tests",
10923    ],
10924}
10925
10926cc_test {
10927    name: "xnnpack_divide_nd_test",
10928    defaults: ["xnnpack_tests_default"],
10929    srcs: [
10930        "test/divide-nd.cc",
10931    ],
10932    test_suites: [
10933        "general-tests",
10934    ],
10935}
10936
10937cc_test {
10938    name: "xnnpack_fully_connected_nc_test",
10939    defaults: ["xnnpack_tests_default"],
10940    srcs: [
10941        "test/fully-connected-nc.cc",
10942    ],
10943    test_suites: [
10944        "general-tests",
10945    ],
10946}
10947
10948cc_test {
10949    name: "xnnpack_floor_nc_test",
10950    defaults: ["xnnpack_tests_default"],
10951    srcs: [
10952        "test/floor-nc.cc",
10953    ],
10954    test_suites: [
10955        "general-tests",
10956    ],
10957}
10958
10959cc_test {
10960    name: "xnnpack_global_average_pooling_nwc_test",
10961    defaults: ["xnnpack_tests_default"],
10962    srcs: [
10963        "test/global-average-pooling-nwc.cc",
10964    ],
10965    test_suites: [
10966        "general-tests",
10967    ],
10968}
10969
10970cc_test {
10971    name: "xnnpack_global_average_pooling_ncw_test",
10972    defaults: ["xnnpack_tests_default"],
10973    srcs: [
10974        "test/global-average-pooling-ncw.cc",
10975    ],
10976    test_suites: [
10977        "general-tests",
10978    ],
10979}
10980
10981cc_test {
10982    name: "xnnpack_hardswish_nc_test",
10983    defaults: ["xnnpack_tests_default"],
10984    srcs: [
10985        "test/hardswish-nc.cc",
10986    ],
10987    test_suites: [
10988        "general-tests",
10989    ],
10990}
10991
10992cc_test {
10993    name: "xnnpack_leaky_relu_nc_test",
10994    defaults: ["xnnpack_tests_default"],
10995    srcs: [
10996        "test/leaky-relu-nc.cc",
10997    ],
10998    test_suites: [
10999        "general-tests",
11000    ],
11001}
11002
11003cc_test {
11004    name: "xnnpack_max_pooling_nhwc_test",
11005    defaults: ["xnnpack_tests_default"],
11006    srcs: [
11007        "test/max-pooling-nhwc.cc",
11008    ],
11009    test_suites: [
11010        "general-tests",
11011    ],
11012}
11013
11014cc_test {
11015    name: "xnnpack_maximum_nd_test",
11016    defaults: ["xnnpack_tests_default"],
11017    srcs: [
11018        "test/maximum-nd.cc",
11019    ],
11020    test_suites: [
11021        "general-tests",
11022    ],
11023}
11024
11025cc_test {
11026    name: "xnnpack_minimum_nd_test",
11027    defaults: ["xnnpack_tests_default"],
11028    srcs: [
11029        "test/minimum-nd.cc",
11030    ],
11031    test_suites: [
11032        "general-tests",
11033    ],
11034}
11035
11036cc_test {
11037    name: "xnnpack_multiply_nd_test",
11038    defaults: ["xnnpack_tests_default"],
11039    srcs: [
11040        "test/multiply-nd.cc",
11041    ],
11042    test_suites: [
11043        "general-tests",
11044    ],
11045}
11046
11047cc_test {
11048    name: "xnnpack_negate_nc_test",
11049    defaults: ["xnnpack_tests_default"],
11050    srcs: [
11051        "test/negate-nc.cc",
11052    ],
11053    test_suites: [
11054        "general-tests",
11055    ],
11056}
11057
11058cc_test {
11059    name: "xnnpack_prelu_nc_test",
11060    defaults: ["xnnpack_tests_default"],
11061    srcs: [
11062        "test/prelu-nc.cc",
11063    ],
11064    test_suites: [
11065        "general-tests",
11066    ],
11067}
11068
11069cc_test {
11070    name: "xnnpack_resize_bilinear_nhwc_test",
11071    defaults: ["xnnpack_tests_default"],
11072    srcs: [
11073        "test/resize-bilinear-nhwc.cc",
11074    ],
11075    test_suites: [
11076        "general-tests",
11077    ],
11078}
11079
11080cc_test {
11081    name: "xnnpack_sigmoid_nc_test",
11082    defaults: ["xnnpack_tests_default"],
11083    srcs: [
11084        "test/sigmoid-nc.cc",
11085    ],
11086    test_suites: [
11087        "general-tests",
11088    ],
11089}
11090
11091cc_test {
11092    name: "xnnpack_softmax_nc_test",
11093    defaults: ["xnnpack_tests_default"],
11094    srcs: [
11095        "test/softmax-nc.cc",
11096    ],
11097    test_suites: [
11098        "general-tests",
11099    ],
11100}
11101
11102cc_test {
11103    name: "xnnpack_square_nc_test",
11104    defaults: ["xnnpack_tests_default"],
11105    srcs: [
11106        "test/square-nc.cc",
11107    ],
11108    test_suites: [
11109        "general-tests",
11110    ],
11111}
11112
11113cc_test {
11114    name: "xnnpack_square_root_nc_test",
11115    defaults: ["xnnpack_tests_default"],
11116    srcs: [
11117        "test/square-root-nc.cc",
11118    ],
11119    test_suites: [
11120        "general-tests",
11121    ],
11122}
11123
11124cc_test {
11125    name: "xnnpack_square_difference_nd_test",
11126    defaults: ["xnnpack_tests_default"],
11127    srcs: [
11128        "test/squared-difference-nd.cc",
11129    ],
11130    test_suites: [
11131        "general-tests",
11132    ],
11133}
11134
11135cc_test {
11136    name: "xnnpack_subtract_nd_test",
11137    defaults: ["xnnpack_tests_default"],
11138    srcs: [
11139        "test/subtract-nd.cc",
11140    ],
11141    test_suites: [
11142        "general-tests",
11143    ],
11144}
11145
11146cc_test {
11147    name: "xnnpack_truncation_nc_test",
11148    defaults: ["xnnpack_tests_default"],
11149    srcs: [
11150        "test/truncation-nc.cc",
11151    ],
11152    test_suites: [
11153        "general-tests",
11154    ],
11155}
11156
11157cc_test {
11158    name: "xnnpack_unpooling_nhwc_test",
11159    defaults: ["xnnpack_tests_default"],
11160    srcs: [
11161        "test/unpooling-nhwc.cc",
11162    ],
11163    test_suites: [
11164        "general-tests",
11165    ],
11166}
11167