forked from google/XNNPACK
-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathavx512f_microkernels.bzl
316 lines (314 loc) · 20.5 KB
/
avx512f_microkernels.bzl
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
"""
Microkernel filenames lists for avx512f.
Auto-generated file. Do not edit!
Generator: tools/update-microkernels.py
"""
ALL_AVX512F_MICROKERNEL_SRCS = [
"src/f32-dwconv/gen/f32-dwconv-3p16c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-3p16c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-3p32c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-3p32c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-4p16c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-4p16c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-4p32c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-4p32c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-5f5m5l16c16s1r-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-5f5m5l16c16s1r-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-5f5m5l32c16s1r-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-5f5m5l32c16s1r-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-9p16c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-9p16c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-9p32c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-9p32c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-25p16c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-25p16c-minmax-avx512f.c",
"src/f32-dwconv/gen/f32-dwconv-25p32c-minmax-avx512f-acc2.c",
"src/f32-dwconv/gen/f32-dwconv-25p32c-minmax-avx512f.c",
"src/f32-gemm/gen/f32-gemm-1x16-minmax-avx512f-broadcast.c",
"src/f32-gemm/gen/f32-gemm-4x16-minmax-avx512f-broadcast.c",
"src/f32-gemm/gen/f32-gemm-5x16-minmax-avx512f-broadcast.c",
"src/f32-gemm/gen/f32-gemm-6x16-minmax-avx512f-broadcast.c",
"src/f32-gemm/gen/f32-gemm-7x16-minmax-avx512f-broadcast.c",
"src/f32-gemm/gen/f32-gemm-8x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-1x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-4x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-5x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-6x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-7x16-minmax-avx512f-broadcast.c",
"src/f32-gemminc/gen/f32-gemminc-8x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-1x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-4x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-5x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-6x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-7x16-minmax-avx512f-broadcast.c",
"src/f32-igemm/gen/f32-igemm-8x16-minmax-avx512f-broadcast.c",
"src/f32-prelu/gen/f32-prelu-avx512f-2x16.c",
"src/f32-prelu/gen/f32-prelu-avx512f-2x32.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u64-acc2.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u64-acc4.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u64.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u128-acc2.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u128-acc4.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u128.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u144-acc3.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u144.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u160-acc2.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u160-acc5.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u160.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u192-acc2.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u192-acc3.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u192-acc6.c",
"src/f32-raddexpminusmax/gen/f32-raddexpminusmax-avx512f-p5-scalef-u192.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u64-acc2.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u64-acc4.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u64.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u128-acc2.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u128-acc4.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u128.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u144-acc3.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u144.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u160-acc2.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u160-acc5.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u160.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u192-acc2.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u192-acc3.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u192-acc6.c",
"src/f32-raddextexp/gen/f32-raddextexp-avx512f-p5-scalef-u192.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u64-acc2.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u64-acc4.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u64.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u128-acc2.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u128-acc4.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u128.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u144-acc3.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u144.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u160-acc2.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u160-acc5.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u160.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u192-acc2.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u192-acc3.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u192-acc6.c",
"src/f32-raddstoreexpminusmax/gen/f32-raddstoreexpminusmax-avx512f-rr1-p5-scalef-u192.c",
"src/f32-rdsum/gen/f32-rdsum-7p7x-minmax-avx512f-c16.c",
"src/f32-rdsum/gen/f32-rdsum-7p7x-minmax-avx512f-c32.c",
"src/f32-rdsum/gen/f32-rdsum-7p7x-minmax-avx512f-c64.c",
"src/f32-rdsum/gen/f32-rdsum-7p7x-minmax-avx512f-c128.c",
"src/f32-rminmax/gen/f32-rmax-avx512f-u16.c",
"src/f32-rminmax/gen/f32-rmax-avx512f-u32-acc2.c",
"src/f32-rminmax/gen/f32-rmax-avx512f-u48-acc3.c",
"src/f32-rminmax/gen/f32-rmax-avx512f-u64-acc2.c",
"src/f32-rminmax/gen/f32-rmax-avx512f-u64-acc4.c",
"src/f32-rminmax/gen/f32-rmin-avx512f-u16.c",
"src/f32-rminmax/gen/f32-rmin-avx512f-u32-acc2.c",
"src/f32-rminmax/gen/f32-rmin-avx512f-u48-acc3.c",
"src/f32-rminmax/gen/f32-rmin-avx512f-u64-acc2.c",
"src/f32-rminmax/gen/f32-rmin-avx512f-u64-acc4.c",
"src/f32-rminmax/gen/f32-rminmax-avx512f-u16.c",
"src/f32-rminmax/gen/f32-rminmax-avx512f-u32-acc2.c",
"src/f32-rminmax/gen/f32-rminmax-avx512f-u48-acc3.c",
"src/f32-rminmax/gen/f32-rminmax-avx512f-u64-acc2.c",
"src/f32-rminmax/gen/f32-rminmax-avx512f-u64-acc4.c",
"src/f32-rsum/gen/f32-rsum-avx512f-u16.c",
"src/f32-rsum/gen/f32-rsum-avx512f-u32-acc2.c",
"src/f32-rsum/gen/f32-rsum-avx512f-u48-acc3.c",
"src/f32-rsum/gen/f32-rsum-avx512f-u64-acc2.c",
"src/f32-rsum/gen/f32-rsum-avx512f-u64-acc4.c",
"src/f32-vbinary/gen/f32-vadd-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vadd-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vaddc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vaddc-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vdiv-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vdiv-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vdivc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vdivc-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vmaxc-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vmaxc-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vmin-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vmin-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vminc-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vminc-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vmul-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vmul-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vmulc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vmulc-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vrdivc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vrdivc-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vrsubc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vrsubc-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vsqrdiff-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vsqrdiff-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vsqrdiffc-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vsqrdiffc-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vsub-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vsub-minmax-avx512f-u32.c",
"src/f32-vbinary/gen/f32-vsubc-minmax-avx512f-u16.c",
"src/f32-vbinary/gen/f32-vsubc-minmax-avx512f-u32.c",
"src/f32-vclamp/gen/f32-vclamp-avx512f-u16.c",
"src/f32-vclamp/gen/f32-vclamp-avx512f-u32.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u16.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u32.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u48.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u64.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u80.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u96.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u112.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-lut16-p3-perm-u128.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u16.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u32.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u48.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u64.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u80.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u96.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u112.c",
"src/f32-velu/gen/f32-velu-avx512f-rr1-p6-u128.c",
"src/f32-vhswish/gen/f32-vhswish-avx512f-u16.c",
"src/f32-vhswish/gen/f32-vhswish-avx512f-u32.c",
"src/f32-vlrelu/gen/f32-vlrelu-avx512f-u16.c",
"src/f32-vlrelu/gen/f32-vlrelu-avx512f-u32.c",
"src/f32-vrelu/gen/f32-vrelu-avx512f-u16.c",
"src/f32-vrelu/gen/f32-vrelu-avx512f-u32.c",
"src/f32-vrnd/gen/f32-vrndd-avx512f-u16.c",
"src/f32-vrnd/gen/f32-vrndd-avx512f-u32.c",
"src/f32-vrnd/gen/f32-vrndne-avx512f-u16.c",
"src/f32-vrnd/gen/f32-vrndne-avx512f-u32.c",
"src/f32-vrnd/gen/f32-vrndu-avx512f-u16.c",
"src/f32-vrnd/gen/f32-vrndu-avx512f-u32.c",
"src/f32-vrnd/gen/f32-vrndz-avx512f-u16.c",
"src/f32-vrnd/gen/f32-vrndz-avx512f-u32.c",
"src/f32-vrsqrt/gen/f32-vrsqrt-avx512f-rsqrt-u16.c",
"src/f32-vrsqrt/gen/f32-vrsqrt-avx512f-rsqrt-u32.c",
"src/f32-vrsqrt/gen/f32-vrsqrt-avx512f-rsqrt-u64.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u16.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u32.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u48.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u64.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u80.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u96.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u112.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u128.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u144.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u160.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u176.c",
"src/f32-vscaleexpminusmax/gen/f32-vscaleexpminusmax-avx512f-p5-scalef-u192.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u16.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u32.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u48.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u64.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u80.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u96.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u112.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u128.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u144.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u160.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u176.c",
"src/f32-vscaleextexp/gen/f32-vscaleextexp-avx512f-p5-scalef-u192.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-div-u128.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma-u128.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-div-u128.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr1-p5-scalef-nr1fma-u128.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div-u128.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u16.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u32.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u48.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u64.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u80.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u96.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u112.c",
"src/f32-vsigmoid/gen/f32-vsigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma-u128.c",
"src/f32-vsqrt/gen/f32-vsqrt-avx512f-rsqrt-u16.c",
"src/f32-vsqrt/gen/f32-vsqrt-avx512f-rsqrt-u32.c",
"src/f32-vsqrt/gen/f32-vsqrt-avx512f-rsqrt-u48.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-div-u8.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-div-u16.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-div-u24.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-div-u32.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-nr-u8.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-nr-u16.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-nr-u24.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-nr-u32.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-u8.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-u16.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-u24.c",
"src/f32-vtanh/gen/f32-vtanh-avx512f-rational-9-6-u32.c",
"src/f32-vunary/gen/f32-vabs-avx512f-u16.c",
"src/f32-vunary/gen/f32-vabs-avx512f-u32.c",
"src/f32-vunary/gen/f32-vneg-avx512f-u16.c",
"src/f32-vunary/gen/f32-vneg-avx512f-u32.c",
"src/f32-vunary/gen/f32-vsqr-avx512f-u16.c",
"src/f32-vunary/gen/f32-vsqr-avx512f-u32.c",
"src/math/f32-exp-avx512f-rr2-lut16-p3-perm-scalef.c",
"src/math/f32-exp-avx512f-rr2-lut16-p3-perm.c",
"src/math/f32-exp-avx512f-rr2-lut32-p2-perm2-scalef.c",
"src/math/f32-exp-avx512f-rr2-lut32-p2-perm2.c",
"src/math/f32-exp-avx512f-rr2-p5-scalef.c",
"src/math/f32-exp-avx512f-rr2-p5.c",
"src/math/f32-expm1minus-avx512f-rr1-lut16-p3-perm.c",
"src/math/f32-expm1minus-avx512f-rr1-p6.c",
"src/math/f32-extexp-avx512f-p5.c",
"src/math/f32-sigmoid-avx512f-rr1-lut16-p3-perm-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr1-lut64-p2-gather-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr1-lut64-p2-gather-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr1-lut64-p2-gather-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr1-p5-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr1-p5-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr1-p5-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr2-lut16-p3-perm-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr2-lut16-p3-perm-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr2-lut16-p3-perm-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr2-lut32-p2-perm2-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr2-lut64-p2-gather-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr2-lut64-p2-gather-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr2-lut64-p2-gather-scalef-nr1fma1adj.c",
"src/math/f32-sigmoid-avx512f-rr2-p5-scalef-div.c",
"src/math/f32-sigmoid-avx512f-rr2-p5-scalef-nr1fma.c",
"src/math/f32-sigmoid-avx512f-rr2-p5-scalef-nr1fma1adj.c",
"src/math/f32-sqrt-avx512f-nr1fma.c",
"src/math/f32-sqrt-avx512f-nr1fma1adj.c",
"src/math/f32-sqrt-avx512f-nr2fma.c",
"src/x32-packw/gen/x32-packw-x16-gemm-goi-avx512f-u4-prfm.c",
"src/x32-packw/gen/x32-packw-x16-gemm-goi-avx512f-u4.c",
]