aboutsummaryrefslogtreecommitdiff
path: root/Android.bp
blob: ab554a8ca2a6536037df42abe12ab644a422d7d1 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
1372
1373
1374
//
// Copyright © 2020-2024 Arm Ltd. All rights reserved.
// SPDX-License-Identifier: MIT
//

// OpenCL sources are NOT required by ArmNN or its Android NNAPI driver and are used for CI purposes only.
opencl_srcs = [
        "src/core/CL/cl_kernels/activation_float_helpers.h",
        "src/core/CL/cl_kernels/activation_quant_helpers.h",
        "src/core/CL/cl_kernels/common/activation_layer.cl",
        "src/core/CL/cl_kernels/common/activation_layer_quant.cl",
        "src/core/CL/cl_kernels/common/arg_min_max.cl",
        "src/core/CL/cl_kernels/common/batchnormalization_layer.cl",
        "src/core/CL/cl_kernels/common/bitwise_op.cl",
        "src/core/CL/cl_kernels/common/bounding_box_transform.cl",
        "src/core/CL/cl_kernels/common/bounding_box_transform_quantized.cl",
        "src/core/CL/cl_kernels/common/cast.cl",
        "src/core/CL/cl_kernels/common/col2im.cl",
        "src/core/CL/cl_kernels/common/comparisons.cl",
        "src/core/CL/cl_kernels/common/concatenate.cl",
        "src/core/CL/cl_kernels/common/convert_fc_weights.cl",
        "src/core/CL/cl_kernels/common/convolution_layer.cl",
        "src/core/CL/cl_kernels/common/copy_tensor.cl",
        "src/core/CL/cl_kernels/common/crop_tensor.cl",
        "src/core/CL/cl_kernels/common/deconvolution_layer.cl",
        "src/core/CL/cl_kernels/common/dequantization_layer.cl",
        "src/core/CL/cl_kernels/common/elementwise_operation.cl",
        "src/core/CL/cl_kernels/common/elementwise_operation_quantized.cl",
        "src/core/CL/cl_kernels/common/elementwise_unary.cl",
        "src/core/CL/cl_kernels/common/elementwise_unary_quantized.cl",
        "src/core/CL/cl_kernels/common/fft.cl",
        "src/core/CL/cl_kernels/common/fft_digit_reverse.cl",
        "src/core/CL/cl_kernels/common/fft_scale.cl",
        "src/core/CL/cl_kernels/common/fill_border.cl",
        "src/core/CL/cl_kernels/common/floor.cl",
        "src/core/CL/cl_kernels/common/gather.cl",
        "src/core/CL/cl_kernels/common/gemm.cl",
        "src/core/CL/cl_kernels/common/gemm_reshaped_only_rhs_mmul.cl",
        "src/core/CL/cl_kernels/common/gemm_utils.cl",
        "src/core/CL/cl_kernels/common/gemmlowp.cl",
        "src/core/CL/cl_kernels/common/gemmlowp_reshaped_only_rhs_mmul.cl",
        "src/core/CL/cl_kernels/common/gemv.cl",
        "src/core/CL/cl_kernels/common/generate_proposals.cl",
        "src/core/CL/cl_kernels/common/generate_proposals_quantized.cl",
        "src/core/CL/cl_kernels/common/instance_normalization.cl",
        "src/core/CL/cl_kernels/common/l2_normalize.cl",
        "src/core/CL/cl_kernels/common/mat_mul.cl",
        "src/core/CL/cl_kernels/common/mat_mul_mmul.cl",
        "src/core/CL/cl_kernels/common/mat_mul_quantized.cl",
        "src/core/CL/cl_kernels/common/mat_mul_quantized_mmul.cl",
        "src/core/CL/cl_kernels/common/mean_stddev_normalization.cl",
        "src/core/CL/cl_kernels/common/memset.cl",
        "src/core/CL/cl_kernels/common/minmax_layer.cl",
        "src/core/CL/cl_kernels/common/nonmax.cl",
        "src/core/CL/cl_kernels/common/pad_layer.cl",
        "src/core/CL/cl_kernels/common/permute.cl",
        "src/core/CL/cl_kernels/common/pixelwise_mul_float.cl",
        "src/core/CL/cl_kernels/common/pixelwise_mul_int.cl",
        "src/core/CL/cl_kernels/common/qlstm_layer_normalization.cl",
        "src/core/CL/cl_kernels/common/quantization_layer.cl",
        "src/core/CL/cl_kernels/common/range.cl",
        "src/core/CL/cl_kernels/common/reduction_operation.cl",
        "src/core/CL/cl_kernels/common/reshape_layer.cl",
        "src/core/CL/cl_kernels/common/reverse.cl",
        "src/core/CL/cl_kernels/common/roi_align_layer.cl",
        "src/core/CL/cl_kernels/common/roi_align_layer_quantized.cl",
        "src/core/CL/cl_kernels/common/roi_pooling_layer.cl",
        "src/core/CL/cl_kernels/common/scatter.cl",
        "src/core/CL/cl_kernels/common/select.cl",
        "src/core/CL/cl_kernels/common/slice_ops.cl",
        "src/core/CL/cl_kernels/common/softmax_layer.cl",
        "src/core/CL/cl_kernels/common/stack_layer.cl",
        "src/core/CL/cl_kernels/common/tile.cl",
        "src/core/CL/cl_kernels/common/transpose.cl",
        "src/core/CL/cl_kernels/common/unpooling_layer.cl",
        "src/core/CL/cl_kernels/gemm_helpers.h",
        "src/core/CL/cl_kernels/helpers.h",
        "src/core/CL/cl_kernels/helpers_asymm.h",
        "src/core/CL/cl_kernels/load_store_utility.h",
        "src/core/CL/cl_kernels/nchw/batch_to_space.cl",
        "src/core/CL/cl_kernels/nchw/batchnormalization_layer.cl",
        "src/core/CL/cl_kernels/nchw/channel_shuffle.cl",
        "src/core/CL/cl_kernels/nchw/depth_to_space.cl",
        "src/core/CL/cl_kernels/nchw/dequantization_layer.cl",
        "src/core/CL/cl_kernels/nchw/direct_convolution.cl",
        "src/core/CL/cl_kernels/nchw/im2col.cl",
        "src/core/CL/cl_kernels/nchw/normalization_layer.cl",
        "src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer.cl",
        "src/core/CL/cl_kernels/nchw/normalize_planar_yuv_layer_quantized.cl",
        "src/core/CL/cl_kernels/nchw/pooling_layer.cl",
        "src/core/CL/cl_kernels/nchw/prior_box_layer.cl",
        "src/core/CL/cl_kernels/nchw/reorg_layer.cl",
        "src/core/CL/cl_kernels/nchw/scale.cl",
        "src/core/CL/cl_kernels/nchw/space_to_batch.cl",
        "src/core/CL/cl_kernels/nchw/space_to_depth.cl",
        "src/core/CL/cl_kernels/nchw/upsample_layer.cl",
        "src/core/CL/cl_kernels/nchw/winograd_filter_transform.cl",
        "src/core/CL/cl_kernels/nchw/winograd_input_transform.cl",
        "src/core/CL/cl_kernels/nchw/winograd_output_transform.cl",
        "src/core/CL/cl_kernels/nhwc/batch_to_space.cl",
        "src/core/CL/cl_kernels/nhwc/batchnormalization_layer.cl",
        "src/core/CL/cl_kernels/nhwc/channel_shuffle.cl",
        "src/core/CL/cl_kernels/nhwc/depth_to_space.cl",
        "src/core/CL/cl_kernels/nhwc/dequantization_layer.cl",
        "src/core/CL/cl_kernels/nhwc/direct_convolution.cl",
        "src/core/CL/cl_kernels/nhwc/direct_convolution3d.cl",
        "src/core/CL/cl_kernels/nhwc/dwc_native_fp_nhwc.cl",
        "src/core/CL/cl_kernels/nhwc/dwc_native_quantized_nhwc.cl",
        "src/core/CL/cl_kernels/nhwc/im2col.cl",
        "src/core/CL/cl_kernels/nhwc/indirect_convolution.cl",
        "src/core/CL/cl_kernels/nhwc/normalization_layer.cl",
        "src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer.cl",
        "src/core/CL/cl_kernels/nhwc/normalize_planar_yuv_layer_quantized.cl",
        "src/core/CL/cl_kernels/nhwc/pooling_3d_layer.cl",
        "src/core/CL/cl_kernels/nhwc/pooling_3d_layer_quantized.cl",
        "src/core/CL/cl_kernels/nhwc/pooling_layer.cl",
        "src/core/CL/cl_kernels/nhwc/pooling_layer_quantized.cl",
        "src/core/CL/cl_kernels/nhwc/reorg_layer.cl",
        "src/core/CL/cl_kernels/nhwc/scale.cl",
        "src/core/CL/cl_kernels/nhwc/space_to_batch.cl",
        "src/core/CL/cl_kernels/nhwc/space_to_depth.cl",
        "src/core/CL/cl_kernels/nhwc/transposed_convolution.cl",
        "src/core/CL/cl_kernels/nhwc/upsample_layer.cl",
        "src/core/CL/cl_kernels/nhwc/winograd_filter_transform.cl",
        "src/core/CL/cl_kernels/nhwc/winograd_input_transform.cl",
        "src/core/CL/cl_kernels/nhwc/winograd_output_transform.cl",
        "src/core/CL/cl_kernels/repeat.h",
        "src/core/CL/cl_kernels/tile_helpers.h",
        "src/core/CL/cl_kernels/types.h",
        "src/core/CL/cl_kernels/warp_helpers.h",
        
]

bootstrap_go_package {
    name: "arm_compute_library_nn_driver",
    pkgPath: "arm_compute_library_nn_driver",
    deps: [
        "blueprint",
        "blueprint-pathtools",
        "blueprint-proptools",
        "soong",
        "soong-android",
        "soong-cc",
    ],
    srcs: [
        "scripts/arm_compute_library_nn_driver.go",
    ],
    pluginFor: [ "soong_build" ],
}

arm_compute_library_defaults {
       name: "acl-default-cppflags",
       cppflags: [
            "-std=c++14",
            "-fexceptions",
            "-DBOOST_NO_AUTO_PTR",
            "-DEMBEDDED_KERNELS",
            "-DARM_COMPUTE_ASSERTS_ENABLED",
            "-DARM_COMPUTE_CPP_SCHEDULER",
            "-DENABLE_NEON",
            "-DARM_COMPUTE_ENABLE_NEON",
            "-Wno-unused-parameter",
            "-DNO_DOT_IN_TOOLCHAIN",
            "-Wno-implicit-fallthrough",
            "-fPIC"
    ],
    rtti: true,
}

cc_library_static {
    name: "arm_compute_library",
    defaults: ["acl-default-cppflags"],
    proprietary: true,
    local_include_dirs: ["build/android-arm64v8a/src/core",
                         "build/android-arm64v8a/src/core/CL",
                         "compute_kernel_writer/include",
                         "src/core/common",
                         "src/core/helpers",
                         "src/core/NEON/kernels/arm_gemm",
                         "src/core/NEON/kernels/assembly",
                         "src/core/NEON/kernels/convolution/common",
                         "src/core/NEON/kernels/convolution/winograd",
                         "src/cpu/kernels/assembly"],
    export_include_dirs: [".", "./include"],
    srcs: [
        "src/c/AclContext.cpp",
        "src/c/AclOperator.cpp",
        "src/c/AclQueue.cpp",
        "src/c/AclTensor.cpp",
        "src/c/AclTensorPack.cpp",
        "src/c/AclVersion.cpp",
        "src/c/cl/AclOpenClExt.cpp",
        "src/c/operators/AclActivation.cpp",
        "src/common/AllocatorWrapper.cpp",
        "src/common/IOperator.cpp",
        "src/common/ITensorV2.cpp",
        "src/common/TensorPack.cpp",
        "src/common/cpuinfo/CpuInfo.cpp",
        "src/common/cpuinfo/CpuIsaInfo.cpp",
        "src/common/cpuinfo/CpuModel.cpp",
        "src/common/utils/LegacySupport.cpp",
        "src/core/AccessWindowAutoPadding.cpp",
        "src/core/AccessWindowStatic.cpp",
        "src/core/AccessWindowTranspose.cpp",
        "src/core/CL/CLCommandBuffer.cpp",
        "src/core/CL/CLCompatCommandBuffer.cpp",
        "src/core/CL/CLCompileContext.cpp",
        "src/core/CL/CLHelpers.cpp",
        "src/core/CL/CLKernelLibrary.cpp",
        "src/core/CL/CLMutableCommandBuffer.cpp",
        "src/core/CL/CLUtils.cpp",
        "src/core/CL/DefaultLWSHeuristics.cpp",
        "src/core/CL/ICLKernel.cpp",
        "src/core/CL/ICLSimple2DKernel.cpp",
        "src/core/CL/ICLSimple3DKernel.cpp",
        "src/core/CL/ICLSimpleKernel.cpp",
        "src/core/CL/ICLTensor.cpp",
        "src/core/CL/OpenCL.cpp",
        "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
        "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
        "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
        "src/core/CL/kernels/CLBitwiseKernel.cpp",
        "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
        "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
        "src/core/CL/kernels/CLComparisonKernel.cpp",
        "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
        "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
        "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
        "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
        "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
        "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
        "src/core/CL/kernels/CLFFTScaleKernel.cpp",
        "src/core/CL/kernels/CLFillBorderKernel.cpp",
        "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
        "src/core/CL/kernels/CLGatherKernel.cpp",
        "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
        "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
        "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
        "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
        "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
        "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
        "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
        "src/core/CL/kernels/CLPadLayerKernel.cpp",
        "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
        "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
        "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
        "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
        "src/core/CL/kernels/CLRangeKernel.cpp",
        "src/core/CL/kernels/CLReductionOperationKernel.cpp",
        "src/core/CL/kernels/CLReorgLayerKernel.cpp",
        "src/core/CL/kernels/CLReverseKernel.cpp",
        "src/core/CL/kernels/CLSelectKernel.cpp",
        "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
        "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
        "src/core/CL/kernels/CLStackLayerKernel.cpp",
        "src/core/CL/kernels/CLStridedSliceKernel.cpp",
        "src/core/CL/kernels/CLTileKernel.cpp",
        "src/core/CPP/CPPTypes.cpp",
        "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
        "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
        "src/core/CPP/kernels/CPPPermuteKernel.cpp",
        "src/core/CPP/kernels/CPPTopKVKernel.cpp",
        "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
        "src/core/Error.cpp",
        "src/core/GPUTarget.cpp",
        "src/core/Helpers.cpp",
        "src/core/IAccessWindow.cpp",
        "src/core/IKernel.cpp",
        "src/core/ITensor.cpp",
        "src/core/ITensorPack.cpp",
        "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
        "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
        "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
        "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
        "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
        "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
        "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
        "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
        "src/core/NEON/kernels/NECropKernel.cpp",
        "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
        "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
        "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
        "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
        "src/core/NEON/kernels/NEFillBorderKernel.cpp",
        "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
        "src/core/NEON/kernels/NEGatherKernel.cpp",
        "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
        "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
        "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
        "src/core/NEON/kernels/NELogicalKernel.cpp",
        "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
        "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
        "src/core/NEON/kernels/NEPadLayerKernel.cpp",
        "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
        "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
        "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
        "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
        "src/core/NEON/kernels/NERangeKernel.cpp",
        "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
        "src/core/NEON/kernels/NEReorderKernel.cpp",
        "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
        "src/core/NEON/kernels/NEReverseKernel.cpp",
        "src/core/NEON/kernels/NESelectKernel.cpp",
        "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
        "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
        "src/core/NEON/kernels/NEStackLayerKernel.cpp",
        "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
        "src/core/NEON/kernels/NETileKernel.cpp",
        "src/core/NEON/kernels/arm_conv/addressing.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_common.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
        "src/core/NEON/kernels/arm_conv/depthwise/premultiply.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
        "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_bf16bf16.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_s8fp32.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
        "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
        "src/core/NEON/kernels/arm_gemm/interleave-8way.cpp",
        "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
        "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
        "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
        "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
        "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
        "src/core/NEON/kernels/arm_gemm/misc-sve.cpp",
        "src/core/NEON/kernels/arm_gemm/misc.cpp",
        "src/core/NEON/kernels/arm_gemm/quantized.cpp",
        "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
        "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
        "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
        "src/core/NEON/kernels/arm_gemm/transform.cpp",
        "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
        "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
        "src/core/NEON/kernels/convolution/common/padding.cpp",
        "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
        "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
        "src/core/NEON/kernels/convolution/common/utils.cpp",
        "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
        "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
        "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
        "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
        "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
        "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
        "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
        "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
        "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
        "src/core/Rounding.cpp",
        "src/core/Size2D.cpp",
        "src/core/Size3D.cpp",
        "src/core/SubTensorInfo.cpp",
        "src/core/TensorInfo.cpp",
        "src/core/Utils.cpp",
        "src/core/Validate.cpp",
        "src/core/Version.cpp",
        "src/core/helpers/LUTManager.cpp",
        "src/core/helpers/SoftmaxHelpers.cpp",
        "src/core/helpers/Utils.cpp",
        "src/core/helpers/WindowHelpers.cpp",
        "src/core/utils/ActivationFunctionUtils.cpp",
        "src/core/utils/AssemblyUtils.cpp",
        "src/core/utils/DataLayoutUtils.cpp",
        "src/core/utils/DataTypeUtils.cpp",
        "src/core/utils/FormatUtils.cpp",
        "src/core/utils/InterpolationPolicyUtils.cpp",
        "src/core/utils/Math.cpp",
        "src/core/utils/ScaleUtils.cpp",
        "src/core/utils/StringUtils.cpp",
        "src/core/utils/helpers/fft.cpp",
        "src/core/utils/helpers/tensor_transform.cpp",
        "src/core/utils/io/FileHandler.cpp",
        "src/core/utils/logging/FilePrinter.cpp",
        "src/core/utils/logging/Helpers.cpp",
        "src/core/utils/logging/Logger.cpp",
        "src/core/utils/logging/LoggerRegistry.cpp",
        "src/core/utils/misc/MMappedFile.cpp",
        "src/core/utils/quantization/AsymmHelpers.cpp",
        "src/cpu/CpuContext.cpp",
        "src/cpu/CpuQueue.cpp",
        "src/cpu/CpuTensor.cpp",
        "src/cpu/kernels/CpuActivationKernel.cpp",
        "src/cpu/kernels/CpuAddKernel.cpp",
        "src/cpu/kernels/CpuAddMulAddKernel.cpp",
        "src/cpu/kernels/CpuCastKernel.cpp",
        "src/cpu/kernels/CpuCol2ImKernel.cpp",
        "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
        "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
        "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
        "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
        "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
        "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
        "src/cpu/kernels/CpuCopyKernel.cpp",
        "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
        "src/cpu/kernels/CpuDequantizeKernel.cpp",
        "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
        "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
        "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
        "src/cpu/kernels/CpuElementwiseKernel.cpp",
        "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
        "src/cpu/kernels/CpuFillKernel.cpp",
        "src/cpu/kernels/CpuFloorKernel.cpp",
        "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
        "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
        "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
        "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
        "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
        "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
        "src/cpu/kernels/CpuIm2ColKernel.cpp",
        "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
        "src/cpu/kernels/CpuMulKernel.cpp",
        "src/cpu/kernels/CpuPermuteKernel.cpp",
        "src/cpu/kernels/CpuPool2dKernel.cpp",
        "src/cpu/kernels/CpuPool3dKernel.cpp",
        "src/cpu/kernels/CpuQuantizeKernel.cpp",
        "src/cpu/kernels/CpuReshapeKernel.cpp",
        "src/cpu/kernels/CpuScaleKernel.cpp",
        "src/cpu/kernels/CpuSoftmaxKernel.cpp",
        "src/cpu/kernels/CpuSubKernel.cpp",
        "src/cpu/kernels/CpuTransposeKernel.cpp",
        "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
        "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
        "src/cpu/kernels/activation/generic/neon/fp16.cpp",
        "src/cpu/kernels/activation/generic/neon/fp32.cpp",
        "src/cpu/kernels/activation/generic/neon/lut.cpp",
        "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/activation/generic/neon/qsymm16.cpp",
        "src/cpu/kernels/add/generic/neon/fp16.cpp",
        "src/cpu/kernels/add/generic/neon/fp32.cpp",
        "src/cpu/kernels/add/generic/neon/impl.cpp",
        "src/cpu/kernels/add/generic/neon/integer.cpp",
        "src/cpu/kernels/add/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/add/generic/neon/qsymm16.cpp",
        "src/cpu/kernels/addmuladd/generic/neon/fp16.cpp",
        "src/cpu/kernels/addmuladd/generic/neon/fp32.cpp",
        "src/cpu/kernels/addmuladd/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/addmuladd/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp",
        "src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp",
        "src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp",
        "src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp",
        "src/cpu/kernels/cast/generic/neon/fp16.cpp",
        "src/cpu/kernels/crop/generic/neon/fp16.cpp",
        "src/cpu/kernels/crop/generic/neon/fp32.cpp",
        "src/cpu/kernels/crop/generic/neon/integer.cpp",
        "src/cpu/kernels/depth_to_space/nchw/any/impl.cpp",
        "src/cpu/kernels/depth_to_space/nhwc/any/impl.cpp",
        "src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp",
        "src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp",
        "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp",
        "src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/directconv2d/nchw/all.cpp",
        "src/cpu/kernels/directconv2d/nchw/fp16.cpp",
        "src/cpu/kernels/directconv2d/nhwc/neon/fp16.cpp",
        "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp",
        "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
        "src/cpu/kernels/directconv2d/nhwc/neon/qasymm8.cpp",
        "src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp",
        "src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp",
        "src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp",
        "src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/q8.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/elementwise_unary/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/floor/neon/fp16.cpp",
        "src/cpu/kernels/floor/neon/fp32.cpp",
        "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
        "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
        "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp",
        "src/cpu/kernels/fuse_batch_normalization/nchw/neon/fp16.cpp",
        "src/cpu/kernels/fuse_batch_normalization/nchw/neon/fp32.cpp",
        "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp",
        "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp",
        "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp",
        "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp",
        "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp",
        "src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
        "src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
        "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
        "src/cpu/kernels/genproposals/generic/neon/fp16.cpp",
        "src/cpu/kernels/genproposals/generic/neon/fp32.cpp",
        "src/cpu/kernels/genproposals/generic/neon/impl.cpp",
        "src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp",
        "src/cpu/kernels/instancenorm/generic/neon/fp16.cpp",
        "src/cpu/kernels/instancenorm/generic/neon/fp32.cpp",
        "src/cpu/kernels/instancenorm/generic/neon/impl.cpp",
        "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
        "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
        "src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp",
        "src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp",
        "src/cpu/kernels/lut/generic/neon/u8.cpp",
        "src/cpu/kernels/maxunpool/generic/neon/fp16.cpp",
        "src/cpu/kernels/maxunpool/generic/neon/fp32.cpp",
        "src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp",
        "src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp",
        "src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp",
        "src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/mul/generic/neon/fp16.cpp",
        "src/cpu/kernels/mul/generic/neon/fp32.cpp",
        "src/cpu/kernels/norm_layer/generic/neon/fp16.cpp",
        "src/cpu/kernels/norm_layer/generic/neon/fp32.cpp",
        "src/cpu/kernels/pool2d/neon/fp16.cpp",
        "src/cpu/kernels/pool2d/neon/fp32.cpp",
        "src/cpu/kernels/pool2d/neon/nchw/all.cpp",
        "src/cpu/kernels/pool2d/neon/qasymm8.cpp",
        "src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/pool3d/neon/fp16.cpp",
        "src/cpu/kernels/pool3d/neon/fp32.cpp",
        "src/cpu/kernels/pool3d/neon/qasymm8.cpp",
        "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/range/generic/neon/fp16.cpp",
        "src/cpu/kernels/range/generic/neon/fp32.cpp",
        "src/cpu/kernels/range/generic/neon/integer.cpp",
        "src/cpu/kernels/roialign/generic/neon/fp16.cpp",
        "src/cpu/kernels/roialign/generic/neon/fp32.cpp",
        "src/cpu/kernels/roialign/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/scale/neon/fp16.cpp",
        "src/cpu/kernels/scale/neon/integer.cpp",
        "src/cpu/kernels/scale/neon/qasymm8.cpp",
        "src/cpu/kernels/scale/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/select/generic/neon/fp16.cpp",
        "src/cpu/kernels/select/generic/neon/fp32.cpp",
        "src/cpu/kernels/select/generic/neon/integer.cpp",
        "src/cpu/kernels/softmax/generic/neon/fp16.cpp",
        "src/cpu/kernels/softmax/generic/neon/fp32.cpp",
        "src/cpu/kernels/softmax/generic/neon/impl.cpp",
        "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp",
        "src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/sub/neon/fp16.cpp",
        "src/cpu/kernels/sub/neon/qasymm8.cpp",
        "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
        "src/cpu/kernels/sub/neon/qsymm16.cpp",
        "src/cpu/operators/CpuActivation.cpp",
        "src/cpu/operators/CpuAdd.cpp",
        "src/cpu/operators/CpuAddMulAdd.cpp",
        "src/cpu/operators/CpuCast.cpp",
        "src/cpu/operators/CpuConcatenate.cpp",
        "src/cpu/operators/CpuConv2d.cpp",
        "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
        "src/cpu/operators/CpuCopy.cpp",
        "src/cpu/operators/CpuDepthwiseConv2d.cpp",
        "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
        "src/cpu/operators/CpuDequantize.cpp",
        "src/cpu/operators/CpuDirectConv2d.cpp",
        "src/cpu/operators/CpuDirectConv3d.cpp",
        "src/cpu/operators/CpuElementwise.cpp",
        "src/cpu/operators/CpuElementwiseUnary.cpp",
        "src/cpu/operators/CpuFill.cpp",
        "src/cpu/operators/CpuFlatten.cpp",
        "src/cpu/operators/CpuFloor.cpp",
        "src/cpu/operators/CpuFullyConnected.cpp",
        "src/cpu/operators/CpuGemm.cpp",
        "src/cpu/operators/CpuGemmConv2d.cpp",
        "src/cpu/operators/CpuGemmDirectConv2d.cpp",
        "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
        "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
        "src/cpu/operators/CpuMatMul.cpp",
        "src/cpu/operators/CpuMaxUnpooling.cpp",
        "src/cpu/operators/CpuMul.cpp",
        "src/cpu/operators/CpuPermute.cpp",
        "src/cpu/operators/CpuPool2d.cpp",
        "src/cpu/operators/CpuPool3d.cpp",
        "src/cpu/operators/CpuQuantize.cpp",
        "src/cpu/operators/CpuReshape.cpp",
        "src/cpu/operators/CpuScale.cpp",
        "src/cpu/operators/CpuSoftmax.cpp",
        "src/cpu/operators/CpuSub.cpp",
        "src/cpu/operators/CpuTranspose.cpp",
        "src/cpu/operators/CpuWinogradConv2d.cpp",
        "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
        "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
        "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
        "src/dynamic_fusion/sketch/attributes/CastAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/ClampAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/Conv2dAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/MatMulAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/Pool2dAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/ReshapeAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/ResizeAttributes.cpp",
        "src/dynamic_fusion/sketch/attributes/SoftmaxAttributes.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
        "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentActivation.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentCast.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentElementwiseBinary.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentMatMul.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentPool2d.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentReshape.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentResize.cpp",
        "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuAdd.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuCast.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuClamp.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuMatMul.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuMul.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuOutput.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuPool2d.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuReshape.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuResize.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuSigmoid.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuSoftmax.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuSub.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/GpuTanh.cpp",
        "src/dynamic_fusion/sketch/gpu/operators/internal/GpuElementwiseBinaryCommon.cpp",
        "src/gpu/cl/ClContext.cpp",
        "src/gpu/cl/ClKernelLibrary.cpp",
        "src/gpu/cl/ClQueue.cpp",
        "src/gpu/cl/ClTensor.cpp",
        "src/gpu/cl/kernels/ClActivationKernel.cpp",
        "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
        "src/gpu/cl/kernels/ClCastKernel.cpp",
        "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
        "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
        "src/gpu/cl/kernels/ClCopyKernel.cpp",
        "src/gpu/cl/kernels/ClCropKernel.cpp",
        "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
        "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
        "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
        "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
        "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
        "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
        "src/gpu/cl/kernels/ClFillKernel.cpp",
        "src/gpu/cl/kernels/ClFloorKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
        "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
        "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
        "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
        "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
        "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
        "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
        "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
        "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
        "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
        "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
        "src/gpu/cl/kernels/ClIndirectConv2dKernel.cpp",
        "src/gpu/cl/kernels/ClMatMulLowpNativeKernel.cpp",
        "src/gpu/cl/kernels/ClMatMulLowpNativeMMULKernel.cpp",
        "src/gpu/cl/kernels/ClMatMulNativeKernel.cpp",
        "src/gpu/cl/kernels/ClMatMulNativeMMULKernel.cpp",
        "src/gpu/cl/kernels/ClMulKernel.cpp",
        "src/gpu/cl/kernels/ClPermuteKernel.cpp",
        "src/gpu/cl/kernels/ClPool2dKernel.cpp",
        "src/gpu/cl/kernels/ClPool3dKernel.cpp",
        "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
        "src/gpu/cl/kernels/ClReshapeKernel.cpp",
        "src/gpu/cl/kernels/ClScaleKernel.cpp",
        "src/gpu/cl/kernels/ClScatterKernel.cpp",
        "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
        "src/gpu/cl/kernels/ClTransposeKernel.cpp",
        "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
        "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
        "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
        "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
        "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
        "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
        "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
        "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
        "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
        "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
        "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
        "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
        "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
        "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
        "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
        "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
        "src/gpu/cl/kernels/helpers/MatMulKernelHelpers.cpp",
        "src/gpu/cl/operators/ClActivation.cpp",
        "src/gpu/cl/operators/ClAdd.cpp",
        "src/gpu/cl/operators/ClCast.cpp",
        "src/gpu/cl/operators/ClConcatenate.cpp",
        "src/gpu/cl/operators/ClConv2d.cpp",
        "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
        "src/gpu/cl/operators/ClCopy.cpp",
        "src/gpu/cl/operators/ClCrop.cpp",
        "src/gpu/cl/operators/ClDequantize.cpp",
        "src/gpu/cl/operators/ClDirectConv2d.cpp",
        "src/gpu/cl/operators/ClDirectConv3d.cpp",
        "src/gpu/cl/operators/ClElementwiseOperations.cpp",
        "src/gpu/cl/operators/ClElementwiseUnary.cpp",
        "src/gpu/cl/operators/ClFill.cpp",
        "src/gpu/cl/operators/ClFlatten.cpp",
        "src/gpu/cl/operators/ClFloor.cpp",
        "src/gpu/cl/operators/ClFullyConnected.cpp",
        "src/gpu/cl/operators/ClGemm.cpp",
        "src/gpu/cl/operators/ClGemmConv2d.cpp",
        "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
        "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
        "src/gpu/cl/operators/ClIndirectConv2d.cpp",
        "src/gpu/cl/operators/ClLogicalNot.cpp",
        "src/gpu/cl/operators/ClMatMul.cpp",
        "src/gpu/cl/operators/ClMul.cpp",
        "src/gpu/cl/operators/ClPRelu.cpp",
        "src/gpu/cl/operators/ClPermute.cpp",
        "src/gpu/cl/operators/ClPool2d.cpp",
        "src/gpu/cl/operators/ClPool3d.cpp",
        "src/gpu/cl/operators/ClQuantize.cpp",
        "src/gpu/cl/operators/ClReshape.cpp",
        "src/gpu/cl/operators/ClScale.cpp",
        "src/gpu/cl/operators/ClScatter.cpp",
        "src/gpu/cl/operators/ClSoftmax.cpp",
        "src/gpu/cl/operators/ClSub.cpp",
        "src/gpu/cl/operators/ClTranspose.cpp",
        "src/gpu/cl/operators/ClTransposedConvolution.cpp",
        "src/gpu/cl/operators/ClWinogradConv2d.cpp",
        "src/runtime/Allocator.cpp",
        "src/runtime/BlobLifetimeManager.cpp",
        "src/runtime/BlobMemoryPool.cpp",
        "src/runtime/CL/CLBufferAllocator.cpp",
        "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
        "src/runtime/CL/CLHelpers.cpp",
        "src/runtime/CL/CLMemory.cpp",
        "src/runtime/CL/CLMemoryRegion.cpp",
        "src/runtime/CL/CLOperator.cpp",
        "src/runtime/CL/CLRuntimeContext.cpp",
        "src/runtime/CL/CLScheduler.cpp",
        "src/runtime/CL/CLSubTensor.cpp",
        "src/runtime/CL/CLTensor.cpp",
        "src/runtime/CL/CLTensorAllocator.cpp",
        "src/runtime/CL/CLTuner.cpp",
        "src/runtime/CL/ICLSimpleFunction.cpp",
        "src/runtime/CL/Utils.cpp",
        "src/runtime/CL/functions/CLActivationLayer.cpp",
        "src/runtime/CL/functions/CLArgMinMaxLayer.cpp",
        "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
        "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp",
        "src/runtime/CL/functions/CLBitwiseAnd.cpp",
        "src/runtime/CL/functions/CLBitwiseNot.cpp",
        "src/runtime/CL/functions/CLBitwiseOr.cpp",
        "src/runtime/CL/functions/CLBitwiseXor.cpp",
        "src/runtime/CL/functions/CLBoundingBoxTransform.cpp",
        "src/runtime/CL/functions/CLCast.cpp",
        "src/runtime/CL/functions/CLChannelShuffleLayer.cpp",
        "src/runtime/CL/functions/CLComparison.cpp",
        "src/runtime/CL/functions/CLConcatenateLayer.cpp",
        "src/runtime/CL/functions/CLConv3D.cpp",
        "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
        "src/runtime/CL/functions/CLConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLCopy.cpp",
        "src/runtime/CL/functions/CLCrop.cpp",
        "src/runtime/CL/functions/CLCropResize.cpp",
        "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
        "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
        "src/runtime/CL/functions/CLDepthConvertLayer.cpp",
        "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp",
        "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLDequantizationLayer.cpp",
        "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
        "src/runtime/CL/functions/CLElementwiseOperations.cpp",
        "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp",
        "src/runtime/CL/functions/CLFFT1D.cpp",
        "src/runtime/CL/functions/CLFFT2D.cpp",
        "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLFill.cpp",
        "src/runtime/CL/functions/CLFlattenLayer.cpp",
        "src/runtime/CL/functions/CLFloor.cpp",
        "src/runtime/CL/functions/CLFullyConnectedLayer.cpp",
        "src/runtime/CL/functions/CLFuseBatchNormalization.cpp",
        "src/runtime/CL/functions/CLGEMM.cpp",
        "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp",
        "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
        "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp",
        "src/runtime/CL/functions/CLGather.cpp",
        "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp",
        "src/runtime/CL/functions/CLIndirectConvolutionLayer.cpp",
        "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp",
        "src/runtime/CL/functions/CLL2NormalizeLayer.cpp",
        "src/runtime/CL/functions/CLLSTMLayer.cpp",
        "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp",
        "src/runtime/CL/functions/CLLogicalAnd.cpp",
        "src/runtime/CL/functions/CLLogicalNot.cpp",
        "src/runtime/CL/functions/CLLogicalOr.cpp",
        "src/runtime/CL/functions/CLMatMul.cpp",
        "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp",
        "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
        "src/runtime/CL/functions/CLNormalizationLayer.cpp",
        "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp",
        "src/runtime/CL/functions/CLPReluLayer.cpp",
        "src/runtime/CL/functions/CLPadLayer.cpp",
        "src/runtime/CL/functions/CLPermute.cpp",
        "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp",
        "src/runtime/CL/functions/CLPooling3dLayer.cpp",
        "src/runtime/CL/functions/CLPoolingLayer.cpp",
        "src/runtime/CL/functions/CLPriorBoxLayer.cpp",
        "src/runtime/CL/functions/CLQLSTMLayer.cpp",
        "src/runtime/CL/functions/CLQuantizationLayer.cpp",
        "src/runtime/CL/functions/CLRNNLayer.cpp",
        "src/runtime/CL/functions/CLROIAlignLayer.cpp",
        "src/runtime/CL/functions/CLROIPoolingLayer.cpp",
        "src/runtime/CL/functions/CLRange.cpp",
        "src/runtime/CL/functions/CLReduceMean.cpp",
        "src/runtime/CL/functions/CLReductionOperation.cpp",
        "src/runtime/CL/functions/CLReorgLayer.cpp",
        "src/runtime/CL/functions/CLReshapeLayer.cpp",
        "src/runtime/CL/functions/CLReverse.cpp",
        "src/runtime/CL/functions/CLScale.cpp",
        "src/runtime/CL/functions/CLScatter.cpp",
        "src/runtime/CL/functions/CLSelect.cpp",
        "src/runtime/CL/functions/CLSlice.cpp",
        "src/runtime/CL/functions/CLSoftmaxLayer.cpp",
        "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp",
        "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp",
        "src/runtime/CL/functions/CLSplit.cpp",
        "src/runtime/CL/functions/CLStackLayer.cpp",
        "src/runtime/CL/functions/CLStridedSlice.cpp",
        "src/runtime/CL/functions/CLTile.cpp",
        "src/runtime/CL/functions/CLTranspose.cpp",
        "src/runtime/CL/functions/CLUnstack.cpp",
        "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp",
        "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
        "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
        "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
        "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
        "src/runtime/CL/mlgo/HeuristicTree.cpp",
        "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
        "src/runtime/CL/mlgo/MLGOParser.cpp",
        "src/runtime/CL/mlgo/Utils.cpp",
        "src/runtime/CL/tuners/CLTuningParametersList.cpp",
        "src/runtime/CPP/CPPScheduler.cpp",
        "src/runtime/CPP/ICPPSimpleFunction.cpp",
        "src/runtime/CPP/SingleThreadScheduler.cpp",
        "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
        "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
        "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
        "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
        "src/runtime/CPP/functions/CPPPermute.cpp",
        "src/runtime/CPP/functions/CPPTopKV.cpp",
        "src/runtime/CPP/functions/CPPUpsample.cpp",
        "src/runtime/IScheduler.cpp",
        "src/runtime/ISimpleLifetimeManager.cpp",
        "src/runtime/ITensorAllocator.cpp",
        "src/runtime/IWeightsManager.cpp",
        "src/runtime/Memory.cpp",
        "src/runtime/MemoryManagerOnDemand.cpp",
        "src/runtime/NEON/INEOperator.cpp",
        "src/runtime/NEON/INESimpleFunction.cpp",
        "src/runtime/NEON/INESimpleFunctionNoBorder.cpp",
        "src/runtime/NEON/functions/NEActivationLayer.cpp",
        "src/runtime/NEON/functions/NEAddMulAdd.cpp",
        "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp",
        "src/runtime/NEON/functions/NEArithmeticAddition.cpp",
        "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
        "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
        "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp",
        "src/runtime/NEON/functions/NEBitwiseAnd.cpp",
        "src/runtime/NEON/functions/NEBitwiseNot.cpp",
        "src/runtime/NEON/functions/NEBitwiseOr.cpp",
        "src/runtime/NEON/functions/NEBitwiseXor.cpp",
        "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp",
        "src/runtime/NEON/functions/NECast.cpp",
        "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp",
        "src/runtime/NEON/functions/NEConcatenateLayer.cpp",
        "src/runtime/NEON/functions/NEConv3D.cpp",
        "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
        "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
        "src/runtime/NEON/functions/NECopy.cpp",
        "src/runtime/NEON/functions/NECropResize.cpp",
        "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp",
        "src/runtime/NEON/functions/NEDepthConvertLayer.cpp",
        "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp",
        "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp",
        "src/runtime/NEON/functions/NEDequantizationLayer.cpp",
        "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp",
        "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
        "src/runtime/NEON/functions/NEElementwiseOperations.cpp",
        "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp",
        "src/runtime/NEON/functions/NEFFT1D.cpp",
        "src/runtime/NEON/functions/NEFFT2D.cpp",
        "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
        "src/runtime/NEON/functions/NEFill.cpp",
        "src/runtime/NEON/functions/NEFillBorder.cpp",
        "src/runtime/NEON/functions/NEFlattenLayer.cpp",
        "src/runtime/NEON/functions/NEFloor.cpp",
        "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp",
        "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp",
        "src/runtime/NEON/functions/NEGEMM.cpp",
        "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
        "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
        "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
        "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp",
        "src/runtime/NEON/functions/NEGather.cpp",
        "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp",
        "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp",
        "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp",
        "src/runtime/NEON/functions/NELSTMLayer.cpp",
        "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
        "src/runtime/NEON/functions/NELogical.cpp",
        "src/runtime/NEON/functions/NEMatMul.cpp",
        "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
        "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp",
        "src/runtime/NEON/functions/NENormalizationLayer.cpp",
        "src/runtime/NEON/functions/NEPReluLayer.cpp",
        "src/runtime/NEON/functions/NEPadLayer.cpp",
        "src/runtime/NEON/functions/NEPermute.cpp",
        "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp",
        "src/runtime/NEON/functions/NEPooling3dLayer.cpp",
        "src/runtime/NEON/functions/NEPoolingLayer.cpp",
        "src/runtime/NEON/functions/NEPriorBoxLayer.cpp",
        "src/runtime/NEON/functions/NEQLSTMLayer.cpp",
        "src/runtime/NEON/functions/NEQuantizationLayer.cpp",
        "src/runtime/NEON/functions/NERNNLayer.cpp",
        "src/runtime/NEON/functions/NEROIAlignLayer.cpp",
        "src/runtime/NEON/functions/NEROIPoolingLayer.cpp",
        "src/runtime/NEON/functions/NERange.cpp",
        "src/runtime/NEON/functions/NEReduceMean.cpp",
        "src/runtime/NEON/functions/NEReductionOperation.cpp",
        "src/runtime/NEON/functions/NEReorderLayer.cpp",
        "src/runtime/NEON/functions/NEReorgLayer.cpp",
        "src/runtime/NEON/functions/NEReshapeLayer.cpp",
        "src/runtime/NEON/functions/NEReverse.cpp",
        "src/runtime/NEON/functions/NEScale.cpp",
        "src/runtime/NEON/functions/NESelect.cpp",
        "src/runtime/NEON/functions/NESlice.cpp",
        "src/runtime/NEON/functions/NESoftmaxLayer.cpp",
        "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp",
        "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp",
        "src/runtime/NEON/functions/NESplit.cpp",
        "src/runtime/NEON/functions/NEStackLayer.cpp",
        "src/runtime/NEON/functions/NEStridedSlice.cpp",
        "src/runtime/NEON/functions/NETile.cpp",
        "src/runtime/NEON/functions/NETranspose.cpp",
        "src/runtime/NEON/functions/NEUnstack.cpp",
        "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp",
        "src/runtime/OMP/OMPScheduler.cpp",
        "src/runtime/OffsetLifetimeManager.cpp",
        "src/runtime/OffsetMemoryPool.cpp",
        "src/runtime/OperatorTensor.cpp",
        "src/runtime/PoolManager.cpp",
        "src/runtime/RuntimeContext.cpp",
        "src/runtime/Scheduler.cpp",
        "src/runtime/SchedulerFactory.cpp",
        "src/runtime/SchedulerUtils.cpp",
        "src/runtime/SubTensor.cpp",
        "src/runtime/Tensor.cpp",
        "src/runtime/TensorAllocator.cpp",
        "src/runtime/Utils.cpp",
        "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
        "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
        "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigBifrost.cpp",
        "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigValhall.cpp",
        "src/runtime/heuristics/dwc_native/ClDWCNativeHeuristicsHelpers.cpp",
        "src/runtime/heuristics/indirect_conv/ClIndirectConvDefaultConfigValhall.cpp",
        "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultConfigValhall.cpp",
        "src/runtime/heuristics/matmul_native/ClMatMulNativeDefaultVariantValhall.cpp",
        "src/runtime/heuristics/matmul_native/ClMatMulNativeHelpers.cpp",
        "utils/CommonGraphOptions.cpp",
        "utils/GraphUtils.cpp",
        "utils/Utils.cpp",
        
    ],
    arch: {
        arm: {
            srcs: [
                "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp",
                
            ],
        },
        arm64: {
            srcs: [
                "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp16fp32fp16_dot_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp16fp32fp16_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8qfp32_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8qfp32_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8qfp32_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
                "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
                "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
                "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
                "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
                "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
                "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
                "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp",
                "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
                
            ],
        },
    },
    rtti: true,
}