xref: /aosp_15_r20/external/ComputeLibrary/filelist.json (revision c217d954acce2dbc11938adb493fc0abd69584f3)
1*c217d954SCole Faust{
2*c217d954SCole Faust  "common": [
3*c217d954SCole Faust    "src/common/cpuinfo/CpuInfo.cpp",
4*c217d954SCole Faust    "src/common/cpuinfo/CpuModel.cpp",
5*c217d954SCole Faust    "src/common/cpuinfo/CpuIsaInfo.cpp",
6*c217d954SCole Faust    "src/common/utils/LegacySupport.cpp",
7*c217d954SCole Faust    "src/common/AllocatorWrapper.cpp",
8*c217d954SCole Faust    "src/common/ITensorV2.cpp",
9*c217d954SCole Faust    "src/common/TensorPack.cpp",
10*c217d954SCole Faust    "src/common/IOperator.cpp",
11*c217d954SCole Faust    "src/core/AccessWindowAutoPadding.cpp",
12*c217d954SCole Faust    "src/core/AccessWindowStatic.cpp",
13*c217d954SCole Faust    "src/core/AccessWindowTranspose.cpp",
14*c217d954SCole Faust    "src/core/Error.cpp",
15*c217d954SCole Faust    "src/core/GPUTarget.cpp",
16*c217d954SCole Faust    "src/core/Helpers.cpp",
17*c217d954SCole Faust    "src/core/IAccessWindow.cpp",
18*c217d954SCole Faust    "src/core/IKernel.cpp",
19*c217d954SCole Faust    "src/core/ITensor.cpp",
20*c217d954SCole Faust    "src/core/ITensorPack.cpp",
21*c217d954SCole Faust    "src/core/Rounding.cpp",
22*c217d954SCole Faust    "src/core/Size2D.cpp",
23*c217d954SCole Faust    "src/core/SubTensorInfo.cpp",
24*c217d954SCole Faust    "src/core/TensorInfo.cpp",
25*c217d954SCole Faust    "src/core/Utils.cpp",
26*c217d954SCole Faust    "src/core/Validate.cpp",
27*c217d954SCole Faust    "src/core/Version.cpp",
28*c217d954SCole Faust    "src/core/helpers/SoftmaxHelpers.cpp",
29*c217d954SCole Faust    "src/core/helpers/WindowHelpers.cpp",
30*c217d954SCole Faust    "src/core/utils/AssemblyUtils.cpp",
31*c217d954SCole Faust    "src/core/utils/ScaleUtils.cpp",
32*c217d954SCole Faust    "src/core/utils/helpers/fft.cpp",
33*c217d954SCole Faust    "src/core/utils/helpers/tensor_transform.cpp",
34*c217d954SCole Faust    "src/core/utils/io/FileHandler.cpp",
35*c217d954SCole Faust    "src/core/utils/misc/MMappedFile.cpp",
36*c217d954SCole Faust    "src/core/utils/quantization/AsymmHelpers.cpp",
37*c217d954SCole Faust    "src/core/CPP/CPPTypes.cpp",
38*c217d954SCole Faust    "src/core/CPP/kernels/CPPBoxWithNonMaximaSuppressionLimitKernel.cpp",
39*c217d954SCole Faust    "src/core/CPP/kernels/CPPNonMaximumSuppressionKernel.cpp",
40*c217d954SCole Faust    "src/core/CPP/kernels/CPPPermuteKernel.cpp",
41*c217d954SCole Faust    "src/core/CPP/kernels/CPPTopKVKernel.cpp",
42*c217d954SCole Faust    "src/core/CPP/kernels/CPPUpsampleKernel.cpp",
43*c217d954SCole Faust    "src/runtime/Allocator.cpp",
44*c217d954SCole Faust    "src/runtime/BlobLifetimeManager.cpp",
45*c217d954SCole Faust    "src/runtime/BlobMemoryPool.cpp",
46*c217d954SCole Faust    "src/runtime/ISimpleLifetimeManager.cpp",
47*c217d954SCole Faust    "src/runtime/ITensorAllocator.cpp",
48*c217d954SCole Faust    "src/runtime/IWeightsManager.cpp",
49*c217d954SCole Faust    "src/runtime/IScheduler.cpp",
50*c217d954SCole Faust    "src/runtime/Memory.cpp",
51*c217d954SCole Faust    "src/runtime/MemoryManagerOnDemand.cpp",
52*c217d954SCole Faust    "src/runtime/OffsetLifetimeManager.cpp",
53*c217d954SCole Faust    "src/runtime/OffsetMemoryPool.cpp",
54*c217d954SCole Faust    "src/runtime/OperatorTensor.cpp",
55*c217d954SCole Faust    "src/runtime/PoolManager.cpp",
56*c217d954SCole Faust    "src/runtime/RuntimeContext.cpp",
57*c217d954SCole Faust    "src/runtime/Scheduler.cpp",
58*c217d954SCole Faust    "src/runtime/SchedulerFactory.cpp",
59*c217d954SCole Faust    "src/runtime/SchedulerUtils.cpp",
60*c217d954SCole Faust    "src/runtime/SubTensor.cpp",
61*c217d954SCole Faust    "src/runtime/Tensor.cpp",
62*c217d954SCole Faust    "src/runtime/TensorAllocator.cpp",
63*c217d954SCole Faust    "src/runtime/Utils.cpp",
64*c217d954SCole Faust    "src/runtime/CPP/ICPPSimpleFunction.cpp",
65*c217d954SCole Faust    "src/runtime/CPP/functions/CPPBoxWithNonMaximaSuppressionLimit.cpp",
66*c217d954SCole Faust    "src/runtime/CPP/functions/CPPDetectionOutputLayer.cpp",
67*c217d954SCole Faust    "src/runtime/CPP/functions/CPPDetectionPostProcessLayer.cpp",
68*c217d954SCole Faust    "src/runtime/CPP/functions/CPPNonMaximumSuppression.cpp",
69*c217d954SCole Faust    "src/runtime/CPP/functions/CPPPermute.cpp",
70*c217d954SCole Faust    "src/runtime/CPP/functions/CPPTopKV.cpp",
71*c217d954SCole Faust    "src/runtime/CPP/functions/CPPUpsample.cpp"
72*c217d954SCole Faust  ],
73*c217d954SCole Faust  "logging": [
74*c217d954SCole Faust    "src/core/utils/logging/FilePrinter.cpp",
75*c217d954SCole Faust    "src/core/utils/logging/Helpers.cpp",
76*c217d954SCole Faust    "src/core/utils/logging/Logger.cpp",
77*c217d954SCole Faust    "src/core/utils/logging/LoggerRegistry.cpp"
78*c217d954SCole Faust  ],
79*c217d954SCole Faust  "scheduler": {
80*c217d954SCole Faust    "single": [ "src/runtime/CPP/SingleThreadScheduler.cpp" ],
81*c217d954SCole Faust    "threads": [ "src/runtime/CPP/CPPScheduler.cpp" ],
82*c217d954SCole Faust    "omp": [ "src/runtime/OMP/OMPScheduler.cpp"]
83*c217d954SCole Faust  },
84*c217d954SCole Faust  "c_api": {
85*c217d954SCole Faust    "common": [
86*c217d954SCole Faust      "src/c/AclContext.cpp",
87*c217d954SCole Faust      "src/c/AclOperator.cpp",
88*c217d954SCole Faust      "src/c/AclQueue.cpp",
89*c217d954SCole Faust      "src/c/AclTensor.cpp",
90*c217d954SCole Faust      "src/c/AclTensorPack.cpp",
91*c217d954SCole Faust      "src/c/AclVersion.cpp"
92*c217d954SCole Faust    ],
93*c217d954SCole Faust    "cpu": [
94*c217d954SCole Faust    ],
95*c217d954SCole Faust    "gpu": [
96*c217d954SCole Faust      "src/c/cl/AclOpenClExt.cpp"
97*c217d954SCole Faust    ],
98*c217d954SCole Faust    "operators":
99*c217d954SCole Faust    [
100*c217d954SCole Faust      "src/c/operators/AclActivation.cpp"
101*c217d954SCole Faust    ]
102*c217d954SCole Faust  },
103*c217d954SCole Faust  "high_priority": [
104*c217d954SCole Faust    "Activation",
105*c217d954SCole Faust    "DepthwiseConv2d",
106*c217d954SCole Faust    "Conv2d",
107*c217d954SCole Faust    "Permute",
108*c217d954SCole Faust    "Pool2d",
109*c217d954SCole Faust    "Reshape"
110*c217d954SCole Faust  ],
111*c217d954SCole Faust  "gpu": {
112*c217d954SCole Faust    "common": [
113*c217d954SCole Faust      "src/core/CL/CLCompileContext.cpp",
114*c217d954SCole Faust      "src/core/CL/DefaultLWSHeuristics.cpp",
115*c217d954SCole Faust      "src/core/CL/CLHelpers.cpp",
116*c217d954SCole Faust      "src/core/CL/CLKernelLibrary.cpp",
117*c217d954SCole Faust      "src/core/CL/CLUtils.cpp",
118*c217d954SCole Faust      "src/core/CL/ICLKernel.cpp",
119*c217d954SCole Faust      "src/core/CL/ICLSimple2DKernel.cpp",
120*c217d954SCole Faust      "src/core/CL/ICLSimple3DKernel.cpp",
121*c217d954SCole Faust      "src/core/CL/ICLSimpleKernel.cpp",
122*c217d954SCole Faust      "src/core/CL/ICLTensor.cpp",
123*c217d954SCole Faust      "src/core/CL/OpenCL.cpp",
124*c217d954SCole Faust      "src/gpu/cl/ClContext.cpp",
125*c217d954SCole Faust      "src/gpu/cl/ClKernelLibrary.cpp",
126*c217d954SCole Faust      "src/gpu/cl/ClQueue.cpp",
127*c217d954SCole Faust      "src/gpu/cl/ClTensor.cpp",
128*c217d954SCole Faust      "src/core/CL/kernels/CLFillBorderKernel.cpp",
129*c217d954SCole Faust      "src/runtime/CL/CLBufferAllocator.cpp",
130*c217d954SCole Faust      "src/runtime/CL/CLGEMMHeuristicsHandle.cpp",
131*c217d954SCole Faust      "src/runtime/CL/CLHelpers.cpp",
132*c217d954SCole Faust      "src/runtime/CL/CLMemory.cpp",
133*c217d954SCole Faust      "src/runtime/CL/CLMemoryRegion.cpp",
134*c217d954SCole Faust      "src/runtime/CL/CLOperator.cpp",
135*c217d954SCole Faust      "src/runtime/CL/CLRuntimeContext.cpp",
136*c217d954SCole Faust      "src/runtime/CL/CLScheduler.cpp",
137*c217d954SCole Faust      "src/runtime/CL/CLSubTensor.cpp",
138*c217d954SCole Faust      "src/runtime/CL/CLTensor.cpp",
139*c217d954SCole Faust      "src/runtime/CL/CLTensorAllocator.cpp",
140*c217d954SCole Faust      "src/runtime/CL/CLTuner.cpp",
141*c217d954SCole Faust      "src/runtime/CL/ICLSimpleFunction.cpp",
142*c217d954SCole Faust      "src/runtime/CL/Utils.cpp",
143*c217d954SCole Faust      "src/runtime/CL/mlgo/HeuristicTree.cpp",
144*c217d954SCole Faust      "src/runtime/CL/mlgo/MLGOHeuristics.cpp",
145*c217d954SCole Faust      "src/runtime/CL/mlgo/MLGOParser.cpp",
146*c217d954SCole Faust      "src/runtime/CL/mlgo/Utils.cpp",
147*c217d954SCole Faust      "src/runtime/CL/tuners/CLTuningParametersList.cpp"
148*c217d954SCole Faust    ],
149*c217d954SCole Faust    "operators": {
150*c217d954SCole Faust    "Activation":{
151*c217d954SCole Faust      "files": {
152*c217d954SCole Faust        "common": [
153*c217d954SCole Faust          "src/gpu/cl/kernels/ClActivationKernel.cpp",
154*c217d954SCole Faust          "src/gpu/cl/operators/ClActivation.cpp",
155*c217d954SCole Faust          "src/runtime/CL/functions/CLActivationLayer.cpp"
156*c217d954SCole Faust        ]
157*c217d954SCole Faust      }
158*c217d954SCole Faust    },
159*c217d954SCole Faust    "ArgMinMax": {
160*c217d954SCole Faust      "deps": [ "Reshape" ],
161*c217d954SCole Faust      "files": {
162*c217d954SCole Faust        "common": [
163*c217d954SCole Faust          "src/core/CL/kernels/CLArgMinMaxLayerKernel.cpp",
164*c217d954SCole Faust          "src/runtime/CL/functions/CLArgMinMaxLayer.cpp"
165*c217d954SCole Faust        ]
166*c217d954SCole Faust      }
167*c217d954SCole Faust    },
168*c217d954SCole Faust    "Add": {
169*c217d954SCole Faust      "files": {
170*c217d954SCole Faust        "common": [
171*c217d954SCole Faust          "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
172*c217d954SCole Faust          "src/gpu/cl/operators/ClAdd.cpp"
173*c217d954SCole Faust        ]
174*c217d954SCole Faust      }
175*c217d954SCole Faust    },
176*c217d954SCole Faust    "BatchNormalization": {
177*c217d954SCole Faust      "files": {
178*c217d954SCole Faust        "common": [
179*c217d954SCole Faust          "src/core/CL/kernels/CLBatchNormalizationLayerKernel.cpp",
180*c217d954SCole Faust          "src/core/CL/kernels/CLFuseBatchNormalizationKernel.cpp",
181*c217d954SCole Faust          "src/runtime/CL/functions/CLBatchNormalizationLayer.cpp",
182*c217d954SCole Faust          "src/runtime/CL/functions/CLFuseBatchNormalization.cpp"
183*c217d954SCole Faust        ]
184*c217d954SCole Faust      }
185*c217d954SCole Faust    },
186*c217d954SCole Faust    "BatchToSpace": {
187*c217d954SCole Faust      "files": {
188*c217d954SCole Faust        "common": [
189*c217d954SCole Faust          "src/core/CL/kernels/CLBatchToSpaceLayerKernel.cpp",
190*c217d954SCole Faust          "src/runtime/CL/functions/CLBatchToSpaceLayer.cpp"
191*c217d954SCole Faust         ]
192*c217d954SCole Faust      }
193*c217d954SCole Faust    },
194*c217d954SCole Faust    "Bitwise": {
195*c217d954SCole Faust      "files": {
196*c217d954SCole Faust        "common": [ "src/core/CL/kernels/CLBitwiseKernel.cpp" ]
197*c217d954SCole Faust      }
198*c217d954SCole Faust    },
199*c217d954SCole Faust    "BitwiseAnd": {
200*c217d954SCole Faust      "deps": [ "Bitwise" ],
201*c217d954SCole Faust      "files": {
202*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLBitwiseAnd.cpp" ]
203*c217d954SCole Faust      }
204*c217d954SCole Faust    },
205*c217d954SCole Faust    "BitwiseNot": {
206*c217d954SCole Faust      "deps": [ "Bitwise" ],
207*c217d954SCole Faust      "files": {
208*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLBitwiseNot.cpp" ]
209*c217d954SCole Faust      }
210*c217d954SCole Faust    },
211*c217d954SCole Faust    "BitwiseOr": {
212*c217d954SCole Faust      "deps": [ "Bitwise" ],
213*c217d954SCole Faust      "files": {
214*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLBitwiseOr.cpp" ]
215*c217d954SCole Faust      }
216*c217d954SCole Faust    },
217*c217d954SCole Faust    "BitwiseXor": {
218*c217d954SCole Faust      "deps": [ "Bitwise" ],
219*c217d954SCole Faust      "files": {
220*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLBitwiseXor.cpp" ]
221*c217d954SCole Faust      }
222*c217d954SCole Faust    },
223*c217d954SCole Faust    "BoundingBoxTransform": {
224*c217d954SCole Faust      "files": {
225*c217d954SCole Faust        "common": [
226*c217d954SCole Faust          "src/core/CL/kernels/CLBoundingBoxTransformKernel.cpp",
227*c217d954SCole Faust          "src/runtime/CL/functions/CLBoundingBoxTransform.cpp"
228*c217d954SCole Faust        ]
229*c217d954SCole Faust      }
230*c217d954SCole Faust    },
231*c217d954SCole Faust    "Cast": {
232*c217d954SCole Faust      "files": {
233*c217d954SCole Faust        "common": [
234*c217d954SCole Faust          "src/gpu/cl/kernels/ClCastKernel.cpp",
235*c217d954SCole Faust          "src/gpu/cl/operators/ClCast.cpp",
236*c217d954SCole Faust          "src/runtime/CL/functions/CLCast.cpp"
237*c217d954SCole Faust        ]
238*c217d954SCole Faust      }
239*c217d954SCole Faust    },
240*c217d954SCole Faust    "ChannelShuffle": {
241*c217d954SCole Faust      "files": {
242*c217d954SCole Faust        "common": [
243*c217d954SCole Faust          "src/core/CL/kernels/CLChannelShuffleLayerKernel.cpp",
244*c217d954SCole Faust          "src/runtime/CL/functions/CLChannelShuffleLayer.cpp"
245*c217d954SCole Faust        ]
246*c217d954SCole Faust      }
247*c217d954SCole Faust    },
248*c217d954SCole Faust    "Comparison":  {
249*c217d954SCole Faust      "files": {
250*c217d954SCole Faust        "common": [
251*c217d954SCole Faust          "src/core/CL/kernels/CLComparisonKernel.cpp",
252*c217d954SCole Faust          "src/runtime/CL/functions/CLComparison.cpp"
253*c217d954SCole Faust        ]
254*c217d954SCole Faust      }
255*c217d954SCole Faust    },
256*c217d954SCole Faust    "Concatenate": {
257*c217d954SCole Faust      "files": {
258*c217d954SCole Faust        "common": [
259*c217d954SCole Faust          "src/gpu/cl/kernels/ClBatchConcatenateKernel.cpp",
260*c217d954SCole Faust          "src/gpu/cl/kernels/ClDepthConcatenateKernel.cpp",
261*c217d954SCole Faust          "src/gpu/cl/kernels/ClHeightConcatenateKernel.cpp",
262*c217d954SCole Faust          "src/gpu/cl/kernels/ClWidthConcatenate2TensorsKernel.cpp",
263*c217d954SCole Faust          "src/gpu/cl/kernels/ClWidthConcatenate4TensorsKernel.cpp",
264*c217d954SCole Faust          "src/gpu/cl/kernels/ClWidthConcatenateKernel.cpp",
265*c217d954SCole Faust          "src/gpu/cl/operators/ClConcatenate.cpp",
266*c217d954SCole Faust          "src/runtime/CL/functions/CLConcatenateLayer.cpp"
267*c217d954SCole Faust        ]
268*c217d954SCole Faust      }
269*c217d954SCole Faust    },
270*c217d954SCole Faust    "Conv2d": {
271*c217d954SCole Faust      "deps": [
272*c217d954SCole Faust        "Activation",
273*c217d954SCole Faust        "ElementwiseBinary",
274*c217d954SCole Faust        "FFT2D",
275*c217d954SCole Faust        "Gemm",
276*c217d954SCole Faust        "Mul",
277*c217d954SCole Faust        "Pad",
278*c217d954SCole Faust        "Permute",
279*c217d954SCole Faust        "Reduction",
280*c217d954SCole Faust        "Reshape",
281*c217d954SCole Faust        "Reverse",
282*c217d954SCole Faust        "Slice"
283*c217d954SCole Faust      ],
284*c217d954SCole Faust      "files": {
285*c217d954SCole Faust        "common": [
286*c217d954SCole Faust          "src/gpu/cl/kernels/ClDirectConv2dKernel.cpp",
287*c217d954SCole Faust          "src/gpu/cl/kernels/ClWinogradFilterTransformKernel.cpp",
288*c217d954SCole Faust          "src/gpu/cl/kernels/ClWinogradInputTransformKernel.cpp",
289*c217d954SCole Faust          "src/gpu/cl/kernels/ClWinogradOutputTransformKernel.cpp",
290*c217d954SCole Faust          "src/gpu/cl/kernels/ClIm2ColKernel.cpp",
291*c217d954SCole Faust          "src/gpu/cl/kernels/ClIndirectConv2dKernel.cpp",
292*c217d954SCole Faust          "src/gpu/cl/kernels/ClIndirectConv2dAddressPrecalculationKernel.cpp",
293*c217d954SCole Faust          "src/gpu/cl/kernels/ClCol2ImKernel.cpp",
294*c217d954SCole Faust          "src/gpu/cl/operators/ClConv2d.cpp",
295*c217d954SCole Faust          "src/gpu/cl/operators/ClDirectConv2d.cpp",
296*c217d954SCole Faust          "src/gpu/cl/operators/ClGemmConv2d.cpp",
297*c217d954SCole Faust          "src/gpu/cl/operators/ClIndirectConv2d.cpp",
298*c217d954SCole Faust          "src/gpu/cl/operators/ClWinogradConv2d.cpp",
299*c217d954SCole Faust          "src/gpu/cl/kernels/ClWeightsReshapeKernel.cpp",
300*c217d954SCole Faust          "src/runtime/CL/functions/CLConvolutionLayer.cpp",
301*c217d954SCole Faust          "src/runtime/CL/functions/CLDirectConvolutionLayer.cpp",
302*c217d954SCole Faust          "src/runtime/CL/functions/CLFFTConvolutionLayer.cpp",
303*c217d954SCole Faust          "src/runtime/CL/functions/CLGEMMConvolutionLayer.cpp",
304*c217d954SCole Faust          "src/runtime/CL/functions/CLIndirectConvolutionLayer.cpp",
305*c217d954SCole Faust          "src/runtime/CL/functions/CLWinogradConvolutionLayer.cpp"
306*c217d954SCole Faust        ]
307*c217d954SCole Faust      }
308*c217d954SCole Faust    },
309*c217d954SCole Faust    "Conv3d": {
310*c217d954SCole Faust      "files": {
311*c217d954SCole Faust        "common": [
312*c217d954SCole Faust          "src/gpu/cl/kernels/ClDirectConv3dKernel.cpp",
313*c217d954SCole Faust          "src/gpu/cl/operators/ClDirectConv3d.cpp",
314*c217d954SCole Faust          "src/runtime/CL/functions/CLConv3D.cpp"
315*c217d954SCole Faust        ]
316*c217d954SCole Faust      }
317*c217d954SCole Faust    },
318*c217d954SCole Faust    "Copy": {
319*c217d954SCole Faust      "files": {
320*c217d954SCole Faust        "common": [
321*c217d954SCole Faust          "src/gpu/cl/kernels/ClCopyKernel.cpp",
322*c217d954SCole Faust          "src/gpu/cl/operators/ClCopy.cpp",
323*c217d954SCole Faust          "src/runtime/CL/functions/CLCopy.cpp"
324*c217d954SCole Faust        ]
325*c217d954SCole Faust      }
326*c217d954SCole Faust    },
327*c217d954SCole Faust    "CropResize": {
328*c217d954SCole Faust      "deps": [ "Copy", "Fill", "Scale" ],
329*c217d954SCole Faust      "files": {
330*c217d954SCole Faust        "common": [
331*c217d954SCole Faust          "src/gpu/cl/kernels/ClCropKernel.cpp",
332*c217d954SCole Faust          "src/gpu/cl/operators/ClCrop.cpp",
333*c217d954SCole Faust          "src/runtime/CL/functions/CLCrop.cpp",
334*c217d954SCole Faust          "src/runtime/CL/functions/CLCropResize.cpp"
335*c217d954SCole Faust        ]
336*c217d954SCole Faust      }
337*c217d954SCole Faust    },
338*c217d954SCole Faust    "Deconv2d": {
339*c217d954SCole Faust      "deps": [ "Conv2d", "Reverse", "Transpose"],
340*c217d954SCole Faust      "files": {
341*c217d954SCole Faust        "common": [
342*c217d954SCole Faust          "src/core/CL/kernels/CLDeconvolutionLayerUpsampleKernel.cpp",
343*c217d954SCole Faust          "src/core/CL/kernels/CLDeconvolutionReshapeOutputKernel.cpp",
344*c217d954SCole Faust          "src/gpu/cl/kernels/ClTransposedConvolutionKernel.cpp",
345*c217d954SCole Faust          "src/gpu/cl/operators/ClTransposedConvolution.cpp",
346*c217d954SCole Faust          "src/runtime/CL/functions/CLDeconvolutionLayer.cpp",
347*c217d954SCole Faust          "src/runtime/CL/functions/CLDeconvolutionLayerUpsample.cpp",
348*c217d954SCole Faust          "src/runtime/CL/functions/CLDirectDeconvolutionLayer.cpp",
349*c217d954SCole Faust          "src/runtime/CL/functions/CLGEMMDeconvolutionLayer.cpp"
350*c217d954SCole Faust        ]
351*c217d954SCole Faust      }
352*c217d954SCole Faust    },
353*c217d954SCole Faust    "DepthConvert": {
354*c217d954SCole Faust      "deps": [ "Cast"],
355*c217d954SCole Faust      "files": {
356*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLDepthConvertLayer.cpp" ]
357*c217d954SCole Faust      }
358*c217d954SCole Faust    },
359*c217d954SCole Faust    "DepthToSpace": {
360*c217d954SCole Faust      "files": {
361*c217d954SCole Faust        "common": [
362*c217d954SCole Faust          "src/core/CL/kernels/CLDepthToSpaceLayerKernel.cpp",
363*c217d954SCole Faust          "src/runtime/CL/functions/CLDepthToSpaceLayer.cpp"
364*c217d954SCole Faust        ]
365*c217d954SCole Faust      }
366*c217d954SCole Faust    },
367*c217d954SCole Faust    "DepthwiseConv2d": {
368*c217d954SCole Faust      "deps": [ "Permute" ],
369*c217d954SCole Faust      "files": {
370*c217d954SCole Faust        "common": [
371*c217d954SCole Faust          "src/core/CL/kernels/CLDepthwiseConvolutionLayerNativeKernel.cpp",
372*c217d954SCole Faust          "src/runtime/CL/functions/CLDepthwiseConvolutionLayer.cpp"
373*c217d954SCole Faust        ]
374*c217d954SCole Faust      }
375*c217d954SCole Faust    },
376*c217d954SCole Faust    "Dequantize": {
377*c217d954SCole Faust      "files": {
378*c217d954SCole Faust        "common": [
379*c217d954SCole Faust          "src/gpu/cl/kernels/ClDequantizeKernel.cpp",
380*c217d954SCole Faust          "src/gpu/cl/operators/ClDequantize.cpp",
381*c217d954SCole Faust          "src/runtime/CL/functions/CLDequantizationLayer.cpp"
382*c217d954SCole Faust        ]
383*c217d954SCole Faust      }
384*c217d954SCole Faust    },
385*c217d954SCole Faust    "ElementwiseBinary": {
386*c217d954SCole Faust      "deps": ["Add", "Sub"],
387*c217d954SCole Faust      "files": {
388*c217d954SCole Faust        "common": [
389*c217d954SCole Faust          "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
390*c217d954SCole Faust          "src/gpu/cl/operators/ClElementwiseOperations.cpp",
391*c217d954SCole Faust          "src/runtime/CL/functions/CLElementwiseOperations.cpp"
392*c217d954SCole Faust        ]
393*c217d954SCole Faust      }
394*c217d954SCole Faust    },
395*c217d954SCole Faust    "ElementwiseUnary":{
396*c217d954SCole Faust      "files": {
397*c217d954SCole Faust        "common": [
398*c217d954SCole Faust          "src/gpu/cl/kernels/ClElementwiseUnaryKernel.cpp",
399*c217d954SCole Faust          "src/gpu/cl/operators/ClElementwiseUnary.cpp",
400*c217d954SCole Faust          "src/runtime/CL/functions/CLElementwiseUnaryLayer.cpp"
401*c217d954SCole Faust        ]
402*c217d954SCole Faust      }
403*c217d954SCole Faust    },
404*c217d954SCole Faust    "FFT1D": {
405*c217d954SCole Faust      "files": {
406*c217d954SCole Faust        "common": [
407*c217d954SCole Faust          "src/core/CL/kernels/CLFFTDigitReverseKernel.cpp",
408*c217d954SCole Faust          "src/core/CL/kernels/CLFFTRadixStageKernel.cpp",
409*c217d954SCole Faust          "src/core/CL/kernels/CLFFTScaleKernel.cpp",
410*c217d954SCole Faust          "src/runtime/CL/functions/CLFFT1D.cpp"
411*c217d954SCole Faust        ]
412*c217d954SCole Faust      }
413*c217d954SCole Faust    },
414*c217d954SCole Faust    "FFT2D": {
415*c217d954SCole Faust      "deps": [ "FFT1D" ],
416*c217d954SCole Faust      "files": {
417*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLFFT2D.cpp" ]
418*c217d954SCole Faust      }
419*c217d954SCole Faust    },
420*c217d954SCole Faust    "Fill": {
421*c217d954SCole Faust      "files": {
422*c217d954SCole Faust        "common": [
423*c217d954SCole Faust          "src/gpu/cl/kernels/ClFillKernel.cpp",
424*c217d954SCole Faust          "src/gpu/cl/operators/ClFill.cpp",
425*c217d954SCole Faust          "src/runtime/CL/functions/CLFill.cpp"
426*c217d954SCole Faust        ]
427*c217d954SCole Faust      }
428*c217d954SCole Faust    },
429*c217d954SCole Faust    "Flatten": {
430*c217d954SCole Faust      "files": {
431*c217d954SCole Faust        "common": [
432*c217d954SCole Faust          "src/gpu/cl/operators/ClFlatten.cpp",
433*c217d954SCole Faust          "src/runtime/CL/functions/CLFlattenLayer.cpp"
434*c217d954SCole Faust        ]
435*c217d954SCole Faust      }
436*c217d954SCole Faust    },
437*c217d954SCole Faust    "Floor": {
438*c217d954SCole Faust      "files": {
439*c217d954SCole Faust        "common": [
440*c217d954SCole Faust          "src/gpu/cl/kernels/ClFloorKernel.cpp",
441*c217d954SCole Faust          "src/gpu/cl/operators/ClFloor.cpp",
442*c217d954SCole Faust          "src/runtime/CL/functions/CLFloor.cpp"
443*c217d954SCole Faust        ]
444*c217d954SCole Faust      }
445*c217d954SCole Faust    },
446*c217d954SCole Faust    "FullyConnected": {
447*c217d954SCole Faust      "deps": [ "Flatten", "Gemm", "Transpose"],
448*c217d954SCole Faust      "files": {
449*c217d954SCole Faust        "common": [
450*c217d954SCole Faust          "src/gpu/cl/kernels/ClConvertFullyConnectedWeightsKernel.cpp",
451*c217d954SCole Faust          "src/gpu/cl/operators/ClConvertFullyConnectedWeights.cpp",
452*c217d954SCole Faust          "src/gpu/cl/operators/ClFullyConnected.cpp",
453*c217d954SCole Faust          "src/runtime/CL/functions/CLConvertFullyConnectedWeights.cpp",
454*c217d954SCole Faust          "src/runtime/CL/functions/CLFullyConnectedLayer.cpp"
455*c217d954SCole Faust        ]
456*c217d954SCole Faust      }
457*c217d954SCole Faust    },
458*c217d954SCole Faust    "Gather": {
459*c217d954SCole Faust      "files": {
460*c217d954SCole Faust        "common": [
461*c217d954SCole Faust          "src/core/CL/kernels/CLGatherKernel.cpp",
462*c217d954SCole Faust          "src/runtime/CL/functions/CLGather.cpp"]
463*c217d954SCole Faust      }
464*c217d954SCole Faust    },
465*c217d954SCole Faust    "Gemm": {
466*c217d954SCole Faust      "deps": [ "Cast" ],
467*c217d954SCole Faust      "files": {
468*c217d954SCole Faust        "common": [
469*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/ClGemmHelpers.cpp",
470*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeBifrost.cpp",
471*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeMidgard.cpp",
472*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/native/ClGemmDefaultConfigNativeValhall.cpp",
473*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedBifrost.cpp",
474*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/reshaped/ClGemmDefaultConfigReshapedValhall.cpp",
475*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyBifrost.cpp",
476*c217d954SCole Faust          "src/gpu/cl/kernels/gemm/reshaped_only_rhs/ClGemmDefaultConfigReshapedRhsOnlyValhall.cpp",
477*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyNativeKernel.cpp",
478*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedKernel.cpp",
479*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsKernel.cpp",
480*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
481*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpOffsetContributionKernel.cpp",
482*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpOffsetContributionOutputStageKernel.cpp",
483*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFixedPointKernel.cpp",
484*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleByFloatKernel.cpp",
485*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpQuantizeDownInt32ScaleKernel.cpp",
486*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmMatrixMultiplyNativeKernel.cpp",
487*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsMMULKernel.cpp",
488*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedKernel.cpp",
489*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmMatrixMultiplyReshapedOnlyRhsKernel.cpp",
490*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmReshapeLhsMatrixKernel.cpp",
491*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmReshapeRhsMatrixKernel.cpp",
492*c217d954SCole Faust          "src/gpu/cl/kernels/ClGemmLowpReductionKernel.cpp",
493*c217d954SCole Faust          "src/gpu/cl/operators/ClGemm.cpp",
494*c217d954SCole Faust          "src/gpu/cl/operators/ClGemmLowpMatrixMultiplyCore.cpp",
495*c217d954SCole Faust          "src/gpu/cl/operators/ClGemmLowpOutputStage.cpp",
496*c217d954SCole Faust          "src/runtime/CL/gemm/CLGEMMDefaultTypeBifrost.cpp",
497*c217d954SCole Faust          "src/runtime/CL/gemm/CLGEMMDefaultTypeMidgard.cpp",
498*c217d954SCole Faust          "src/runtime/CL/gemm/CLGEMMDefaultTypeValhall.cpp",
499*c217d954SCole Faust          "src/runtime/CL/gemm_auto_heuristics/CLGEMMAutoHeuristics.cpp",
500*c217d954SCole Faust          "src/runtime/CL/functions/CLGEMM.cpp",
501*c217d954SCole Faust          "src/runtime/CL/functions/CLGEMMLowpMatrixMultiplyCore.cpp",
502*c217d954SCole Faust          "src/runtime/CL/functions/CLGEMMLowpOutputStage.cpp",
503*c217d954SCole Faust          "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigBifrost.cpp",
504*c217d954SCole Faust          "src/runtime/heuristics/direct_conv/ClDirectConvDefaultConfigValhall.cpp",
505*c217d954SCole Faust          "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigBifrost.cpp",
506*c217d954SCole Faust          "src/runtime/heuristics/dwc_native/ClDWCNativeDefaultConfigValhall.cpp",
507*c217d954SCole Faust          "src/runtime/heuristics/dwc_native/ClDWCNativeHeuristicsHelpers.cpp",
508*c217d954SCole Faust          "src/runtime/heuristics/indirect_conv/ClIndirectConvDefaultConfigValhall.cpp"
509*c217d954SCole Faust        ]
510*c217d954SCole Faust      }
511*c217d954SCole Faust    },
512*c217d954SCole Faust    "GenerateProposals": {
513*c217d954SCole Faust      "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
514*c217d954SCole Faust      "files": {
515*c217d954SCole Faust        "common": [
516*c217d954SCole Faust          "src/core/CL/kernels/CLGenerateProposalsLayerKernel.cpp",
517*c217d954SCole Faust          "src/runtime/CL/functions/CLGenerateProposalsLayer.cpp"
518*c217d954SCole Faust        ]
519*c217d954SCole Faust      }
520*c217d954SCole Faust    },
521*c217d954SCole Faust    "InstanceNormalize": {
522*c217d954SCole Faust      "files": {
523*c217d954SCole Faust        "common": [
524*c217d954SCole Faust          "src/core/CL/kernels/CLInstanceNormalizationLayerKernel.cpp",
525*c217d954SCole Faust          "src/runtime/CL/functions/CLInstanceNormalizationLayer.cpp"
526*c217d954SCole Faust        ]
527*c217d954SCole Faust      }
528*c217d954SCole Faust    },
529*c217d954SCole Faust    "L2Normalize": {
530*c217d954SCole Faust      "deps": [ "Reduction" ],
531*c217d954SCole Faust      "files": {
532*c217d954SCole Faust        "common": [
533*c217d954SCole Faust          "src/core/CL/kernels/CLL2NormalizeLayerKernel.cpp",
534*c217d954SCole Faust          "src/runtime/CL/functions/CLL2NormalizeLayer.cpp"
535*c217d954SCole Faust        ]
536*c217d954SCole Faust      }
537*c217d954SCole Faust    },
538*c217d954SCole Faust    "Logical": {
539*c217d954SCole Faust      "files": {
540*c217d954SCole Faust        "common": [
541*c217d954SCole Faust          "src/gpu/cl/operators/ClLogicalNot.cpp",
542*c217d954SCole Faust          "src/runtime/CL/functions/CLLogicalAnd.cpp",
543*c217d954SCole Faust          "src/runtime/CL/functions/CLLogicalNot.cpp",
544*c217d954SCole Faust          "src/runtime/CL/functions/CLLogicalOr.cpp"
545*c217d954SCole Faust        ]
546*c217d954SCole Faust      }
547*c217d954SCole Faust    },
548*c217d954SCole Faust    "LSTM": {
549*c217d954SCole Faust      "deps": [
550*c217d954SCole Faust        "Activation",
551*c217d954SCole Faust        "Concatenate",
552*c217d954SCole Faust        "Copy",
553*c217d954SCole Faust        "Dequantize",
554*c217d954SCole Faust        "ElementwiseBinary",
555*c217d954SCole Faust        "Fill",
556*c217d954SCole Faust        "FullyConnected",
557*c217d954SCole Faust        "Gemm",
558*c217d954SCole Faust        "MeanStdDevNormalize",
559*c217d954SCole Faust        "Mul",
560*c217d954SCole Faust        "Quantize",
561*c217d954SCole Faust        "Slice",
562*c217d954SCole Faust        "Transpose"
563*c217d954SCole Faust      ],
564*c217d954SCole Faust      "files": {
565*c217d954SCole Faust        "common": [
566*c217d954SCole Faust          "src/core/CL/kernels/CLQLSTMLayerNormalizationKernel.cpp",
567*c217d954SCole Faust          "src/runtime/CL/functions/CLQLSTMLayer.cpp",
568*c217d954SCole Faust          "src/runtime/CL/functions/CLLSTMLayer.cpp",
569*c217d954SCole Faust          "src/runtime/CL/functions/CLLSTMLayerQuantized.cpp"
570*c217d954SCole Faust        ]
571*c217d954SCole Faust      }
572*c217d954SCole Faust    },
573*c217d954SCole Faust    "MaxUnpool2d": {
574*c217d954SCole Faust      "deps": [ "Fill" ],
575*c217d954SCole Faust      "files": {
576*c217d954SCole Faust        "common": [
577*c217d954SCole Faust          "src/core/CL/kernels/CLMaxUnpoolingLayerKernel.cpp",
578*c217d954SCole Faust          "src/runtime/CL/functions/CLMaxUnpoolingLayer.cpp"
579*c217d954SCole Faust        ]
580*c217d954SCole Faust      }
581*c217d954SCole Faust    },
582*c217d954SCole Faust    "MeanStdDevNormalize": {
583*c217d954SCole Faust      "deps": [ "Reduction" ],
584*c217d954SCole Faust      "files": {
585*c217d954SCole Faust        "common": [
586*c217d954SCole Faust          "src/core/CL/kernels/CLMeanStdDevNormalizationKernel.cpp",
587*c217d954SCole Faust          "src/runtime/CL/functions/CLMeanStdDevNormalizationLayer.cpp",
588*c217d954SCole Faust          "src/runtime/CL/functions/CLReduceMean.cpp"
589*c217d954SCole Faust        ]
590*c217d954SCole Faust      }
591*c217d954SCole Faust    },
592*c217d954SCole Faust    "Mul": {
593*c217d954SCole Faust      "files": {
594*c217d954SCole Faust        "common": [
595*c217d954SCole Faust          "src/gpu/cl/kernels/ClMulKernel.cpp",
596*c217d954SCole Faust          "src/gpu/cl/operators/ClMul.cpp",
597*c217d954SCole Faust          "src/runtime/CL/functions/CLPixelWiseMultiplication.cpp"
598*c217d954SCole Faust        ]
599*c217d954SCole Faust      }
600*c217d954SCole Faust    },
601*c217d954SCole Faust    "Normalize": {
602*c217d954SCole Faust      "files": {
603*c217d954SCole Faust        "common": [
604*c217d954SCole Faust          "src/core/CL/kernels/CLNormalizationLayerKernel.cpp",
605*c217d954SCole Faust          "src/runtime/CL/functions/CLNormalizationLayer.cpp"
606*c217d954SCole Faust        ]
607*c217d954SCole Faust      }
608*c217d954SCole Faust    },
609*c217d954SCole Faust    "Pad": {
610*c217d954SCole Faust      "deps": [ "Copy" ],
611*c217d954SCole Faust      "files": {
612*c217d954SCole Faust        "common": [
613*c217d954SCole Faust          "src/core/CL/kernels/CLPadLayerKernel.cpp",
614*c217d954SCole Faust          "src/runtime/CL/functions/CLPadLayer.cpp"
615*c217d954SCole Faust        ]
616*c217d954SCole Faust      }
617*c217d954SCole Faust    },
618*c217d954SCole Faust    "Permute": {
619*c217d954SCole Faust      "files": {
620*c217d954SCole Faust        "common": [
621*c217d954SCole Faust          "src/gpu/cl/kernels/ClPermuteKernel.cpp",
622*c217d954SCole Faust          "src/gpu/cl/operators/ClPermute.cpp",
623*c217d954SCole Faust          "src/runtime/CL/functions/CLPermute.cpp"
624*c217d954SCole Faust        ]
625*c217d954SCole Faust      }
626*c217d954SCole Faust    },
627*c217d954SCole Faust    "Pool2d": {
628*c217d954SCole Faust      "files": {
629*c217d954SCole Faust        "common": [
630*c217d954SCole Faust          "src/gpu/cl/kernels/ClPool2dKernel.cpp",
631*c217d954SCole Faust          "src/gpu/cl/operators/ClPool2d.cpp",
632*c217d954SCole Faust          "src/runtime/CL/functions/CLPoolingLayer.cpp"
633*c217d954SCole Faust        ]
634*c217d954SCole Faust      }
635*c217d954SCole Faust    },
636*c217d954SCole Faust    "Pool3d": {
637*c217d954SCole Faust      "files": {
638*c217d954SCole Faust        "common": [
639*c217d954SCole Faust          "src/gpu/cl/kernels/ClPool3dKernel.cpp",
640*c217d954SCole Faust          "src/gpu/cl/operators/ClPool3d.cpp",
641*c217d954SCole Faust          "src/runtime/CL/functions/CLPooling3dLayer.cpp"
642*c217d954SCole Faust        ]
643*c217d954SCole Faust      }
644*c217d954SCole Faust    },
645*c217d954SCole Faust    "PRelu": {
646*c217d954SCole Faust      "deps": [ "ElementwiseBinary" ],
647*c217d954SCole Faust      "files": {
648*c217d954SCole Faust        "common": [
649*c217d954SCole Faust          "src/gpu/cl/operators/ClPRelu.cpp",
650*c217d954SCole Faust          "src/runtime/CL/functions/CLPReluLayer.cpp"
651*c217d954SCole Faust        ]
652*c217d954SCole Faust      }
653*c217d954SCole Faust    },
654*c217d954SCole Faust    "PriorBox": {
655*c217d954SCole Faust      "files": {
656*c217d954SCole Faust        "common": [
657*c217d954SCole Faust          "src/core/CL/kernels/CLPriorBoxLayerKernel.cpp",
658*c217d954SCole Faust          "src/runtime/CL/functions/CLPriorBoxLayer.cpp"
659*c217d954SCole Faust        ]
660*c217d954SCole Faust      }
661*c217d954SCole Faust    },
662*c217d954SCole Faust    "Quantize": {
663*c217d954SCole Faust      "files": {
664*c217d954SCole Faust        "common": [
665*c217d954SCole Faust          "src/gpu/cl/kernels/ClQuantizeKernel.cpp",
666*c217d954SCole Faust          "src/gpu/cl/operators/ClQuantize.cpp",
667*c217d954SCole Faust          "src/runtime/CL/functions/CLQuantizationLayer.cpp"
668*c217d954SCole Faust        ]
669*c217d954SCole Faust      }
670*c217d954SCole Faust    },
671*c217d954SCole Faust    "Range": {
672*c217d954SCole Faust      "files": {
673*c217d954SCole Faust        "common": [
674*c217d954SCole Faust          "src/core/CL/kernels/CLRangeKernel.cpp",
675*c217d954SCole Faust          "src/runtime/CL/functions/CLRange.cpp"
676*c217d954SCole Faust        ]
677*c217d954SCole Faust      }
678*c217d954SCole Faust    },
679*c217d954SCole Faust    "Reduction": {
680*c217d954SCole Faust      "deps": [ "Reshape" ],
681*c217d954SCole Faust      "files": {
682*c217d954SCole Faust        "common": [
683*c217d954SCole Faust          "src/core/CL/kernels/CLReductionOperationKernel.cpp",
684*c217d954SCole Faust          "src/runtime/CL/functions/CLReductionOperation.cpp"
685*c217d954SCole Faust        ]
686*c217d954SCole Faust      }
687*c217d954SCole Faust    },
688*c217d954SCole Faust    "Reorg": {
689*c217d954SCole Faust      "files": {
690*c217d954SCole Faust        "common": [
691*c217d954SCole Faust          "src/core/CL/kernels/CLReorgLayerKernel.cpp",
692*c217d954SCole Faust          "src/runtime/CL/functions/CLReorgLayer.cpp"
693*c217d954SCole Faust        ]
694*c217d954SCole Faust      }
695*c217d954SCole Faust    },
696*c217d954SCole Faust    "Reshape": {
697*c217d954SCole Faust      "files": {
698*c217d954SCole Faust        "common": [
699*c217d954SCole Faust          "src/gpu/cl/kernels/ClReshapeKernel.cpp",
700*c217d954SCole Faust          "src/gpu/cl/operators/ClReshape.cpp",
701*c217d954SCole Faust          "src/runtime/CL/functions/CLReshapeLayer.cpp"
702*c217d954SCole Faust        ]
703*c217d954SCole Faust      }
704*c217d954SCole Faust    },
705*c217d954SCole Faust    "Reverse": {
706*c217d954SCole Faust      "files": {
707*c217d954SCole Faust        "common": [
708*c217d954SCole Faust          "src/core/CL/kernels/CLReverseKernel.cpp",
709*c217d954SCole Faust          "src/runtime/CL/functions/CLReverse.cpp"
710*c217d954SCole Faust        ]
711*c217d954SCole Faust      }
712*c217d954SCole Faust    },
713*c217d954SCole Faust    "RNN": {
714*c217d954SCole Faust      "deps": [ "Activation", "Cast", "ElementwiseBinary", "FullyConnected", "Gemm"],
715*c217d954SCole Faust      "files": {
716*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLRNNLayer.cpp" ]
717*c217d954SCole Faust      }
718*c217d954SCole Faust    },
719*c217d954SCole Faust    "ROIAlign": {
720*c217d954SCole Faust      "files": {
721*c217d954SCole Faust        "common": [
722*c217d954SCole Faust          "src/core/CL/kernels/CLROIAlignLayerKernel.cpp",
723*c217d954SCole Faust          "src/runtime/CL/functions/CLROIAlignLayer.cpp"
724*c217d954SCole Faust        ]
725*c217d954SCole Faust      }
726*c217d954SCole Faust    },
727*c217d954SCole Faust    "ROIPool2d": {
728*c217d954SCole Faust      "files": {
729*c217d954SCole Faust        "common": [
730*c217d954SCole Faust          "src/core/CL/kernels/CLROIPoolingLayerKernel.cpp",
731*c217d954SCole Faust          "src/runtime/CL/functions/CLROIPoolingLayer.cpp"
732*c217d954SCole Faust        ]
733*c217d954SCole Faust      }
734*c217d954SCole Faust    },
735*c217d954SCole Faust    "Scale": {
736*c217d954SCole Faust      "files": {
737*c217d954SCole Faust        "common": [
738*c217d954SCole Faust          "src/gpu/cl/kernels/ClScaleKernel.cpp",
739*c217d954SCole Faust          "src/gpu/cl/operators/ClScale.cpp",
740*c217d954SCole Faust          "src/runtime/CL/functions/CLScale.cpp"
741*c217d954SCole Faust        ]
742*c217d954SCole Faust      }
743*c217d954SCole Faust    },
744*c217d954SCole Faust    "Select": {
745*c217d954SCole Faust      "files": {
746*c217d954SCole Faust        "common": [
747*c217d954SCole Faust          "src/core/CL/kernels/CLSelectKernel.cpp",
748*c217d954SCole Faust          "src/runtime/CL/functions/CLSelect.cpp"
749*c217d954SCole Faust        ]
750*c217d954SCole Faust      }
751*c217d954SCole Faust    },
752*c217d954SCole Faust    "Slice": {
753*c217d954SCole Faust      "deps": [ "StridedSlice" ],
754*c217d954SCole Faust      "files": {
755*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLSlice.cpp" ]
756*c217d954SCole Faust      }
757*c217d954SCole Faust    },
758*c217d954SCole Faust    "Softmax": {
759*c217d954SCole Faust      "deps": [ "Permute" ],
760*c217d954SCole Faust      "files": {
761*c217d954SCole Faust        "common": [
762*c217d954SCole Faust          "src/gpu/cl/kernels/ClSoftmaxKernel.cpp",
763*c217d954SCole Faust          "src/gpu/cl/operators/ClSoftmax.cpp",
764*c217d954SCole Faust          "src/runtime/CL/functions/CLSoftmaxLayer.cpp"
765*c217d954SCole Faust        ]
766*c217d954SCole Faust      }
767*c217d954SCole Faust    },
768*c217d954SCole Faust    "SpaceToBatch": {
769*c217d954SCole Faust      "files": {
770*c217d954SCole Faust        "common": [
771*c217d954SCole Faust          "src/core/CL/kernels/CLSpaceToBatchLayerKernel.cpp",
772*c217d954SCole Faust          "src/runtime/CL/functions/CLSpaceToBatchLayer.cpp"
773*c217d954SCole Faust        ]
774*c217d954SCole Faust      }
775*c217d954SCole Faust    },
776*c217d954SCole Faust    "SpaceToDepth": {
777*c217d954SCole Faust      "files": {
778*c217d954SCole Faust        "common": [
779*c217d954SCole Faust          "src/core/CL/kernels/CLSpaceToDepthLayerKernel.cpp",
780*c217d954SCole Faust          "src/runtime/CL/functions/CLSpaceToDepthLayer.cpp"
781*c217d954SCole Faust        ]
782*c217d954SCole Faust      }
783*c217d954SCole Faust    },
784*c217d954SCole Faust    "Split": {
785*c217d954SCole Faust      "deps": [ "StridedSlice" ],
786*c217d954SCole Faust      "files": {
787*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLSplit.cpp" ]
788*c217d954SCole Faust      }
789*c217d954SCole Faust    },
790*c217d954SCole Faust    "Stack": {
791*c217d954SCole Faust      "files": {
792*c217d954SCole Faust        "common": [
793*c217d954SCole Faust          "src/core/CL/kernels/CLStackLayerKernel.cpp",
794*c217d954SCole Faust          "src/runtime/CL/functions/CLStackLayer.cpp"
795*c217d954SCole Faust        ]
796*c217d954SCole Faust      }
797*c217d954SCole Faust    },
798*c217d954SCole Faust    "StridedSlice": {
799*c217d954SCole Faust      "files": {
800*c217d954SCole Faust        "common": [
801*c217d954SCole Faust          "src/core/CL/kernels/CLStridedSliceKernel.cpp",
802*c217d954SCole Faust          "src/runtime/CL/functions/CLStridedSlice.cpp"
803*c217d954SCole Faust        ]
804*c217d954SCole Faust      }
805*c217d954SCole Faust    },
806*c217d954SCole Faust    "Sub": {
807*c217d954SCole Faust      "files": {
808*c217d954SCole Faust        "common": [
809*c217d954SCole Faust          "src/gpu/cl/kernels/ClElementwiseKernel.cpp",
810*c217d954SCole Faust          "src/gpu/cl/operators/ClSub.cpp"
811*c217d954SCole Faust        ]
812*c217d954SCole Faust      }
813*c217d954SCole Faust    },
814*c217d954SCole Faust    "Tile": {
815*c217d954SCole Faust      "files": {
816*c217d954SCole Faust        "common": [
817*c217d954SCole Faust          "src/core/CL/kernels/CLTileKernel.cpp",
818*c217d954SCole Faust          "src/runtime/CL/functions/CLTile.cpp"
819*c217d954SCole Faust        ]
820*c217d954SCole Faust      }
821*c217d954SCole Faust    },
822*c217d954SCole Faust    "Transpose": {
823*c217d954SCole Faust      "files": {
824*c217d954SCole Faust        "common": [
825*c217d954SCole Faust          "src/gpu/cl/kernels/ClTransposeKernel.cpp",
826*c217d954SCole Faust          "src/gpu/cl/operators/ClTranspose.cpp",
827*c217d954SCole Faust          "src/runtime/CL/functions/CLTranspose.cpp"
828*c217d954SCole Faust        ]
829*c217d954SCole Faust      }
830*c217d954SCole Faust    },
831*c217d954SCole Faust    "Unstack": {
832*c217d954SCole Faust      "deps": [ "StridedSlice" ],
833*c217d954SCole Faust      "files": {
834*c217d954SCole Faust        "common": [ "src/runtime/CL/functions/CLUnstack.cpp" ]
835*c217d954SCole Faust      }
836*c217d954SCole Faust    },
837*c217d954SCole Faust    "YUVNormalize": {
838*c217d954SCole Faust      "files": {
839*c217d954SCole Faust        "common": [
840*c217d954SCole Faust          "src/core/CL/kernels/CLNormalizePlanarYUVLayerKernel.cpp",
841*c217d954SCole Faust          "src/runtime/CL/functions/CLNormalizePlanarYUVLayer.cpp"
842*c217d954SCole Faust        ]
843*c217d954SCole Faust      }
844*c217d954SCole Faust    }
845*c217d954SCole Faust  }
846*c217d954SCole Faust},
847*c217d954SCole Faust  "cpu": {
848*c217d954SCole Faust    "common": [
849*c217d954SCole Faust      "src/cpu/CpuContext.cpp",
850*c217d954SCole Faust      "src/cpu/CpuQueue.cpp",
851*c217d954SCole Faust      "src/cpu/CpuTensor.cpp",
852*c217d954SCole Faust      "src/core/NEON/kernels/NEFillBorderKernel.cpp",
853*c217d954SCole Faust      "src/runtime/NEON/INEOperator.cpp",
854*c217d954SCole Faust      "src/runtime/NEON/INESimpleFunction.cpp",
855*c217d954SCole Faust      "src/runtime/NEON/INESimpleFunctionNoBorder.cpp"
856*c217d954SCole Faust    ],
857*c217d954SCole Faust    "operators": {
858*c217d954SCole Faust      "Activation": {
859*c217d954SCole Faust        "files": {
860*c217d954SCole Faust          "common": [
861*c217d954SCole Faust            "src/cpu/operators/CpuActivation.cpp",
862*c217d954SCole Faust            "src/cpu/kernels/CpuActivationKernel.cpp",
863*c217d954SCole Faust            "src/runtime/NEON/functions/NEActivationLayer.cpp"
864*c217d954SCole Faust          ],
865*c217d954SCole Faust          "neon": {
866*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/activation/generic/neon/fp16.cpp" ],
867*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/activation/generic/neon/fp32.cpp" ],
868*c217d954SCole Faust            "qasymm8": [
869*c217d954SCole Faust              "src/cpu/kernels/activation/generic/neon/qasymm8.cpp",
870*c217d954SCole Faust              "src/cpu/kernels/activation/generic/neon/lut.cpp"
871*c217d954SCole Faust            ],
872*c217d954SCole Faust            "qasymm8_signed": [
873*c217d954SCole Faust              "src/cpu/kernels/activation/generic/neon/qasymm8_signed.cpp",
874*c217d954SCole Faust              "src/cpu/kernels/activation/generic/neon/lut.cpp"
875*c217d954SCole Faust            ],
876*c217d954SCole Faust            "qsymm16": [ "src/cpu/kernels/activation/generic/neon/qsymm16.cpp" ]
877*c217d954SCole Faust          },
878*c217d954SCole Faust          "sve": {
879*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/activation/generic/sve/fp16.cpp" ],
880*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/activation/generic/sve/fp32.cpp" ],
881*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/activation/generic/sve/lut.cpp"]
882*c217d954SCole Faust          },
883*c217d954SCole Faust          "sve2":{
884*c217d954SCole Faust            "qasymm8": [ "src/cpu/kernels/activation/generic/sve2/qasymm8.cpp" ],
885*c217d954SCole Faust            "qasymm8_signed": [ "src/cpu/kernels/activation/generic/sve2/qasymm8_signed.cpp" ],
886*c217d954SCole Faust            "qsymm16": [ "src/cpu/kernels/activation/generic/sve2/qsymm16.cpp" ]
887*c217d954SCole Faust          }
888*c217d954SCole Faust        }
889*c217d954SCole Faust      },
890*c217d954SCole Faust      "ArgMinMax": {
891*c217d954SCole Faust        "deps": [ "Reduction" ],
892*c217d954SCole Faust        "files": {
893*c217d954SCole Faust          "common": [ "src/runtime/NEON/functions/NEArgMinMaxLayer.cpp" ]
894*c217d954SCole Faust        }
895*c217d954SCole Faust      },
896*c217d954SCole Faust      "Add": {
897*c217d954SCole Faust        "files": {
898*c217d954SCole Faust          "common": [
899*c217d954SCole Faust            "src/cpu/operators/CpuAdd.cpp",
900*c217d954SCole Faust            "src/cpu/kernels/CpuAddKernel.cpp",
901*c217d954SCole Faust            "src/runtime/NEON/functions/NEArithmeticAddition.cpp"
902*c217d954SCole Faust          ],
903*c217d954SCole Faust          "neon": {
904*c217d954SCole Faust            "common": ["src/cpu/kernels/add/generic/neon/impl.cpp"],
905*c217d954SCole Faust            "fp32":["src/cpu/kernels/add/generic/neon/fp32.cpp"],
906*c217d954SCole Faust            "fp16":["src/cpu/kernels/add/generic/neon/fp16.cpp"],
907*c217d954SCole Faust            "integer":["src/cpu/kernels/add/generic/neon/integer.cpp"],
908*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/add/generic/neon/qasymm8.cpp"],
909*c217d954SCole Faust            "qasymm8_signed": ["src/cpu/kernels/add/generic/neon/qasymm8_signed.cpp"],
910*c217d954SCole Faust            "qsymm16": ["src/cpu/kernels/add/generic/neon/qsymm16.cpp"]
911*c217d954SCole Faust          },
912*c217d954SCole Faust          "sve": {
913*c217d954SCole Faust            "common": [ "src/cpu/kernels/add/generic/sve/impl.cpp" ],
914*c217d954SCole Faust            "integer":["src/cpu/kernels/add/generic/sve/integer.cpp"],
915*c217d954SCole Faust            "fp32":["src/cpu/kernels/add/generic/sve/fp32.cpp"],
916*c217d954SCole Faust            "fp16":["src/cpu/kernels/add/generic/sve/fp16.cpp"]
917*c217d954SCole Faust          },
918*c217d954SCole Faust          "sve2": {
919*c217d954SCole Faust            "qasymm8": [ "src/cpu/kernels/add/generic/sve2/qasymm8.cpp" ],
920*c217d954SCole Faust            "qasymm8_signed": [ "src/cpu/kernels/add/generic/sve2/qasymm8_signed.cpp" ],
921*c217d954SCole Faust            "qsymm16": [ "src/cpu/kernels/add/generic/sve2/qsymm16.cpp" ]
922*c217d954SCole Faust          }
923*c217d954SCole Faust        }
924*c217d954SCole Faust      },
925*c217d954SCole Faust      "AddMulAdd": {
926*c217d954SCole Faust        "files": {
927*c217d954SCole Faust          "common": [
928*c217d954SCole Faust            "src/cpu/operators/CpuAddMulAdd.cpp",
929*c217d954SCole Faust            "src/cpu/kernels/CpuAddMulAddKernel.cpp",
930*c217d954SCole Faust            "src/runtime/NEON/functions/NEAddMulAdd.cpp"
931*c217d954SCole Faust          ],
932*c217d954SCole Faust          "neon": {
933*c217d954SCole Faust            "fp32":["src/cpu/kernels/addmuladd/generic/neon/fp32.cpp"],
934*c217d954SCole Faust            "fp16":["src/cpu/kernels/addmuladd/generic/neon/fp16.cpp"],
935*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8.cpp"],
936*c217d954SCole Faust            "qasymm8_signed": ["src/cpu/kernels/addmuladd/generic/neon/qasymm8_signed.cpp"]
937*c217d954SCole Faust          }
938*c217d954SCole Faust        }
939*c217d954SCole Faust      },
940*c217d954SCole Faust      "BatchNormalize": {
941*c217d954SCole Faust        "files": {
942*c217d954SCole Faust          "common": [
943*c217d954SCole Faust            "src/core/NEON/kernels/NEBatchNormalizationLayerKernel.cpp",
944*c217d954SCole Faust            "src/core/NEON/kernels/NEFuseBatchNormalizationKernel.cpp",
945*c217d954SCole Faust            "src/runtime/NEON/functions/NEBatchNormalizationLayer.cpp",
946*c217d954SCole Faust            "src/runtime/NEON/functions/NEFuseBatchNormalization.cpp"
947*c217d954SCole Faust          ],
948*c217d954SCole Faust          "neon": {
949*c217d954SCole Faust            "common": [
950*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/generic/impl.cpp",
951*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/nchw/all.cpp",
952*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/impl.cpp"
953*c217d954SCole Faust            ],
954*c217d954SCole Faust            "fp16": [
955*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/generic/fp16.cpp",
956*c217d954SCole Faust              "src/core/NEON/kernels/batchnormalization/impl/NEON/fp16.cpp",
957*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp16.cpp"
958*c217d954SCole Faust            ],
959*c217d954SCole Faust            "fp32": [
960*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/generic/fp32.cpp",
961*c217d954SCole Faust              "src/core/NEON/kernels/batchnormalization/impl/NEON/fp32.cpp",
962*c217d954SCole Faust              "src/cpu/kernels/fuse_batch_normalization/nhwc/neon/fp32.cpp"
963*c217d954SCole Faust            ]
964*c217d954SCole Faust          },
965*c217d954SCole Faust          "sve": {
966*c217d954SCole Faust            "fp16": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp16.cpp" ],
967*c217d954SCole Faust            "fp32": [ "src/core/NEON/kernels/batchnormalization/impl/SVE/fp32.cpp" ]
968*c217d954SCole Faust          }
969*c217d954SCole Faust        }
970*c217d954SCole Faust      },
971*c217d954SCole Faust      "BatchToSpace": {
972*c217d954SCole Faust        "files": {
973*c217d954SCole Faust          "common": [
974*c217d954SCole Faust            "src/core/NEON/kernels/NEBatchToSpaceLayerKernel.cpp",
975*c217d954SCole Faust            "src/runtime/NEON/functions/NEBatchToSpaceLayer.cpp"
976*c217d954SCole Faust          ]
977*c217d954SCole Faust        }
978*c217d954SCole Faust      },
979*c217d954SCole Faust      "BitwiseAnd": {
980*c217d954SCole Faust        "files": {
981*c217d954SCole Faust          "common": [
982*c217d954SCole Faust            "src/core/NEON/kernels/NEBitwiseAndKernel.cpp",
983*c217d954SCole Faust            "src/runtime/NEON/functions/NEBitwiseAnd.cpp"
984*c217d954SCole Faust          ]
985*c217d954SCole Faust        }
986*c217d954SCole Faust      },
987*c217d954SCole Faust      "BitwiseNot": {
988*c217d954SCole Faust        "files": {
989*c217d954SCole Faust          "common": [
990*c217d954SCole Faust            "src/core/NEON/kernels/NEBitwiseNotKernel.cpp",
991*c217d954SCole Faust            "src/runtime/NEON/functions/NEBitwiseNot.cpp"
992*c217d954SCole Faust          ]
993*c217d954SCole Faust        }
994*c217d954SCole Faust      },
995*c217d954SCole Faust      "BitwiseOr": {
996*c217d954SCole Faust        "files": {
997*c217d954SCole Faust          "common": [
998*c217d954SCole Faust            "src/core/NEON/kernels/NEBitwiseOrKernel.cpp",
999*c217d954SCole Faust            "src/runtime/NEON/functions/NEBitwiseOr.cpp"
1000*c217d954SCole Faust          ]
1001*c217d954SCole Faust        }
1002*c217d954SCole Faust      },
1003*c217d954SCole Faust      "BitwiseXor": {
1004*c217d954SCole Faust        "files": {
1005*c217d954SCole Faust          "common": [
1006*c217d954SCole Faust            "src/core/NEON/kernels/NEBitwiseXorKernel.cpp",
1007*c217d954SCole Faust            "src/runtime/NEON/functions/NEBitwiseXor.cpp"
1008*c217d954SCole Faust          ]
1009*c217d954SCole Faust        }
1010*c217d954SCole Faust      },
1011*c217d954SCole Faust      "BoundingBoxTransform": {
1012*c217d954SCole Faust        "files": {
1013*c217d954SCole Faust          "common": [
1014*c217d954SCole Faust            "src/core/NEON/kernels/NEBoundingBoxTransformKernel.cpp",
1015*c217d954SCole Faust            "src/runtime/NEON/functions/NEBoundingBoxTransform.cpp"
1016*c217d954SCole Faust          ],
1017*c217d954SCole Faust          "neon":{
1018*c217d954SCole Faust            "common":["src/cpu/kernels/boundingboxtransform/generic/neon/impl.cpp"],
1019*c217d954SCole Faust            "fp32":["src/cpu/kernels/boundingboxtransform/generic/neon/fp32.cpp"],
1020*c217d954SCole Faust            "fp16":["src/cpu/kernels/boundingboxtransform/generic/neon/fp16.cpp"],
1021*c217d954SCole Faust            "qsymm16":["src/cpu/kernels/boundingboxtransform/generic/neon/qsymm16.cpp"]
1022*c217d954SCole Faust          }
1023*c217d954SCole Faust        }
1024*c217d954SCole Faust      },
1025*c217d954SCole Faust      "Cast": {
1026*c217d954SCole Faust        "files": {
1027*c217d954SCole Faust          "common": [
1028*c217d954SCole Faust            "src/cpu/operators/CpuCast.cpp",
1029*c217d954SCole Faust            "src/cpu/kernels/CpuCastKernel.cpp",
1030*c217d954SCole Faust            "src/runtime/NEON/functions/NECast.cpp",
1031*c217d954SCole Faust            "src/cpu/kernels/cast/generic/neon/bfloat16.cpp"
1032*c217d954SCole Faust          ],
1033*c217d954SCole Faust          "neon":{
1034*c217d954SCole Faust            "fp16":["src/cpu/kernels/cast/generic/neon/fp16.cpp"]
1035*c217d954SCole Faust          }
1036*c217d954SCole Faust        }
1037*c217d954SCole Faust      },
1038*c217d954SCole Faust      "ChannelShuffle": {
1039*c217d954SCole Faust        "files": {
1040*c217d954SCole Faust          "common": [
1041*c217d954SCole Faust            "src/core/NEON/kernels/NEChannelShuffleLayerKernel.cpp",
1042*c217d954SCole Faust            "src/runtime/NEON/functions/NEChannelShuffleLayer.cpp"
1043*c217d954SCole Faust          ]
1044*c217d954SCole Faust        }
1045*c217d954SCole Faust      },
1046*c217d954SCole Faust      "Concatenate": {
1047*c217d954SCole Faust        "files": {
1048*c217d954SCole Faust          "common": [
1049*c217d954SCole Faust            "src/cpu/operators/CpuConcatenate.cpp",
1050*c217d954SCole Faust            "src/cpu/kernels/CpuConcatenateWidthKernel.cpp",
1051*c217d954SCole Faust            "src/cpu/kernels/CpuConcatenateBatchKernel.cpp",
1052*c217d954SCole Faust            "src/cpu/kernels/CpuConcatenateDepthKernel.cpp",
1053*c217d954SCole Faust            "src/cpu/kernels/CpuConcatenateHeightKernel.cpp",
1054*c217d954SCole Faust            "src/runtime/NEON/functions/NEConcatenateLayer.cpp"
1055*c217d954SCole Faust          ]
1056*c217d954SCole Faust        }
1057*c217d954SCole Faust      },
1058*c217d954SCole Faust      "Conv2d": {
1059*c217d954SCole Faust        "deps": [
1060*c217d954SCole Faust          "Activation",
1061*c217d954SCole Faust          "ElementwiseBinary",
1062*c217d954SCole Faust          "FFT2D",
1063*c217d954SCole Faust          "Gemm",
1064*c217d954SCole Faust          "Mul",
1065*c217d954SCole Faust          "Pad",
1066*c217d954SCole Faust          "Permute",
1067*c217d954SCole Faust          "Reshape",
1068*c217d954SCole Faust          "Reverse",
1069*c217d954SCole Faust          "Slice"
1070*c217d954SCole Faust        ],
1071*c217d954SCole Faust        "files": {
1072*c217d954SCole Faust          "common": [
1073*c217d954SCole Faust            "src/cpu/operators/CpuConv2d.cpp",
1074*c217d954SCole Faust            "src/cpu/operators/CpuDirectConv2d.cpp",
1075*c217d954SCole Faust            "src/cpu/operators/CpuGemmDirectConv2d.cpp",
1076*c217d954SCole Faust            "src/cpu/operators/CpuGemmConv2d.cpp",
1077*c217d954SCole Faust            "src/cpu/operators/CpuWinogradConv2d.cpp",
1078*c217d954SCole Faust            "src/cpu/operators/internal/CpuGemmAssemblyDispatch.cpp",
1079*c217d954SCole Faust            "src/cpu/kernels/CpuDirectConv2dKernel.cpp",
1080*c217d954SCole Faust            "src/cpu/kernels/CpuDirectConv2dOutputStageKernel.cpp",
1081*c217d954SCole Faust            "src/cpu/kernels/CpuWinogradConv2dKernel.cpp",
1082*c217d954SCole Faust            "src/cpu/kernels/CpuCol2ImKernel.cpp",
1083*c217d954SCole Faust            "src/cpu/kernels/CpuIm2ColKernel.cpp",
1084*c217d954SCole Faust            "src/cpu/kernels/CpuWeightsReshapeKernel.cpp",
1085*c217d954SCole Faust            "src/runtime/NEON/functions/NEConvolutionLayer.cpp",
1086*c217d954SCole Faust            "src/runtime/NEON/functions/NEDirectConvolutionLayer.cpp",
1087*c217d954SCole Faust            "src/runtime/NEON/functions/NEFFTConvolutionLayer.cpp",
1088*c217d954SCole Faust            "src/runtime/NEON/functions/NEGEMMConv2d.cpp",
1089*c217d954SCole Faust            "src/runtime/NEON/functions/NEGEMMConvolutionLayer.cpp",
1090*c217d954SCole Faust            "src/runtime/NEON/functions/NEWinogradConvolutionLayer.cpp"
1091*c217d954SCole Faust          ],
1092*c217d954SCole Faust          "neon": {
1093*c217d954SCole Faust            "common": [
1094*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/padding.cpp",
1095*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1096*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1097*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/utils.cpp",
1098*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms_fp16.cpp",
1099*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms_fp32.cpp",
1100*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms_fp16.cpp",
1101*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms_fp32.cpp",
1102*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp16.cpp",
1103*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms_fp32.cpp",
1104*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/winograd_fp16.cpp",
1105*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/winograd_fp32.cpp",
1106*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp16_6x6.cpp",
1107*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/a64_fp32_6x6.cpp",
1108*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_1x8.cpp",
1109*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_4x4.cpp",
1110*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/arm_fp32_6x6.cpp",
1111*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/a64_fp16_4x4_3x3.cpp",
1112*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x2_1x7.cpp",
1113*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x4_1x5.cpp",
1114*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_1x6_1x3.cpp",
1115*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_3x3.cpp",
1116*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_2x2_5x5.cpp",
1117*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/arm_fp32_4x4_3x3.cpp",
1118*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/a64_fp16_4x4_3x3.cpp",
1119*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_3x3.cpp",
1120*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_2x2_5x5.cpp",
1121*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/arm_fp32_4x4_3x3.cpp",
1122*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x2_1x7.cpp",
1123*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x4_1x5.cpp",
1124*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/weight_transforms/cpp_fp32_1x6_1x3.cpp",
1125*c217d954SCole Faust              "src/cpu/kernels/directconv2d/nhwc/neon/impl.cpp",
1126*c217d954SCole Faust              "src/cpu/kernels/directconv2d/nchw/all.cpp"
1127*c217d954SCole Faust            ],
1128*c217d954SCole Faust            "fp32": [
1129*c217d954SCole Faust              "src/cpu/kernels/directconv2d/nhwc/neon/fp32.cpp"
1130*c217d954SCole Faust            ]
1131*c217d954SCole Faust          },
1132*c217d954SCole Faust          "sve": {
1133*c217d954SCole Faust            "common": [
1134*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/sve_fp32_6x6.cpp",
1135*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/input_transforms/sme_fp32_mla_6x6.cpp",
1136*c217d954SCole Faust              "src/core/NEON/kernels/convolution/winograd/output_transforms/sme_fp32_mopa_4x4_3x3.cpp"
1137*c217d954SCole Faust            ]
1138*c217d954SCole Faust          }
1139*c217d954SCole Faust        }
1140*c217d954SCole Faust      },
1141*c217d954SCole Faust      "Copy": {
1142*c217d954SCole Faust        "files": {
1143*c217d954SCole Faust          "common": [
1144*c217d954SCole Faust            "src/cpu/operators/CpuCopy.cpp",
1145*c217d954SCole Faust            "src/cpu/kernels/CpuCopyKernel.cpp",
1146*c217d954SCole Faust            "src/runtime/NEON/functions/NECopy.cpp"
1147*c217d954SCole Faust          ]
1148*c217d954SCole Faust        }
1149*c217d954SCole Faust      },
1150*c217d954SCole Faust      "CropResize": {
1151*c217d954SCole Faust        "deps": [ "Scale" ],
1152*c217d954SCole Faust        "files": {
1153*c217d954SCole Faust          "common": [
1154*c217d954SCole Faust            "src/core/NEON/kernels/NECropKernel.cpp",
1155*c217d954SCole Faust            "src/runtime/NEON/functions/NECropResize.cpp"
1156*c217d954SCole Faust          ],
1157*c217d954SCole Faust          "neon": {
1158*c217d954SCole Faust            "common":  [ "src/cpu/kernels/crop/generic/neon/impl.cpp" ],
1159*c217d954SCole Faust            "fp32":    [ "src/cpu/kernels/crop/generic/neon/fp32.cpp" ],
1160*c217d954SCole Faust            "fp16":    [ "src/cpu/kernels/crop/generic/neon/fp16.cpp" ],
1161*c217d954SCole Faust            "integer": [ "src/cpu/kernels/crop/generic/neon/integer.cpp"   ]
1162*c217d954SCole Faust          }
1163*c217d954SCole Faust        }
1164*c217d954SCole Faust      },
1165*c217d954SCole Faust      "Deconv2d": {
1166*c217d954SCole Faust        "deps": [ "Conv2d", "Reverse", "Transpose"],
1167*c217d954SCole Faust        "files": {
1168*c217d954SCole Faust          "common": [
1169*c217d954SCole Faust            "src/runtime/NEON/functions/NEDeconvolutionLayer.cpp"
1170*c217d954SCole Faust          ]
1171*c217d954SCole Faust        }
1172*c217d954SCole Faust      },
1173*c217d954SCole Faust      "DepthConvert": {
1174*c217d954SCole Faust        "deps": [ "Cast"],
1175*c217d954SCole Faust        "files": {
1176*c217d954SCole Faust          "common": [
1177*c217d954SCole Faust            "src/runtime/NEON/functions/NEDepthConvertLayer.cpp"
1178*c217d954SCole Faust          ]
1179*c217d954SCole Faust        }
1180*c217d954SCole Faust      },
1181*c217d954SCole Faust      "DepthToSpace": {
1182*c217d954SCole Faust        "files": {
1183*c217d954SCole Faust          "common": [
1184*c217d954SCole Faust            "src/core/NEON/kernels/NEDepthToSpaceLayerKernel.cpp",
1185*c217d954SCole Faust            "src/runtime/NEON/functions/NEDepthToSpaceLayer.cpp"
1186*c217d954SCole Faust          ]
1187*c217d954SCole Faust        }
1188*c217d954SCole Faust      },
1189*c217d954SCole Faust      "DepthwiseConv2d": {
1190*c217d954SCole Faust        "deps": [ "Activation", "Permute" ],
1191*c217d954SCole Faust        "files": {
1192*c217d954SCole Faust          "common": [
1193*c217d954SCole Faust            "src/cpu/operators/CpuDepthwiseConv2d.cpp",
1194*c217d954SCole Faust            "src/cpu/operators/CpuDepthwiseConv2dAssemblyDispatch.cpp",
1195*c217d954SCole Faust            "src/cpu/kernels/CpuDepthwiseConv2dNativeKernel.cpp",
1196*c217d954SCole Faust            "src/cpu/kernels/internal/CpuDepthwiseConv2dAssemblyWrapperKernel.cpp",
1197*c217d954SCole Faust            "src/runtime/NEON/functions/NEDepthwiseConvolutionLayer.cpp"
1198*c217d954SCole Faust          ],
1199*c217d954SCole Faust          "neon": {
1200*c217d954SCole Faust            "common": [
1201*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/padding.cpp",
1202*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/qasymm8.cpp",
1203*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/qsymm8.cpp",
1204*c217d954SCole Faust              "src/core/NEON/kernels/convolution/common/utils.cpp",
1205*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/addressing.cpp",
1206*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_strategies_common.cpp",
1207*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8q.cpp",
1208*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_u8s8u8q.cpp",
1209*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/8b_mla.cpp",
1210*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_s8q.cpp",
1211*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp32.cpp",
1212*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1213*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1214*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1215*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1216*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1217*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1218*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1219*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1220*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1221*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1222*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1223*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/depthwise_fp16.cpp",
1224*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1225*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1226*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1227*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1228*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1229*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1230*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1231*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1232*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1233*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1234*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp16_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1235*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1236*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1237*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1238*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1239*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1240*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1241*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1242*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1243*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1244*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1245*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1246*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1247*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1248*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1249*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1250*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1251*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1252*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1253*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1254*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1255*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1256*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1257*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1258*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1259*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1260*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8s8u8q_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1261*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1262*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1263*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/a64_u8qa_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1264*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_s8q_3x3_dot.cpp",
1265*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/a64_u8q_3x3_dot.cpp",
1266*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic.cpp",
1267*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/generic_quantized_dot_product.cpp",
1268*c217d954SCole Faust              "src/cpu/kernels/depthwiseconv2d/generic/neon/impl.cpp"
1269*c217d954SCole Faust              ],
1270*c217d954SCole Faust              "fp16":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp16.cpp"],
1271*c217d954SCole Faust              "fp32":["src/cpu/kernels/depthwiseconv2d/generic/neon/fp32.cpp"],
1272*c217d954SCole Faust              "qasymm8":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8.cpp"],
1273*c217d954SCole Faust              "qasymm8_signed":["src/cpu/kernels/depthwiseconv2d/generic/neon/qasymm8_signed.cpp"]
1274*c217d954SCole Faust          },
1275*c217d954SCole Faust          "sve": {
1276*c217d954SCole Faust            "common": [
1277*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_8b_mla.cpp",
1278*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_s8q_3x3_dot.cpp",
1279*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/interleaves/sve_u8q_3x3_dot.cpp",
1280*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1281*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1282*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1283*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1284*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1285*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1286*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1287*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1288*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1289*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp16_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1290*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1291*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1292*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1293*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst_strided/generic.cpp",
1294*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1295*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1296*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1297*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1298*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1299*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1300*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1301*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_5x5_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1302*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_nhwc_generic_output9_mla_depthfirst/generic.cpp",
1303*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_3x3_s2_with_multiplier_output3x3_mla_depthfirst/generic.cpp",
1304*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_5x5_s1_with_multiplier_output2x4_mla_depthfirst/generic.cpp",
1305*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_fp32_packed_to_nhwc_generic_with_multiplier_output2x8_mla_depthfirst/generic.cpp",
1306*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1307*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1308*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1309*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1310*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1311*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1312*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_s8qs_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1313*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_dot_depthfirst/generic.cpp",
1314*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1315*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1316*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1317*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_3x3_s2_with_multiplier_output2x4_dot_depthfirst/generic.cpp",
1318*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8q_packed_to_nhwc_5x5_s1_with_multiplier_output4x2_dot_depthfirst/generic.cpp",
1319*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s1_output2x2_mla_depthfirst/generic.cpp",
1320*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_3x3_s2_output2x2_mla_depthfirst/generic.cpp",
1321*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sve_u8s8u8q_nhwc_5x5_s1_output2x2_mla_depthfirst/generic.cpp",
1322*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_direct.cpp",
1323*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output2x2_mla_depthfirst/generic_indirect.cpp",
1324*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_direct.cpp",
1325*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output3x3_mla_depthfirst/generic_indirect.cpp",
1326*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_direct.cpp",
1327*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s1_output4x4_mla_depthfirst/generic_indirect.cpp",
1328*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_direct.cpp",
1329*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_nhwc_3x3_s2_output2x2_mla_depthfirst/generic_indirect.cpp",
1330*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s1_4rows_mla_za/generic.cpp",
1331*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_3x3_s2_4rows_mla_za/generic.cpp",
1332*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s1_4rows_mla_za/generic.cpp",
1333*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32_planar_5x5_s2_4rows_mla_za/generic.cpp",
1334*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s1_4rows_dot_za/generic.cpp",
1335*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_3x3_s2_4rows_dot_za/generic.cpp",
1336*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s1_4rows_dot_za/generic.cpp",
1337*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_fp32bf16fp32_planar_5x5_s2_4rows_dot_za/generic.cpp",
1338*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1339*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1340*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1341*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1342*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_s8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1343*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1344*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1345*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1346*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1347*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8q_planar_5x5_s2_4rows_dot_za/generic.cpp",
1348*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s1_4rows_dot_za/generic.cpp",
1349*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_2rows_dot_za/generic.cpp",
1350*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_3x3_s2_4rows_dot_za/generic.cpp",
1351*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s1_4rows_dot_za/generic.cpp",
1352*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/depthwise/kernels/sme2_u8s8u8q_planar_5x5_s2_4rows_dot_za/generic.cpp"
1353*c217d954SCole Faust            ]
1354*c217d954SCole Faust          }
1355*c217d954SCole Faust        }
1356*c217d954SCole Faust      },
1357*c217d954SCole Faust      "Dequantize": {
1358*c217d954SCole Faust        "files": {
1359*c217d954SCole Faust          "common": [
1360*c217d954SCole Faust            "src/cpu/operators/CpuDequantize.cpp",
1361*c217d954SCole Faust            "src/cpu/kernels/CpuDequantizeKernel.cpp",
1362*c217d954SCole Faust            "src/runtime/NEON/functions/NEDequantizationLayer.cpp"
1363*c217d954SCole Faust          ]
1364*c217d954SCole Faust        }
1365*c217d954SCole Faust      },
1366*c217d954SCole Faust      "DetectionPostProcess": {
1367*c217d954SCole Faust        "deps": [ "Dequantize" ],
1368*c217d954SCole Faust        "files": {
1369*c217d954SCole Faust          "common" : [ "src/runtime/NEON/functions/NEDetectionPostProcessLayer.cpp" ]
1370*c217d954SCole Faust        }
1371*c217d954SCole Faust      },
1372*c217d954SCole Faust      "Conv3d": {
1373*c217d954SCole Faust        "deps": [
1374*c217d954SCole Faust          "Activation"
1375*c217d954SCole Faust        ],
1376*c217d954SCole Faust        "files": {
1377*c217d954SCole Faust          "common": [
1378*c217d954SCole Faust            "src/cpu/operators/CpuDirectConv3d.cpp",
1379*c217d954SCole Faust            "src/cpu/kernels/CpuDirectConv3dKernel.cpp",
1380*c217d954SCole Faust            "src/runtime/NEON/functions/NEConv3D.cpp"
1381*c217d954SCole Faust          ]
1382*c217d954SCole Faust        }
1383*c217d954SCole Faust      },
1384*c217d954SCole Faust      "ElementwiseBinary": {
1385*c217d954SCole Faust        "files": {
1386*c217d954SCole Faust          "common": [
1387*c217d954SCole Faust            "src/cpu/operators/CpuElementwise.cpp",
1388*c217d954SCole Faust            "src/cpu/kernels/CpuElementwiseKernel.cpp",
1389*c217d954SCole Faust            "src/runtime/NEON/functions/NEElementwiseOperations.cpp"
1390*c217d954SCole Faust          ],
1391*c217d954SCole Faust          "neon":{
1392*c217d954SCole Faust            "fp32": ["src/cpu/kernels/elementwise_binary/generic/neon/fp32.cpp"],
1393*c217d954SCole Faust            "fp16": ["src/cpu/kernels/elementwise_binary/generic/neon/fp16.cpp"],
1394*c217d954SCole Faust            "integer": ["src/cpu/kernels/elementwise_binary/generic/neon/integer.cpp"],
1395*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8.cpp"],
1396*c217d954SCole Faust            "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/neon/qasymm8_signed.cpp"]
1397*c217d954SCole Faust          },
1398*c217d954SCole Faust          "sve": {
1399*c217d954SCole Faust            "common": ["src/cpu/kernels/elementwise_binary/generic/sve/impl.cpp" ],
1400*c217d954SCole Faust            "integer": ["src/cpu/kernels/elementwise_binary/generic/sve/integer.cpp"],
1401*c217d954SCole Faust            "fp32": ["src/cpu/kernels/elementwise_binary/generic/sve/fp32.cpp"],
1402*c217d954SCole Faust            "fp16": ["src/cpu/kernels/elementwise_binary/generic/sve/fp16.cpp"]
1403*c217d954SCole Faust
1404*c217d954SCole Faust          },
1405*c217d954SCole Faust          "sve2":{
1406*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8.cpp"],
1407*c217d954SCole Faust            "qasymm8_signed": ["src/cpu/kernels/elementwise_binary/generic/sve2/qasymm8_signed.cpp"]
1408*c217d954SCole Faust          }
1409*c217d954SCole Faust        }
1410*c217d954SCole Faust      },
1411*c217d954SCole Faust      "ElementwiseUnary":{
1412*c217d954SCole Faust        "files": {
1413*c217d954SCole Faust          "common": [
1414*c217d954SCole Faust            "src/cpu/operators/CpuElementwiseUnary.cpp",
1415*c217d954SCole Faust            "src/cpu/kernels/CpuElementwiseUnaryKernel.cpp",
1416*c217d954SCole Faust            "src/runtime/NEON/functions/NEElementwiseUnaryLayer.cpp"
1417*c217d954SCole Faust          ],
1418*c217d954SCole Faust          "neon": {
1419*c217d954SCole Faust            "common":["src/cpu/kernels/elementwise_unary/generic/neon/impl.cpp"],
1420*c217d954SCole Faust            "integer": ["src/cpu/kernels/elementwise_unary/generic/neon/integer.cpp"],
1421*c217d954SCole Faust            "fp32": ["src/cpu/kernels/elementwise_unary/generic/neon/fp32.cpp"],
1422*c217d954SCole Faust            "fp16": ["src/cpu/kernels/elementwise_unary/generic/neon/fp16.cpp"]
1423*c217d954SCole Faust          },
1424*c217d954SCole Faust          "sve": {
1425*c217d954SCole Faust            "common": ["src/cpu/kernels/elementwise_unary/generic/sve/impl.cpp" ],
1426*c217d954SCole Faust            "integer": ["src/cpu/kernels/elementwise_unary/generic/sve/integer.cpp"],
1427*c217d954SCole Faust            "fp32": ["src/cpu/kernels/elementwise_unary/generic/sve/fp32.cpp"],
1428*c217d954SCole Faust            "fp16": ["src/cpu/kernels/elementwise_unary/generic/sve/fp16.cpp"]
1429*c217d954SCole Faust          }
1430*c217d954SCole Faust        }
1431*c217d954SCole Faust      },
1432*c217d954SCole Faust      "FFT1D": {
1433*c217d954SCole Faust        "deps": [ "Reduction" ],
1434*c217d954SCole Faust        "files": {
1435*c217d954SCole Faust          "common": [
1436*c217d954SCole Faust            "src/core/NEON/kernels/NEFFTDigitReverseKernel.cpp",
1437*c217d954SCole Faust            "src/core/NEON/kernels/NEFFTRadixStageKernel.cpp",
1438*c217d954SCole Faust            "src/core/NEON/kernels/NEFFTScaleKernel.cpp",
1439*c217d954SCole Faust            "src/runtime/NEON/functions/NEFFT1D.cpp"
1440*c217d954SCole Faust          ]
1441*c217d954SCole Faust        }
1442*c217d954SCole Faust      },
1443*c217d954SCole Faust      "FFT2D": {
1444*c217d954SCole Faust        "deps": [ "FFT1D" ],
1445*c217d954SCole Faust        "files": {
1446*c217d954SCole Faust          "common": [
1447*c217d954SCole Faust            "src/runtime/NEON/functions/NEFFT2D.cpp"
1448*c217d954SCole Faust          ]
1449*c217d954SCole Faust        }
1450*c217d954SCole Faust      },
1451*c217d954SCole Faust      "Fill": {
1452*c217d954SCole Faust        "files": {
1453*c217d954SCole Faust          "common": [
1454*c217d954SCole Faust            "src/cpu/operators/CpuFill.cpp",
1455*c217d954SCole Faust            "src/cpu/kernels/CpuFillKernel.cpp",
1456*c217d954SCole Faust            "src/runtime/NEON/functions/NEFill.cpp"
1457*c217d954SCole Faust          ]
1458*c217d954SCole Faust        }
1459*c217d954SCole Faust      },
1460*c217d954SCole Faust      "Flatten": {
1461*c217d954SCole Faust        "deps: ": [ "Reshape" ],
1462*c217d954SCole Faust        "files": {
1463*c217d954SCole Faust          "common": [
1464*c217d954SCole Faust            "src/cpu/operators/CpuFlatten.cpp",
1465*c217d954SCole Faust            "src/runtime/NEON/functions/NEFlattenLayer.cpp"
1466*c217d954SCole Faust          ]
1467*c217d954SCole Faust        }
1468*c217d954SCole Faust      },
1469*c217d954SCole Faust      "Floor": {
1470*c217d954SCole Faust        "files": {
1471*c217d954SCole Faust          "common": [
1472*c217d954SCole Faust            "src/cpu/operators/CpuFloor.cpp",
1473*c217d954SCole Faust            "src/cpu/kernels/CpuFloorKernel.cpp",
1474*c217d954SCole Faust            "src/runtime/NEON/functions/NEFloor.cpp"
1475*c217d954SCole Faust          ],
1476*c217d954SCole Faust          "neon": {
1477*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/floor/neon/fp32.cpp" ],
1478*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/floor/neon/fp16.cpp" ]
1479*c217d954SCole Faust          }
1480*c217d954SCole Faust        }
1481*c217d954SCole Faust      },
1482*c217d954SCole Faust      "FullyConnected": {
1483*c217d954SCole Faust        "deps": [ "Flatten", "Gemm", "Transpose"],
1484*c217d954SCole Faust        "files": {
1485*c217d954SCole Faust          "common": [
1486*c217d954SCole Faust            "src/cpu/kernels/CpuConvertFullyConnectedWeightsKernel.cpp",
1487*c217d954SCole Faust            "src/cpu/operators/CpuConvertFullyConnectedWeights.cpp",
1488*c217d954SCole Faust            "src/cpu/operators/CpuFullyConnected.cpp",
1489*c217d954SCole Faust            "src/runtime/NEON/functions/NEConvertFullyConnectedWeights.cpp",
1490*c217d954SCole Faust            "src/runtime/NEON/functions/NEFullyConnectedLayer.cpp"
1491*c217d954SCole Faust          ]
1492*c217d954SCole Faust        }
1493*c217d954SCole Faust      },
1494*c217d954SCole Faust      "Gather": {
1495*c217d954SCole Faust        "files": {
1496*c217d954SCole Faust          "common": [
1497*c217d954SCole Faust            "src/core/NEON/kernels/NEGatherKernel.cpp",
1498*c217d954SCole Faust            "src/runtime/NEON/functions/NEGather.cpp"
1499*c217d954SCole Faust          ]
1500*c217d954SCole Faust        }
1501*c217d954SCole Faust      },
1502*c217d954SCole Faust      "Gemm": {
1503*c217d954SCole Faust        "deps": [ "Quantize", "Add"],
1504*c217d954SCole Faust          "files": {
1505*c217d954SCole Faust          "common": [
1506*c217d954SCole Faust            "src/cpu/kernels/CpuConvertQuantizedSignednessKernel.cpp",
1507*c217d954SCole Faust            "src/cpu/kernels/CpuGemmMatrixAdditionKernel.cpp",
1508*c217d954SCole Faust            "src/cpu/kernels/CpuGemmMatrixMultiplyKernel.cpp",
1509*c217d954SCole Faust            "src/cpu/kernels/CpuGemmTranspose1xWKernel.cpp",
1510*c217d954SCole Faust            "src/cpu/kernels/CpuGemmInterleave4x4Kernel.cpp",
1511*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ScaleKernel.cpp",
1512*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt16ScaleByFixedPointKernel.cpp",
1513*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToInt8ScaleByFixedPointKernel.cpp",
1514*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpQuantizeDownInt32ToUint8ScaleByFixedPointKernel.cpp",
1515*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpMatrixMultiplyKernel.cpp",
1516*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpMatrixReductionKernel.cpp",
1517*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpOffsetContributionOutputStageKernel.cpp",
1518*c217d954SCole Faust            "src/cpu/kernels/CpuGemmLowpOffsetContributionKernel.cpp",
1519*c217d954SCole Faust            "src/cpu/operators/CpuGemm.cpp",
1520*c217d954SCole Faust            "src/cpu/operators/CpuGemmLowpOutputStage.cpp",
1521*c217d954SCole Faust            "src/cpu/operators/CpuGemmLowpMatrixMultiplyCore.cpp",
1522*c217d954SCole Faust            "src/runtime/NEON/functions/NEGEMM.cpp",
1523*c217d954SCole Faust            "src/runtime/NEON/functions/NEGEMMLowpMatrixMultiplyCore.cpp",
1524*c217d954SCole Faust            "src/runtime/NEON/functions/NEGEMMLowpOutputStage.cpp"
1525*c217d954SCole Faust          ],
1526*c217d954SCole Faust          "neon": {
1527*c217d954SCole Faust            "common": [
1528*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_bf16.cpp",
1529*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_fp16.cpp",
1530*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_fp32.cpp",
1531*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_int16.cpp",
1532*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_int8.cpp",
1533*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_qint8.cpp",
1534*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_quint8.cpp",
1535*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_uint16.cpp",
1536*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/gemm_uint8.cpp",
1537*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/interleave_indirect.cpp",
1538*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/mergeresults-fp16.cpp",
1539*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/mergeresults.cpp",
1540*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/misc.cpp",
1541*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/quantized.cpp",
1542*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/rowsum_indirect_s8.cpp",
1543*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/rowsum_indirect_u8.cpp",
1544*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/transform.cpp",
1545*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s16_8x12/generic.cpp",
1546*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_4x4/generic.cpp",
1547*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/a55r1.cpp",
1548*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/generic.cpp",
1549*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_s8_8x12/x1.cpp",
1550*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u16_8x12/generic.cpp",
1551*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_4x4/generic.cpp",
1552*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/a55r1.cpp",
1553*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/generic.cpp",
1554*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_gemm_u8_8x12/x1.cpp",
1555*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/a55r1.cpp",
1556*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/generic.cpp",
1557*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hgemm_8x24/x1.cpp",
1558*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_dot_6x16/generic.cpp",
1559*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_bf16fp32_mmla_6x16/generic.cpp",
1560*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/a55.cpp",
1561*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp16_mla_6x32/generic.cpp",
1562*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/a55.cpp",
1563*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_4x24/generic.cpp",
1564*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/a55.cpp",
1565*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_6x16/generic.cpp",
1566*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/a55.cpp",
1567*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32_mla_8x4/generic.cpp",
1568*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1569*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_fp32bf16fp32_mmla_6x16/generic.cpp",
1570*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/a55.cpp",
1571*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_dot_4x16/generic.cpp",
1572*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qa_mmla_4x16/generic.cpp",
1573*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/a55.cpp",
1574*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_dot_6x16/generic.cpp",
1575*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8qs_mmla_6x16/generic.cpp",
1576*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/a55.cpp",
1577*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_dot_6x16/generic.cpp",
1578*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_s8s32_mmla_6x16/generic.cpp",
1579*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/a55.cpp",
1580*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_dot_4x16/generic.cpp",
1581*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8qa_mmla_4x16/generic.cpp",
1582*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/a55.cpp",
1583*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_dot_6x16/generic.cpp",
1584*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_hybrid_u8u32_mmla_6x16/generic.cpp",
1585*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/generic.cpp",
1586*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_dot_8x12/x1.cpp",
1587*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/generic.cpp",
1588*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_bf16fp32_mmla_8x12/a510.cpp",
1589*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/generic.cpp",
1590*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_s8s32_mmla_8x12/a510.cpp",
1591*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/generic.cpp",
1592*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_interleaved_u8u32_mmla_8x12/a510.cpp",
1593*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a53.cpp",
1594*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55.cpp",
1595*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/a55r1.cpp",
1596*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/generic.cpp",
1597*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x12/x1.cpp",
1598*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemm_8x6/generic.cpp",
1599*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_6x4/generic.cpp",
1600*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_fp32_mla_8x4/generic.cpp",
1601*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/a55.cpp",
1602*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_6x4/generic.cpp",
1603*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/a55.cpp",
1604*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_s8s32_dot_8x4/generic.cpp",
1605*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/a55.cpp",
1606*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_6x4/generic.cpp",
1607*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/a55.cpp",
1608*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_smallK_hybrid_u8u32_dot_8x4/generic.cpp",
1609*c217d954SCole Faust              "src/cpu/kernels/gemm_matrix_mul/generic/neon/impl.cpp",
1610*c217d954SCole Faust              "src/cpu/kernels/gemm_matrix_add/generic/neon/impl.cpp"
1611*c217d954SCole Faust            ],
1612*c217d954SCole Faust            "fp32":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp32.cpp",
1613*c217d954SCole Faust                    "src/cpu/kernels/gemm_matrix_add/generic/neon/fp32.cpp"],
1614*c217d954SCole Faust            "fp16":["src/cpu/kernels/gemm_matrix_mul/generic/neon/fp16.cpp",
1615*c217d954SCole Faust                    "src/cpu/kernels/gemm_matrix_add/generic/neon/fp16.cpp"],
1616*c217d954SCole Faust            "estate32": [
1617*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a53.cpp",
1618*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/a55r1.cpp",
1619*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a32_sgemm_8x6/generic.cpp"
1620*c217d954SCole Faust            ],
1621*c217d954SCole Faust            "estate64": [
1622*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_sgemv_pretransposed/generic.cpp"
1623*c217d954SCole Faust            ],
1624*c217d954SCole Faust            "experimental_fixed_format_kernels": [
1625*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_bf16fp32_mmla_6x16/generic.cpp",
1626*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp16_mla_6x32/generic.cpp",
1627*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32_mla_6x16/generic.cpp",
1628*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffhybrid_fp32bf16fp32_mmla_4x24/generic.cpp",
1629*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_dot_8x12/generic.cpp",
1630*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_bf16fp32_mmla_8x12/generic.cpp",
1631*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp16_mla_8x24/generic.cpp",
1632*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/a64_ffinterleaved_fp32_mla_8x12/generic.cpp"
1633*c217d954SCole Faust            ]
1634*c217d954SCole Faust          },
1635*c217d954SCole Faust          "sve": {
1636*c217d954SCole Faust            "common": [
1637*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/interleave_indirect-sve.cpp",
1638*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_bf16fp32_dot_16VL/generic.cpp",
1639*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32_mla_16VL/generic.cpp",
1640*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_fp32bf16fp32_dot_16VL/generic.cpp",
1641*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_s8qa_dot_16VL/generic.cpp",
1642*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_gemv_u8qa_dot_16VL/generic.cpp",
1643*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_1VLx4VL/generic.cpp",
1644*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_2VLx2VL/generic.cpp",
1645*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_bf16fp32_mopa_4VLx1VL/generic.cpp",
1646*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_1VLx4VL/generic.cpp",
1647*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_2VLx2VL/generic.cpp",
1648*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_fp32_mopa_4VLx1VL/generic.cpp",
1649*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_1VLx4VL/generic.cpp",
1650*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_2VLx2VL/generic.cpp",
1651*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8q_mopa_4VLx1VL/generic.cpp",
1652*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_1VLx4VL/generic.cpp",
1653*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_2VLx2VL/generic.cpp",
1654*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_s8s32_mopa_4VLx1VL/generic.cpp",
1655*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_1VLx4VL/generic.cpp",
1656*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_2VLx2VL/generic.cpp",
1657*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sme2_interleaved_nomerge_u8q_mopa_4VLx1VL/generic.cpp",
1658*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_dot_6x4VL/generic.cpp",
1659*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1660*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/a64fx.cpp",
1661*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp16_mla_6x4VL/generic.cpp",
1662*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/a64fx.cpp",
1663*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_6x4VL/generic.cpp",
1664*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/a64fx.cpp",
1665*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32_mla_8x1VL/generic.cpp",
1666*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1667*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_fp32bf16fp32_mmla_6x4VL/generic.cpp",
1668*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_dot_4x4VL/generic.cpp",
1669*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qa_mmla_4x4VL/generic.cpp",
1670*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_dot_6x4VL/generic.cpp",
1671*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8qs_mmla_6x4VL/generic.cpp",
1672*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/a64fx.cpp",
1673*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_dot_6x4VL/generic.cpp",
1674*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_s8s32_mmla_6x4VL/generic.cpp",
1675*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_dot_4x4VL/generic.cpp",
1676*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8qa_mmla_4x4VL/generic.cpp",
1677*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/a64fx.cpp",
1678*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_dot_6x4VL/generic.cpp",
1679*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_hybrid_u8u32_mmla_6x4VL/generic.cpp",
1680*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_dot_8x3VL/generic.cpp",
1681*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1682*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/a64fx.cpp",
1683*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp16_mla_8x3VL/generic.cpp",
1684*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/a64fx.cpp",
1685*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mla_8x3VL/generic.cpp",
1686*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_fp32_mmla_8x3VL/generic.cpp",
1687*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/a64fx.cpp",
1688*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_dot_8x3VL/generic.cpp",
1689*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_s8s32_mmla_8x3VL/generic.cpp",
1690*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/a64fx.cpp",
1691*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_dot_8x3VL/generic.cpp",
1692*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_interleaved_u8u32_mmla_8x3VL/generic.cpp",
1693*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_fp32_mla_8x1VL/generic.cpp",
1694*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_s8s32_dot_8x1VL/generic.cpp",
1695*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_smallK_hybrid_u8u32_dot_8x1VL/generic.cpp",
1696*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/mergeresults-sve.cpp",
1697*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/transform-sve.cpp",
1698*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/misc-sve.cpp"
1699*c217d954SCole Faust            ],
1700*c217d954SCole Faust            "experimental_fixed_format_kernels": [
1701*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_bf16fp32_mmla_6x4VL/generic.cpp",
1702*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/a64fx.cpp",
1703*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp16_mla_6x4VL/generic.cpp",
1704*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/a64fx.cpp",
1705*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32_mla_6x4VL/generic.cpp",
1706*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffhybrid_fp32bf16fp32_mmla_4x6VL/generic.cpp",
1707*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_bf16fp32_mmla_8x3VL/generic.cpp",
1708*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/a64fx.cpp",
1709*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp16_mla_8x3VL/generic.cpp",
1710*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/a64fx.cpp",
1711*c217d954SCole Faust              "src/core/NEON/kernels/arm_gemm/kernels/sve_ffinterleaved_fp32_mla_8x3VL/generic.cpp"
1712*c217d954SCole Faust	    ]
1713*c217d954SCole Faust          }
1714*c217d954SCole Faust        }
1715*c217d954SCole Faust      },
1716*c217d954SCole Faust      "GenerateProposals": {
1717*c217d954SCole Faust        "deps": [ "BoundingBoxTransform", "Dequantize", "Pad", "Permute", "Quantize", "Reshape" ],
1718*c217d954SCole Faust        "files": {
1719*c217d954SCole Faust          "common": [
1720*c217d954SCole Faust            "src/core/NEON/kernels/NEGenerateProposalsLayerKernel.cpp",
1721*c217d954SCole Faust            "src/runtime/NEON/functions/NEGenerateProposalsLayer.cpp"
1722*c217d954SCole Faust          ],
1723*c217d954SCole Faust          "neon":{
1724*c217d954SCole Faust            "common":["src/cpu/kernels/genproposals/generic/neon/impl.cpp"],
1725*c217d954SCole Faust            "fp16":["src/cpu/kernels/genproposals/generic/neon/fp16.cpp"],
1726*c217d954SCole Faust            "fp32":["src/cpu/kernels/genproposals/generic/neon/fp32.cpp"],
1727*c217d954SCole Faust            "qsymm16":["src/cpu/kernels/genproposals/generic/neon/qsymm16.cpp"]
1728*c217d954SCole Faust          }
1729*c217d954SCole Faust        }
1730*c217d954SCole Faust      },
1731*c217d954SCole Faust      "InstanceNormalize": {
1732*c217d954SCole Faust        "deps": [ "Permute", "Reduction" ],
1733*c217d954SCole Faust        "files": {
1734*c217d954SCole Faust          "common": [
1735*c217d954SCole Faust            "src/core/NEON/kernels/NEInstanceNormalizationLayerKernel.cpp",
1736*c217d954SCole Faust            "src/runtime/NEON/functions/NEInstanceNormalizationLayer.cpp"
1737*c217d954SCole Faust          ],
1738*c217d954SCole Faust          "neon":{
1739*c217d954SCole Faust            "common":["src/cpu/kernels/instancenorm/generic/neon/impl.cpp"],
1740*c217d954SCole Faust            "fp16":["src/cpu/kernels/instancenorm/generic/neon/fp16.cpp"],
1741*c217d954SCole Faust            "fp32":["src/cpu/kernels/instancenorm/generic/neon/fp32.cpp"]
1742*c217d954SCole Faust          }
1743*c217d954SCole Faust        }
1744*c217d954SCole Faust      },
1745*c217d954SCole Faust      "L2Normalize": {
1746*c217d954SCole Faust        "deps": [ "Reduction" ],
1747*c217d954SCole Faust        "files": {
1748*c217d954SCole Faust          "common": [
1749*c217d954SCole Faust            "src/core/NEON/kernels/NEL2NormalizeLayerKernel.cpp",
1750*c217d954SCole Faust            "src/runtime/NEON/functions/NEL2NormalizeLayer.cpp"
1751*c217d954SCole Faust          ],
1752*c217d954SCole Faust          "neon":{
1753*c217d954SCole Faust            "common":["src/cpu/kernels/l2normlayer/generic/neon/impl.cpp"],
1754*c217d954SCole Faust            "fp32":["src/cpu/kernels/l2normlayer/generic/neon/fp32.cpp"],
1755*c217d954SCole Faust            "fp16":["src/cpu/kernels/l2normlayer/generic/neon/fp16.cpp"]
1756*c217d954SCole Faust          }
1757*c217d954SCole Faust        }
1758*c217d954SCole Faust      },
1759*c217d954SCole Faust      "Logical": {
1760*c217d954SCole Faust        "files": {
1761*c217d954SCole Faust          "common": [
1762*c217d954SCole Faust            "src/core/NEON/kernels/NELogicalKernel.cpp",
1763*c217d954SCole Faust            "src/runtime/NEON/functions/NELogical.cpp"
1764*c217d954SCole Faust          ]
1765*c217d954SCole Faust        }
1766*c217d954SCole Faust      },
1767*c217d954SCole Faust      "LSTM": {
1768*c217d954SCole Faust        "deps": [
1769*c217d954SCole Faust          "Activation",
1770*c217d954SCole Faust          "Concatenate",
1771*c217d954SCole Faust          "Copy",
1772*c217d954SCole Faust          "Dequantize",
1773*c217d954SCole Faust          "ElementwiseBinary",
1774*c217d954SCole Faust          "Fill",
1775*c217d954SCole Faust          "FullyConnected",
1776*c217d954SCole Faust          "Gemm",
1777*c217d954SCole Faust          "MeanStdDevNormalize",
1778*c217d954SCole Faust          "Mul",
1779*c217d954SCole Faust          "Quantize",
1780*c217d954SCole Faust          "Slice",
1781*c217d954SCole Faust          "Transpose"
1782*c217d954SCole Faust        ],
1783*c217d954SCole Faust        "files": {
1784*c217d954SCole Faust          "common": [
1785*c217d954SCole Faust            "src/core/NEON/kernels/NEQLSTMLayerNormalizationKernel.cpp",
1786*c217d954SCole Faust            "src/runtime/NEON/functions/NELSTMLayer.cpp",
1787*c217d954SCole Faust            "src/runtime/NEON/functions/NELSTMLayerQuantized.cpp",
1788*c217d954SCole Faust            "src/runtime/NEON/functions/NEQLSTMLayer.cpp"
1789*c217d954SCole Faust          ]
1790*c217d954SCole Faust        }
1791*c217d954SCole Faust      },
1792*c217d954SCole Faust      "MaxUnpool2d": {
1793*c217d954SCole Faust        "deps": [ "Fill" ],
1794*c217d954SCole Faust        "files": {
1795*c217d954SCole Faust          "common": [
1796*c217d954SCole Faust            "src/cpu/kernels/CpuMaxUnpoolingLayerKernel.cpp",
1797*c217d954SCole Faust            "src/runtime/NEON/functions/NEMaxUnpoolingLayer.cpp",
1798*c217d954SCole Faust            "src/cpu/operators/CpuMaxUnpooling.cpp"
1799*c217d954SCole Faust          ],
1800*c217d954SCole Faust          "neon":{
1801*c217d954SCole Faust            "fp32":["src/cpu/kernels/maxunpool/generic/neon/fp32.cpp"],
1802*c217d954SCole Faust            "fp16":["src/cpu/kernels/maxunpool/generic/neon/fp16.cpp"],
1803*c217d954SCole Faust            "qasymm8":["src/cpu/kernels/maxunpool/generic/neon/qasymm8.cpp"],
1804*c217d954SCole Faust            "qasymm8_signed":[ "src/cpu/kernels/maxunpool/generic/neon/qasymm8_signed.cpp"],
1805*c217d954SCole Faust            "common":["src/cpu/kernels/maxunpool/generic/neon/impl.cpp"]
1806*c217d954SCole Faust          }
1807*c217d954SCole Faust        }
1808*c217d954SCole Faust      },
1809*c217d954SCole Faust      "Mean": {
1810*c217d954SCole Faust        "deps" : [ "Reduction" ],
1811*c217d954SCole Faust        "files": {
1812*c217d954SCole Faust          "common": [ "src/runtime/NEON/functions/NEReduceMean.cpp" ]
1813*c217d954SCole Faust        }
1814*c217d954SCole Faust      },
1815*c217d954SCole Faust      "MeanStdDevNormalize": {
1816*c217d954SCole Faust        "files": {
1817*c217d954SCole Faust          "common": [
1818*c217d954SCole Faust            "src/core/NEON/kernels/NEMeanStdDevNormalizationKernel.cpp",
1819*c217d954SCole Faust            "src/runtime/NEON/functions/NEMeanStdDevNormalizationLayer.cpp"
1820*c217d954SCole Faust          ],
1821*c217d954SCole Faust        "neon":{
1822*c217d954SCole Faust          "common":["src/cpu/kernels/meanstddevnorm/generic/neon/impl.cpp"],
1823*c217d954SCole Faust          "fp32":["src/cpu/kernels/meanstddevnorm/generic/neon/fp32.cpp"],
1824*c217d954SCole Faust          "fp16":["src/cpu/kernels/meanstddevnorm/generic/neon/fp16.cpp"],
1825*c217d954SCole Faust          "qasymm8":["src/cpu/kernels/meanstddevnorm/generic/neon/qasymm8.cpp"]
1826*c217d954SCole Faust        }
1827*c217d954SCole Faust        }
1828*c217d954SCole Faust      },
1829*c217d954SCole Faust      "Mul": {
1830*c217d954SCole Faust        "files": {
1831*c217d954SCole Faust          "common": [
1832*c217d954SCole Faust            "src/cpu/operators/CpuMul.cpp",
1833*c217d954SCole Faust            "src/cpu/kernels/CpuMulKernel.cpp",
1834*c217d954SCole Faust            "src/runtime/NEON/functions/NEPixelWiseMultiplication.cpp"
1835*c217d954SCole Faust          ]
1836*c217d954SCole Faust        }
1837*c217d954SCole Faust      },
1838*c217d954SCole Faust      "Normalize": {
1839*c217d954SCole Faust        "deps": [ "Mul" ],
1840*c217d954SCole Faust        "files": {
1841*c217d954SCole Faust          "common": [
1842*c217d954SCole Faust            "src/core/NEON/kernels/NENormalizationLayerKernel.cpp",
1843*c217d954SCole Faust            "src/runtime/NEON/functions/NENormalizationLayer.cpp"
1844*c217d954SCole Faust          ]
1845*c217d954SCole Faust        }
1846*c217d954SCole Faust      },
1847*c217d954SCole Faust      "Pad": {
1848*c217d954SCole Faust        "deps": [ "Concatenate", "Copy", "StridedSlice" ],
1849*c217d954SCole Faust        "files": {
1850*c217d954SCole Faust          "common": [
1851*c217d954SCole Faust            "src/core/NEON/kernels/NEPadLayerKernel.cpp",
1852*c217d954SCole Faust            "src/runtime/NEON/functions/NEPadLayer.cpp"
1853*c217d954SCole Faust          ]
1854*c217d954SCole Faust        }
1855*c217d954SCole Faust      },
1856*c217d954SCole Faust      "Permute": {
1857*c217d954SCole Faust        "files": {
1858*c217d954SCole Faust          "common": [
1859*c217d954SCole Faust            "src/cpu/operators/CpuPermute.cpp",
1860*c217d954SCole Faust            "src/cpu/kernels/CpuPermuteKernel.cpp",
1861*c217d954SCole Faust            "src/runtime/NEON/functions/NEPermute.cpp"
1862*c217d954SCole Faust          ]
1863*c217d954SCole Faust        }
1864*c217d954SCole Faust      },
1865*c217d954SCole Faust      "Pool2d": {
1866*c217d954SCole Faust        "files": {
1867*c217d954SCole Faust          "common": [
1868*c217d954SCole Faust            "src/cpu/operators/CpuPool2d.cpp",
1869*c217d954SCole Faust            "src/cpu/kernels/CpuPool2dKernel.cpp",
1870*c217d954SCole Faust            "src/cpu/kernels/internal/CpuPool2dAssemblyWrapperKernel.cpp",
1871*c217d954SCole Faust            "src/runtime/NEON/functions/NEPoolingLayer.cpp"
1872*c217d954SCole Faust          ],
1873*c217d954SCole Faust          "neon": {
1874*c217d954SCole Faust            "common": [
1875*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/cpp_nhwc_1x1_stride_any_depthfirst/generic.cpp",
1876*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_fp16.cpp",
1877*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_fp32.cpp",
1878*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_s8.cpp",
1879*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_s8q.cpp",
1880*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_u8.cpp",
1881*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/pooling_u8q.cpp",
1882*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1883*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1884*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1885*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1886*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1887*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1888*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1889*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1890*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1891*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1892*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8_nhwc_max_generic_depthfirst/generic.cpp",
1893*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1894*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1895*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1896*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1897*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8_nhwc_max_generic_depthfirst/generic.cpp",
1898*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1899*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/a64_u8q_nhwc_max_generic_depthfirst/generic.cpp"
1900*c217d954SCole Faust            ],
1901*c217d954SCole Faust            "nchw": [ "src/cpu/kernels/pool2d/neon/nchw/all.cpp" ],
1902*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/pool2d/neon/fp16.cpp" ],
1903*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/pool2d/neon/fp32.cpp" ],
1904*c217d954SCole Faust            "qasymm8":[ "src/cpu/kernels/pool2d/neon/qasymm8.cpp" ],
1905*c217d954SCole Faust            "qasymm8_signed":["src/cpu/kernels/pool2d/neon/qasymm8_signed.cpp"]
1906*c217d954SCole Faust          },
1907*c217d954SCole Faust          "sve": {
1908*c217d954SCole Faust            "common": [
1909*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1910*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1911*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1912*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1913*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1914*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1915*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1916*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1917*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1918*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1919*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8_nhwc_max_generic_depthfirst/generic.cpp",
1920*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1921*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1922*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1923*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1924*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8_nhwc_max_generic_depthfirst/generic.cpp",
1925*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1926*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sve_u8q_nhwc_max_generic_depthfirst/generic.cpp",
1927*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1928*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_avg_generic_depthfirst/generic.cpp",
1929*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1930*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp16_nhwc_max_generic_depthfirst/generic.cpp",
1931*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_3x3_s1_output2x2_depthfirst/generic.cpp",
1932*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_avg_generic_depthfirst/generic.cpp",
1933*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1934*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_fp32_nhwc_max_generic_depthfirst/generic.cpp",
1935*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_avg_generic_depthfirst/generic.cpp",
1936*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1937*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8_nhwc_max_generic_depthfirst/generic.cpp",
1938*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_avg_generic_depthfirst/generic.cpp",
1939*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_s8q_nhwc_max_generic_depthfirst/generic.cpp",
1940*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_avg_generic_depthfirst/generic.cpp",
1941*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_2x2_s1_output2x2_depthfirst/generic.cpp",
1942*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8_nhwc_max_generic_depthfirst/generic.cpp",
1943*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_avg_generic_depthfirst/generic.cpp",
1944*c217d954SCole Faust              "src/core/NEON/kernels/arm_conv/pooling/kernels/sme_u8q_nhwc_max_generic_depthfirst/generic.cpp"
1945*c217d954SCole Faust            ]
1946*c217d954SCole Faust          }
1947*c217d954SCole Faust        }
1948*c217d954SCole Faust      },
1949*c217d954SCole Faust      "Pool3d": {
1950*c217d954SCole Faust        "files": {
1951*c217d954SCole Faust          "common": [
1952*c217d954SCole Faust            "src/cpu/operators/CpuPool3d.cpp",
1953*c217d954SCole Faust            "src/cpu/kernels/CpuPool3dKernel.cpp",
1954*c217d954SCole Faust            "src/runtime/NEON/functions/NEPooling3dLayer.cpp"
1955*c217d954SCole Faust          ],
1956*c217d954SCole Faust          "neon": {
1957*c217d954SCole Faust            "common":         [ "src/cpu/kernels/pool3d/neon/impl.cpp" ],
1958*c217d954SCole Faust            "fp16":           [ "src/cpu/kernels/pool3d/neon/fp16.cpp" ],
1959*c217d954SCole Faust            "fp32":           [ "src/cpu/kernels/pool3d/neon/fp32.cpp" ],
1960*c217d954SCole Faust            "qasymm8":        [ "src/cpu/kernels/pool3d/neon/qasymm8.cpp" ],
1961*c217d954SCole Faust            "qasymm8_signed": [ "src/cpu/kernels/pool3d/neon/qasymm8_signed.cpp" ]
1962*c217d954SCole Faust          }
1963*c217d954SCole Faust        }
1964*c217d954SCole Faust      },
1965*c217d954SCole Faust      "PRelu": {
1966*c217d954SCole Faust        "deps": [ "ElementwiseBinary" ],
1967*c217d954SCole Faust        "files": {
1968*c217d954SCole Faust          "common": [
1969*c217d954SCole Faust            "src/runtime/NEON/functions/NEPReluLayer.cpp"
1970*c217d954SCole Faust          ]
1971*c217d954SCole Faust        }
1972*c217d954SCole Faust      },
1973*c217d954SCole Faust      "PriorBox": {
1974*c217d954SCole Faust        "files": {
1975*c217d954SCole Faust          "common": [
1976*c217d954SCole Faust            "src/core/NEON/kernels/NEPriorBoxLayerKernel.cpp",
1977*c217d954SCole Faust            "src/runtime/NEON/functions/NEPriorBoxLayer.cpp"
1978*c217d954SCole Faust          ]
1979*c217d954SCole Faust        }
1980*c217d954SCole Faust      },
1981*c217d954SCole Faust      "Quantize": {
1982*c217d954SCole Faust        "files": {
1983*c217d954SCole Faust          "common": [
1984*c217d954SCole Faust            "src/cpu/operators/CpuQuantize.cpp",
1985*c217d954SCole Faust            "src/cpu/kernels/CpuQuantizeKernel.cpp",
1986*c217d954SCole Faust            "src/runtime/NEON/functions/NEQuantizationLayer.cpp"
1987*c217d954SCole Faust          ]
1988*c217d954SCole Faust        }
1989*c217d954SCole Faust      },
1990*c217d954SCole Faust      "Range": {
1991*c217d954SCole Faust        "files": {
1992*c217d954SCole Faust          "common": [
1993*c217d954SCole Faust            "src/core/NEON/kernels/NERangeKernel.cpp",
1994*c217d954SCole Faust            "src/runtime/NEON/functions/NERange.cpp"
1995*c217d954SCole Faust          ],
1996*c217d954SCole Faust          "neon": {
1997*c217d954SCole Faust            "common":  [ "src/cpu/kernels/range/generic/neon/impl.cpp" ],
1998*c217d954SCole Faust            "fp32":    [ "src/cpu/kernels/range/generic/neon/fp32.cpp" ],
1999*c217d954SCole Faust            "fp16":    [ "src/cpu/kernels/range/generic/neon/fp16.cpp" ],
2000*c217d954SCole Faust            "integer": [ "src/cpu/kernels/range/generic/neon/integer.cpp"   ]
2001*c217d954SCole Faust          }
2002*c217d954SCole Faust        }
2003*c217d954SCole Faust      },
2004*c217d954SCole Faust      "Reduction":{
2005*c217d954SCole Faust        "deps": [ "Reshape" ],
2006*c217d954SCole Faust        "files": {
2007*c217d954SCole Faust          "common": [
2008*c217d954SCole Faust            "src/core/NEON/kernels/NEReductionOperationKernel.cpp",
2009*c217d954SCole Faust            "src/runtime/NEON/functions/NEReductionOperation.cpp"
2010*c217d954SCole Faust          ]
2011*c217d954SCole Faust        }
2012*c217d954SCole Faust      },
2013*c217d954SCole Faust      "Reorg": {
2014*c217d954SCole Faust        "files": {
2015*c217d954SCole Faust          "common": [
2016*c217d954SCole Faust            "src/core/NEON/kernels/NEReorgLayerKernel.cpp",
2017*c217d954SCole Faust            "src/runtime/NEON/functions/NEReorgLayer.cpp"
2018*c217d954SCole Faust          ]
2019*c217d954SCole Faust        }
2020*c217d954SCole Faust      },
2021*c217d954SCole Faust      "Reshape": {
2022*c217d954SCole Faust        "files": {
2023*c217d954SCole Faust          "common": [
2024*c217d954SCole Faust            "src/cpu/operators/CpuReshape.cpp",
2025*c217d954SCole Faust            "src/cpu/kernels/CpuReshapeKernel.cpp",
2026*c217d954SCole Faust            "src/runtime/NEON/functions/NEReshapeLayer.cpp"
2027*c217d954SCole Faust          ]
2028*c217d954SCole Faust        }
2029*c217d954SCole Faust      },
2030*c217d954SCole Faust      "Reverse": {
2031*c217d954SCole Faust        "files": {
2032*c217d954SCole Faust          "common": [
2033*c217d954SCole Faust            "src/core/NEON/kernels/NEReverseKernel.cpp",
2034*c217d954SCole Faust            "src/runtime/NEON/functions/NEReverse.cpp"
2035*c217d954SCole Faust          ]
2036*c217d954SCole Faust        }
2037*c217d954SCole Faust      },
2038*c217d954SCole Faust      "RNN": {
2039*c217d954SCole Faust        "deps": [ "Activation", "Add", "FullyConnected", "Gemm"],
2040*c217d954SCole Faust        "files": {
2041*c217d954SCole Faust          "common": [ "src/runtime/NEON/functions/NERNNLayer.cpp" ]
2042*c217d954SCole Faust        }
2043*c217d954SCole Faust      },
2044*c217d954SCole Faust      "ROIAlign": {
2045*c217d954SCole Faust        "files": {
2046*c217d954SCole Faust          "common": [
2047*c217d954SCole Faust            "src/core/NEON/kernels/NEROIAlignLayerKernel.cpp",
2048*c217d954SCole Faust            "src/runtime/NEON/functions/NEROIAlignLayer.cpp"
2049*c217d954SCole Faust          ],
2050*c217d954SCole Faust          "neon":{
2051*c217d954SCole Faust            "common":["src/cpu/kernels/roialign/generic/neon/impl.cpp"],
2052*c217d954SCole Faust            "fp32":["src/cpu/kernels/roialign/generic/neon/fp32.cpp"],
2053*c217d954SCole Faust            "fp16":["src/cpu/kernels/roialign/generic/neon/fp16.cpp"],
2054*c217d954SCole Faust            "qasymm8":["src/cpu/kernels/roialign/generic/neon/qasymm8.cpp"],
2055*c217d954SCole Faust            "qasymm8_signed":["src/cpu/kernels/roialign/generic/neon/qasymm8_signed.cpp"]
2056*c217d954SCole Faust          }
2057*c217d954SCole Faust        }
2058*c217d954SCole Faust      },
2059*c217d954SCole Faust      "ROIPool2d": {
2060*c217d954SCole Faust        "files": {
2061*c217d954SCole Faust          "common": [
2062*c217d954SCole Faust            "src/core/NEON/kernels/NEROIPoolingLayerKernel.cpp",
2063*c217d954SCole Faust            "src/runtime/NEON/functions/NEROIPoolingLayer.cpp"
2064*c217d954SCole Faust          ]
2065*c217d954SCole Faust        }
2066*c217d954SCole Faust      },
2067*c217d954SCole Faust      "Scale": {
2068*c217d954SCole Faust        "files": {
2069*c217d954SCole Faust          "common": [
2070*c217d954SCole Faust            "src/cpu/operators/CpuScale.cpp",
2071*c217d954SCole Faust            "src/cpu/kernels/CpuScaleKernel.cpp",
2072*c217d954SCole Faust            "src/runtime/NEON/functions/NEScale.cpp"
2073*c217d954SCole Faust          ],
2074*c217d954SCole Faust          "sve": {
2075*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/scale/sve/fp16.cpp" ],
2076*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/scale/sve/fp32.cpp" ],
2077*c217d954SCole Faust            "integer": [ "src/cpu/kernels/scale/sve/integer.cpp" ],
2078*c217d954SCole Faust            "qasymm8": [ "src/cpu/kernels/scale/sve/qasymm8.cpp" ],
2079*c217d954SCole Faust            "qasymm8_signed": [ "src/cpu/kernels/scale/sve/qasymm8_signed.cpp" ]
2080*c217d954SCole Faust          },
2081*c217d954SCole Faust          "neon": {
2082*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/scale/neon/fp16.cpp" ],
2083*c217d954SCole Faust            "integer": [ "src/cpu/kernels/scale/neon/integer.cpp" ],
2084*c217d954SCole Faust            "qasymm8": [ "src/cpu/kernels/scale/neon/qasymm8.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ],
2085*c217d954SCole Faust            "qasymm8_signed": [ "src/cpu/kernels/scale/neon/qasymm8_signed.cpp", "src/cpu/kernels/scale/neon/integer.cpp" ]
2086*c217d954SCole Faust          }
2087*c217d954SCole Faust        }
2088*c217d954SCole Faust      },
2089*c217d954SCole Faust      "Select": {
2090*c217d954SCole Faust        "files": {
2091*c217d954SCole Faust          "common": [
2092*c217d954SCole Faust            "src/core/NEON/kernels/NESelectKernel.cpp",
2093*c217d954SCole Faust            "src/runtime/NEON/functions/NESelect.cpp"
2094*c217d954SCole Faust          ],
2095*c217d954SCole Faust          "neon": {
2096*c217d954SCole Faust            "common": [ "src/cpu/kernels/select/generic/neon/impl.cpp" ],
2097*c217d954SCole Faust            "fp32": [ "src/cpu/kernels/select/generic/neon/fp32.cpp" ],
2098*c217d954SCole Faust            "fp16": [ "src/cpu/kernels/select/generic/neon/fp16.cpp" ],
2099*c217d954SCole Faust            "integer": [ "src/cpu/kernels/select/generic/neon/integer.cpp"  ]
2100*c217d954SCole Faust          }
2101*c217d954SCole Faust        }
2102*c217d954SCole Faust      },
2103*c217d954SCole Faust      "Slice": {
2104*c217d954SCole Faust        "deps": [ "StridedSlice" ],
2105*c217d954SCole Faust        "files": {
2106*c217d954SCole Faust          "common": [ "src/runtime/NEON/functions/NESlice.cpp" ]
2107*c217d954SCole Faust        }
2108*c217d954SCole Faust      },
2109*c217d954SCole Faust      "Softmax": {
2110*c217d954SCole Faust        "deps": [
2111*c217d954SCole Faust          "Permute"
2112*c217d954SCole Faust        ],
2113*c217d954SCole Faust        "files": {
2114*c217d954SCole Faust          "common": [
2115*c217d954SCole Faust            "src/cpu/operators/CpuSoftmax.cpp",
2116*c217d954SCole Faust            "src/cpu/kernels/CpuSoftmaxKernel.cpp",
2117*c217d954SCole Faust            "src/runtime/NEON/functions/NESoftmaxLayer.cpp"
2118*c217d954SCole Faust          ],
2119*c217d954SCole Faust          "neon":{
2120*c217d954SCole Faust            "common":["src/cpu/kernels/softmax/generic/neon/impl.cpp"],
2121*c217d954SCole Faust            "fp32": ["src/cpu/kernels/softmax/generic/neon/fp32.cpp"],
2122*c217d954SCole Faust            "fp16": ["src/cpu/kernels/softmax/generic/neon/fp16.cpp"],
2123*c217d954SCole Faust            "qasymm8":[ "src/cpu/kernels/softmax/generic/neon/qasymm8.cpp"],
2124*c217d954SCole Faust            "qasymm8_signed":["src/cpu/kernels/softmax/generic/neon/qasymm8_signed.cpp"]
2125*c217d954SCole Faust          },
2126*c217d954SCole Faust          "sve": {
2127*c217d954SCole Faust            "common": [ "src/cpu/kernels/softmax/generic/sve/impl.cpp" ],
2128*c217d954SCole Faust            "fp32": ["src/cpu/kernels/softmax/generic/sve/fp32.cpp"],
2129*c217d954SCole Faust            "fp16": ["src/cpu/kernels/softmax/generic/sve/fp16.cpp"],
2130*c217d954SCole Faust            "qasymm8": ["src/cpu/kernels/softmax/generic/sve/qasymm8.cpp" ],
2131*c217d954SCole Faust            "qasymm8_signed": ["src/cpu/kernels/softmax/generic/sve/qasymm8_signed.cpp"]
2132*c217d954SCole Faust          },
2133*c217d954SCole Faust          "sve2":{
2134*c217d954SCole Faust            "common" :["src/cpu/kernels/softmax/generic/sve2/impl.cpp"],
2135*c217d954SCole Faust            "qasymm8":[ "src/cpu/kernels/softmax/generic/sve2/qasymm8.cpp"],
2136*c217d954SCole Faust            "qasymm8_signed":["src/cpu/kernels/softmax/generic/sve2/qasymm8_signed.cpp"]
2137*c217d954SCole Faust          }
2138*c217d954SCole Faust        }
2139*c217d954SCole Faust      },
2140*c217d954SCole Faust      "SpaceToBatch": {
2141*c217d954SCole Faust        "files": {
2142*c217d954SCole Faust          "common": [
2143*c217d954SCole Faust            "src/core/NEON/kernels/NESpaceToBatchLayerKernel.cpp",
2144*c217d954SCole Faust            "src/runtime/NEON/functions/NESpaceToBatchLayer.cpp"
2145*c217d954SCole Faust          ]
2146*c217d954SCole Faust        }
2147*c217d954SCole Faust      },
2148*c217d954SCole Faust      "SpaceToDepth": {
2149*c217d954SCole Faust        "files": {
2150*c217d954SCole Faust          "common": [
2151*c217d954SCole Faust            "src/core/NEON/kernels/NESpaceToDepthLayerKernel.cpp",
2152*c217d954SCole Faust            "src/runtime/NEON/functions/NESpaceToDepthLayer.cpp"
2153*c217d954SCole Faust          ]
2154*c217d954SCole Faust        }
2155*c217d954SCole Faust      },
2156*c217d954SCole Faust      "Split": {
2157*c217d954SCole Faust        "deps": [ "StridedSlice" ],
2158*c217d954SCole Faust        "files": {
2159*c217d954SCole Faust          "common": [
2160*c217d954SCole Faust            "src/runtime/NEON/functions/NESplit.cpp"
2161*c217d954SCole Faust          ]
2162*c217d954SCole Faust        }
2163*c217d954SCole Faust      },
2164*c217d954SCole Faust      "Stack": {
2165*c217d954SCole Faust        "files": {
2166*c217d954SCole Faust          "common": [
2167*c217d954SCole Faust            "src/core/NEON/kernels/NEStackLayerKernel.cpp",
2168*c217d954SCole Faust            "src/runtime/NEON/functions/NEStackLayer.cpp"
2169*c217d954SCole Faust          ]
2170*c217d954SCole Faust        }
2171*c217d954SCole Faust      },
2172*c217d954SCole Faust      "StridedSlice": {
2173*c217d954SCole Faust        "files": {
2174*c217d954SCole Faust          "common": [
2175*c217d954SCole Faust            "src/core/NEON/kernels/NEStridedSliceKernel.cpp",
2176*c217d954SCole Faust            "src/runtime/NEON/functions/NEStridedSlice.cpp"
2177*c217d954SCole Faust          ]
2178*c217d954SCole Faust        }
2179*c217d954SCole Faust      },
2180*c217d954SCole Faust      "Sub": {
2181*c217d954SCole Faust        "files": {
2182*c217d954SCole Faust          "common": [
2183*c217d954SCole Faust            "src/cpu/operators/CpuSub.cpp",
2184*c217d954SCole Faust            "src/cpu/kernels/CpuSubKernel.cpp",
2185*c217d954SCole Faust            "src/runtime/NEON/functions/NEArithmeticSubtraction.cpp",
2186*c217d954SCole Faust            "src/cpu/kernels/sub/neon/qasymm8.cpp",
2187*c217d954SCole Faust            "src/cpu/kernels/sub/neon/qasymm8_signed.cpp",
2188*c217d954SCole Faust            "src/cpu/kernels/sub/neon/qsymm16.cpp"
2189*c217d954SCole Faust          ]
2190*c217d954SCole Faust        }
2191*c217d954SCole Faust      },
2192*c217d954SCole Faust      "Tile": {
2193*c217d954SCole Faust        "files": {
2194*c217d954SCole Faust          "common": [
2195*c217d954SCole Faust            "src/core/NEON/kernels/NETileKernel.cpp",
2196*c217d954SCole Faust            "src/runtime/NEON/functions/NETile.cpp"
2197*c217d954SCole Faust          ]
2198*c217d954SCole Faust        }
2199*c217d954SCole Faust      },
2200*c217d954SCole Faust      "Transpose": {
2201*c217d954SCole Faust        "files": {
2202*c217d954SCole Faust          "common": [
2203*c217d954SCole Faust            "src/cpu/kernels/CpuTransposeKernel.cpp",
2204*c217d954SCole Faust            "src/cpu/operators/CpuTranspose.cpp",
2205*c217d954SCole Faust            "src/runtime/NEON/functions/NETranspose.cpp"
2206*c217d954SCole Faust          ]
2207*c217d954SCole Faust        }
2208*c217d954SCole Faust      },
2209*c217d954SCole Faust      "Unstack": {
2210*c217d954SCole Faust        "deps": [ "StridedSlice" ],
2211*c217d954SCole Faust        "files": {
2212*c217d954SCole Faust          "common": [ "src/runtime/NEON/functions/NEUnstack.cpp" ]
2213*c217d954SCole Faust        }
2214*c217d954SCole Faust      }
2215*c217d954SCole Faust    }
2216*c217d954SCole Faust  },
2217*c217d954SCole Faust  "experimental": {
2218*c217d954SCole Faust    "dynamic_fusion": [
2219*c217d954SCole Faust      "src/dynamic_fusion/runtime/gpu/cl/ClKernelRuntime.cpp",
2220*c217d954SCole Faust      "src/dynamic_fusion/runtime/gpu/cl/ClWorkloadRuntime.cpp",
2221*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/CastAttributes.cpp",
2222*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/ClampAttributes.cpp",
2223*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/Conv2dAttributes.cpp",
2224*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/DepthwiseConv2dAttributes.cpp",
2225*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/Pool2dAttributes.cpp",
2226*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/ResizeAttributes.cpp",
2227*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/SoftmaxAttributes.cpp",
2228*c217d954SCole Faust      "src/dynamic_fusion/sketch/attributes/ReshapeAttributes.cpp",
2229*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuKernelArgument.cpp",
2230*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGraph.cpp",
2231*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuKernelComponentGroup.cpp",
2232*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuKernelComponentStream.cpp",
2233*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuLogicalKernel.cpp",
2234*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuOperatorGroup.cpp",
2235*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuWorkloadContext.cpp",
2236*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/GpuWorkloadSketch.cpp",
2237*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentActivation.cpp",
2238*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentCast.cpp",
2239*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDepthwiseConv2d.cpp",
2240*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentDirectConv2d.cpp",
2241*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentPool2d.cpp",
2242*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentElementwiseBinary.cpp",
2243*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DMaxShiftExpSum.cpp",
2244*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentLogits1DNorm.cpp",
2245*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentReshape.cpp",
2246*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentResize.cpp",
2247*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/components/cl/ClComponentStore.cpp",
2248*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuAdd.cpp",
2249*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuCast.cpp",
2250*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuClamp.cpp",
2251*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuConv2d.cpp",
2252*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuDepthwiseConv2d.cpp",
2253*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuMul.cpp",
2254*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuReshape.cpp",
2255*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuPool2d.cpp",
2256*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuOutput.cpp",
2257*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuResize.cpp",
2258*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuSoftmax.cpp",
2259*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/GpuSub.cpp",
2260*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/operators/internal/GpuElementwiseBinaryCommon.cpp",
2261*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateActivation.cpp",
2262*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateCast.cpp",
2263*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDepthwiseConv2d.cpp",
2264*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp",
2265*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplatePool2d.cpp",
2266*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateElementwiseBinary.cpp",
2267*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DMaxShiftExpSum.cpp",
2268*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateLogits1DNorm.cpp",
2269*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateReshape.cpp",
2270*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateResize.cpp",
2271*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateStore.cpp",
2272*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateWriter.cpp",
2273*c217d954SCole Faust      "src/dynamic_fusion/sketch/gpu/template_writer/GpuKernelVariableTable.cpp"
2274*c217d954SCole Faust    ]
2275*c217d954SCole Faust  }
2276*c217d954SCole Faust}
2277