Home
last modified time | relevance | path

Searched refs:threadsPerThreadgroup (Results 1 – 25 of 28) sorted by relevance

12

/aosp_15_r20/external/pytorch/aten/src/ATen/native/metal/mpscnn/
H A DMPSImageUtils.mm60 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
83 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
145 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
165 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
197 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
229 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMPSCNNUtils.mm22 const auto threadsPerThreadgroup = MTLSizeMake(
27 divRoundUp(width, threadsPerThreadgroup.width),
28 divRoundUp(height, threadsPerThreadgroup.height),
32 return {threadsPerThreadgroup, threadgroupsPerGrid, threadsPerGrid};
H A DMPSCNNClampOp.mm41 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMPSCNNUtils.h26 MTLSize threadsPerThreadgroup; member
/aosp_15_r20/external/skia/src/gpu/graphite/mtl/
H A DMtlComputeCommandEncoder.h106 MTLSize threadsPerThreadgroup = in dispatchThreadgroups() local
109 threadsPerThreadgroup:threadsPerThreadgroup]; in dispatchThreadgroups()
115 MTLSize threadsPerThreadgroup = in dispatchThreadgroupsWithIndirectBuffer() local
119 threadsPerThreadgroup:threadsPerThreadgroup]; in dispatchThreadgroupsWithIndirectBuffer()
/aosp_15_r20/external/angle/src/libANGLE/renderer/metal/
H A DProvokingVertexHelper.mm220 auto threadsPerThreadgroup = MTLSizeMake(MIN(primCount, 64u), 1, 1);
231 MTLSizeMake((primCount + threadsPerThreadgroup.width - 1) / threadsPerThreadgroup.width, 1,
233 threadsPerThreadgroup);
270 auto threadsPerThreadgroup = MTLSizeMake(MIN(primCount, 64u), 1, 1);
280 MTLSizeMake((primCount + threadsPerThreadgroup.width - 1) / threadsPerThreadgroup.width, 1,
282 threadsPerThreadgroup);
H A Dmtl_render_utils.mm588 const MTLSize &threadsPerThreadgroup)
592 encoder->dispatchNonUniform(numThreads, threadsPerThreadgroup);
597 (numThreads.width + threadsPerThreadgroup.width - 1) / threadsPerThreadgroup.width,
598 (numThreads.height + threadsPerThreadgroup.height - 1) / threadsPerThreadgroup.height,
599 (numThreads.depth + threadsPerThreadgroup.depth - 1) / threadsPerThreadgroup.depth);
600 encoder->dispatch(groups, threadsPerThreadgroup);
611 MTLSize threadsPerThreadgroup = MTLSizeMake(w, 1, 1);
616 cmdEncoder->dispatchNonUniform(threads, threadsPerThreadgroup);
621 cmdEncoder->dispatch(groups, threadsPerThreadgroup);
1755 MTLSize threadsPerThreadgroup = MTLSizeMake(w, 1, 1);
[all …]
/aosp_15_r20/external/pytorch/aten/src/ATen/native/metal/ops/
H A DMetalConcat.mm46 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
122 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
155 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalLeakyReLU.mm42 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
77 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalHardshrink.mm44 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
79 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalHardswish.mm40 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
73 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalCopy.mm45 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalBinaryElementwise.mm93 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
131 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalPadding.mm80 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalChunk.mm53 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalTranspose.mm81 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
H A DMetalReshape.mm57 threadsPerThreadgroup:launchParams.threadsPerThreadgroup];
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/metal/
H A Dcompute_task.cc289 threadsPerThreadgroup:groupsSize]; in EncodeToICB()
325 [encoder dispatchThreadgroups:groupsCount threadsPerThreadgroup:groupsSize]; in Encode()
H A Dbuffer_convert.mm120 [encoder dispatchThreadgroups:groups_count threadsPerThreadgroup:group_size];
/aosp_15_r20/external/pytorch/aten/src/ATen/native/mps/operations/
H A DMultiTensorApply.h299 … [computeEncoder dispatchThreadgroups:gridSize threadsPerThreadgroup:threadGroupSize];
334 [computeEncoder dispatchThreadgroups:gridSize threadsPerThreadgroup:threadGroupSize];
H A DQuantized.mm750 …[computeEncoder dispatchThreads:MTLSizeMake(N, Kdiv2 / 4, 1) threadsPerThreadgroup:MTLSizeMake(64,…
809 …[computeEncoder dispatchThreads:MTLSizeMake(N / 4 * 32, 1, M) threadsPerThreadgroup:MTLSizeMake(64…
867 threadsPerThreadgroup:MTLSizeMake(64, 1, 1)];
871 threadsPerThreadgroup:MTLSizeMake(128, 1, 1)];
/aosp_15_r20/external/pytorch/test/cpp_extensions/
H A Dmps_extension.mm66 [computeEncoder dispatchThreads: gridSize threadsPerThreadgroup: threadGroupSize];
/aosp_15_r20/external/pytorch/aten/src/ATen/test/
H A Dmps_test_objc_interface.mm76 [computeEncoder dispatchThreads: gridSize threadsPerThreadgroup: threadGroupSize];
/aosp_15_r20/external/tensorflow/tensorflow/lite/delegates/gpu/
H A Dmetal_delegate.mm133 threadsPerThreadgroup:MTLSizeMake(1, 1, 1)];
555 threadsPerThreadgroup:MTLSizeMake(1, 1, 1)];
/aosp_15_r20/external/pytorch/aten/src/ATen/native/mps/
H A DOperationUtils.h397 [encoder dispatchThreads:size threadsPerThreadgroup:threadGroupSize]; in mtl_dispatch1DJob()

12