Home
last modified time | relevance | path

Searched refs:GPUModuleOp (Results 1 – 15 of 15) sorted by relevance

/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/mlir_hlo/lib/Transforms/
H A Dhlo_to_gpu_pipeline.cc37 using ::mlir::gpu::GPUModuleOp;
65 pm.addNestedPass<GPUModuleOp>(createForLoopSpecializationPass()); in createHloToGpuPipeline()
66 pm.addNestedPass<GPUModuleOp>(createLowerAffinePass()); in createHloToGpuPipeline()
67 pm.addNestedPass<GPUModuleOp>(createCanonicalizerPass()); in createHloToGpuPipeline()
68 pm.addNestedPass<GPUModuleOp>(createConvertSCFToCFPass()); in createHloToGpuPipeline()
71 pm.addNestedPass<GPUModuleOp>(createGpuKernelToRocdlPass()); in createHloToGpuPipeline()
73 pm.addNestedPass<GPUModuleOp>(createGpuKernelToNvvmPass()); in createHloToGpuPipeline()
78 pm.addNestedPass<GPUModuleOp>(createStripDebugInfoPass()); in createHloToGpuPipeline()
H A Dgpu_kernel_lowering_passes.cc91 std::unique_ptr<OperationPass<gpu::GPUModuleOp> >
96 std::unique_ptr<OperationPass<gpu::GPUModuleOp> >
H A Dpropagate_static_shapes_to_kernel.cc223 auto callback = [&](gpu::GPUModuleOp gpuModule) -> WalkResult { in runOnOperation()
H A Dgpu_fusion_rewrite.cc246 for (auto gpuModuleOp : moduleOp.getBodyRegion().getOps<gpu::GPUModuleOp>()) { in matchAndRewrite()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/mlir_hlo/include/mlir-hlo/Transforms/
H A Dgpu_passes.h27 class GPUModuleOp; variable
40 std::unique_ptr<OperationPass<mlir::gpu::GPUModuleOp>>
44 std::unique_ptr<OperationPass<mlir::gpu::GPUModuleOp>>
H A Dgpu_passes.td26 def GpuKernelToNVVMPass : Pass<"gpu-kernel-to-nvvm", "gpu::GPUModuleOp"> {
32 def GpuKernelToROCDLPass : Pass<"gpu-kernel-to-rocdl", "gpu::GPUModuleOp"> {
H A DGPUPassDetail.h27 class GPUModuleOp; variable
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/tools/kernel_gen/transforms/
H A Dtf_kernel_to_llvm_pass.cc165 auto kernel_module = SymbolTable::lookupNearestSymbolFrom<gpu::GPUModuleOp>( in matchAndRewrite()
289 target.addLegalOp<ModuleOp, gpu::GPUModuleOp>(); in runOnOperation()
291 target.markOpRecursivelyLegal<gpu::GPUModuleOp>(); in runOnOperation()
300 for (auto op : llvm::make_early_inc_range(m.getOps<gpu::GPUModuleOp>())) { in runOnOperation()
H A Dgpu_kernel_to_blob_pass.cc62 gpu::GPUModuleOp gpu_module = getOperation(); in runOnOperation()
77 gpu::GPUModuleOp gpu_module) { in GetGpuBinaryBlob()
259 std::unique_ptr<OperationPass<gpu::GPUModuleOp>> CreateGpuKernelToBlobPass( in CreateGpuKernelToBlobPass()
H A Dpasses.h70 std::unique_ptr<OperationPass<gpu::GPUModuleOp>> CreateGpuKernelToBlobPass(
H A Dpasses.td80 def GpuKernelToBlobPass : Pass<"gpu-kernel-to-blob", "gpu::GPUModuleOp"> {
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/tools/kernel_gen/
H A Dkernel_creator.cc317 auto gpu_modules = module.getOps<::mlir::gpu::GPUModuleOp>(); in LowerKernelBodiesToLowLevelIr()
318 for (::mlir::gpu::GPUModuleOp gpu_module : gpu_modules) { in LowerKernelBodiesToLowLevelIr()
334 auto& kernelPm = pm.nest<::mlir::gpu::GPUModuleOp>(); in LowerKernelBodiesToLowLevelIr()
378 auto& kernel_pm = pm.nest<mlir::gpu::GPUModuleOp>(); in GenerateDeviceCode()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/tfrt/transforms/lmhlo_to_gpu/
H A Dlmhlo_to_jitrt.cc82 using mlir::gpu::GPUModuleOp;
154 class GpuModuleOpLowering : public OpRewritePattern<GPUModuleOp> {
158 LogicalResult matchAndRewrite(GPUModuleOp op, in matchAndRewrite()
373 auto gpu_module = kernel->getParentOfType<mlir::gpu::GPUModuleOp>(); in matchAndRewrite()
H A Dkernel_ops_pattern.cc341 auto gpu_module = rewriter.create<mlir::gpu::GPUModuleOp>(loc, "gpu_module"); in Rewrite()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/
H A Dir_emitter_unnested.cc1600 auto gpu_module = kernel_func->getParentOfType<mlir::gpu::GPUModuleOp>(); in EmitLaunchFunc()