Home
last modified time | relevance | path

Searched refs:GetNumThreadsPerBlock (Results 1 – 2 of 2) sorted by relevance

/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/
H A Dkernel_mapping_scheme.h111 int64_t GetNumThreadsPerBlock() const { in GetNumThreadsPerBlock() function
127 return GetNumThreadsPerBlock() * thread_id_virtual_scaling_; in GetNumThreadsPerBlockPhysical()
H A Dir_emitter_unnested.cc3632 CHECK_EQ(tiling_scheme.GetNumThreadsPerBlock() % WarpSize(), 0); in GenerateReductionCodegenState()
3633 int num_warps = tiling_scheme.GetNumThreadsPerBlock() / WarpSize(); in GenerateReductionCodegenState()
3951 if (tiling_scheme.GetNumThreadsPerBlock() > WarpSize()) { in EmitReductionOutputForRowReduction()
3954 tiling_scheme.GetNumThreadsPerBlock()); in EmitReductionOutputForRowReduction()
4023 tiling_scheme.GetNumThreadsPerBlock()); in EmitReductionOutputForColumnReduction()
4084 thread_id_physical, constant(tiling_scheme.GetNumThreadsPerBlock())); in EmitThreadIdInfo()
4086 thread_id_physical, constant(tiling_scheme.GetNumThreadsPerBlock())); in EmitThreadIdInfo()