Home
last modified time | relevance | path

Searched refs:shared_memory_per_block (Results 1 – 12 of 12) sorted by relevance

/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/
H A Dgpu_device_info.cc27 gpu_device_info.shared_memory_per_block = in GetGpuDeviceInfo()
28 stream_exec->GetDeviceDescription().shared_memory_per_block(); in GetGpuDeviceInfo()
H A Dbuffer_comparator.cc662 gpu_device_info.shared_memory_per_block = in DeviceCompare()
663 executor->GetDeviceDescription().shared_memory_per_block(); in DeviceCompare()
H A Dgpu_device_info.h30 int shared_memory_per_block; member
H A Dir_emitter_unnested.cc2668 ir_emitter_context_->gpu_device_info().shared_memory_per_block; in EmitSort()
2677 ir_emitter_context_->gpu_device_info().shared_memory_per_block); in EmitSort()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/cuda/
H A Dcuda_gpu_executor.cc525 uint64_t shared_memory_per_block, in CalculateOccupancy() argument
532 shared_memory_per_block, 0); in CalculateOccupancy()
542 uint64_t shared_memory_per_block, in CompareOccupancy() argument
549 shared_memory_per_block, 0); in CompareOccupancy()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/gpu/
H A Dgpu_executor.h130 uint64_t shared_memory_per_block,
137 uint64_t shared_memory_per_block,
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/tfrt/transforms/lmhlo_to_gpu/
H A Dlmhlo_to_gpu_binary.h34 options.gpu_device_info.shared_memory_per_block = in DefaultGpuBinaryOptions()
/aosp_15_r20/external/tensorflow/tensorflow/core/kernels/
H A Dtensor_to_hash_bucket_op_gpu.cu.cc96 stream->parent()->GetDeviceDescription().shared_memory_per_block(); in operator ()()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/tests/
H A Dhlo_to_llvm_ir.cc60 gpu_device_info.shared_memory_per_block = 49152; in CompileAndPrintLlvmIr()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/tpu/
H A Dc_api_decl.h144 int64_t shared_memory_per_block; member
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/
H A Ddevice_description.h285 int64_t shared_memory_per_block() const { return shared_memory_per_block_; } in shared_memory_per_block() function
/aosp_15_r20/external/tensorflow/tensorflow/stream_executor/rocm/
H A Drocm_gpu_executor.cc352 uint64_t shared_memory_per_block, in CalculateOccupancy() argument
362 uint64_t shared_memory_per_block, in CompareOccupancy() argument