Home
last modified time | relevance | path

Searched refs:cuda_compute_capability (Results 1 – 25 of 35) sorted by relevance

12

/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/tests/
H A Dhlo_to_llvm_ir.cc67 tensorflow::se::CudaComputeCapability cuda_compute_capability; in CompileAndPrintLlvmIr() local
68 cuda_compute_capability.major = sm / 10; in CompileAndPrintLlvmIr()
69 cuda_compute_capability.minor = sm % 10; in CompileAndPrintLlvmIr()
83 cuda_compute_capability, rocm_compute_capability, in CompileAndPrintLlvmIr()
93 llvm_module.get(), cuda_compute_capability, in CompileAndPrintLlvmIr()
H A Dgpu_atomic_test.cc119 .cuda_compute_capability() in TEST_F()
H A Dmlir_gpu_test_base.cc62 stream_exec->GetDeviceDescription().cuda_compute_capability(), in CompileMlirModule()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/
H A Dnvptx_compiler.cc85 stream_exec->GetDeviceDescription().cuda_compute_capability()); in OptimizeHloConvolutionCanonicalization()
87 stream_exec->GetDeviceDescription().cuda_compute_capability()); in OptimizeHloConvolutionCanonicalization()
126 if (stream_exec->GetDeviceDescription().cuda_compute_capability().IsAtLeast( in OptimizeHloPostLayoutAssignment()
131 if (stream_exec->GetDeviceDescription().cuda_compute_capability().IsAtLeast( in OptimizeHloPostLayoutAssignment()
153 if (!stream_exec->GetDeviceDescription().cuda_compute_capability().IsAtLeast( in OptimizeHloPostLayoutAssignment()
324 return stream_exec->GetDeviceDescription().cuda_compute_capability(); in GetGpuVersion()
H A Dir_emitter_context.h42 se::CudaComputeCapability cuda_compute_capability, in IrEmitterContext() argument
49 cuda_compute_capability_(cuda_compute_capability), in IrEmitterContext()
64 se::CudaComputeCapability cuda_compute_capability() const { in cuda_compute_capability() function
H A Dgpu_compiler.cc263 .cuda_compute_capability() in IsConvBF16Supported()
406 .cuda_compute_capability() in OptimizeHloModule()
755 stream_exec->GetDeviceDescription().cuda_compute_capability()); in OptimizeHloPostLayoutAssignment()
899 options.cuda_compute_capability = in LowerToJitRt()
900 stream_exec->GetDeviceDescription().cuda_compute_capability(); in LowerToJitRt()
970 se::CudaComputeCapability cuda_compute_capability, in CompileModuleToLlvmIrImpl() argument
1001 absl::StrCat("sm_", cuda_compute_capability.ToString(), in CompileModuleToLlvmIrImpl()
1037 gpu_device_info, cuda_compute_capability, rocm_compute_capability, in CompileModuleToLlvmIrImpl()
1361 stream_exec->GetDeviceDescription().cuda_compute_capability(), in RunBackend()
1457 stream_exec->GetDeviceDescription().cuda_compute_capability(), in CompileAheadOfTime()
[all …]
H A Dtree_reduction_rewriter.h79 se::CudaComputeCapability cuda_compute_capability) in GpuTreeReductionRewriter() argument
80 : cuda_compute_capability_(cuda_compute_capability) {} in GpuTreeReductionRewriter()
H A Dtree_reduction_rewriter.cc49 se::CudaComputeCapability cuda_compute_capability) in ReductionRewriterVisitor() argument
50 : cuda_compute_capability_(cuda_compute_capability) {} in ReductionRewriterVisitor()
H A Dir_emission_utils.h101 se::CudaComputeCapability cuda_compute_capability);
H A Dgpu_compiler.h178 se::CudaComputeCapability cuda_compute_capability,
/aosp_15_r20/external/tensorflow/tensorflow/tools/tensorflow_builder/config_detector/
H A DBUILD20 ":cuda_compute_capability",
28 name = "cuda_compute_capability",
29 srcs = ["data/cuda_compute_capability.py"],
H A Dconfig_detector.py71 from tensorflow.tools.tensorflow_builder.config_detector.data import cuda_compute_capability
249 gpu_dict = cuda_compute_capability.retrieve_from_golden()
388 cuda_compute_capa = cuda_compute_capability.retrieve_from_web()
390 cuda_compute_capa = cuda_compute_capability.retrieve_from_golden()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/tfrt/transforms/lmhlo_to_gpu/
H A Dlmhlo_to_gpu_binary.h45 options.cuda_compute_capability = {5, 2}; in DefaultGpuBinaryOptions()
53 stream_executor::CudaComputeCapability cuda_compute_capability; member
H A Dkernel_ops_pattern.cc235 gpu_options.cuda_compute_capability, gpu_options.rocm_compute_capability, in Emit()
319 gpu_options.cuda_compute_capability, in Match()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/
H A Ddevice_description.cc92 result["CUDA Compute Capability"] = cuda_compute_capability().ToString(); in ToMap()
109 CudaComputeCapability DeviceDescription::cuda_compute_capability() const { in cuda_compute_capability() function in stream_executor::DeviceDescription
H A Dstream_executor_pimpl.cc283 GetDeviceDescription().cuda_compute_capability(), out_algorithms); in GetConvolveAlgorithms()
286 GetDeviceDescription().cuda_compute_capability(), out_algorithms); in GetConvolveAlgorithms()
289 GetDeviceDescription().cuda_compute_capability(), out_algorithms); in GetConvolveAlgorithms()
H A Ddnn.cc111 CudaComputeCapability cuda_compute_capability, in GetConvolveAlgorithms() argument
192 CudaComputeCapability cuda_compute_capability, in GetConvolveBackwardDataAlgorithms() argument
198 CudaComputeCapability cuda_compute_capability, in GetConvolveBackwardFilterAlgorithms() argument
H A Ddevice_description.h271 CudaComputeCapability cuda_compute_capability() const;
H A Ddnn.h1386 CudaComputeCapability cuda_compute_capability,
1497 CudaComputeCapability cuda_compute_capability,
1503 CudaComputeCapability cuda_compute_capability,
/aosp_15_r20/external/tensorflow/tensorflow/core/common_runtime/gpu/
H A Dgpu_device.cc1102 se->GetDeviceDescription().cuda_compute_capability(); in SingleVirtualDeviceMemoryLimit()
1263 (*details)["compute_capability"] = desc->cuda_compute_capability().ToString(); in GetDeviceDetails()
1550 ", compute capability: ", desc.cuda_compute_capability().ToString()); in GetShortDeviceDescription()
1905 << description->cuda_compute_capability().ToString() in GetValidDeviceIds()
1975 if (desc->cuda_compute_capability() < min_supported_capability) { in GetValidDeviceIds()
1980 << desc->cuda_compute_capability().ToString() in GetValidDeviceIds()
2020 auto device_capability = desc->cuda_compute_capability(); in GetValidDeviceIds()
/aosp_15_r20/external/tensorflow/tensorflow/core/grappler/
H A Ddevices.cc53 (*desc)->cuda_compute_capability().IsAtLeast( in GetNumAvailableGPUs()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/stream_executor/cuda/
H A Dcuda_dnn.h217 CudaComputeCapability cuda_compute_capability,
272 CudaComputeCapability cuda_compute_capability,
276 CudaComputeCapability cuda_compute_capability,
H A Dcuda_dnn.cc912 CudaComputeCapability cuda_compute_capability) { in TensorOpMathAvailable() argument
913 return cuda_compute_capability.IsAtLeast(7); in TensorOpMathAvailable()
4750 auto cuda_compute_capability = stream->GetCudaComputeCapability(); in GetConvolveRunners() local
4758 got_algos = GetConvolveAlgorithms(cuda_compute_capability, &algorithms); in GetConvolveRunners()
4761 got_algos = GetConvolveBackwardFilterAlgorithms(cuda_compute_capability, in GetConvolveRunners()
4765 got_algos = GetConvolveBackwardDataAlgorithms(cuda_compute_capability, in GetConvolveRunners()
5219 auto cuda_compute_capability = stream->GetCudaComputeCapability(); in GetFusedConvolveRunners() local
5220 if (!GetConvolveAlgorithms(cuda_compute_capability, &algorithms)) { in GetFusedConvolveRunners()
5275 CudaComputeCapability cuda_compute_capability, in GetConvolveAlgorithms() argument
5280 TensorOpMathAvailable(cuda_compute_capability); in GetConvolveAlgorithms()
[all …]
/aosp_15_r20/external/tensorflow/tensorflow/stream_executor/rocm/
H A Drocm_dnn.h237 CudaComputeCapability cuda_compute_capability,
276 CudaComputeCapability cuda_compute_capability,
280 CudaComputeCapability cuda_compute_capability,
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/
H A Dplatform_util.cc131 se::CudaComputeCapability cc = description.cuda_compute_capability(); in IsDeviceSupported()

12