/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/ |
H A D | all_reduce_blueconnect_test.cc | 73 auto reduce_scatter = AllOf(op::Shape("f32[4]"), op::ReduceScatter(bitcast), in TEST_F() local 159 auto reduce_scatter = AllOf(op::Shape("(f32[4], f32[8])"), in TEST_F() local
|
H A D | all_reduce_blueconnect.cc | 225 HloInstruction* reduce_scatter = in TryDecomposeAllReduce() local
|
/aosp_15_r20/external/tensorflow/tensorflow/dtensor/mlir/ |
H A D | dtensor_allreduce_scatter_optimization.cc | 138 auto reduce_scatter = builder.create<mlir::TF::DTensorReduceScatterOp>( in ApplyOptimization() local
|
/aosp_15_r20/external/pytorch/torch/cuda/ |
H A D | nccl.py | 142 def reduce_scatter( function
|
/aosp_15_r20/external/pytorch/test/cpp_extensions/ |
H A D | cpp_c10d_extension.cpp | 83 c10::intrusive_ptr<Work> ProcessGroupTest::reduce_scatter( in reduce_scatter() function in c10d::ProcessGroupTest
|
/aosp_15_r20/external/pytorch/torch/csrc/distributed/c10d/ |
H A D | PyProcessGroup.hpp | 155 c10::intrusive_ptr<Work> reduce_scatter( in reduce_scatter() function in c10d::PyProcessGroup
|
H A D | FakeProcessGroup.hpp | 120 c10::intrusive_ptr<Work> reduce_scatter( in reduce_scatter() function in c10d::FakeProcessGroup
|
H A D | Backend.hpp | 201 virtual c10::intrusive_ptr<Work> reduce_scatter( in reduce_scatter() function in c10d::Backend
|
H A D | ProcessGroup.hpp | 349 virtual c10::intrusive_ptr<Work> reduce_scatter( in reduce_scatter() function in c10d::ProcessGroup
|
H A D | ProcessGroupWrapper.cpp | 480 c10::intrusive_ptr<Work> ProcessGroupWrapper::reduce_scatter( in reduce_scatter() function in c10d::ProcessGroupWrapper
|
H A D | ProcessGroupMPI.cpp | 689 c10::intrusive_ptr<Work> ProcessGroupMPI::reduce_scatter( in reduce_scatter() function in c10d::ProcessGroupMPI
|
H A D | ProcessGroupUCC.cpp | 1378 c10::intrusive_ptr<Work> ProcessGroupUCC::reduce_scatter( in reduce_scatter() function in c10d::ProcessGroupUCC
|
H A D | ProcessGroupNCCL.cpp | 3857 c10::intrusive_ptr<Work> ProcessGroupNCCL::reduce_scatter( in checkForNCCLErrorsInternal() function in c10d::ProcessGroupNCCL
|
H A D | ProcessGroupGloo.cpp | 2602 c10::intrusive_ptr<Work> ProcessGroupGloo::reduce_scatter( in reduce_scatter() function in c10d::ProcessGroupGloo
|
/aosp_15_r20/external/pytorch/test/distributed/tensor/parallel/ |
H A D | test_tp_examples.py | 47 reduce_scatter, all_gather, all_reduce = ( variable
|
/aosp_15_r20/external/pytorch/torch/distributed/checkpoint/ |
H A D | utils.py | 147 def reduce_scatter( member in _DistWrapper
|
/aosp_15_r20/external/pytorch/test/inductor/ |
H A D | test_distributed_patterns.py | 24 def reduce_scatter(t): function
|
/aosp_15_r20/external/pytorch/test/distributed/ |
H A D | test_c10d_ops_nccl.py | 739 def reduce_scatter(outputs, input_lists, op): function
|
H A D | test_c10d_common.py | 1601 def reduce_scatter(self, output_tensor_list, input_tensor_lists, opts=None): member in DummyProcessGroup
|
/aosp_15_r20/external/pytorch/torch/distributed/nn/ |
H A D | functional.py | 88 def reduce_scatter(output, input_list, op=ReduceOp.SUM, group=group.WORLD): function
|
/aosp_15_r20/external/pytorch/torch/testing/_internal/distributed/ |
H A D | multi_threaded_pg.py | 379 def reduce_scatter(self, output_tensor, scatter_list, opts=ReduceScatterOptions()): member in ProcessLocalGroup
|
/aosp_15_r20/external/tensorflow/tensorflow/dtensor/mlir/utils/ |
H A D | collective_lowering.cc | 325 mlir::TF::DTensorReduceScatterOp reduce_scatter) { in LowerReduceScatterOp()
|
/aosp_15_r20/external/pytorch/torch/csrc/cuda/ |
H A D | nccl.cpp | 718 void reduce_scatter( in reduce_scatter() function
|
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/xla/ |
H A D | hlo_function_importer.cc | 1186 auto reduce_scatter = Cast<HloReduceScatterInstruction>(instruction); in ImportInstructionImpl() local
|
/aosp_15_r20/external/pytorch/torch/distributed/ |
H A D | distributed_c10d.py | 3727 def reduce_scatter(output, input_list, op=ReduceOp.SUM, group=None, async_op=False): function
|