Home
last modified time | relevance | path

Searched defs:all_reduce (Results 1 – 25 of 36) sorted by relevance

12

/aosp_15_r20/external/tensorflow/tensorflow/dtensor/mlir/
H A Ddtensor_allreduce_combine_optimization.cc197 mlir::TF::DTensorAllReduceOp& all_reduce = all_reduce_group[i]; in MergeAllReduceGroup() local
234 mlir::TF::DTensorAllReduceOp& all_reduce = all_reduce_group[i]; in MergeAllReduceGroup() local
257 mlir::TF::DTensorAllReduceOp& all_reduce = all_reduce_group[i]; in MergeAllReduceGroup() local
358 for (mlir::TF::DTensorAllReduceOp all_reduce : all_reduces) { in CombineAllReduceOpsOfSameTypeAndGroupAssignment() local
472 mlir::TF::DTensorAllReduceOp all_reduce = all_reduce_group[i]; in CombineAllReduceOpsOfSameTypeAndGroupAssignment() local
476 mlir::TF::DTensorAllReduceOp all_reduce = all_reduce_group[i]; in CombineAllReduceOpsOfSameTypeAndGroupAssignment() local
518 for (mlir::TF::DTensorAllReduceOp all_reduce : all_reduces) { in CombineAllReduceOpsOfSameType() local
554 cluster.GetBody().walk([&](mlir::TF::DTensorAllReduceOp all_reduce) { in runOnOperation()
H A Ddtensor_allreduce_sum_optimization.cc154 mlir::TF::DTensorAllReduceOp all_reduce = in OptimizeAllReduceAndSum() local
290 mlir::TF::DTensorAllReduceOp all_reduce = in CheckWhileLoopOptimizationCriteria() local
367 const int output_index, mlir::TF::DTensorAllReduceOp all_reduce, in ExtractAllReduceFromWhileOp()
427 mlir::TF::DTensorAllReduceOp all_reduce; in OptimizeWhileLoopLazyAllReduce() local
H A Ddtensor_allreduce_scatter_optimization.cc79 function.walk([&](mlir::TF::DTensorAllReduceOp all_reduce) { in ApplyOptimization()
H A Dcollectives.cc322 auto all_reduce = builder.create<mlir::TF::DTensorAllReduceOp>( in EmitAllReduce() local
/aosp_15_r20/external/tensorflow/tensorflow/dtensor/mlir/utils/
H A Dcollective_lowering.cc91 mlir::TF::DTensorAllReduceOp all_reduce, in EmitAllReduceForXla()
205 mlir::TF::DTensorAllReduceOp all_reduce, mlir::Value* value) { in LowerAllReduceOpImpl()
310 mlir::TF::DTensorAllReduceOp all_reduce) { in LowerAllReduceOp()
616 mlir::TF::DTensorAllReduceOp all_reduce = in LowerAllGatherOp() local
738 module.walk([&](mlir::TF::DTensorAllReduceOp all_reduce) { in runOnOperation()
743 for (auto& all_reduce : all_reduces) in runOnOperation() local
760 module.walk([&](mlir::TF::DTensorReduceScatterOp all_reduce) { in runOnOperation()
765 for (auto& all_reduce : all_reduces) in runOnOperation() local
/aosp_15_r20/external/tensorflow/tensorflow/python/kernel_tests/
H A Dcollective_ops_test.py47 def all_reduce(t, group_size, group_key, instance_key, *args, **kwargs): member in CollectiveOpsV1
65 def all_reduce(t, group_size, group_key, instance_key, *args, **kwargs): member in CollectiveOpsV2
571 def all_reduce(device): function
607 def all_reduce(device): function
644 def all_reduce(device, device_index): function
682 def all_reduce(device, device_index): function
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/gpu/
H A Dall_reduce_blueconnect_test.cc75 auto all_reduce = AllOf(op::Shape("f32[4]"), op::AllReduce(reduce_scatter), in TEST_F() local
117 auto all_reduce = AllOf(op::Shape("f32[2]"), op::AllReduce(reduce_scatter1), in TEST_F() local
162 auto all_reduce = AllOf(op::Shape("(f32[4], f32[8])"), in TEST_F() local
H A Dnvptx_compiler_test.cc53 HloInstruction* all_reduce = module->entry_computation()->root_instruction(); in TEST_F() local
83 HloInstruction* all_reduce = module->entry_computation()->root_instruction(); in TEST_F() local
H A Dall_reduce_blueconnect.cc111 const HloAllReduceInstruction& all_reduce, size_t num_devices_per_host) { in TryDecomposeReplicaGroups()
186 StatusOr<bool> TryDecomposeAllReduce(HloAllReduceInstruction* all_reduce, in TryDecomposeAllReduce()
/aosp_15_r20/external/tensorflow/tensorflow/compiler/xla/service/
H A Dwhile_loop_all_reduce_code_motion.cc159 HloInstruction* all_reduce, HloComputation* while_body, in IsAllReduceMovable()
170 auto all_reduce_is_summation = [](HloInstruction* all_reduce) -> bool { in IsAllReduceMovable()
464 HloComputation* while_body) -> MovableAllReduceContext { in IsAllReduceMovable()
829 HloInstruction* all_reduce = all_reduce_accumulations_pair.first; in Run() local
H A Dall_reduce_simplifier.cc41 [this](const HloInstruction* all_reduce) -> int64_t { in Run()
94 auto all_reduce = all_reduce_and_group_size.first; in Run() local
H A Dar_crs_combiner.cc95 auto all_reduce = Cast<HloAllReduceInstruction>(hlo); in HasCombinableReplicaGroup() local
544 auto all_reduce = pair.ar; in RewriteGraph() local
H A Dall_reduce_contiguous.cc31 Status ReplaceWithContiguousAllReduce(HloAllReduceInstruction* all_reduce) { in ReplaceWithContiguousAllReduce()
H A Dall_reduce_combiner_test.cc219 auto all_reduce = b.AddInstruction(HloInstruction::CreateAllReduce( in TEST_F() local
/aosp_15_r20/external/tensorflow/tensorflow/compiler/mlir/xla/transforms/
H A Dlegalize_tf_collective.cc142 auto all_reduce = builder.create<AllReduceOp>( in ConvertAllReduce() local
199 LogicalResult matchAndRewrite(TF::XlaAllReduceOp all_reduce, in matchAndRewrite()
251 LogicalResult matchAndRewrite(TF::CollectiveReduceV2Op all_reduce, in matchAndRewrite()
H A Dmhlo_to_lhlo_with_xla.cc1175 auto* all_reduce = xla::Cast<xla::HloAllReduceInstruction>(instr); in EmitAllReduceOp() local
1200 auto* all_reduce = xla::Cast<xla::HloAllReduceInstruction>(instr); in EmitAllReduceStartOp() local
/aosp_15_r20/external/pytorch/torch/cuda/
H A Dnccl.py71 def all_reduce(inputs, outputs=None, op=SUM, streams=None, comms=None): function
/aosp_15_r20/external/pytorch/test/distributed/tensor/parallel/
H A Dtest_tp_examples.py47 reduce_scatter, all_gather, all_reduce = ( variable
/aosp_15_r20/external/tensorflow/tensorflow/python/ops/
H A Dcollective_ops.py19 def all_reduce(t, function
/aosp_15_r20/external/tensorflow/tensorflow/python/distribute/
H A Dcross_device_utils.py332 def all_reduce( member in CollectiveReplicaLauncher
H A Dvars_test.py1012 def all_reduce(): function
/aosp_15_r20/external/pytorch/torch/distributed/checkpoint/
H A Dutils.py194 def all_reduce( member in _DistWrapper
/aosp_15_r20/external/pytorch/torch/distributed/nn/
H A Dfunctional.py205 def all_reduce(tensor, op=ReduceOp.SUM, group=group.WORLD): function
/aosp_15_r20/external/pytorch/torch/distributed/_tools/
H A Dfsdp2_mem_tracker.py517 def all_reduce( function
/aosp_15_r20/external/pytorch/torch/csrc/distributed/c10d/
H A DFunctional.cpp119 at::Tensor all_reduce( in all_reduce() function

12