torch/csrc/distributed/c10d/Ops.cpp - platform/external/pytorch - Git at Google

 #include <torch/csrc/distributed/c10d/Ops.hpp>

 #include <ATen/core/dispatch/Dispatcher.h>
 #include <torch/library.h>

 namespace c10d {
 namespace {
 c10::intrusive_ptr<ProcessGroup::Work> broadcast(
     const c10::intrusive_ptr<ProcessGroup>& process_group,
     at::TensorList tensors,
     int64_t root_rank = 0,
     int64_t root_tensor = 0,
     int64_t timeout = -1) {
   auto tensor_vec = tensors.vec();
   return process_group->broadcast(
       tensor_vec,
       BroadcastOptions{
           root_rank, root_tensor, std::chrono::milliseconds(timeout)});
 }

 TORCH_LIBRARY(c10d, m) {
   // The following ProcessGroup and Work definations are more like declarations.
   // They don't expose the details of the two classes into TorchScript.
   m.class_<ProcessGroup>("ProcessGroup").def(torch::init<int64_t, int64_t>());
   m.class_<ProcessGroup::Work>("Work").def(torch::init<>());
   // It's important to register the op to the CompositeExplicitAutograd key to
   // enable
   // __torch_dispatch__.
   m.def(
       "broadcast",
       dispatch(c10::DispatchKey::CompositeExplicitAutograd, broadcast));
 }
 } // namespace

 namespace ops {

 c10::intrusive_ptr<ProcessGroup::Work> broadcast(
     const c10::intrusive_ptr<ProcessGroup>& process_group,
     at::TensorList tensors,
     const BroadcastOptions& opts) {
   auto op = c10::Dispatcher::singleton()
                 .findSchemaOrThrow("c10d::broadcast", "")
                 .typed<c10::intrusive_ptr<::c10d::ProcessGroup::Work>(
                     const c10::intrusive_ptr<::c10d::ProcessGroup>&,
                     at::TensorList,
                     int64_t,
                     int64_t,
                     int64_t)>();
   // It's awakward to unbox the opts here and box them again in the custom C++
   // op. But it's also complicated to make opts as a CustomClassHolder. Leave it
   // as it is now.
   return op.call(
       process_group,
       tensors,
       opts.rootRank,
       opts.rootTensor,
       opts.timeout.count());
 }

 } // namespace ops
 } // namespace c10d
	#include <torch/csrc/distributed/c10d/Ops.hpp>

	#include <ATen/core/dispatch/Dispatcher.h>
	#include <torch/library.h>

	namespace c10d {
	namespace {
	c10::intrusive_ptr<ProcessGroup::Work> broadcast(
	const c10::intrusive_ptr<ProcessGroup>& process_group,
	at::TensorList tensors,
	int64_t root_rank = 0,
	int64_t root_tensor = 0,
	int64_t timeout = -1) {
	auto tensor_vec = tensors.vec();
	return process_group->broadcast(
	tensor_vec,
	BroadcastOptions{
	root_rank, root_tensor, std::chrono::milliseconds(timeout)});
	}

	TORCH_LIBRARY(c10d, m) {
	// The following ProcessGroup and Work definations are more like declarations.
	// They don't expose the details of the two classes into TorchScript.
	m.class_<ProcessGroup>("ProcessGroup").def(torch::init<int64_t, int64_t>());
	m.class_<ProcessGroup::Work>("Work").def(torch::init<>());
	// It's important to register the op to the CompositeExplicitAutograd key to
	// enable
	// __torch_dispatch__.
	m.def(
	"broadcast",
	dispatch(c10::DispatchKey::CompositeExplicitAutograd, broadcast));
	}
	} // namespace

	namespace ops {

	c10::intrusive_ptr<ProcessGroup::Work> broadcast(
	const c10::intrusive_ptr<ProcessGroup>& process_group,
	at::TensorList tensors,
	const BroadcastOptions& opts) {
	auto op = c10::Dispatcher::singleton()
	.findSchemaOrThrow("c10d::broadcast", "")
	.typed<c10::intrusive_ptr<::c10d::ProcessGroup::Work>(
	const c10::intrusive_ptr<::c10d::ProcessGroup>&,
	at::TensorList,
	int64_t,
	int64_t,
	int64_t)>();
	// It's awakward to unbox the opts here and box them again in the custom C++
	// op. But it's also complicated to make opts as a CustomClassHolder. Leave it
	// as it is now.
	return op.call(
	process_group,
	tensors,
	opts.rootRank,
	opts.rootTensor,
	opts.timeout.count());
	}

	} // namespace ops
	} // namespace c10d