torch/csrc/cuda/python_comm.cpp - platform/external/pytorch - Git at Google

 #include <torch/csrc/utils/pybind.h>
 #include <torch/csrc/cuda/comm.h>
 #include <torch/csrc/cuda/Stream.h>
 #include <torch/csrc/cuda/THCP.h>
 #include <torch/csrc/utils/auto_gil.h>
 #include <ATen/core/functional.h>

 #include <ATen/ATen.h>

 #include <THC/THC.h>

 #include <cstddef>
 #include <vector>

 namespace torch { namespace cuda { namespace python {
 void initCommMethods(PyObject *module) {
   auto m = py::cast<py::module>(module);
   m.def(
        "_broadcast_coalesced",
        [](std::vector<at::Tensor>& tensors,
           std::vector<int64_t> devices,
           size_t buffer_size) {
          return broadcast_coalesced(tensors, devices, buffer_size);
        },
        py::arg("tensors"),
        py::arg("devices"),
        py::arg("buffer_size"),
        py::call_guard<py::gil_scoped_release>())
       .def(
           "_broadcast",
           [](at::Tensor& tensor, std::vector<int64_t> devices) {
             return broadcast(tensor, devices);
           },
           py::call_guard<py::gil_scoped_release>())
       .def(
           "_scatter",
           [](at::Tensor& tensor,
              std::vector<int64_t>& devices,
              c10::optional<std::vector<int64_t>> chunk_sizes,
              int64_t dim,
              c10::optional<py::object> py_streams) {
             c10::optional<std::vector<c10::optional<at::cuda::CUDAStream>>> streams;
             if (py_streams) {
               py::handle handle = *py_streams;
               streams = THPUtils_PySequence_to_CUDAStreamList(handle.ptr());
             }
             // Note: We're holding the GIL up to here.
             AutoNoGIL no_gil;
             return scatter(tensor, devices, chunk_sizes, dim, streams);
           },
           py::arg("tensor"),
           py::arg("devices"),
           py::arg("chunk_sizes"),
           py::arg("dim"),
           py::arg("streams"))
       .def(
           "_gather",
           [](std::vector<at::Tensor>& tensors,
              int64_t dim,
              c10::optional<int32_t> destination_index) {
             return gather(tensors, dim, destination_index);
           },
           py::arg("tensors"),
           py::arg("dim"),
           py::arg("destination_index"),
           py::call_guard<py::gil_scoped_release>());
 }
 }}}
	#include <torch/csrc/utils/pybind.h>
	#include <torch/csrc/cuda/comm.h>
	#include <torch/csrc/cuda/Stream.h>
	#include <torch/csrc/cuda/THCP.h>
	#include <torch/csrc/utils/auto_gil.h>
	#include <ATen/core/functional.h>

	#include <ATen/ATen.h>

	#include <THC/THC.h>

	#include <cstddef>
	#include <vector>

	namespace torch { namespace cuda { namespace python {
	void initCommMethods(PyObject *module) {
	auto m = py::cast<py::module>(module);
	m.def(
	"_broadcast_coalesced",
	[](std::vector<at::Tensor>& tensors,
	std::vector<int64_t> devices,
	size_t buffer_size) {
	return broadcast_coalesced(tensors, devices, buffer_size);
	},
	py::arg("tensors"),
	py::arg("devices"),
	py::arg("buffer_size"),
	py::call_guard<py::gil_scoped_release>())
	.def(
	"_broadcast",
	[](at::Tensor& tensor, std::vector<int64_t> devices) {
	return broadcast(tensor, devices);
	},
	py::call_guard<py::gil_scoped_release>())
	.def(
	"_scatter",
	[](at::Tensor& tensor,
	std::vector<int64_t>& devices,
	c10::optional<std::vector<int64_t>> chunk_sizes,
	int64_t dim,
	c10::optional<py::object> py_streams) {
	c10::optional<std::vector<c10::optional<at::cuda::CUDAStream>>> streams;
	if (py_streams) {
	py::handle handle = *py_streams;
	streams = THPUtils_PySequence_to_CUDAStreamList(handle.ptr());
	}
	// Note: We're holding the GIL up to here.
	AutoNoGIL no_gil;
	return scatter(tensor, devices, chunk_sizes, dim, streams);
	},
	py::arg("tensor"),
	py::arg("devices"),
	py::arg("chunk_sizes"),
	py::arg("dim"),
	py::arg("streams"))
	.def(
	"_gather",
	[](std::vector<at::Tensor>& tensors,
	int64_t dim,
	c10::optional<int32_t> destination_index) {
	return gather(tensors, dim, destination_index);
	},
	py::arg("tensors"),
	py::arg("dim"),
	py::arg("destination_index"),
	py::call_guard<py::gil_scoped_release>());
	}
	}}}