torch/csrc/cuda/nccl.h - platform/external/pytorch - Git at Google

 #pragma once

 #include <nccl.h>
 #include <ATen/ATen.h>
 #include <THC/THC.h>

 namespace torch { namespace cuda { namespace nccl {

 // NOTE: this is exposed only so that python_nccl.cpp can some of these helpers.
 // Don't use them outside of these files.
 namespace detail {

 void throw_nccl_error(ncclResult_t status);

 static inline void CHECK(ncclResult_t status) {
   if (status != ncclSuccess) {
     throw_nccl_error(status);
   }
 }

 struct AutoNcclGroup {
   AutoNcclGroup() {
 #if defined(NCCL_MAJOR) && (NCCL_MAJOR >= 2)
     CHECK(ncclGroupStart());
 #endif
   }
   ~AutoNcclGroup() {
 #if defined(NCCL_MAJOR) && (NCCL_MAJOR >= 2)
     CHECK(ncclGroupEnd());
 #endif
   }
 };

 at::ArrayRef<ncclComm_t> _get_communicators(at::TensorList inputs);
 void _check_inputs(at::TensorList inputs, at::TensorList outputs,
                    int input_multiplier, int output_multiplier);
 ncclDataType_t _get_data_type(const at::Type& type);

 } // namespace detail

 using comm_list = std::vector<ncclComm_t>;
 using stream_list = std::vector<THCStream*>;

 std::uint64_t version();
 bool is_available(at::TensorList tensors);
 void broadcast(at::TensorList tensors,
                const stream_list& streams = {},
                const comm_list& user_comms = {});

 }}}
	#pragma once

	#include <nccl.h>
	#include <ATen/ATen.h>
	#include <THC/THC.h>

	namespace torch { namespace cuda { namespace nccl {

	// NOTE: this is exposed only so that python_nccl.cpp can some of these helpers.
	// Don't use them outside of these files.
	namespace detail {

	void throw_nccl_error(ncclResult_t status);

	static inline void CHECK(ncclResult_t status) {
	if (status != ncclSuccess) {
	throw_nccl_error(status);
	}
	}

	struct AutoNcclGroup {
	AutoNcclGroup() {
	#if defined(NCCL_MAJOR) && (NCCL_MAJOR >= 2)
	CHECK(ncclGroupStart());
	#endif
	}
	~AutoNcclGroup() {
	#if defined(NCCL_MAJOR) && (NCCL_MAJOR >= 2)
	CHECK(ncclGroupEnd());
	#endif
	}
	};

	at::ArrayRef<ncclComm_t> _get_communicators(at::TensorList inputs);
	void _check_inputs(at::TensorList inputs, at::TensorList outputs,
	int input_multiplier, int output_multiplier);
	ncclDataType_t _get_data_type(const at::Type& type);

	} // namespace detail

	using comm_list = std::vector<ncclComm_t>;
	using stream_list = std::vector<THCStream*>;

	std::uint64_t version();
	bool is_available(at::TensorList tensors);
	void broadcast(at::TensorList tensors,
	const stream_list& streams = {},
	const comm_list& user_comms = {});

	}}}