c10/util/Logging.h - platform/external/pytorch - Git at Google

 #ifndef C10_UTIL_LOGGING_H_
 #define C10_UTIL_LOGGING_H_

 #include <climits>
 #include <exception>
 #include <functional>
 #include <limits>
 #include <sstream>

 #include <c10/macros/Macros.h>
 #include <c10/util/Exception.h>
 #include <c10/util/Flags.h>
 #include <c10/util/StringUtil.h>

 // CAFFE2_LOG_THRESHOLD is a compile time flag that would allow us to turn off
 // logging at compile time so no logging message below that level is produced
 // at all. The value should be between INT_MIN and CAFFE_FATAL.
 #ifndef CAFFE2_LOG_THRESHOLD
 // If we have not defined the compile time log threshold, we keep all the
 // log cases.
 #define CAFFE2_LOG_THRESHOLD INT_MIN
 #endif // CAFFE2_LOG_THRESHOLD

 // Below are different implementations for glog and non-glog cases.
 #ifdef C10_USE_GLOG
 #include <c10/util/logging_is_google_glog.h>
 #else // !C10_USE_GLOG
 #include <c10/util/logging_is_not_google_glog.h>
 #endif // C10_USE_GLOG

 C10_DECLARE_int(caffe2_log_level);
 C10_DECLARE_bool(caffe2_use_fatal_for_enforce);

 // Some versions of GLOG support less-spammy version of LOG_EVERY_MS. If it's
 // not available - just short-circuit to the always working one one.
 // We define the C10_ name to avoid confusing other files
 #ifdef LOG_EVERY_MS
 #define C10_LOG_EVERY_MS(severity, ms) LOG_EVERY_MS(severity, ms)
 #else
 #define C10_LOG_EVERY_MS(severity, ms) LOG(severity)
 #endif

 // Same for LOG_FIRST_N
 #ifdef LOG_FIRST_N
 #define C10_LOG_FIRST_N(severity, n) LOG_FIRST_N(severity, n)
 #else
 #define C10_LOG_FIRST_N(severity, n) LOG(severity)
 #endif

 // Same for LOG_EVERY_N
 #ifdef LOG_EVERY_N
 #define C10_LOG_EVERY_N(severity, n) LOG_EVERY_N(severity, n)
 #else
 #define C10_LOG_EVERY_N(severity, n) LOG(severity)
 #endif

 namespace c10 {

 using std::string;

 // Functions that we use for initialization.
 C10_API bool InitCaffeLogging(int* argc, char** argv);
 C10_API void UpdateLoggingLevelsFromFlags();

 [[noreturn]] C10_API void ThrowEnforceNotMet(
     const char* file,
     const int line,
     const char* condition,
     const std::string& msg,
     const void* caller = nullptr);

 [[noreturn]] C10_API void ThrowEnforceNotMet(
     const char* file,
     const int line,
     const char* condition,
     const char* msg,
     const void* caller = nullptr);

 [[noreturn]] C10_API inline void ThrowEnforceNotMet(
     const char* file,
     const int line,
     const char* condition,
     detail::CompileTimeEmptyString msg,
     const void* caller = nullptr) {
   ThrowEnforceNotMet(file, line, condition, "", caller);
 }

 [[noreturn]] C10_API void ThrowEnforceFiniteNotMet(
     const char* file,
     const int line,
     const char* condition,
     const std::string& msg,
     const void* caller = nullptr);

 [[noreturn]] C10_API void ThrowEnforceFiniteNotMet(
     const char* file,
     const int line,
     const char* condition,
     const char* msg,
     const void* caller = nullptr);

 [[noreturn]] C10_API inline void ThrowEnforceFiniteNotMet(
     const char* file,
     const int line,
     const char* condition,
     detail::CompileTimeEmptyString msg,
     const void* caller = nullptr) {
   ThrowEnforceFiniteNotMet(file, line, condition, "", caller);
 }

 constexpr bool IsUsingGoogleLogging() {
 #ifdef C10_USE_GLOG
   return true;
 #else
   return false;
 #endif
 }

 /**
  * A utility to allow one to show log info to stderr after the program starts.
  *
  * This is similar to calling GLOG's --logtostderr, or setting caffe2_log_level
  * to smaller than INFO. You are recommended to only use this in a few sparse
  * cases, such as when you want to write a tutorial or something. Normally, use
  * the commandline flags to set the log level.
  */
 C10_API void ShowLogInfoToStderr();

 C10_API void SetStackTraceFetcher(std::function<string(void)> fetcher);

 using EnforceNotMet = ::c10::Error;

 #define CAFFE_ENFORCE(condition, ...)                               \
   do {                                                              \
     if (C10_UNLIKELY(!(condition))) {                               \
       ::c10::ThrowEnforceNotMet(                                    \
           __FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__)); \
     }                                                               \
   } while (false)

 #define CAFFE_ENFORCE_FINITE(condition, ...)                        \
     do {                                                            \
       if (C10_UNLIKELY(!(condition))) {                             \
         ::c10::ThrowEnforceFiniteNotMet(                            \
           __FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__)); \
       }                                                             \
     } while (false)

 #define CAFFE_ENFORCE_WITH_CALLER(condition, ...)                         \
   do {                                                                    \
     if (C10_UNLIKELY(!(condition))) {                                     \
       ::c10::ThrowEnforceNotMet(                                          \
           __FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__), this); \
     }                                                                     \
   } while (false)

 #define CAFFE_THROW(...) \
   ::c10::ThrowEnforceNotMet(__FILE__, __LINE__, "", ::c10::str(__VA_ARGS__))

 /**
  * Rich logging messages
  *
  * CAFFE_ENFORCE_THAT can be used with one of the "checker functions" that
  * capture input argument values and add it to the exception message. E.g.
  * `CAFFE_ENFORCE_THAT(Equals(foo(x), bar(y)), "Optional additional message")`
  * would evaluate both foo and bar only once and if the results are not equal -
  * include them in the exception message.
  *
  * Some of the basic checker functions like Equals or Greater are already
  * defined below. Other header might define customized checkers by adding
  * functions to caffe2::enforce_detail namespace. For example:
  *
  *   namespace caffe2 { namespace enforce_detail {
  *   inline EnforceFailMessage IsVector(const vector<int64_t>& shape) {
  *     if (shape.size() == 1) { return EnforceOK(); }
  *     return c10::str("Shape ", shape, " is not a vector");
  *   }
  *   }}
  *
  * With further usages like `CAFFE_ENFORCE_THAT(IsVector(Input(0).dims()))`
  *
  * Convenient wrappers for binary operations like CAFFE_ENFORCE_EQ are provided
  * too. Please use them instead of CHECK_EQ and friends for failures in
  * user-provided input.
  */

 namespace enforce_detail {

 template <typename T1, typename T2>
 std::string enforceFailMsgImpl(const T1& x, const T2& y) {
   return c10::str(x, " vs ", y);
 }

 template <typename T1, typename T2, typename... Args>
 std::string enforceFailMsgImpl(const T1& x, const T2& y, const Args&... args) {
   return c10::str(x, " vs ", y, ". ", args...);
 }

 template <typename Pred, typename T1, typename T2, typename... Args>
 void enforceThatImpl(Pred p, const T1& lhs, const T2& rhs, const char* file,
                      int line, const char* expr, const void* caller,
                      const Args&... args) {
   if (C10_UNLIKELY(!(p(lhs, rhs)))) {
     ::c10::ThrowEnforceNotMet(
         file,
         line,
         expr,
         ::c10::enforce_detail::enforceFailMsgImpl(
             lhs,
             rhs,
             args...),
         caller);
   }
 }
 #define CAFFE_ENFORCE_THAT_IMPL(op, lhs, rhs, expr, ...)        \
   ::c10::enforce_detail::enforceThatImpl(                       \
       op,                                                       \
       lhs,                                                      \
       rhs,                                                      \
       __FILE__,                                                 \
       __LINE__,                                                 \
       expr,                                                     \
       nullptr,                                                  \
       ##__VA_ARGS__)

 #define CAFFE_ENFORCE_THAT_IMPL_WITH_CALLER(op, lhs, rhs, expr, ...)    \
   ::c10::enforce_detail::enforceThatImpl(                               \
       op,                                                               \
       (lhs),                                                            \
       (rhs),                                                            \
       __FILE__,                                                         \
       __LINE__,                                                         \
       expr,                                                             \
       this,                                                             \
       ##__VA_ARGS__)

 } // namespace enforce_detail

 #define CAFFE_ENFORCE_THAT(cmp, op, lhs, rhs,...)                        \
   CAFFE_ENFORCE_THAT_IMPL(cmp, lhs, rhs,  #lhs " " #op " " #rhs, ##__VA_ARGS__)

 #define CAFFE_ENFORCE_BINARY_OP(cmp, op, x, y, ...)                      \
   CAFFE_ENFORCE_THAT_IMPL(cmp, x, y, #x " " #op " " #y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_EQ(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::equal_to<void>(), ==, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_NE(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::not_equal_to<void>(), !=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_LE(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::less_equal<void>(), <=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_LT(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::less<void>(), <, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_GE(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::greater_equal<void>(), >=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_GT(x, y, ...)                     \
   CAFFE_ENFORCE_BINARY_OP(std::greater<void>(), >, x, y, ##__VA_ARGS__)

 #define CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(cmp, op, x, y, ...)          \
   CAFFE_ENFORCE_THAT_IMPL_WITH_CALLER(cmp, x, y, #x " " #op " " #y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_EQ_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::equal_to<void>(), ==, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_NE_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::not_equal_to<void>(), !=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_LE_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::less_equal<void>(), <=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_LT_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::less<void>(), <, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_GE_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::greater_equal<void>(), >=, x, y, ##__VA_ARGS__)
 #define CAFFE_ENFORCE_GT_WITH_CALLER(x, y, ...)                 \
   CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::greater<void>(), >, x, y, ##__VA_ARGS__)

 /**
  * Very lightweight logging for the first time API usage. It's beneficial for
  * tracking of individual functionality usage in larger applications.
  *
  * In order to ensure light-weightedness of logging, we utilize static variable
  * trick - LogAPIUsage will be invoked only once and further invocations will
  * just do an atomic check.
  *
  * Example:
  *   // Logs caller info with an arbitrary text event, if there is a usage.
  *   C10_LOG_API_USAGE_ONCE("my_api");
  */
 #define C10_LOG_API_USAGE_ONCE(...)             \
   C10_UNUSED static bool C10_ANONYMOUS_VARIABLE(logFlag) = \
       ::c10::detail::LogAPIUsageFakeReturn(__VA_ARGS__);

 // API usage logging capabilities
 C10_API void SetAPIUsageLogger(std::function<void(const std::string&)> logger);
 C10_API void LogAPIUsage(const std::string& context);

 // PyTorch ddp usage logging capabilities
 // DDPLoggingData holds data that can be logged in applications
 // for analysis and debugging. Data structure is defined in
 // c10 directory so that it can be easily imported by both c10
 // and torch files.
 struct DDPLoggingData {
   // Data that can be got during DistributedDataParallel construction time
   int world_size = -1;
   int rank = -1;
   std::string module_name = "";
   std::vector<int> device_ids = std::vector<int>();
   int output_device = -1;
   std::string backend_name = "";
   // Parameters' data types, there may be multiple data
   // types for mixed precision training.
   std::vector<std::string> dtypes = std::vector<std::string>();
   // Total parameters size (Bytes)
   int64_t total_parameter_size_bytes = -1;
   // The number of parameter tensors
   int num_parameter_tensors = -1;
   // A list of bucket sizes (Bytes) calculated during construction time
   std::vector<int> bucket_sizes = std::vector<int>();
   bool is_multi_device_module = false;

   // Environment variables
   std::string master_port = "";
   std::string master_addr = "";
   std::string cuda_visible_devices = "";
   std::string gloo_socket_ifname = "";
   std::string gloo_device_transport = "";
   std::string nccl_socket_ifname = "";
   std::string nccl_blocking_wait = "";
   std::string nccl_async_error_handling = "";
   std::string nccl_debug = "";
   std::string nccl_nthreads = "";
   std::string nccl_ib_timeout = "";

   // DistributedDataParallel constructor input parameters
   bool broadcast_buffers = false;
   float bucket_cap_mb = -1.0;
   bool find_unused_parameters = false;
   bool gradient_as_bucket_view = false;

   // Communication hook. Empty string if not set, in which case it will not be
   // logged.
   std::string comm_hook = "";
   // Whether we are running under model.join() context manager for DDP uneven
   // inputs.
   bool join_uneven_inputs = false;

   // The following runtime stats are collected for the first 10 iterations
   // and then are collected every kDDPRuntimeLoggingSampleRate=100 iterations.
   // Users can get these stats at any iteration of training
   // loop by calling get_ddp_logging_data() in python.

   // In which iteration of the training loop the get_ddp_logging_data()
   // is called to fetch the DDPLoggingData, 0 if the data is fetched
   // before training loop.
   int64_t iteration = -1;

   // When get_ddp_logging_data() is called, "unused_parameter_size",
   // "has_rebuilt_buckets" and "rebuilt_bucket_sizes" are updated in the latest
   // sampling iteration.
   // Total unused parameter size (Bytes)
   int64_t unused_parameter_size = 0;
   // Rebuild buckets stats after 1st iteration
   bool has_rebuilt_buckets = false;
   std::vector<int> rebuilt_bucket_sizes = std::vector<int>();
   // Average performance stats for the number of sampling iterations
   // when time is recorded (ns).
   // e.g., training loop has ran "DDPLoggingData::iteration=1000" iterations,
   // time is recorded every kDDPRuntimeLoggingSampleRate=100 iterations,
   // the following performance stats are averaged among the
   // "DDPLoggingData::iteration"/"kDDPRuntimeLoggingSampleRate"=10 sampling
   // iterations.
   int64_t avg_forward_compute_time = 0;
   int64_t avg_backward_compute_time = 0;
   int64_t avg_backward_comm_time = 0;
   int64_t avg_backward_compute_comm_overlap_time = 0;

   // Performance stats for the current iteration.
   int64_t forward_compute_time = 0;
   int64_t backward_compute_time = 0;
   int64_t backward_comm_time = 0;
   int64_t backward_compute_comm_overlap_time = 0;

   // Stream insertion operator for logging i.e. to standard output/error.
   friend std::ostream& operator<<(
     std::ostream& output,
     const DDPLoggingData& ddp_logging_data
   ) {

     std::string devicesStr = c10::Join(", ", ddp_logging_data.device_ids);
     std::string bucketSizesStr = c10::Join(", ", ddp_logging_data.bucket_sizes);
     std::string dtypesStr = c10::Join(" ", ddp_logging_data.dtypes);

     std::string ddpLoggingDataInfo = c10::str(
       "world_size: ", ddp_logging_data.world_size, ", module_name: ",
       ddp_logging_data.module_name, ", device_ids: ", devicesStr, ", output_device: ",
       ddp_logging_data.output_device, ", backend_name: ", ddp_logging_data.backend_name,
       ", parameter_dtype: ", dtypesStr, ", total_parameter_size_in_bytes: ",
       ddp_logging_data.total_parameter_size_bytes, ", num_parameter_tensors: ",
       ddp_logging_data.num_parameter_tensors, " bucket_sizes: ", bucketSizesStr,
       ", CUDA_VISIBLE_DEVICES: ", ddp_logging_data.cuda_visible_devices, ", broadcast_buffers: ",
       ddp_logging_data.broadcast_buffers, ", bucket_cap_mb: ", ddp_logging_data.bucket_cap_mb,
       ", find_unused_parameters: ", ddp_logging_data.find_unused_parameters,
       ", gradient_as_bucket_view: ", ddp_logging_data.gradient_as_bucket_view,
       "\n"
     );
     std::string backendInfo = " Backend Info: ";
     if (ddp_logging_data.backend_name == "nccl") {
       backendInfo += c10::str(
         "nccl_socket_ifname: ", ddp_logging_data.nccl_socket_ifname,
         " nccl_blocking_wait: ", ddp_logging_data.nccl_blocking_wait,
         " nccl_debug: ", ddp_logging_data.nccl_debug,
         " nccl_async_error_handling: ", ddp_logging_data.nccl_async_error_handling,
         " nccl_nthreads: ", ddp_logging_data.nccl_nthreads,
         " nccl_ib_timeout: ", ddp_logging_data.nccl_ib_timeout,
         "\n"
       );
     } else if (ddp_logging_data.backend_name == "gloo") {
       backendInfo += c10::str(
         "gloo_socket_ifname: ", ddp_logging_data.gloo_socket_ifname,
         " gloo_device_transport: ", ddp_logging_data.gloo_device_transport,
         "\n"
       );
     }
     ddpLoggingDataInfo += backendInfo;

     if (ddp_logging_data.comm_hook != "") {
       auto commHookInfo = c10::str(
         "comm_hook: ", ddp_logging_data.comm_hook
       );
       ddpLoggingDataInfo += commHookInfo;
     }

     if (ddp_logging_data.join_uneven_inputs) {
       auto joinInfo = c10::str("join_uneven_inputs: ", ddp_logging_data.join_uneven_inputs);
       ddpLoggingDataInfo += joinInfo;
     }

     return output << ddpLoggingDataInfo;
   }
 };

 C10_API void SetPyTorchDDPUsageLogger(std::function<void(const c10::DDPLoggingData&)> logger);
 C10_API void LogPyTorchDDPUsage(const c10::DDPLoggingData& ddpData);

 namespace detail {
 // Return value is needed to do the static variable initialization trick
 C10_API bool LogAPIUsageFakeReturn(const std::string& context);
 }

 } // namespace c10

 #endif // C10_UTIL_LOGGING_H_
	#ifndef C10_UTIL_LOGGING_H_
	#define C10_UTIL_LOGGING_H_

	#include <climits>
	#include <exception>
	#include <functional>
	#include <limits>
	#include <sstream>

	#include <c10/macros/Macros.h>
	#include <c10/util/Exception.h>
	#include <c10/util/Flags.h>
	#include <c10/util/StringUtil.h>

	// CAFFE2_LOG_THRESHOLD is a compile time flag that would allow us to turn off
	// logging at compile time so no logging message below that level is produced
	// at all. The value should be between INT_MIN and CAFFE_FATAL.
	#ifndef CAFFE2_LOG_THRESHOLD
	// If we have not defined the compile time log threshold, we keep all the
	// log cases.
	#define CAFFE2_LOG_THRESHOLD INT_MIN
	#endif // CAFFE2_LOG_THRESHOLD

	// Below are different implementations for glog and non-glog cases.
	#ifdef C10_USE_GLOG
	#include <c10/util/logging_is_google_glog.h>
	#else // !C10_USE_GLOG
	#include <c10/util/logging_is_not_google_glog.h>
	#endif // C10_USE_GLOG

	C10_DECLARE_int(caffe2_log_level);
	C10_DECLARE_bool(caffe2_use_fatal_for_enforce);

	// Some versions of GLOG support less-spammy version of LOG_EVERY_MS. If it's
	// not available - just short-circuit to the always working one one.
	// We define the C10_ name to avoid confusing other files
	#ifdef LOG_EVERY_MS
	#define C10_LOG_EVERY_MS(severity, ms) LOG_EVERY_MS(severity, ms)
	#else
	#define C10_LOG_EVERY_MS(severity, ms) LOG(severity)
	#endif

	// Same for LOG_FIRST_N
	#ifdef LOG_FIRST_N
	#define C10_LOG_FIRST_N(severity, n) LOG_FIRST_N(severity, n)
	#else
	#define C10_LOG_FIRST_N(severity, n) LOG(severity)
	#endif

	// Same for LOG_EVERY_N
	#ifdef LOG_EVERY_N
	#define C10_LOG_EVERY_N(severity, n) LOG_EVERY_N(severity, n)
	#else
	#define C10_LOG_EVERY_N(severity, n) LOG(severity)
	#endif

	namespace c10 {

	using std::string;

	// Functions that we use for initialization.
	C10_API bool InitCaffeLogging(int* argc, char** argv);
	C10_API void UpdateLoggingLevelsFromFlags();

	[[noreturn]] C10_API void ThrowEnforceNotMet(
	const char* file,
	const int line,
	const char* condition,
	const std::string& msg,
	const void* caller = nullptr);

	[[noreturn]] C10_API void ThrowEnforceNotMet(
	const char* file,
	const int line,
	const char* condition,
	const char* msg,
	const void* caller = nullptr);

	[[noreturn]] C10_API inline void ThrowEnforceNotMet(
	const char* file,
	const int line,
	const char* condition,
	detail::CompileTimeEmptyString msg,
	const void* caller = nullptr) {
	ThrowEnforceNotMet(file, line, condition, "", caller);
	}

	[[noreturn]] C10_API void ThrowEnforceFiniteNotMet(
	const char* file,
	const int line,
	const char* condition,
	const std::string& msg,
	const void* caller = nullptr);

	[[noreturn]] C10_API void ThrowEnforceFiniteNotMet(
	const char* file,
	const int line,
	const char* condition,
	const char* msg,
	const void* caller = nullptr);

	[[noreturn]] C10_API inline void ThrowEnforceFiniteNotMet(
	const char* file,
	const int line,
	const char* condition,
	detail::CompileTimeEmptyString msg,
	const void* caller = nullptr) {
	ThrowEnforceFiniteNotMet(file, line, condition, "", caller);
	}

	constexpr bool IsUsingGoogleLogging() {
	#ifdef C10_USE_GLOG
	return true;
	#else
	return false;
	#endif
	}

	/**
	* A utility to allow one to show log info to stderr after the program starts.
	*
	* This is similar to calling GLOG's --logtostderr, or setting caffe2_log_level
	* to smaller than INFO. You are recommended to only use this in a few sparse
	* cases, such as when you want to write a tutorial or something. Normally, use
	* the commandline flags to set the log level.
	*/
	C10_API void ShowLogInfoToStderr();

	C10_API void SetStackTraceFetcher(std::function<string(void)> fetcher);

	using EnforceNotMet = ::c10::Error;

	#define CAFFE_ENFORCE(condition, ...) \
	do { \
	if (C10_UNLIKELY(!(condition))) { \
	::c10::ThrowEnforceNotMet( \
	__FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__)); \
	} \
	} while (false)

	#define CAFFE_ENFORCE_FINITE(condition, ...) \
	do { \
	if (C10_UNLIKELY(!(condition))) { \
	::c10::ThrowEnforceFiniteNotMet( \
	__FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__)); \
	} \
	} while (false)

	#define CAFFE_ENFORCE_WITH_CALLER(condition, ...) \
	do { \
	if (C10_UNLIKELY(!(condition))) { \
	::c10::ThrowEnforceNotMet( \
	__FILE__, __LINE__, #condition, ::c10::str(__VA_ARGS__), this); \
	} \
	} while (false)

	#define CAFFE_THROW(...) \
	::c10::ThrowEnforceNotMet(__FILE__, __LINE__, "", ::c10::str(__VA_ARGS__))

	/**
	* Rich logging messages
	*
	* CAFFE_ENFORCE_THAT can be used with one of the "checker functions" that
	* capture input argument values and add it to the exception message. E.g.
	* `CAFFE_ENFORCE_THAT(Equals(foo(x), bar(y)), "Optional additional message")`
	* would evaluate both foo and bar only once and if the results are not equal -
	* include them in the exception message.
	*
	* Some of the basic checker functions like Equals or Greater are already
	* defined below. Other header might define customized checkers by adding
	* functions to caffe2::enforce_detail namespace. For example:
	*
	* namespace caffe2 { namespace enforce_detail {
	* inline EnforceFailMessage IsVector(const vector<int64_t>& shape) {
	* if (shape.size() == 1) { return EnforceOK(); }
	* return c10::str("Shape ", shape, " is not a vector");
	* }
	* }}
	*
	* With further usages like `CAFFE_ENFORCE_THAT(IsVector(Input(0).dims()))`
	*
	* Convenient wrappers for binary operations like CAFFE_ENFORCE_EQ are provided
	* too. Please use them instead of CHECK_EQ and friends for failures in
	* user-provided input.
	*/

	namespace enforce_detail {

	template <typename T1, typename T2>
	std::string enforceFailMsgImpl(const T1& x, const T2& y) {
	return c10::str(x, " vs ", y);
	}

	template <typename T1, typename T2, typename... Args>
	std::string enforceFailMsgImpl(const T1& x, const T2& y, const Args&... args) {
	return c10::str(x, " vs ", y, ". ", args...);
	}

	template <typename Pred, typename T1, typename T2, typename... Args>
	void enforceThatImpl(Pred p, const T1& lhs, const T2& rhs, const char* file,
	int line, const char* expr, const void* caller,
	const Args&... args) {
	if (C10_UNLIKELY(!(p(lhs, rhs)))) {
	::c10::ThrowEnforceNotMet(
	file,
	line,
	expr,
	::c10::enforce_detail::enforceFailMsgImpl(
	lhs,
	rhs,
	args...),
	caller);
	}
	}
	#define CAFFE_ENFORCE_THAT_IMPL(op, lhs, rhs, expr, ...) \
	::c10::enforce_detail::enforceThatImpl( \
	op, \
	lhs, \
	rhs, \
	__FILE__, \
	__LINE__, \
	expr, \
	nullptr, \
	##__VA_ARGS__)

	#define CAFFE_ENFORCE_THAT_IMPL_WITH_CALLER(op, lhs, rhs, expr, ...) \
	::c10::enforce_detail::enforceThatImpl( \
	op, \
	(lhs), \
	(rhs), \
	__FILE__, \
	__LINE__, \
	expr, \
	this, \
	##__VA_ARGS__)

	} // namespace enforce_detail

	#define CAFFE_ENFORCE_THAT(cmp, op, lhs, rhs,...) \
	CAFFE_ENFORCE_THAT_IMPL(cmp, lhs, rhs, #lhs " " #op " " #rhs, ##__VA_ARGS__)

	#define CAFFE_ENFORCE_BINARY_OP(cmp, op, x, y, ...) \
	CAFFE_ENFORCE_THAT_IMPL(cmp, x, y, #x " " #op " " #y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_EQ(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::equal_to<void>(), ==, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_NE(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::not_equal_to<void>(), !=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_LE(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::less_equal<void>(), <=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_LT(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::less<void>(), <, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_GE(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::greater_equal<void>(), >=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_GT(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP(std::greater<void>(), >, x, y, ##__VA_ARGS__)

	#define CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(cmp, op, x, y, ...) \
	CAFFE_ENFORCE_THAT_IMPL_WITH_CALLER(cmp, x, y, #x " " #op " " #y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_EQ_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::equal_to<void>(), ==, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_NE_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::not_equal_to<void>(), !=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_LE_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::less_equal<void>(), <=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_LT_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::less<void>(), <, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_GE_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::greater_equal<void>(), >=, x, y, ##__VA_ARGS__)
	#define CAFFE_ENFORCE_GT_WITH_CALLER(x, y, ...) \
	CAFFE_ENFORCE_BINARY_OP_WITH_CALLER(std::greater<void>(), >, x, y, ##__VA_ARGS__)

	/**
	* Very lightweight logging for the first time API usage. It's beneficial for
	* tracking of individual functionality usage in larger applications.
	*
	* In order to ensure light-weightedness of logging, we utilize static variable
	* trick - LogAPIUsage will be invoked only once and further invocations will
	* just do an atomic check.
	*
	* Example:
	* // Logs caller info with an arbitrary text event, if there is a usage.
	* C10_LOG_API_USAGE_ONCE("my_api");
	*/
	#define C10_LOG_API_USAGE_ONCE(...) \
	C10_UNUSED static bool C10_ANONYMOUS_VARIABLE(logFlag) = \
	::c10::detail::LogAPIUsageFakeReturn(__VA_ARGS__);

	// API usage logging capabilities
	C10_API void SetAPIUsageLogger(std::function<void(const std::string&)> logger);
	C10_API void LogAPIUsage(const std::string& context);

	// PyTorch ddp usage logging capabilities
	// DDPLoggingData holds data that can be logged in applications
	// for analysis and debugging. Data structure is defined in
	// c10 directory so that it can be easily imported by both c10
	// and torch files.
	struct DDPLoggingData {
	// Data that can be got during DistributedDataParallel construction time
	int world_size = -1;
	int rank = -1;
	std::string module_name = "";
	std::vector<int> device_ids = std::vector<int>();
	int output_device = -1;
	std::string backend_name = "";
	// Parameters' data types, there may be multiple data
	// types for mixed precision training.
	std::vector<std::string> dtypes = std::vector<std::string>();
	// Total parameters size (Bytes)
	int64_t total_parameter_size_bytes = -1;
	// The number of parameter tensors
	int num_parameter_tensors = -1;
	// A list of bucket sizes (Bytes) calculated during construction time
	std::vector<int> bucket_sizes = std::vector<int>();
	bool is_multi_device_module = false;

	// Environment variables
	std::string master_port = "";
	std::string master_addr = "";
	std::string cuda_visible_devices = "";
	std::string gloo_socket_ifname = "";
	std::string gloo_device_transport = "";
	std::string nccl_socket_ifname = "";
	std::string nccl_blocking_wait = "";
	std::string nccl_async_error_handling = "";
	std::string nccl_debug = "";
	std::string nccl_nthreads = "";
	std::string nccl_ib_timeout = "";

	// DistributedDataParallel constructor input parameters
	bool broadcast_buffers = false;
	float bucket_cap_mb = -1.0;
	bool find_unused_parameters = false;
	bool gradient_as_bucket_view = false;

	// Communication hook. Empty string if not set, in which case it will not be
	// logged.
	std::string comm_hook = "";
	// Whether we are running under model.join() context manager for DDP uneven
	// inputs.
	bool join_uneven_inputs = false;

	// The following runtime stats are collected for the first 10 iterations
	// and then are collected every kDDPRuntimeLoggingSampleRate=100 iterations.
	// Users can get these stats at any iteration of training
	// loop by calling get_ddp_logging_data() in python.

	// In which iteration of the training loop the get_ddp_logging_data()
	// is called to fetch the DDPLoggingData, 0 if the data is fetched
	// before training loop.
	int64_t iteration = -1;

	// When get_ddp_logging_data() is called, "unused_parameter_size",
	// "has_rebuilt_buckets" and "rebuilt_bucket_sizes" are updated in the latest
	// sampling iteration.
	// Total unused parameter size (Bytes)
	int64_t unused_parameter_size = 0;
	// Rebuild buckets stats after 1st iteration
	bool has_rebuilt_buckets = false;
	std::vector<int> rebuilt_bucket_sizes = std::vector<int>();
	// Average performance stats for the number of sampling iterations
	// when time is recorded (ns).
	// e.g., training loop has ran "DDPLoggingData::iteration=1000" iterations,
	// time is recorded every kDDPRuntimeLoggingSampleRate=100 iterations,
	// the following performance stats are averaged among the
	// "DDPLoggingData::iteration"/"kDDPRuntimeLoggingSampleRate"=10 sampling
	// iterations.
	int64_t avg_forward_compute_time = 0;
	int64_t avg_backward_compute_time = 0;
	int64_t avg_backward_comm_time = 0;
	int64_t avg_backward_compute_comm_overlap_time = 0;

	// Performance stats for the current iteration.
	int64_t forward_compute_time = 0;
	int64_t backward_compute_time = 0;
	int64_t backward_comm_time = 0;
	int64_t backward_compute_comm_overlap_time = 0;

	// Stream insertion operator for logging i.e. to standard output/error.
	friend std::ostream& operator<<(
	std::ostream& output,
	const DDPLoggingData& ddp_logging_data
	) {

	std::string devicesStr = c10::Join(", ", ddp_logging_data.device_ids);
	std::string bucketSizesStr = c10::Join(", ", ddp_logging_data.bucket_sizes);
	std::string dtypesStr = c10::Join(" ", ddp_logging_data.dtypes);

	std::string ddpLoggingDataInfo = c10::str(
	"world_size: ", ddp_logging_data.world_size, ", module_name: ",
	ddp_logging_data.module_name, ", device_ids: ", devicesStr, ", output_device: ",
	ddp_logging_data.output_device, ", backend_name: ", ddp_logging_data.backend_name,
	", parameter_dtype: ", dtypesStr, ", total_parameter_size_in_bytes: ",
	ddp_logging_data.total_parameter_size_bytes, ", num_parameter_tensors: ",
	ddp_logging_data.num_parameter_tensors, " bucket_sizes: ", bucketSizesStr,
	", CUDA_VISIBLE_DEVICES: ", ddp_logging_data.cuda_visible_devices, ", broadcast_buffers: ",
	ddp_logging_data.broadcast_buffers, ", bucket_cap_mb: ", ddp_logging_data.bucket_cap_mb,
	", find_unused_parameters: ", ddp_logging_data.find_unused_parameters,
	", gradient_as_bucket_view: ", ddp_logging_data.gradient_as_bucket_view,
	"\n"
	);
	std::string backendInfo = " Backend Info: ";
	if (ddp_logging_data.backend_name == "nccl") {
	backendInfo += c10::str(
	"nccl_socket_ifname: ", ddp_logging_data.nccl_socket_ifname,
	" nccl_blocking_wait: ", ddp_logging_data.nccl_blocking_wait,
	" nccl_debug: ", ddp_logging_data.nccl_debug,
	" nccl_async_error_handling: ", ddp_logging_data.nccl_async_error_handling,
	" nccl_nthreads: ", ddp_logging_data.nccl_nthreads,
	" nccl_ib_timeout: ", ddp_logging_data.nccl_ib_timeout,
	"\n"
	);
	} else if (ddp_logging_data.backend_name == "gloo") {
	backendInfo += c10::str(
	"gloo_socket_ifname: ", ddp_logging_data.gloo_socket_ifname,
	" gloo_device_transport: ", ddp_logging_data.gloo_device_transport,
	"\n"
	);
	}
	ddpLoggingDataInfo += backendInfo;

	if (ddp_logging_data.comm_hook != "") {
	auto commHookInfo = c10::str(
	"comm_hook: ", ddp_logging_data.comm_hook
	);
	ddpLoggingDataInfo += commHookInfo;
	}

	if (ddp_logging_data.join_uneven_inputs) {
	auto joinInfo = c10::str("join_uneven_inputs: ", ddp_logging_data.join_uneven_inputs);
	ddpLoggingDataInfo += joinInfo;
	}

	return output << ddpLoggingDataInfo;
	}
	};

	C10_API void SetPyTorchDDPUsageLogger(std::function<void(const c10::DDPLoggingData&)> logger);
	C10_API void LogPyTorchDDPUsage(const c10::DDPLoggingData& ddpData);

	namespace detail {
	// Return value is needed to do the static variable initialization trick
	C10_API bool LogAPIUsageFakeReturn(const std::string& context);
	}

	} // namespace c10

	#endif // C10_UTIL_LOGGING_H_