aten/src/ATen/native/mkldnn/MKLDNNCommon.cpp - platform/external/pytorch - Git at Google

 #include <ATen/native/mkldnn/MKLDNNCommon.h>
 #include <ATen/OpaqueTensorImpl.h>
 #include <c10/core/Allocator.h>

 #if AT_MKLDNN_ENABLED()

 #include <ideep.hpp>

 namespace at { namespace native {

 /**
  * `IntrusivePtrTargetWrapper` wraps a custom storage handle  of a tensor
 *  (as template param) and inherits `c10::intrusive_ptr_target` so that it
 *  can be used with `c10::intrusive_ptr`.
  *
  * It currently only supports wrapping the custom handle by:
  * - Constructing with an existing custom handle by copy/move constructor.
  *
  * See `OpaqueTensorImpl::opaque_handle_`.
  *
  * NOTE: if this is generally useful we may want to move this to its own header.
  */
 template <typename T>
 struct TORCH_API IntrusivePtrTargetWrapper : c10::intrusive_ptr_target {
 private:
   T target_;

 public:
   IntrusivePtrTargetWrapper() = delete;
   IntrusivePtrTargetWrapper(const T& target): target_(target) {}
   IntrusivePtrTargetWrapper(T&& target): target_(std::move(target)) {}

   T& get_target() {
     return target_;
   }
 };

 using IDeepTensorWrapper = IntrusivePtrTargetWrapper<ideep::tensor>;
 using IDeepTensorWrapperPtr = c10::intrusive_ptr<IDeepTensorWrapper>;
 using MKLDNNTensorImpl = OpaqueTensorImpl<IDeepTensorWrapperPtr>;
 using MKLDNNTensor = Tensor;

 ideep::tensor::data_type get_mkldnn_dtype(ScalarType type) {
   switch (type) {
     case ScalarType::Float:
       return ideep::tensor::data_type::f32;
     case ScalarType::QInt32:
       return ideep::tensor::data_type::s32;
     case ScalarType::QInt8:
       return ideep::tensor::data_type::s8;
     case ScalarType::QUInt8:
     case ScalarType::Byte:
       return ideep::tensor::data_type::u8;
     case ScalarType::BFloat16:
       return ideep::tensor::data_type::bf16;
     default:
       TORCH_CHECK(false, "get_mkldnn_dtype: unsupported data type");
   }
 }

 Tensor new_with_itensor_mkldnn(ideep::tensor&& it, c10::optional<ScalarType> dtype, c10::optional<Device> device) {
   // NOTE: int32_t dims from ideep::tensor but sizes needs int64_t
   // TODO: support int64_t dims in ideep::tensor to avoid extra conversion
   auto dims = it.get_dims();
   IDeepTensorWrapperPtr handle = c10::make_intrusive<IDeepTensorWrapper>(std::move(it));
   caffe2::TypeMeta dtype_ = scalarTypeToTypeMeta(dtype_or_default(dtype));
   Device device_ = device_or_default(device);
   return detail::make_tensor<MKLDNNTensorImpl>(
     DispatchKeySet(DispatchKey::MkldnnCPU),
     dtype_, device_, handle,
     std::vector<int64_t>(dims.begin(), dims.end()));
 }

 ideep::tensor& itensor_from_mkldnn(const MKLDNNTensor& mkldnn_tensor) {
   TORCH_CHECK(mkldnn_tensor.is_mkldnn(),
              "itensor_from_mkldnn expects MKL-DNN tensor input");
   TORCH_INTERNAL_ASSERT(at::impl::variable_excluded_from_dispatch());
   MKLDNNTensorImpl *mklimpl = static_cast<MKLDNNTensorImpl *>(mkldnn_tensor.unsafeGetTensorImpl());
   return mklimpl->unsafe_opaque_handle()->get_target();
 }

 ideep::tensor itensor_view_from_dense(const Tensor& tensor) {
   TORCH_CHECK(
       tensor.device().type() == DeviceType::CPU,
       "itensor_view_from_dense expects CPU tensor input");
   TORCH_CHECK(
       tensor.layout() == Layout::Strided,
       "itensor_view_from_dense expects dense tensor input");
   TORCH_CHECK(tensor.scalar_type() == ScalarType::Float,
              "itensor_view_from_dense expects float tensor input");
   TORCH_INTERNAL_ASSERT(at::impl::variable_excluded_from_dispatch());
   return {{{tensor.sizes().cbegin(), tensor.sizes().cend()},
            ideep::tensor::data_type::f32},
           tensor.template data_ptr<float>()};
 }

 // Helper function for getting an ideep tensor out of an aten Tensor.
 // Note in case the aten Tensor is a dense tensor, the returned ideep
 // tensor is just a view of the storage of the aten dense tensor, so
 // caller needs to make sure the aten dense tensor's lifetime is
 // longer than the ideep tensor.
 ideep::tensor itensor_from_tensor(const Tensor& tensor) {
   if (tensor.is_mkldnn()) {
     return itensor_from_mkldnn(tensor);
   } else {
     return itensor_view_from_dense(tensor);
   }
 }

 }}

 #endif // AT_MKLDNN_ENABLED()
	#include <ATen/native/mkldnn/MKLDNNCommon.h>
	#include <ATen/OpaqueTensorImpl.h>
	#include <c10/core/Allocator.h>

	#if AT_MKLDNN_ENABLED()

	#include <ideep.hpp>

	namespace at { namespace native {

	/**
	* `IntrusivePtrTargetWrapper` wraps a custom storage handle of a tensor
	* (as template param) and inherits `c10::intrusive_ptr_target` so that it
	* can be used with `c10::intrusive_ptr`.
	*
	* It currently only supports wrapping the custom handle by:
	* - Constructing with an existing custom handle by copy/move constructor.
	*
	* See `OpaqueTensorImpl::opaque_handle_`.
	*
	* NOTE: if this is generally useful we may want to move this to its own header.
	*/
	template <typename T>
	struct TORCH_API IntrusivePtrTargetWrapper : c10::intrusive_ptr_target {
	private:
	T target_;

	public:
	IntrusivePtrTargetWrapper() = delete;
	IntrusivePtrTargetWrapper(const T& target): target_(target) {}
	IntrusivePtrTargetWrapper(T&& target): target_(std::move(target)) {}

	T& get_target() {
	return target_;
	}
	};

	using IDeepTensorWrapper = IntrusivePtrTargetWrapper<ideep::tensor>;
	using IDeepTensorWrapperPtr = c10::intrusive_ptr<IDeepTensorWrapper>;
	using MKLDNNTensorImpl = OpaqueTensorImpl<IDeepTensorWrapperPtr>;
	using MKLDNNTensor = Tensor;

	ideep::tensor::data_type get_mkldnn_dtype(ScalarType type) {
	switch (type) {
	case ScalarType::Float:
	return ideep::tensor::data_type::f32;
	case ScalarType::QInt32:
	return ideep::tensor::data_type::s32;
	case ScalarType::QInt8:
	return ideep::tensor::data_type::s8;
	case ScalarType::QUInt8:
	case ScalarType::Byte:
	return ideep::tensor::data_type::u8;
	case ScalarType::BFloat16:
	return ideep::tensor::data_type::bf16;
	default:
	TORCH_CHECK(false, "get_mkldnn_dtype: unsupported data type");
	}
	}

	Tensor new_with_itensor_mkldnn(ideep::tensor&& it, c10::optional<ScalarType> dtype, c10::optional<Device> device) {
	// NOTE: int32_t dims from ideep::tensor but sizes needs int64_t
	// TODO: support int64_t dims in ideep::tensor to avoid extra conversion
	auto dims = it.get_dims();
	IDeepTensorWrapperPtr handle = c10::make_intrusive<IDeepTensorWrapper>(std::move(it));
	caffe2::TypeMeta dtype_ = scalarTypeToTypeMeta(dtype_or_default(dtype));
	Device device_ = device_or_default(device);
	return detail::make_tensor<MKLDNNTensorImpl>(
	DispatchKeySet(DispatchKey::MkldnnCPU),
	dtype_, device_, handle,
	std::vector<int64_t>(dims.begin(), dims.end()));
	}

	ideep::tensor& itensor_from_mkldnn(const MKLDNNTensor& mkldnn_tensor) {
	TORCH_CHECK(mkldnn_tensor.is_mkldnn(),
	"itensor_from_mkldnn expects MKL-DNN tensor input");
	TORCH_INTERNAL_ASSERT(at::impl::variable_excluded_from_dispatch());
	MKLDNNTensorImpl mklimpl = static_cast<MKLDNNTensorImpl >(mkldnn_tensor.unsafeGetTensorImpl());
	return mklimpl->unsafe_opaque_handle()->get_target();
	}

	ideep::tensor itensor_view_from_dense(const Tensor& tensor) {
	TORCH_CHECK(
	tensor.device().type() == DeviceType::CPU,
	"itensor_view_from_dense expects CPU tensor input");
	TORCH_CHECK(
	tensor.layout() == Layout::Strided,
	"itensor_view_from_dense expects dense tensor input");
	TORCH_CHECK(tensor.scalar_type() == ScalarType::Float,
	"itensor_view_from_dense expects float tensor input");
	TORCH_INTERNAL_ASSERT(at::impl::variable_excluded_from_dispatch());
	return {{{tensor.sizes().cbegin(), tensor.sizes().cend()},
	ideep::tensor::data_type::f32},
	tensor.template data_ptr<float>()};
	}

	// Helper function for getting an ideep tensor out of an aten Tensor.
	// Note in case the aten Tensor is a dense tensor, the returned ideep
	// tensor is just a view of the storage of the aten dense tensor, so
	// caller needs to make sure the aten dense tensor's lifetime is
	// longer than the ideep tensor.
	ideep::tensor itensor_from_tensor(const Tensor& tensor) {
	if (tensor.is_mkldnn()) {
	return itensor_from_mkldnn(tensor);
	} else {
	return itensor_view_from_dense(tensor);
	}
	}

	}}

	#endif // AT_MKLDNN_ENABLED()