DistKLDivCriterion.cu - platform/external/pytorch - Git at Google

 #include "THCUNN.h"
 #include "common.h"
 #include "THCHalf.h"
 #include "THCHalfAutoNumerics.cuh"

 #include <thrust/fill.h>
 #include <thrust/functional.h>
 #include <thrust/device_ptr.h>
 #include <thrust/reduce.h>
 #include <thrust/inner_product.h>

 template <typename Dtype, typename Acctype>
 struct kl_functor
 {
   __host__ __device__ Acctype operator()(const Dtype& x, const Dtype& y) const
   {
       Acctype yAcc = ScalarConvert<Dtype, Acctype>::to(y);
       return y > 0 ? yAcc * (THCNumerics<Acctype>::log(yAcc) - x) : Acctype(0);
   }
 };

 template <typename Dtype>
 struct kl_updateGradInput_functor
 {
   const Dtype norm;

   kl_updateGradInput_functor(Dtype norm_)
     : norm(norm_)
   {}

   __host__ __device__ Dtype operator()(const Dtype& x, const Dtype& y) const
   {
       return y > 0 ? norm * (-y) : ScalarConvert<int, Dtype>::to(0);
   }
 };

 #include "generic/DistKLDivCriterion.cu"
 #include "THCGenerateFloatTypes.h"
	#include "THCUNN.h"
	#include "common.h"
	#include "THCHalf.h"
	#include "THCHalfAutoNumerics.cuh"

	#include <thrust/fill.h>
	#include <thrust/functional.h>
	#include <thrust/device_ptr.h>
	#include <thrust/reduce.h>
	#include <thrust/inner_product.h>

	template <typename Dtype, typename Acctype>
	struct kl_functor
	{
	__host__ __device__ Acctype operator()(const Dtype& x, const Dtype& y) const
	{
	Acctype yAcc = ScalarConvert<Dtype, Acctype>::to(y);
	return y > 0 ? yAcc * (THCNumerics<Acctype>::log(yAcc) - x) : Acctype(0);
	}
	};

	template <typename Dtype>
	struct kl_updateGradInput_functor
	{
	const Dtype norm;

	kl_updateGradInput_functor(Dtype norm_)
	: norm(norm_)
	{}

	__host__ __device__ Dtype operator()(const Dtype& x, const Dtype& y) const
	{
	return y > 0 ? norm * (-y) : ScalarConvert<int, Dtype>::to(0);
	}
	};

	#include "generic/DistKLDivCriterion.cu"
	#include "THCGenerateFloatTypes.h"