caffe2/contrib/warpctc/ctc_op.h - platform/external/pytorch - Git at Google

 #pragma once

 #include <ctc.h>

 #include "caffe2/core/context.h"
 #include "caffe2/core/operator.h"
 #include "caffe2/utils/math.h"
 #include "caffe2/core/common_cudnn.h"

 #define CTC_CHECK(condition)           \
   do {                                 \
     ctcStatus_t status = condition;    \
     CAFFE_ENFORCE_EQ(                  \
         status,                        \
         CTC_STATUS_SUCCESS,            \
         " Error at: ",                 \
         __FILE__,                      \
         ":",                           \
         __LINE__,                      \
         ": ",                          \
         ::ctcGetStatusString(status)); \
   } while (0)

 namespace caffe2 {

 namespace detail {

 template <typename Context>
 ctcComputeInfo workspaceInfo(const Context& context);

 }

 template <typename T, typename Context>
 class CTCOp final : public Operator<Context> {
  public:
   USE_OPERATOR_CONTEXT_FUNCTIONS;
   CTCOp(const OperatorDef& operator_def, Workspace* ws)
       : Operator<Context>(operator_def, ws),
         is_test_(
             OperatorBase::GetSingleArgument<int>(OpSchema::Arg_IsTest, 0)) {
     CAFFE_ENFORCE(
         (is_test_ && OutputSize() == 2) || (!is_test_ && OutputSize() == 3));
   }

   bool RunOnDevice() override {
     // inputs
     const auto& inputs = Input(INPUTS);
     const auto maxTimeSteps = inputs.size(0);
     const auto minibatchSize = inputs.size(1);
     const auto alphabetSize = inputs.size(2);
     const auto& labels = OperatorBase::template Input<Tensor>(LABELS, CPU);
     const auto& labelLengths =
         OperatorBase::template Input<Tensor>(LABEL_LENGTHS, CPU);

     const int* inputLengthsData = nullptr;
     if (InputSize() == 4) {
       const auto& inputLengths =
           OperatorBase::template Input<Tensor>(INPUT_LENGTHS, CPU);
       inputLengthsData = inputLengths.template data<int>();
     } else {
       // Input lengths not passed in. Default to max timesteps for
       // each item in minibatch.
       default_input_lengths_.resize(minibatchSize, maxTimeSteps);
       inputLengthsData = default_input_lengths_.data();
     }

     // outputs
     Tensor* gradients = nullptr;
     TensorCPU* costs;
     Tensor* workspace;
     if (!is_test_) {
       // [grads, costs, workspace] to maintain backward compatibility
       gradients = Output(0);
       gradients->ResizeLike(inputs);
       costs = OperatorBase::template Output<Tensor>(1, CPU);
       costs->ResizeLike(labelLengths);
       workspace = Output(2);
     } else {
       // [costs, workspace]
       costs = OperatorBase::template Output<Tensor>(0, CPU);
       costs->ResizeLike(labelLengths);
       workspace = Output(1);
     }

     size_t workspaceSizeBytes;
     CTC_CHECK(get_workspace_size(
         labelLengths.template data<int>(),
         inputLengthsData,
         alphabetSize,
         minibatchSize,
         detail::workspaceInfo(context_),
         &workspaceSizeBytes));
     workspace->Resize(workspaceSizeBytes);
     auto* workspaceData = workspace->template mutable_data<uint8_t>();

     if (is_test_ && labels.size(0) == 0) {
       // compute_ctc_loss doesn't handle empty labels well
       T* costsData = costs->template mutable_data<T>();
       for (int i = 0; i < costs->numel(); ++i) {
         costsData[i] = 0;
       }
       return true;
     }

     CTC_CHECK(compute_ctc_loss(
         inputs.template data<T>(),
         gradients ? gradients->template mutable_data<T>() : nullptr,
         labels.template data<int>(),
         labelLengths.template data<int>(),
         inputLengthsData,
         alphabetSize,
         minibatchSize,
         costs->template mutable_data<T>(),
         workspaceData,
         detail::workspaceInfo(context_)));
     return true;
   }

 private:
  bool is_test_;
  std::vector<int> default_input_lengths_;

  INPUT_TAGS(INPUTS, LABELS, LABEL_LENGTHS, INPUT_LENGTHS);
 };
 }

 #undef CTC_CHECK
	#pragma once

	#include <ctc.h>

	#include "caffe2/core/context.h"
	#include "caffe2/core/operator.h"
	#include "caffe2/utils/math.h"
	#include "caffe2/core/common_cudnn.h"

	#define CTC_CHECK(condition) \
	do { \
	ctcStatus_t status = condition; \
	CAFFE_ENFORCE_EQ( \
	status, \
	CTC_STATUS_SUCCESS, \
	" Error at: ", \
	__FILE__, \
	":", \
	__LINE__, \
	": ", \
	::ctcGetStatusString(status)); \
	} while (0)

	namespace caffe2 {

	namespace detail {

	template <typename Context>
	ctcComputeInfo workspaceInfo(const Context& context);

	}

	template <typename T, typename Context>
	class CTCOp final : public Operator<Context> {
	public:
	USE_OPERATOR_CONTEXT_FUNCTIONS;
	CTCOp(const OperatorDef& operator_def, Workspace* ws)
	: Operator<Context>(operator_def, ws),
	is_test_(
	OperatorBase::GetSingleArgument<int>(OpSchema::Arg_IsTest, 0)) {
	CAFFE_ENFORCE(
	(is_test_ && OutputSize() == 2) \|\| (!is_test_ && OutputSize() == 3));
	}

	bool RunOnDevice() override {
	// inputs
	const auto& inputs = Input(INPUTS);
	const auto maxTimeSteps = inputs.size(0);
	const auto minibatchSize = inputs.size(1);
	const auto alphabetSize = inputs.size(2);
	const auto& labels = OperatorBase::template Input<Tensor>(LABELS, CPU);
	const auto& labelLengths =
	OperatorBase::template Input<Tensor>(LABEL_LENGTHS, CPU);

	const int* inputLengthsData = nullptr;
	if (InputSize() == 4) {
	const auto& inputLengths =
	OperatorBase::template Input<Tensor>(INPUT_LENGTHS, CPU);
	inputLengthsData = inputLengths.template data<int>();
	} else {
	// Input lengths not passed in. Default to max timesteps for
	// each item in minibatch.
	default_input_lengths_.resize(minibatchSize, maxTimeSteps);
	inputLengthsData = default_input_lengths_.data();
	}

	// outputs
	Tensor* gradients = nullptr;
	TensorCPU* costs;
	Tensor* workspace;
	if (!is_test_) {
	// [grads, costs, workspace] to maintain backward compatibility
	gradients = Output(0);
	gradients->ResizeLike(inputs);
	costs = OperatorBase::template Output<Tensor>(1, CPU);
	costs->ResizeLike(labelLengths);
	workspace = Output(2);
	} else {
	// [costs, workspace]
	costs = OperatorBase::template Output<Tensor>(0, CPU);
	costs->ResizeLike(labelLengths);
	workspace = Output(1);
	}

	size_t workspaceSizeBytes;
	CTC_CHECK(get_workspace_size(
	labelLengths.template data<int>(),
	inputLengthsData,
	alphabetSize,
	minibatchSize,
	detail::workspaceInfo(context_),
	&workspaceSizeBytes));
	workspace->Resize(workspaceSizeBytes);
	auto* workspaceData = workspace->template mutable_data<uint8_t>();

	if (is_test_ && labels.size(0) == 0) {
	// compute_ctc_loss doesn't handle empty labels well
	T* costsData = costs->template mutable_data<T>();
	for (int i = 0; i < costs->numel(); ++i) {
	costsData[i] = 0;
	}
	return true;
	}

	CTC_CHECK(compute_ctc_loss(
	inputs.template data<T>(),
	gradients ? gradients->template mutable_data<T>() : nullptr,
	labels.template data<int>(),
	labelLengths.template data<int>(),
	inputLengthsData,
	alphabetSize,
	minibatchSize,
	costs->template mutable_data<T>(),
	workspaceData,
	detail::workspaceInfo(context_)));
	return true;
	}

	private:
	bool is_test_;
	std::vector<int> default_input_lengths_;

	INPUT_TAGS(INPUTS, LABELS, LABEL_LENGTHS, INPUT_LENGTHS);
	};
	}

	#undef CTC_CHECK