blob: 735836a731f8febb1e9147713f2a98a3123fd02a [file] [log] [blame]
/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#ifndef TENSORFLOW_LITE_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_
#define TENSORFLOW_LITE_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_
#include <vector>
#include "tensorflow/lite/delegates/hexagon/builders/op_builder.h"
namespace tflite {
namespace delegates {
namespace hexagon {
// Stores quantization data for Conv/TransposeConv nodes.
// This information is used to handle the per-channel quantized weights & biases
// correctly in the Hexagon delegate.
struct PerChannelQuantData {
// This is initialized while processing quantized weights, and acts as an
// input to Hexagon Conv nodes.
OpBuilder* channel_scales_node = nullptr;
// Scale information is obtained from TfLiteAffineQuantization in the weights
// tensor.
float* scales_data = nullptr;
int num_scale_values = 1;
};
class Conv2dOpBuilder : public OpBuilder {
public:
explicit Conv2dOpBuilder(GraphBuilder* graph_builder, int op_type)
: OpBuilder(graph_builder, op_type) {}
TfLiteStatus PopulateSubGraph(const TfLiteIntArray* inputs,
const TfLiteIntArray* outputs,
TfLiteContext* context) override;
TfLiteStatus RegisterOutputs(const TfLiteIntArray* outputs,
TfLiteContext* context) override;
~Conv2dOpBuilder() override;
private:
TfLiteStatus InitializeWeightsNodes(const TfLiteIntArray* inputs,
const TfLiteIntArray* outputs,
TfLiteContext* context,
const int input_depth);
TfLiteStatus InitializeBiasNodes(const TfLiteIntArray* inputs,
const TfLiteIntArray* outputs,
TfLiteContext* context);
TensorID node_output_;
std::vector<float> transposed_weights_;
std::vector<int> stride_shape_;
std::vector<int> weight_shape_;
OpBuilder* weights_min_node_ = nullptr;
OpBuilder* weights_max_node_ = nullptr;
OpBuilder* bias_min_node_ = nullptr;
OpBuilder* bias_max_node_ = nullptr;
// Modified only if node has per-channel quantized weights/biases.
PerChannelQuantData per_channel_quant_;
// Only used for dilated Depthwise Conv.
std::vector<int> dilation_factors_h_w_;
std::vector<int> space_to_batch_paddings_;
std::vector<int> batch_to_space_crops_;
};
// ProcessPerChannelQuantizedWeights & ProcessPerChannelQuantizedBias can be
// used to pre-process per-channel quantized weights & biases for Hexagon.
// NOTE: ProcessPerChannelQuantizedWeights should be run before
// ProcessPerChannelQuantizedBias. This is becase we set PerChannelQuantData
// based on the weights tensor, which is utilized while preprocessing bias.
TfLiteStatus ProcessPerChannelQuantizedWeights(
const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
TfLiteContext* context, float* weights_min, float* weights_max,
GraphBuilder* graph_builder, PerChannelQuantData* per_channel_quant);
TfLiteStatus ProcessPerChannelQuantizedBias(
const TfLiteIntArray* inputs, const TfLiteIntArray* outputs,
TfLiteContext* context, float* bias_min, float* bias_max,
GraphBuilder* graph_builder, PerChannelQuantData* per_channel_quant,
OpBuilder** bias_const_node = nullptr);
} // namespace hexagon
} // namespace delegates
} // namespace tflite
#endif // TENSORFLOW_LITE_DELEGATES_HEXAGON_BUILDERS_CONV_2D_BUILDER_H_