| #pragma once |
| |
| #include <caffe2/core/workspace.h> |
| #include <caffe2/proto/caffe2_pb.h> |
| |
| namespace caffe2 { |
| /// We have a variant of 2-input Int8Quantize and 4-input Int8FC where the last |
| /// input points to a blob which contains the y_scale and y_zero_point. It's |
| /// orginated from online snapshot update but is creating complications for |
| /// onnxifi flow. Hence this pass is just to absorb the quantization params into |
| /// the op itself and remove the last input. |
| void freezeQuantizationParams(NetDef* net, Workspace* ws); |
| } // namespace caffe2 |