| /* Copyright 2019 The TensorFlow Authors. All Rights Reserved. |
| |
| Licensed under the Apache License, Version 2.0 (the "License"); |
| you may not use this file except in compliance with the License. |
| You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| ==============================================================================*/ |
| |
| #ifndef TENSORFLOW_LITE_DELEGATES_GPU_COMMON_CONVERT_H_ |
| #define TENSORFLOW_LITE_DELEGATES_GPU_COMMON_CONVERT_H_ |
| |
| #include <vector> |
| |
| #include "absl/types/span.h" |
| #include "tensorflow/lite/delegates/gpu/common/shape.h" |
| #include "tensorflow/lite/delegates/gpu/common/status.h" |
| #include "tensorflow/lite/delegates/gpu/common/tensor.h" |
| #include "tensorflow/lite/delegates/gpu/common/types.h" |
| |
| namespace tflite { |
| namespace gpu { |
| |
| // PHWC4 layout is where channels are grouped by 4 in a row and P stands for |
| // a plane that was derived by dividing channels by 4. |
| Status ConvertToPHWC4(absl::Span<const float> in, const BHWC& shape, |
| absl::Span<float> out); |
| Status ConvertToPHWC4Half(absl::Span<const float> in, const BHWC& shape, |
| absl::Span<HalfBits> out); |
| |
| // @return number of elements when shape is converted into PHWC4. |
| uint32_t GetElementsSizeForPHWC4(const BHWC& shape); |
| |
| // Operation is opposite to ConvertToPHWC4. |
| Status ConvertFromPHWC4(absl::Span<const float> in, const BHWC& shape, |
| absl::Span<float> out); |
| Status ConvertFromPHWC4Half(absl::Span<const HalfBits> in, const BHWC& shape, |
| absl::Span<float> out); |
| |
| // Convenience wrapper around a method above. |
| std::vector<float> ConvertToPHWC4( |
| const Tensor<BHWC, DataType::FLOAT32>& tensor); |
| std::vector<float> ConvertToPHWC4(const Tensor<HWC, DataType::FLOAT32>& tensor); |
| |
| // @return number of elements when shape is converted into PIOHW4. |
| uint32_t GetElementsSizeForPIOHW4(const OHWI& shape); |
| |
| // PIOHW4 layout re-arranges weights in groups by 4, where outer dimension is |
| // P which is OxI/4. |
| Status ConvertToPIOHW4(absl::Span<const float> in, const OHWI& shape, |
| absl::Span<float> out); |
| |
| // Convenience wrapper around a method above. |
| std::vector<float> ConvertToPIOHW4( |
| const Tensor<OHWI, DataType::FLOAT32>& tensor); |
| |
| // @return number of elements when shape is converted into PHWO4I4. |
| uint32_t GetElementsSizeForPHWO4I4(const OHWI& shape); |
| |
| // Convenience wrapper around a method above. |
| std::vector<float> ConvertToPHWO4I4( |
| const Tensor<OHWI, DataType::FLOAT32>& tensor); |
| |
| // Convenience wrapper around a method above, for Transposed Convolution. |
| std::vector<float> ConvertToPHWO4I4Transposed( |
| const Tensor<OHWI, DataType::FLOAT32>& tensor); |
| |
| // @return (x,y,z) size for PHWO4I4 to access elements where each element |
| // consists of 4 values. |
| uint3 Get3DSizeForPHWO4I4(const OHWI& shape); |
| |
| // @return number of elements when shape is converted into PHWO4I4. |
| uint32_t GetElementsSizeForPHWO4I4(const IHWO& shape); |
| |
| // Layout is Po,H,W,OI4x4. |
| Status ConvertToPHWO4I4(absl::Span<const float> in, const IHWO& shape, |
| absl::Span<float> out); |
| |
| // Convenience wrapper around a method above. |
| std::vector<float> ConvertToPHWO4I4( |
| const Tensor<IHWO, DataType::FLOAT32>& tensor); |
| |
| } // namespace gpu |
| } // namespace tflite |
| |
| #endif // TENSORFLOW_LITE_DELEGATES_GPU_COMMON_CONVERT_H_ |