blob: f9c3718e14bf05c718a42523d1eab23a088e7722 [file] [log] [blame]
//
// Copyright © 2022 Arm Ltd and Contributors. All rights reserved.
// SPDX-License-Identifier: MIT
//
#pragma once
#include <armnn/backends/Workload.hpp>
#include <aclCommon/ArmComputeTensorUtils.hpp>
#include <neon/NeonTensorHandle.hpp>
#include <neon/NeonTimer.hpp>
#include <armnn/backends/TensorHandle.hpp>
#include <armnn/Utils.hpp>
#include <Half.hpp>
#define ARMNN_SCOPED_PROFILING_EVENT_NEON(name) \
ARMNN_SCOPED_PROFILING_EVENT_WITH_INSTRUMENTS(armnn::Compute::CpuAcc, \
armnn::EmptyOptional(), \
name, \
armnn::NeonTimer(), \
armnn::WallClockTimer())
#define ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID(name, guid) \
ARMNN_SCOPED_PROFILING_EVENT_WITH_INSTRUMENTS(armnn::Compute::CpuAcc, \
guid, \
name, \
armnn::NeonTimer(), \
armnn::WallClockTimer())
using namespace armnn::armcomputetensorutils;
namespace armnn
{
inline std::string GetConvolutionMethodString(arm_compute::ConvolutionMethod& convolutionMethod)
{
switch (convolutionMethod)
{
case arm_compute::ConvolutionMethod::FFT:
return "FFT";
case arm_compute::ConvolutionMethod::DIRECT:
return "Direct";
case arm_compute::ConvolutionMethod::GEMM:
return "GEMM";
case arm_compute::ConvolutionMethod::WINOGRAD:
return "Winograd";
default:
return "Unknown";
}
}
template <typename T>
void CopyArmComputeTensorData(arm_compute::Tensor& dstTensor, const T* srcData)
{
InitialiseArmComputeTensorEmpty(dstTensor);
CopyArmComputeITensorData(srcData, dstTensor);
}
inline void InitializeArmComputeTensorData(arm_compute::Tensor& tensor,
const ConstTensorHandle* handle)
{
ARMNN_ASSERT(handle);
switch(handle->GetTensorInfo().GetDataType())
{
case DataType::Float16:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<armnn::Half>());
break;
case DataType::Float32:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<float>());
break;
case DataType::QAsymmU8:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<uint8_t>());
break;
case DataType::QSymmS8:
case DataType::QAsymmS8:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<int8_t>());
break;
case DataType::Signed32:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<int32_t>());
break;
case DataType::QSymmS16:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<int16_t>());
break;
case DataType::BFloat16:
CopyArmComputeTensorData(tensor, handle->GetConstTensor<armnn::BFloat16>());
break;
default:
// Throw exception; assertion not called in release build.
throw Exception("Unexpected tensor type during InitializeArmComputeTensorData().");
}
};
inline auto SetNeonStridedSliceData(const std::vector<int>& m_begin,
const std::vector<int>& m_end,
const std::vector<int>& m_stride)
{
arm_compute::Coordinates starts;
arm_compute::Coordinates ends;
arm_compute::Coordinates strides;
unsigned int num_dims = static_cast<unsigned int>(m_begin.size());
for (unsigned int i = 0; i < num_dims; i++)
{
unsigned int revertedIndex = num_dims - i - 1;
starts.set(i, static_cast<int>(m_begin[revertedIndex]));
ends.set(i, static_cast<int>(m_end[revertedIndex]));
strides.set(i, static_cast<int>(m_stride[revertedIndex]));
}
return std::make_tuple(starts, ends, strides);
}
inline auto SetNeonSliceData(const std::vector<unsigned int>& m_begin,
const std::vector<unsigned int>& m_size)
{
// This function must translate the size vector given to an end vector
// expected by the ACL NESlice workload
arm_compute::Coordinates starts;
arm_compute::Coordinates ends;
unsigned int num_dims = static_cast<unsigned int>(m_begin.size());
// For strided slices, we have the relationship size = (end - begin) / stride
// For slice, we assume stride to be a vector of all ones, yielding the formula
// size = (end - begin) therefore we know end = size + begin
for (unsigned int i = 0; i < num_dims; i++)
{
unsigned int revertedIndex = num_dims - i - 1;
starts.set(i, static_cast<int>(m_begin[revertedIndex]));
ends.set(i, static_cast<int>(m_begin[revertedIndex] + m_size[revertedIndex]));
}
return std::make_tuple(starts, ends);
}
template <typename DataType, typename PayloadType>
DataType* GetOutputTensorData(unsigned int idx, const PayloadType& data)
{
ITensorHandle* tensorHandle = data.m_Outputs[idx];
return reinterpret_cast<DataType*>(tensorHandle->Map());
}
} //namespace armnn