blob: 6431348bc282b45f3d129b271a321a82aeea9848 [file] [log] [blame]
//
// Copyright © 2017 Arm Ltd. All rights reserved.
// SPDX-License-Identifier: MIT
//
#include "RefElementwiseWorkload.hpp"
#include "Decoders.hpp"
#include "ElementwiseFunction.hpp"
#include "Encoders.hpp"
#include "Profiling.hpp"
#include "RefWorkloadUtils.hpp"
#include "StringMapping.hpp"
#include <ResolveType.hpp>
#include <vector>
namespace armnn
{
template <typename Functor, typename ParentDescriptor, typename armnn::StringMapping::Id DebugString>
RefElementwiseWorkload<Functor, ParentDescriptor, DebugString>::RefElementwiseWorkload(
const ParentDescriptor& desc,
const WorkloadInfo& info)
: BaseWorkload<ParentDescriptor>(desc, info)
{
}
template <typename Functor, typename ParentDescriptor, typename armnn::StringMapping::Id DebugString>
void RefElementwiseWorkload<Functor, ParentDescriptor, DebugString>::PostAllocationConfigure()
{
const TensorInfo& inputInfo0 = GetTensorInfo(m_Data.m_Inputs[0]);
const TensorInfo& inputInfo1 = GetTensorInfo(m_Data.m_Inputs[1]);
const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);
m_Input0 = MakeDecoder<InType>(inputInfo0);
m_Input1 = MakeDecoder<InType>(inputInfo1);
m_Output = MakeEncoder<OutType>(outputInfo);
}
template <typename Functor, typename ParentDescriptor, typename armnn::StringMapping::Id DebugString>
void RefElementwiseWorkload<Functor, ParentDescriptor, DebugString>::Execute() const
{
ARMNN_SCOPED_PROFILING_EVENT(Compute::CpuRef, StringMapping::Instance().Get(DebugString));
const TensorInfo& inputInfo0 = GetTensorInfo(m_Data.m_Inputs[0]);
const TensorInfo& inputInfo1 = GetTensorInfo(m_Data.m_Inputs[1]);
const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);
const TensorShape& inShape0 = inputInfo0.GetShape();
const TensorShape& inShape1 = inputInfo1.GetShape();
const TensorShape& outShape = outputInfo.GetShape();
m_Input0->Reset(m_Data.m_Inputs[0]->Map());
m_Input1->Reset(m_Data.m_Inputs[1]->Map());
m_Output->Reset(m_Data.m_Outputs[0]->Map());
ElementwiseFunction<Functor>(inShape0,
inShape1,
outShape,
*m_Input0,
*m_Input1,
*m_Output);
}
} //namespace armnn
template class armnn::RefElementwiseWorkload<std::plus<float>,
armnn::AdditionQueueDescriptor,
armnn::StringMapping::RefAdditionWorkload_Execute>;
template class armnn::RefElementwiseWorkload<std::minus<float>,
armnn::SubtractionQueueDescriptor,
armnn::StringMapping::RefSubtractionWorkload_Execute>;
template class armnn::RefElementwiseWorkload<std::multiplies<float>,
armnn::MultiplicationQueueDescriptor,
armnn::StringMapping::RefMultiplicationWorkload_Execute>;
template class armnn::RefElementwiseWorkload<std::divides<float>,
armnn::DivisionQueueDescriptor,
armnn::StringMapping::RefDivisionWorkload_Execute>;
template class armnn::RefElementwiseWorkload<armnn::maximum<float>,
armnn::MaximumQueueDescriptor,
armnn::StringMapping::RefMaximumWorkload_Execute>;
template class armnn::RefElementwiseWorkload<armnn::minimum<float>,
armnn::MinimumQueueDescriptor,
armnn::StringMapping::RefMinimumWorkload_Execute>;
template class armnn::RefElementwiseWorkload<std::equal_to<float>,
armnn::EqualQueueDescriptor,
armnn::StringMapping::RefEqualWorkload_Execute>;
template class armnn::RefElementwiseWorkload<std::greater<float>,
armnn::GreaterQueueDescriptor,
armnn::StringMapping::RefGreaterWorkload_Execute>;