plain/22.08/_ethosn_ref_convolution2d_workload_8cpp_source.xhtml

 //
 // Copyright © 2017 Arm Ltd. All rights reserved.
 // SPDX-License-Identifier: MIT
 //

 #include "EthosnRefConvolution2dWorkload.hpp"
 #include "EthosnRefConvImpl.hpp"
 #include "EthosnRefWorkloadUtils.hpp"

 using namespace armnn::ethosnref;

 namespace armnn
 {

 static inline std::string Split(const std::string& s, const std::string& delim, std::size_t& pos)
 {
     if (pos >= s.length())
     {
         return "";
     }

     std::size_t end = s.find(delim, pos);
     if (end == std::string::npos)
     {
         end = s.length();
     }

     std::string str = s.substr(pos, end - pos);
     pos             = end + 1;

     return str;
 }

 EthosnRefConvolution2dWorkload::EthosnRefConvolution2dWorkload(
         const Convolution2dQueueDescriptor& descriptor, const WorkloadInfo& info, bool winograd, std::string BlockConfigs)
         : BaseWorkload<Convolution2dQueueDescriptor>(descriptor, info)
 {
     m_Weight = std::make_unique<ScopedCpuTensorHandle>(*(descriptor.m_Weight));

     if (descriptor.m_Parameters.m_BiasEnabled)
     {
         m_Bias = std::make_unique<ScopedCpuTensorHandle>(*(descriptor.m_Bias));
     }

     m_Winograd = winograd;

     m_IsBlockConfigsWinograd2dCompatible = false;
     std::string part;
     std::size_t pos = 0;
     while (!(part = Split(BlockConfigs, ",", pos)).empty())
     {
         if (part == "16x8")
         {
             m_IsBlockConfigsWinograd2dCompatible = true;
         }
         else if (part == "8x16")
         {
             m_IsBlockConfigsWinograd2dCompatible = true;
         }
         else if (part == "8x8")
         {
             m_IsBlockConfigsWinograd2dCompatible = true;
         }
     }
     if (BlockConfigs == "")
     {
         m_IsBlockConfigsWinograd2dCompatible = true;
     }
 }


 void EthosnRefConvolution2dWorkload::Execute() const {

     ARMNN_SCOPED_PROFILING_EVENT_ETHOSN("EthosnRefConvolution2dWorkload_Execute");

     const TensorInfo& inputInfo = GetTensorInfo(m_Data.m_Inputs[0]);
     const TensorInfo& weightsInfo = m_Weight->GetTensorInfo();

     bool useWinograd = false;

     if (m_Winograd == true) {
       const armnnUtils::DataLayoutIndexed dataLayoutIndexed(m_Data.m_Parameters.m_DataLayout);
       unsigned int weightsHeight = weightsInfo.GetShape()[dataLayoutIndexed.GetHeightIndex()];
       unsigned int weightsWidth  = weightsInfo.GetShape()[dataLayoutIndexed.GetWidthIndex()];
       unsigned int xStride       = m_Data.m_Parameters.m_StrideX;
       unsigned int yStride       = m_Data.m_Parameters.m_StrideY;

       bool isWinograd1D    = weightsWidth == 1 || weightsHeight == 1;
       bool isBlockSizeOk   = isWinograd1D? true : m_IsBlockConfigsWinograd2dCompatible;

       uint32_t numMultsDirect, numMultsWinograd;

       if ( weightsWidth == 1 || weightsHeight == 1)
       {
           // 1D convolution kernel dim w x 1 or 1 x h
           // numOfMultiplications = 2 * w or 2 * h                   DIRECT
           //                      = 4 * CEIL(W/3) or 4 * CEIL(H/3)   WINOGRAD
           numMultsDirect   = weightsWidth * weightsHeight * 2;
           numMultsWinograd = 4 * DivideRoundUp(weightsWidth * weightsHeight, 3);
       }
       else
       {
           // 2D convolution kernel dim w x h
           // numOfMultiplications = 4 * w * h                    DIRECT
           //                      = 16 * CEIL(W/3) * CEIL(H/3)   WINOGRAD
           numMultsDirect   = weightsWidth * weightsHeight * 4;
           numMultsWinograd = 16 *  DivideRoundUp(weightsWidth, 3) * DivideRoundUp(weightsHeight, 3);
       }
       if (numMultsWinograd < numMultsDirect &&
               isBlockSizeOk &&
               //TODO: FENCHSW-922 Need to revisit then when
               // SW add support for Winogard + Strided
               xStride == 1 && yStride == 1)
           useWinograd = true;
     }

     if (useWinograd == true)
     {
         std::cout << "[EthosNRef] Runnning in Winograd Mode.\n";
     }
     else
     {
         std::cout << "[EthosNRef] Runnning in Direct Mode.\n";
     }

     if (CheckDataType(DataType::QSymmS16, inputInfo.GetDataType(), weightsInfo.GetDataType())) {
         const int16_t* inputData = GetInputTensorData<int16_t>(0, m_Data);
         const int16_t* weightsData = m_Weight->template GetConstTensor<int16_t>();
         const int32_t* biasData = m_Data.m_Parameters.m_BiasEnabled ? m_Bias->template GetConstTensor<int32_t>() : nullptr;
         const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);

         if(useWinograd == false)
         {
           EthosnRefConvImpl<armnn::Convolution2dQueueDescriptor, int16_t, int16_t, int32_t, int64_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
         else
         {
           EthosnRefWinogradConvImpl<armnn::Convolution2dQueueDescriptor, int16_t, int16_t, int32_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
     }
     else if (CheckDataType(DataType::QSymmS8, inputInfo.GetDataType(), weightsInfo.GetDataType())) {
         const int8_t* inputData = GetInputTensorData<int8_t>(0, m_Data);
         const int8_t* weightsData = m_Weight->template GetConstTensor<int8_t>();
         const int32_t* biasData = m_Data.m_Parameters.m_BiasEnabled ? m_Bias->template GetConstTensor<int32_t>() : nullptr;
         const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);

         if(useWinograd == false)
         {
           EthosnRefConvImpl<armnn::Convolution2dQueueDescriptor, int8_t, int8_t, int32_t, int32_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
         else
         {
           EthosnRefWinogradConvImpl<armnn::Convolution2dQueueDescriptor, int8_t, int8_t, int32_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
     }
     else { // QAsymmU8
         assert(CheckDataType(DataType::QAsymmU8, inputInfo.GetDataType(), weightsInfo.GetDataType()));

         const uint8_t* inputData = GetInputTensorData<uint8_t>(0, m_Data);
         const uint8_t* weightsData = m_Weight->template GetConstTensor<uint8_t>();
         const int32_t* biasData = m_Data.m_Parameters.m_BiasEnabled ? m_Bias->template GetConstTensor<int32_t>() : nullptr;
         const TensorInfo& outputInfo = GetTensorInfo(m_Data.m_Outputs[0]);

         if(useWinograd == false)
         {
           EthosnRefConvImpl<armnn::Convolution2dQueueDescriptor, uint8_t, uint8_t, int32_t, int32_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
         else
         {
           EthosnRefWinogradConvImpl<armnn::Convolution2dQueueDescriptor, uint8_t, uint8_t, int32_t>(
             m_Data,
             inputData, inputInfo.GetQuantizationScale(),  inputInfo.GetQuantizationOffset(),
             weightsData, weightsInfo.GetQuantizationScale(), weightsInfo.GetQuantizationOffset(),
             biasData,
             outputInfo.GetQuantizationScale(), outputInfo.GetQuantizationOffset(), weightsInfo);
         }
     }
 }

 } //namespace armnn
armnn::Convolution2dDescriptor::m_BiasEnabled
bool m_BiasEnabled
Enable/disable bias.
Definition: Descriptors.hpp:543

armnn::Convolution2dDescriptor::m_DataLayout
DataLayout m_DataLayout
The data layout to be used (NCHW, NHWC).
Definition: Descriptors.hpp:545

armnnUtils::DataLayoutIndexed::GetWidthIndex
unsigned int GetWidthIndex() const
Definition: DataLayoutIndexed.hpp:25

armnn::TensorInfo::GetShape
const TensorShape & GetShape() const
Definition: Tensor.hpp:191

armnn::EthosnRefConvolution2dWorkload::Execute
virtual void Execute() const override
Definition: EthosnRefConvolution2dWorkload.cpp:72

armnn::TensorInfo
Definition: Tensor.hpp:152

EthosnRefWorkloadUtils.hpp

armnn::EthosnRefConvolution2dWorkload::EthosnRefConvolution2dWorkload
EthosnRefConvolution2dWorkload(const Convolution2dQueueDescriptor &descriptor, const WorkloadInfo &info, bool winograd=false, std::string BlockConfigs="")
Definition: EthosnRefConvolution2dWorkload.cpp:34

armnn::Convolution2dQueueDescriptor::m_Weight
const ConstTensorHandle * m_Weight
Definition: WorkloadData.hpp:222

armnn::Convolution2dQueueDescriptor::m_Bias
const ConstTensorHandle * m_Bias
Definition: WorkloadData.hpp:223

armnn::DataType::QSymmS16

armnn
Copyright (c) 2021 ARM Limited and Contributors.
Definition: 01_00_quick_start.dox:6

armnn::ethosnref
Definition: EthosnRefWorkloadUtils.hpp:26

armnn::QueueDescriptorWithParameters::m_Parameters
LayerDescriptor m_Parameters
Definition: WorkloadData.hpp:66

armnnUtils::DataLayoutIndexed::GetHeightIndex
unsigned int GetHeightIndex() const
Definition: DataLayoutIndexed.hpp:24

armnn::ethosnref::DivideRoundUp
uint32_t DivideRoundUp(uint32_t numerator, uint32_t denominator)
Definition: EthosnRefWorkloadUtils.hpp:51

EthosnRefConvolution2dWorkload.hpp

armnn::ethosnref::CheckDataType
bool CheckDataType(DataType type, DataType inputType, DataType weightsType)
Definition: EthosnRefWorkloadUtils.hpp:56

armnn::Convolution2dDescriptor::m_StrideX
uint32_t m_StrideX
Stride value when proceeding through input for the width dimension.
Definition: Descriptors.hpp:535

armnn::BaseWorkload
Definition: Workload.hpp:33

armnn::TensorInfo::GetQuantizationOffset
int32_t GetQuantizationOffset() const
Definition: Tensor.cpp:478

armnn::TensorInfo::GetQuantizationScale
float GetQuantizationScale() const
Definition: Tensor.cpp:461

armnn::BaseWorkload< Convolution2dQueueDescriptor >::m_Data
Convolution2dQueueDescriptor m_Data
Definition: Workload.hpp:83

armnn::TensorInfo::GetDataType
DataType GetDataType() const
Definition: Tensor.hpp:198

armnnUtils::DataLayoutIndexed
Provides access to the appropriate indexes for Channels, Height and Width based on DataLayout...
Definition: DataLayoutIndexed.hpp:17

armnn::DataType::QAsymmU8

armnn::Convolution2dDescriptor::m_StrideY
uint32_t m_StrideY
Stride value when proceeding through input for the height dimension.
Definition: Descriptors.hpp:537

ARMNN_SCOPED_PROFILING_EVENT_ETHOSN
#define ARMNN_SCOPED_PROFILING_EVENT_ETHOSN(name)
Definition: EthosnRefWorkloadUtils.hpp:21

armnn::Convolution2dQueueDescriptor
Definition: WorkloadData.hpp:214

EthosnRefConvImpl.hpp

armnn::QueueDescriptor::m_Outputs
std::vector< ITensorHandle * > m_Outputs
Definition: WorkloadData.hpp:27

armnn::WorkloadInfo
Contains information about TensorInfos of a layer.
Definition: WorkloadInfo.hpp:16

armnn::DataType::QSymmS8

armnn::QueueDescriptor::m_Inputs
std::vector< ITensorHandle * > m_Inputs
Definition: WorkloadData.hpp:26

armnn::GetTensorInfo
const TensorInfo & GetTensorInfo(const ITensorHandle *tensorHandle)
float32 helpers
Definition: RefWorkloadUtils.hpp:26