#include <NeonGatherNdWorkload.hpp>

Inheritance diagram for NeonGatherNdWorkload:

Collaboration diagram for NeonGatherNdWorkload:

Public Member Functions
	NeonGatherNdWorkload (const GatherNdQueueDescriptor &descriptor, const WorkloadInfo &info)

virtual void	Execute () const override

Public Member Functions inherited from NeonBaseWorkload< GatherNdQueueDescriptor >
	NeonBaseWorkload (const GatherNdQueueDescriptor &descriptor, const WorkloadInfo &info)

void	ReplaceInputTensorHandle (ITensorHandle *tensorHandle, unsigned int slot) override

void	ReplaceOutputTensorHandle (ITensorHandle *tensorHandle, unsigned int slot) override

Public Member Functions inherited from BaseWorkload< GatherNdQueueDescriptor >
	BaseWorkload (const GatherNdQueueDescriptor &descriptor, const WorkloadInfo &info)

virtual const std::string &	GetName () const override

void	ExecuteAsync (ExecutionData &executionData) override

void	PostAllocationConfigure () override

const GatherNdQueueDescriptor &	GetData () const

arm::pipe::ProfilingGuid	GetGuid () const final

virtual bool	SupportsTensorHandleReplacement () const override

Public Member Functions inherited from IWorkload
virtual	~IWorkload ()

virtual arm::pipe::ProfilingGuid	GetGuid () const =0

virtual bool	SupportsTensorHandleReplacement () const =0

virtual const std::string &	GetName () const =0

virtual void	RegisterDebugCallback (const DebugCallbackFunction &)

virtual armnn::Optional< armnn::MemoryRequirements >	GetMemoryRequirements ()

Additional Inherited Members
Protected Member Functions inherited from NeonBaseWorkload< GatherNdQueueDescriptor >
virtual void	Reconfigure ()

Protected Attributes inherited from BaseWorkload< GatherNdQueueDescriptor >
GatherNdQueueDescriptor	m_Data

const arm::pipe::ProfilingGuid	m_Guid

const std::string	m_Name

Detailed Description

Definition at line 22 of file NeonGatherNdWorkload.hpp.

Constructor & Destructor Documentation

◆ NeonGatherNdWorkload()

NeonGatherNdWorkload	(	const GatherNdQueueDescriptor &	descriptor,
		const WorkloadInfo &	info
	)

Calculate flattened indices: m_FlattenedIndices = indices * m_FlattenedCoeff. This could be done using MatMul instead of multiplication followed by reduce sum operation, but GeMM does not support s32 at the moment.

Call Gather with adequate shapes

Definition at line 97 of file NeonGatherNdWorkload.cpp.

         : NeonBaseWorkload<GatherNdQueueDescriptor>(descriptor, info)
 {
     m_Data.ValidateInputsOutputs("NeonGatherNdWorkload", 2, 1);
  
     TensorInfo paramsInfo  = info.m_InputTensorInfos[0];
     TensorInfo indicesInfo = info.m_InputTensorInfos[1];
     TensorInfo outputInfo  = info.m_OutputTensorInfos[0];
  
     arm_compute::ITensor& input   = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
     arm_compute::ITensor& indices = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Inputs[1])->GetTensor();
     arm_compute::ITensor& output  = PolymorphicDowncast<IAclTensorHandle*>(m_Data.m_Outputs[0])->GetTensor();
  
     // Calculate ND, K, W, C.
     std::map<std::string, unsigned int> keyIndices = CalculateGatherNdKeyIndices(paramsInfo, indicesInfo);
  
     /// Calculate flattened indices: m_FlattenedIndices = indices * m_FlattenedCoeff.
     /// This could be done using MatMul instead of multiplication followed by reduce sum operation,
     /// but GeMM does not support s32 at the moment.
  
     // Prepare the tensor to store the output of the reduce_sum operation
     armnn::TensorInfo flattenedIndices_Info = indicesInfo;
     flattenedIndices_Info.SetShape({ keyIndices["W"] });
     BuildArmComputeTensor(m_FlattenedIndices, flattenedIndices_Info);
     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_FlattenedIndices);
  
     // Reshape indices into { W, ND }
     indices.info()->set_tensor_shape(BuildArmComputeTensorShape({ keyIndices["W"], keyIndices["ND"] }));
  
     // Calculate the m_FlattenedCoeff
     TensorShape paramsShape = paramsInfo.GetShape();
     std::vector<int32_t> flattenedCoeff(keyIndices["ND"], 1);
     for (unsigned int i = 1; i < keyIndices["ND"]; ++i)
     {
         flattenedCoeff[i - 1] = static_cast<int32_t>(paramsShape[i]);
     }
     for (unsigned int i = keyIndices["ND"] - 1; i > 0; --i)
     {
         flattenedCoeff[i - 1] *= flattenedCoeff[i];
     }
     armnn::TensorInfo flattenedCoeff_Info = indicesInfo;
     flattenedCoeff_Info.SetShape({ keyIndices["ND"] });
     BuildArmComputeTensor(m_FlattenedCoeff, flattenedCoeff_Info);
     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_FlattenedCoeff);
     ARMNN_ASSERT_MSG(indicesInfo.GetDataType() == DataType::Signed32,
                      "flattenedCoeff must be same data type as m_FlattenedCoeff");
     CopyArmComputeITensorData<int32_t>(flattenedCoeff.data(), m_FlattenedCoeff);
  
     // Prepare the tensor to store the output of the multiplication
     armnn::TensorInfo outputMul_Info = indicesInfo;
     outputMul_Info.SetShape({ keyIndices["W"], keyIndices["ND"] });
     BuildArmComputeTensor(m_OutputMul, outputMul_Info);
     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_OutputMul);
  
     // Multiply
     m_MulLayer.configure(&indices,
                          &m_FlattenedCoeff,
                          &m_OutputMul,
                          1.0f,
                          arm_compute::ConvertPolicy::WRAP,
                          arm_compute::RoundingPolicy::TO_ZERO,
                          arm_compute::ActivationLayerInfo());
  
     // Reduce Sum
     const std::vector<unsigned int> armnnReduceAxes(1, 1);
     arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(m_OutputMul.info()->num_dimensions(),
                                                                           outputMul_Info.GetNumDimensions(),
                                                                           armnnReduceAxes);
     m_ReduceSumLayer.configure(&m_OutputMul,
                                &m_FlattenedIndices,
                                static_cast<unsigned int>(coords[0]),
                                arm_compute::ReductionOperation::SUM,
                                false);
  
     /// Call Gather with adequate shapes
     // Reshape params into { K, C }
     paramsInfo.SetShape({ keyIndices["K"], keyIndices["C"] });
     input.info()->set_tensor_shape(BuildArmComputeTensorShape(paramsInfo.GetShape()));
  
     // Reshape output to have the shape given by gather { W, C }
     // (the original outputInfo has the shape given by gatherNd)
     armnn::TensorInfo outputGather_Info = outputInfo;
     outputGather_Info.SetShape({ keyIndices["W"], keyIndices["C"] });
     BuildArmComputeTensor(m_OutputGather, outputGather_Info);
     armcomputetensorutils::InitialiseArmComputeTensorEmpty(m_OutputGather);
  
     m_GatherLayer.configure(&input, &m_FlattenedIndices, &m_OutputGather, ComputeAclAxis(0, paramsInfo));
  
     // Reshape output to the original output shape
     m_ReshapeLayer.configure(&m_OutputGather, &output);
 }

References armnn::CalculateGatherNdKeyIndices(), armnn::info, BaseWorkload< GatherNdQueueDescriptor >::m_Data, QueueDescriptor::m_Inputs, QueueDescriptor::m_Outputs, TensorInfo::SetShape(), and QueueDescriptor::ValidateInputsOutputs().

Member Function Documentation

◆ Execute()

void Execute ( ) const

overridevirtual

Implements IWorkload.

Definition at line 190 of file NeonGatherNdWorkload.cpp.

 {
     ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID("NeonGatherNdWorkload_Execute");
     m_MulLayer.run();
     m_ReduceSumLayer.run();
     m_GatherLayer.run();
     m_ReshapeLayer.run();
 }

References ARMNN_SCOPED_PROFILING_EVENT_NEON_NAME_GUID.

The documentation for this class was generated from the following files:

src/backends/neon/workloads/NeonGatherNdWorkload.hpp
src/backends/neon/workloads/NeonGatherNdWorkload.cpp

Public Member Functions

Additional Inherited Members

Detailed Description

Constructor & Destructor Documentation

◆ NeonGatherNdWorkload()

Member Function Documentation

◆ Execute()