29 std::vector<ITensorHandle*> outputs)
const 35 std::unique_ptr<Decoder<float>> decoderPtr = MakeDecoder<float>(inputInfo, inputs[0]->Map());
38 std::unique_ptr<Encoder<float>> encoderPtr = MakeEncoder<float>(outputInfo, outputs[0]->Map());
41 auto getNumberOfElements = [](
const TensorShape& tensorShape,uint32_t startAxis, uint32_t lastAxis)
44 for (uint32_t i = startAxis; i < lastAxis; i++)
46 count *= tensorShape[i];
54 const uint32_t groupSize = tensorShape[channelsAxis] / numGroups;
56 uint32_t outerSize = getNumberOfElements(tensorShape, 0, channelsAxis);
57 uint32_t innerSize = getNumberOfElements(tensorShape, channelsAxis + 1, tensorShape.
GetNumDimensions());
59 for (uint32_t outer = 0; outer < outerSize; ++outer)
61 for (uint32_t inner = 0; inner < innerSize; ++inner)
63 uint32_t decoderStep1 = outer * tensorShape[channelsAxis] * innerSize + inner;
64 decoder += decoderStep1;
65 uint32_t encoderStep1 = outer * tensorShape[channelsAxis] * innerSize + inner;
66 encoder += encoderStep1;
67 for (uint32_t i = 0; i < groupSize; i++)
69 for (uint32_t j = 0; j < numGroups; j++, encoder += innerSize, encoderStep1 += innerSize)
71 decoder += innerSize * (i + j * groupSize);
72 float decoded = decoder.Get();
74 decoder -= innerSize * (i + j * groupSize);
77 decoder -= decoderStep1;
78 encoder -= encoderStep1;
const TensorShape & GetShape() const
CPU Execution: Reference C++ kernels.
Copyright (c) 2021 ARM Limited and Contributors.
LayerDescriptor m_Parameters
#define ARMNN_SCOPED_PROFILING_EVENT(backendId, name)
std::vector< ITensorHandle * > m_Inputs
ChannelShuffleQueueDescriptor m_Data
uint32_t m_NumGroups
Number of groups for the channel shuffle operation.
std::vector< ITensorHandle * > m_Outputs
void Execute() const override
unsigned int GetNumDimensions() const
Function that returns the tensor rank.
std::vector< ITensorHandle * > m_Outputs
void ExecuteAsync(WorkingMemDescriptor &workingMemDescriptor) override
uint32_t m_Axis
Axis to apply channel shuffle operation on.
std::vector< ITensorHandle * > m_Inputs
const TensorInfo & GetTensorInfo(const ITensorHandle *tensorHandle)
float32 helpers