diff options
Diffstat (limited to 'src/backends/cl/workloads')
-rw-r--r-- | src/backends/cl/workloads/ClReduceWorkload.cpp | 51 |
1 files changed, 40 insertions, 11 deletions
diff --git a/src/backends/cl/workloads/ClReduceWorkload.cpp b/src/backends/cl/workloads/ClReduceWorkload.cpp index 6f594ff7a9..0ad6259cc2 100644 --- a/src/backends/cl/workloads/ClReduceWorkload.cpp +++ b/src/backends/cl/workloads/ClReduceWorkload.cpp @@ -20,23 +20,52 @@ arm_compute::Status ClReduceWorkloadValidate(const TensorInfo& input, const ReduceDescriptor& desc) { const arm_compute::TensorInfo aclInputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(input); - const arm_compute::TensorInfo aclOutputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(output); - if (!desc.m_vAxis.empty() && desc.m_vAxis.size() > 1) - { - return arm_compute::Status(arm_compute::ErrorCode::RUNTIME_ERROR, - "ClReduceWorkload: Reduction is supported only on 1 axis."); - } arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(aclInputInfo.num_dimensions(), input.GetNumDimensions(), desc.m_vAxis); + // As ACL only support one axis, validate the layer for each axis if more than one is present. + if (!desc.m_vAxis.empty() && desc.m_vAxis.size() > 1) + { + arm_compute::Status status; + + for (unsigned int i = 0; i != desc.m_vAxis.size(); ++i) + { + TensorInfo inputToModify = input; + std::vector<uint32_t> singleAxis(1, desc.m_vAxis[i]); - return arm_compute::CLReductionOperation::validate(&aclInputInfo, - &aclOutputInfo, - static_cast<unsigned int>(coords[0]), - ConvertReductionOperationToAcl(desc), - desc.m_KeepDims); + // Calculate the output shape using the input shape for a single axis. + // Currently the output TensorInfo inferred will be reduced upon multiple axis + // which will fail validation as only one axis is supported. + const TensorShape& reducedShape = ComputeReductionTensorShape(inputToModify, singleAxis, desc.m_KeepDims); + inputToModify.SetShape(reducedShape); + + const arm_compute::TensorInfo aclOutputInfoModified = + armcomputetensorutils::BuildArmComputeTensorInfo(inputToModify); + + status = arm_compute::CLReductionOperation::validate(&aclInputInfo, + &aclOutputInfoModified, + static_cast<unsigned int>(coords[i]), + ConvertReductionOperationToAcl(desc), + desc.m_KeepDims); + if (!status) + { + break; + } + } + return status; + } + else + { + const arm_compute::TensorInfo aclOutputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(output); + + return arm_compute::CLReductionOperation::validate(&aclInputInfo, + &aclOutputInfo, + static_cast<unsigned int>(coords[0]), + ConvertReductionOperationToAcl(desc), + desc.m_KeepDims); + } } ClReduceWorkload::ClReduceWorkload(const ReduceQueueDescriptor& descriptor, const WorkloadInfo& info) |