aboutsummaryrefslogtreecommitdiff
path: root/src/backends/neon/workloads/NeonMeanWorkload.cpp
diff options
context:
space:
mode:
authorKeith Davis <keith.davis@arm.com>2021-08-05 11:35:00 +0100
committerKeithARM <keith.davis@arm.com>2021-08-10 11:53:19 +0000
commit2d0679f33f75c43e7169fe0f0ee2d15d0620e091 (patch)
tree9f259a41e3208aa37a19330b63e0aabac607cacf /src/backends/neon/workloads/NeonMeanWorkload.cpp
parentd218d9804723e78da9bbd36e6211b3310426852b (diff)
downloadarmnn-2d0679f33f75c43e7169fe0f0ee2d15d0620e091.tar.gz
IVGCVSW-6249 Add ProfilingDetails Macros to all workloads in Neon
Signed-off-by: Keith Davis <keith.davis@arm.com> Change-Id: I7be77712a9f790928219ce91222d46cc766ab9dd
Diffstat (limited to 'src/backends/neon/workloads/NeonMeanWorkload.cpp')
-rw-r--r--src/backends/neon/workloads/NeonMeanWorkload.cpp14
1 files changed, 10 insertions, 4 deletions
diff --git a/src/backends/neon/workloads/NeonMeanWorkload.cpp b/src/backends/neon/workloads/NeonMeanWorkload.cpp
index bb0870d9ef..5d8d1c43a1 100644
--- a/src/backends/neon/workloads/NeonMeanWorkload.cpp
+++ b/src/backends/neon/workloads/NeonMeanWorkload.cpp
@@ -17,21 +17,27 @@ using namespace armcomputetensorutils;
arm_compute::Status NeonMeanWorkloadValidate(const TensorInfo& input,
const TensorInfo& output,
- const MeanDescriptor& desc)
+ const MeanDescriptor& descriptor)
{
const arm_compute::TensorInfo aclInputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(input);
const arm_compute::TensorInfo aclOutputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(output);
arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(aclInputInfo.num_dimensions(),
input.GetNumDimensions(),
- desc.m_Axis);
+ descriptor.m_Axis);
- return arm_compute::NEReduceMean::validate(&aclInputInfo, coords, desc.m_KeepDims, &aclOutputInfo);
+ return arm_compute::NEReduceMean::validate(&aclInputInfo, coords, descriptor.m_KeepDims, &aclOutputInfo);
}
NeonMeanWorkload::NeonMeanWorkload(const MeanQueueDescriptor& descriptor, const WorkloadInfo& info)
: BaseWorkload<MeanQueueDescriptor>(descriptor, info)
{
+ // Report Profiling Details
+ ARMNN_REPORT_PROFILING_WORKLOAD_DESC("NeonMeanWorkload_Construct",
+ descriptor.m_Parameters,
+ info,
+ this->GetGuid());
+
m_Data.ValidateInputsOutputs("NeonMeanWorkload", 1, 1);
arm_compute::ITensor& input = static_cast<IAclTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
@@ -46,7 +52,7 @@ NeonMeanWorkload::NeonMeanWorkload(const MeanQueueDescriptor& descriptor, const
void NeonMeanWorkload::Execute() const
{
- ARMNN_SCOPED_PROFILING_EVENT_NEON("NeonMeanWorkload_Execute");
+ ARMNN_SCOPED_PROFILING_EVENT_NEON_GUID("NeonMeanWorkload_Execute", this->GetGuid());
m_Layer.run();
}