aboutsummaryrefslogtreecommitdiff
path: root/src/backends/cl/workloads/ClMeanWorkload.cpp
diff options
context:
space:
mode:
authorKeith Davis <keith.davis@arm.com>2021-08-05 14:20:33 +0100
committerMatthew Sloyan <matthew.sloyan@arm.com>2021-08-10 13:51:31 +0000
commitbcd860a30eba22bb2ba0943ad705734ce0ec5b23 (patch)
treea54dc121df65036f1604389684c76cdd2c988a4a /src/backends/cl/workloads/ClMeanWorkload.cpp
parent2d0679f33f75c43e7169fe0f0ee2d15d0620e091 (diff)
downloadarmnn-bcd860a30eba22bb2ba0943ad705734ce0ec5b23.tar.gz
IVGCVSW-6249 Add ProfilingDetails Macros to all workloads in CL
Signed-off-by: Keith Davis <keith.davis@arm.com> Change-Id: I92dd410da7ad633a46d025fdc2b26093041c439b
Diffstat (limited to 'src/backends/cl/workloads/ClMeanWorkload.cpp')
-rw-r--r--src/backends/cl/workloads/ClMeanWorkload.cpp13
1 files changed, 9 insertions, 4 deletions
diff --git a/src/backends/cl/workloads/ClMeanWorkload.cpp b/src/backends/cl/workloads/ClMeanWorkload.cpp
index 4cc0f7c1c2..cd79d04612 100644
--- a/src/backends/cl/workloads/ClMeanWorkload.cpp
+++ b/src/backends/cl/workloads/ClMeanWorkload.cpp
@@ -16,16 +16,16 @@ using namespace armcomputetensorutils;
arm_compute::Status ClMeanValidate(const TensorInfo& input,
const TensorInfo& output,
- const MeanDescriptor& desc)
+ const MeanDescriptor& descriptor)
{
const arm_compute::TensorInfo aclInputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(input);
const arm_compute::TensorInfo aclOutputInfo = armcomputetensorutils::BuildArmComputeTensorInfo(output);
arm_compute::Coordinates coords = BuildArmComputeReductionCoordinates(aclInputInfo.num_dimensions(),
input.GetNumDimensions(),
- desc.m_Axis);
+ descriptor.m_Axis);
- return arm_compute::CLReduceMean::validate(&aclInputInfo, coords, desc.m_KeepDims, &aclOutputInfo);
+ return arm_compute::CLReduceMean::validate(&aclInputInfo, coords, descriptor.m_KeepDims, &aclOutputInfo);
}
ClMeanWorkload::ClMeanWorkload(const MeanQueueDescriptor& descriptor,
@@ -33,6 +33,11 @@ ClMeanWorkload::ClMeanWorkload(const MeanQueueDescriptor& descriptor,
const arm_compute::CLCompileContext& clCompileContext)
: BaseWorkload<MeanQueueDescriptor>(descriptor, info)
{
+ // Report Profiling Details
+ ARMNN_REPORT_PROFILING_WORKLOAD_DESC("ClMeanWorkload_Construct",
+ descriptor.m_Parameters,
+ info,
+ this->GetGuid());
m_Data.ValidateInputsOutputs("ClMeanWorkload", 1, 1);
arm_compute::ICLTensor& input = static_cast<IClTensorHandle*>(m_Data.m_Inputs[0])->GetTensor();
@@ -47,7 +52,7 @@ ClMeanWorkload::ClMeanWorkload(const MeanQueueDescriptor& descriptor,
void ClMeanWorkload::Execute() const
{
- ARMNN_SCOPED_PROFILING_EVENT_CL("ClMeanWorkload_Execute");
+ ARMNN_SCOPED_PROFILING_EVENT_CL_GUID("ClMeanWorkload_Execute", this->GetGuid());
m_Layer.run();
}