diff options
author | Mike Kelly <mike.kelly@arm.com> | 2023-07-25 17:37:33 +0100 |
---|---|---|
committer | mike.kelly <mike.kelly@arm.com> | 2023-07-31 15:34:06 +0000 |
commit | 7cbe78140a274cec783049051df7c7298b974f13 (patch) | |
tree | d39f19b35e120b59d9dbd7f0c7eb27ef97621ebe /src/backends/cl/workloads/ClTransposeWorkload.cpp | |
parent | 21e399974e3cdd8db00bd76af813aa0485395b60 (diff) | |
download | armnn-7cbe78140a274cec783049051df7c7298b974f13.tar.gz |
MLCE-1092 Add Names to Workloads
* Added names to Workloads.
* Workloads will be given the name of the Layer that created them.
* Added new profiling macros to CL Neon and Ref that add the
workload name to the event label
* Updated workloads to use new macros.
* Added missing profiling to Rank Workloads.
* Fixed issue where ClConvolution2dWorkload was being reported as
Undefined rather than GpuAcc.
Signed-off-by: Mike Kelly <mike.kelly@arm.com>
Change-Id: I0a55eab6c2f455b73943aca8e99a247c3cb2a906
Diffstat (limited to 'src/backends/cl/workloads/ClTransposeWorkload.cpp')
-rw-r--r-- | src/backends/cl/workloads/ClTransposeWorkload.cpp | 6 |
1 files changed, 3 insertions, 3 deletions
diff --git a/src/backends/cl/workloads/ClTransposeWorkload.cpp b/src/backends/cl/workloads/ClTransposeWorkload.cpp index 383f5f1faf..8f3ccdbe99 100644 --- a/src/backends/cl/workloads/ClTransposeWorkload.cpp +++ b/src/backends/cl/workloads/ClTransposeWorkload.cpp @@ -1,5 +1,5 @@ // -// Copyright © 2020 Arm Ltd and Contributors. All rights reserved. +// Copyright © 2020-2023 Arm Ltd and Contributors. All rights reserved. // SPDX-License-Identifier: MIT // @@ -43,7 +43,7 @@ ClTransposeWorkload::ClTransposeWorkload(const TransposeQueueDescriptor& descrip arm_compute::ICLTensor& output = static_cast<IClTensorHandle*>(m_Data.m_Outputs[0])->GetTensor(); const armnn::PermutationVector& mappings = m_Data.m_Parameters.m_DimMappings; { - ARMNN_SCOPED_PROFILING_EVENT(Compute::Undefined, "ClTransposeWorkload_configure"); + ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClTransposeWorkload_configure"); // Run the layer. m_PermuteFunction.configure(clCompileContext, &input, @@ -54,7 +54,7 @@ ClTransposeWorkload::ClTransposeWorkload(const TransposeQueueDescriptor& descrip void ClTransposeWorkload::Execute() const { - ARMNN_SCOPED_PROFILING_EVENT_CL_GUID(GetName() + "_Execute", this->GetGuid()); + ARMNN_SCOPED_PROFILING_EVENT_CL_NAME_GUID("ClTransposeWorkload_Execute"); RunClFunction(m_PermuteFunction, CHECK_LOCATION()); } |