aboutsummaryrefslogtreecommitdiff
path: root/src/cpu/kernels/CpuAddKernel.h
diff options
context:
space:
mode:
authorGunes Bayir <gunes.bayir@arm.com>2022-07-28 17:44:00 +0100
committerGunes Bayir <gunes.bayir@arm.com>2022-08-01 20:13:56 +0000
commit9b921be1ff7283050eb39d9ce1b10b5c8bfc1300 (patch)
tree0cb274a6c529717b8ef987aa3e270647927e9d89 /src/cpu/kernels/CpuAddKernel.h
parent385dad2bffecbf395aa9aad257809de81c727ac7 (diff)
downloadComputeLibrary-9b921be1ff7283050eb39d9ce1b10b5c8bfc1300.tar.gz
Optimize add layer by considering the input tensors as 1D array
Resolves: COMPMID-5108 Change-Id: I544f8160fbe5b4ffbef348d1fbd3dd626a6e1bdb Signed-off-by: Gunes Bayir <gunes.bayir@arm.com> Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/8002 Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com> Comments-Addressed: Arm Jenkins <bsgcomp@arm.com> Benchmark: Arm Jenkins <bsgcomp@arm.com> Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/cpu/kernels/CpuAddKernel.h')
-rw-r--r--src/cpu/kernels/CpuAddKernel.h12
1 files changed, 9 insertions, 3 deletions
diff --git a/src/cpu/kernels/CpuAddKernel.h b/src/cpu/kernels/CpuAddKernel.h
index 6638135580..1afbc1a4d0 100644
--- a/src/cpu/kernels/CpuAddKernel.h
+++ b/src/cpu/kernels/CpuAddKernel.h
@@ -42,9 +42,9 @@ private:
public:
struct AddKernel
{
- const char *name;
- const DataTypeISASelectorPtr is_selected;
- AddKernelPtr ukernel;
+ const char *name;
+ const CpuAddKernelDataTypeISASelectorDataPtr is_selected;
+ AddKernelPtr ukernel;
};
CpuAddKernel() = default;
@@ -91,10 +91,16 @@ public:
static const std::vector<AddKernel> &get_available_kernels();
+ bool get_can_interpret_inputs_as_1d_array()
+ {
+ return _can_interpret_inputs_as_1d_array;
+ }
+
private:
ConvertPolicy _policy{};
AddKernelPtr _run_method{ nullptr };
std::string _name{};
+ bool _can_interpret_inputs_as_1d_array{ false };
};
} // namespace kernels
} // namespace cpu