diff options
author | Sheri Zhang <sheri.zhang@arm.com> | 2021-06-29 17:34:06 +0100 |
---|---|---|
committer | Sheri Zhang <sheri.zhang@arm.com> | 2021-07-13 15:36:03 +0000 |
commit | a387e271b1e02ffd5c2993702b9a21c1ed5c95fa (patch) | |
tree | f53416756c70c85d962218168ad3cd3359d9f5c8 /src/graph/mutators | |
parent | 6fc7d528382716de9e417c9dcf0fddf109446e9f (diff) | |
download | ComputeLibrary-a387e271b1e02ffd5c2993702b9a21c1ed5c95fa.tar.gz |
Add in-place calculation support for CL elementwise arithmetic kernels
- Add in-place calculation support in ClArithmeticKernel, ClSaturatedArithmeticKernel and ClMulKernel
- Add in-place test cases
Resolves: COMPMID-4431
Signed-off-by: Sheri Zhang <sheri.zhang@arm.com>
Change-Id: Id484bdb76b74478a33fedb471ae0c7f799c599f6
Reviewed-on: https://review.mlplatform.org/c/ml/ComputeLibrary/+/5885
Comments-Addressed: Arm Jenkins <bsgcomp@arm.com>
Reviewed-by: SiCong Li <sicong.li@arm.com>
Tested-by: Arm Jenkins <bsgcomp@arm.com>
Diffstat (limited to 'src/graph/mutators')
-rw-r--r-- | src/graph/mutators/InPlaceOperationMutator.cpp | 8 |
1 files changed, 5 insertions, 3 deletions
diff --git a/src/graph/mutators/InPlaceOperationMutator.cpp b/src/graph/mutators/InPlaceOperationMutator.cpp index 86236e8854..d3ea940895 100644 --- a/src/graph/mutators/InPlaceOperationMutator.cpp +++ b/src/graph/mutators/InPlaceOperationMutator.cpp @@ -180,9 +180,11 @@ void try_in_place_elementwise(std::unique_ptr<INode> &node) ARM_COMPUTE_ERROR_ON(current_output_tensor == nullptr); const auto qinfo_out = current_output_tensor->desc().quant_info; - // Can do in place, if the input has same shape as output, has same quntisation info as output, and input doesn't have accessor. - bool input0_can_in_place = !arm_compute::detail::have_different_dimensions(out_shape, shape0, 0) && (qinfo0 == qinfo_out) && (input0_tensor->accessor() == nullptr); - bool input1_can_in_place = !arm_compute::detail::have_different_dimensions(out_shape, shape1, 0) && (qinfo1 == qinfo_out) && (input1_tensor->accessor() == nullptr); + // Can do in place, if the input has same shape as output, has same quntisation info as output, has same data type as output and input doesn't have accessor. + bool input0_can_in_place = !arm_compute::detail::have_different_dimensions(out_shape, shape0, 0) && (qinfo0 == qinfo_out) + && (input0_tensor->desc().data_type == current_output_tensor->desc().data_type) && (input0_tensor->accessor() == nullptr); + bool input1_can_in_place = !arm_compute::detail::have_different_dimensions(out_shape, shape1, 0) && (qinfo1 == qinfo_out) + && (input1_tensor->desc().data_type == current_output_tensor->desc().data_type) && (input1_tensor->accessor() == nullptr); if(input0_can_in_place) { |