diff options
author | Chunosov <N.Chunosov@yandex.ru> | 2017-11-06 22:09:45 +0700 |
---|---|---|
committer | Anthony Barbier <anthony.barbier@arm.com> | 2018-11-02 16:35:24 +0000 |
commit | d6afedc775220f17317f1835a4d18b72a54525de (patch) | |
tree | 54aed8322a4a286ba376d74bbee61c85a588cc9b /src/core/CL/cl_kernels/fixed_point.h | |
parent | 6ff12a0f7765f62b8d0fa8554021e1cac2789f19 (diff) | |
download | ComputeLibrary-d6afedc775220f17317f1835a4d18b72a54525de.tar.gz |
COMPMID-661: softmax-fp32 optimisation (#14)
Change-Id: I2007af1ed9dcf68065cf412aa50f73a2025b31a6
Reviewed-on: http://mpd-gerrit.cambridge.arm.com/94605
Reviewed-by: Gian Marco Iodice <gianmarco.iodice@arm.com>
Tested-by: Kaizen <jeremy.johnson+kaizengerrit@arm.com>
Diffstat (limited to 'src/core/CL/cl_kernels/fixed_point.h')
-rw-r--r-- | src/core/CL/cl_kernels/fixed_point.h | 5 |
1 files changed, 5 insertions, 0 deletions
diff --git a/src/core/CL/cl_kernels/fixed_point.h b/src/core/CL/cl_kernels/fixed_point.h index 5476a6e070..b329118f14 100644 --- a/src/core/CL/cl_kernels/fixed_point.h +++ b/src/core/CL/cl_kernels/fixed_point.h @@ -359,7 +359,12 @@ DIVQ_SAT_IMPL(qs16, qs16, qs32) return select((type)stype##_MAX, select(sum << dec_m, sum >> -dec_m, dec_m < (type)0), clz(sum) > dec_m); /* Saturate result if needed */ \ } +EXPQ_IMPL(qs8, qs8x2, 2) +EXPQ_IMPL(qs8, qs8x4, 4) +EXPQ_IMPL(qs8, qs8x8, 8) EXPQ_IMPL(qs8, qs8x16, 16) +EXPQ_IMPL(qs16, qs16x2, 2) +EXPQ_IMPL(qs16, qs16x4, 4) EXPQ_IMPL(qs16, qs16x8, 8) EXPQ_IMPL(qs16, qs16x16, 16) |