/* * Copyright (c) 2016-2018 ARM Limited. * * SPDX-License-Identifier: MIT * * Permission is hereby granted, free of charge, to any person obtaining a copy * of this software and associated documentation files (the "Software"), to * deal in the Software without restriction, including without limitation the * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or * sell copies of the Software, and to permit persons to whom the Software is * furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice shall be included in all * copies or substantial portions of the Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE * SOFTWARE. */ #ifndef __ARM_COMPUTE_CLHELPERS_H__ #define __ARM_COMPUTE_CLHELPERS_H__ #include "arm_compute/core/CL/OpenCL.h" #include "arm_compute/core/Helpers.h" #include "support/ToolchainSupport.h" #include namespace arm_compute { enum class DataType; enum class GPUTarget; /** Enable operation operations on GPUTarget enumerations */ template <> struct enable_bitwise_ops { static constexpr bool value = true; }; /** Max vector width of an OpenCL vector */ static constexpr unsigned int max_cl_vector_width = 16; /** Translates a tensor data type to the appropriate OpenCL type. * * @param[in] dt @ref DataType to be translated to OpenCL type. * * @return The string specifying the OpenCL type to be used. */ std::string get_cl_type_from_data_type(const DataType &dt); /** Get the size of a data type in number of bits. * * @param[in] dt @ref DataType. * * @return Number of bits in the data type specified. */ std::string get_data_size_from_data_type(const DataType &dt); /** Translates fixed point tensor data type to the underlying OpenCL type. * * @param[in] dt @ref DataType to be translated to OpenCL type. * * @return The string specifying the underlying OpenCL type to be used. */ std::string get_underlying_cl_type_from_data_type(const DataType &dt); /** Translates a given gpu device target to string. * * @param[in] target Given gpu target. * * @return The string describing the target. */ const std::string &string_from_target(GPUTarget target); /** Helper function to create and return a unique_ptr pointed to a CL kernel object * It also calls the kernel's configuration. * * @param[in] args All the arguments that need pass to kernel's configuration. * * @return A unique pointer pointed to a CL kernel object */ template std::unique_ptr create_configure_kernel(T &&... args) { std::unique_ptr k = arm_compute::support::cpp14::make_unique(); k->configure(std::forward(args)...); return k; } /** Helper function to create and return a unique_ptr pointed to a CL kernel object * * @return A unique pointer pointed to a CL kernel object */ template std::unique_ptr create_kernel() { std::unique_ptr k = arm_compute::support::cpp14::make_unique(); return k; } /** Helper function to get the GPU target from a device name * * @param[in] device_name A device name * * @return the GPU target */ GPUTarget get_target_from_name(const std::string &device_name); /** Helper function to get the GPU target from CL device * * @param[in] device A CL device * * @return the GPU target */ GPUTarget get_target_from_device(cl::Device &device); /** Helper function to get the GPU arch * * @param[in] target GPU target * * @return the GPU target which shows the arch */ GPUTarget get_arch_from_target(GPUTarget target); /** Helper function to get the highest OpenCL version supported * * @param[in] device A CL device * * @return the highest OpenCL version supported */ CLVersion get_cl_version(const cl::Device &device); /** Helper function to check whether the cl_khr_fp16 extension is supported * * @param[in] device A CL device * * @return True if the extension is supported */ bool fp16_support(const cl::Device &device); /** Helper function to check whether the arm_non_uniform_work_group_size extension is supported * * @param[in] device A CL device * * @return True if the extension is supported */ bool non_uniform_workgroup_support(const cl::Device &device); /** Helper function to check whether a gpu target is equal to the provided targets * * @param[in] target_to_check gpu target to check * @param[in] target First target to compare against * @param[in] targets (Optional) Additional targets to compare with * * @return True if the target is equal with at least one of the targets. */ template bool gpu_target_is_in(GPUTarget target_to_check, GPUTarget target, Args... targets) { return (target_to_check == target) | gpu_target_is_in(target_to_check, targets...); } /** Variant of gpu_target_is_in for comparing two targets */ inline bool gpu_target_is_in(GPUTarget target_to_check, GPUTarget target) { return target_to_check == target; } } #endif /* __ARM_COMPUTE_CLHELPERS_H__ */