aboutsummaryrefslogtreecommitdiff
path: root/compute_kernel_writer/src/cl
diff options
context:
space:
mode:
Diffstat (limited to 'compute_kernel_writer/src/cl')
-rw-r--r--compute_kernel_writer/src/cl/CLHelpers.cpp26
-rw-r--r--compute_kernel_writer/src/cl/CLHelpers.h10
-rw-r--r--compute_kernel_writer/src/cl/CLTensorArgument.cpp247
-rw-r--r--compute_kernel_writer/src/cl/CLTensorArgument.h70
4 files changed, 350 insertions, 3 deletions
diff --git a/compute_kernel_writer/src/cl/CLHelpers.cpp b/compute_kernel_writer/src/cl/CLHelpers.cpp
index 5a3d0fab81..af8a8a07ac 100644
--- a/compute_kernel_writer/src/cl/CLHelpers.cpp
+++ b/compute_kernel_writer/src/cl/CLHelpers.cpp
@@ -21,10 +21,10 @@
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
+#include "src/cl/CLHelpers.h"
#include "ckw/Error.h"
#include "ckw/types/DataType.h"
-
-#include "src/cl/CLHelpers.h"
+#include "ckw/types/TensorStorageType.h"
namespace ckw
{
@@ -120,4 +120,26 @@ int32_t width_to_cl_vector_size(int32_t width)
return 0;
}
}
+
+std::string cl_get_variable_storagetype_as_string(TensorStorageType storage)
+{
+ std::string res;
+ switch(storage)
+ {
+ case TensorStorageType::BufferUint8Ptr:
+ res += "__global uchar*";
+ break;
+ case TensorStorageType::Texture2dReadOnly:
+ res += "__read_only image2d_t";
+ break;
+ case TensorStorageType::Texture2dWriteOnly:
+ res += "__write_only image2d_t";
+ break;
+ default:
+ COMPUTE_KERNEL_WRITER_ERROR_ON_MSG("Unsupported storage type");
+ }
+
+ return res;
+}
+
} // namespace ckw
diff --git a/compute_kernel_writer/src/cl/CLHelpers.h b/compute_kernel_writer/src/cl/CLHelpers.h
index a9a84e2187..d0ca488617 100644
--- a/compute_kernel_writer/src/cl/CLHelpers.h
+++ b/compute_kernel_writer/src/cl/CLHelpers.h
@@ -24,14 +24,15 @@
#ifndef CKW_SRC_CL_CLHELPERS_H
#define CKW_SRC_CL_CLHELPERS_H
-#include <string>
#include <cstdint>
+#include <string>
/** OpenCL specific helper functions */
namespace ckw
{
// Forward declarations
enum class DataType;
+enum class TensorStorageType : uint32_t;
/** Helper function to validate the vector length of OpenCL vector data types
*
@@ -58,6 +59,13 @@ std::string cl_get_variable_datatype_as_string(DataType dt, int32_t len);
*/
int32_t width_to_cl_vector_size(int32_t width);
+/** Helper function to return the OpenCL storage type as a string from a @ref TensorStorage
+ *
+ * @param[in] storage Storage type
+ *
+ * @return the OpenCL storage type as a string
+ */
+std::string cl_get_variable_storagetype_as_string(TensorStorageType storage);
} // namespace ckw
#endif /* COMPUTE_KERNEL_WRITER_SRC_CL_CLHELPERS_H */
diff --git a/compute_kernel_writer/src/cl/CLTensorArgument.cpp b/compute_kernel_writer/src/cl/CLTensorArgument.cpp
new file mode 100644
index 0000000000..ed1c5bd687
--- /dev/null
+++ b/compute_kernel_writer/src/cl/CLTensorArgument.cpp
@@ -0,0 +1,247 @@
+/*
+ * Copyright (c) 2023 Arm Limited.
+ *
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to
+ * deal in the Software without restriction, including without limitation the
+ * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
+ * sell copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in all
+ * copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+
+#include "src/cl/CLTensorArgument.h"
+#include "ckw/Error.h"
+#include "src/cl/CLHelpers.h"
+#include "src/types/TensorComponentType.h"
+
+#include <algorithm>
+#include <vector>
+
+namespace ckw
+{
+CLTensorArgument::CLTensorArgument(const std::string &name, const TensorInfo &info, bool return_dims_by_value)
+{
+ _return_dims_by_value = return_dims_by_value;
+ _basename = name;
+ _info = info;
+}
+
+TileVariable CLTensorArgument::component(TensorComponentType x)
+{
+ if(_return_dims_by_value)
+ {
+ uint32_t component_type = static_cast<uint32_t>(x);
+
+ const bool is_dimension = (component_type & static_cast<uint32_t>(TensorComponentBitmask::Dimension)) != 0;
+ const bool is_folded_dimensions = (component_type & static_cast<uint32_t>(TensorComponentBitmask::FoldedDimensions)) != 0;
+
+ constexpr auto bitmask_all = static_cast<uint32_t>(TensorComponentIndexBitmask::All);
+ constexpr auto bitmask_index_0 = static_cast<uint32_t>(TensorComponentIndexBitmask::Index0);
+#ifdef COMPUTE_KERNEL_WRITER_ASSERTS_ENABLED
+ constexpr auto bitmask_index_1 = static_cast<uint32_t>(TensorComponentIndexBitmask::Index1);
+ constexpr auto bitmask_index_2 = static_cast<uint32_t>(TensorComponentIndexBitmask::Index2);
+ constexpr auto bitmask_index_3 = static_cast<uint32_t>(TensorComponentIndexBitmask::Index3);
+#endif // COMPUTE_KERNEL_WRITER_ASSERTS_ENABLED
+
+ // Make sure that the encoding of component type hasn't changed and each nibble is 4 bits apart.
+ CKW_ASSERT(bitmask_all == (bitmask_index_0 | bitmask_index_1 | bitmask_index_2 | bitmask_index_3));
+ CKW_ASSERT(bitmask_index_0 == bitmask_index_1 >> 4);
+ CKW_ASSERT(bitmask_index_1 == bitmask_index_2 >> 4);
+ CKW_ASSERT(bitmask_index_2 == bitmask_index_3 >> 4);
+
+ // If we have a dimension or folded dimensions, we can return the corresponding value if it is not dynamic (not equal to -1)
+ if(is_dimension == true || is_folded_dimensions == true)
+ {
+ component_type = component_type & bitmask_all;
+
+ int32_t idx = 1;
+ for(int32_t i = 0; i < tensor_component_index_max_count; ++i)
+ {
+ uint32_t dim_idx = component_type & bitmask_index_0;
+
+ if(dim_idx == 0)
+ {
+ // Stop at the first nibble containing 0
+ break;
+ }
+
+ // Subtract - 1. Please refer to the TensorComponentIndexBitmask documentation
+ dim_idx -= 1;
+
+ // Get the dimension value
+ const int32_t dim_val = _info.shape()[dim_idx];
+
+ if(dim_val == kDynamicTensorDimensionValue)
+ {
+ // We cannot return the dimension by value if it is dynamic.
+ // Therefore, force the idx variable to kDynamicTensorDimensionValue and break the loop.
+ idx = kDynamicTensorDimensionValue;
+ break;
+ }
+
+ idx *= dim_val;
+
+ // Go to the next nibble
+ component_type >>= 4;
+ }
+
+ if(idx != kDynamicTensorDimensionValue)
+ {
+ TileVariable t;
+ t.str = std::to_string(idx);
+ t.desc.dt = DataType::Uint32;
+ t.desc.len = 1;
+ return t;
+ }
+ }
+ }
+
+ auto it = std::find(_components_used.begin(), _components_used.end(), x);
+
+ // Add to the list of used components if not present yet
+ if(it == _components_used.end())
+ {
+ _components_used.push_back(x);
+ }
+
+ TileVariable t;
+ t.str = create_component_name(x);
+ t.desc.dt = DataType::Int32;
+ t.desc.len = 1;
+ return t;
+}
+
+TensorStorageVariable CLTensorArgument::storage(TensorStorageType x)
+{
+ if(std::find(_storages_used.begin(), _storages_used.end(), x) == _storages_used.end())
+ {
+ _storages_used.push_back(x);
+ }
+
+ TensorStorageVariable t;
+ t.val = create_storage_name(x);
+ t.type = cl_get_variable_storagetype_as_string(x);
+
+ return t;
+}
+
+std::string CLTensorArgument::create_storage_name(TensorStorageType x) const
+{
+ std::string var_name = _basename;
+
+ switch(x)
+ {
+ case TensorStorageType::BufferUint8Ptr:
+ var_name += "_ptr";
+ break;
+ case TensorStorageType::Texture2dReadOnly:
+ case TensorStorageType::Texture2dWriteOnly:
+ var_name += "_img2d";
+ break;
+ default:
+ CKW_ASSERT_FAILED_MSG("Unsupported tensor storage");
+ return "";
+ }
+
+ return var_name;
+}
+
+std::string CLTensorArgument::create_component_name(TensorComponentType x) const
+{
+ std::string var_name = _basename;
+
+ switch(x)
+ {
+ case TensorComponentType::OffsetFirstElement:
+ var_name += "_offset_first_element";
+ break;
+ case TensorComponentType::Stride0:
+ var_name += "_stride0";
+ break;
+ case TensorComponentType::Stride1:
+ var_name += "_stride1";
+ break;
+ case TensorComponentType::Stride2:
+ var_name += "_stride2";
+ break;
+ case TensorComponentType::Stride3:
+ var_name += "_stride3";
+ break;
+ case TensorComponentType::Stride4:
+ var_name += "_stride4";
+ break;
+ case TensorComponentType::Dim0:
+ var_name += "_dim0";
+ break;
+ case TensorComponentType::Dim1:
+ var_name += "_dim1";
+ break;
+ case TensorComponentType::Dim2:
+ var_name += "_dim2";
+ break;
+ case TensorComponentType::Dim3:
+ var_name += "_dim3";
+ break;
+ case TensorComponentType::Dim4:
+ var_name += "_dim4";
+ break;
+ case TensorComponentType::Dim1xDim2:
+ var_name += "_dim1xdim2";
+ break;
+ case TensorComponentType::Dim2xDim3:
+ var_name += "_dim2xdim3";
+ break;
+ case TensorComponentType::Dim1xDim2xDim3:
+ var_name += "_dim1xdim2xdim3";
+ break;
+ default:
+ COMPUTE_KERNEL_WRITER_ERROR_ON_MSG("Unsupported tensor component");
+ return "";
+ }
+
+ return var_name;
+}
+
+std::vector<TensorStorageVariable> CLTensorArgument::storages() const
+{
+ std::vector<TensorStorageVariable> storages;
+ for(auto &val : _storages_used)
+ {
+ TensorStorageVariable t;
+ t.val = create_storage_name(val);
+ t.type = cl_get_variable_storagetype_as_string(val);
+ storages.push_back(t);
+ }
+
+ return storages;
+}
+
+std::vector<TileVariable> CLTensorArgument::components() const
+{
+ std::vector<TileVariable> components;
+
+ for(auto &val : _components_used)
+ {
+ TileVariable t;
+ t.str = create_component_name(val);
+ t.desc.dt = DataType::Int32;
+ t.desc.len = 1;
+ components.push_back(t);
+ }
+
+ return components;
+}
+} // namespace ckw
diff --git a/compute_kernel_writer/src/cl/CLTensorArgument.h b/compute_kernel_writer/src/cl/CLTensorArgument.h
new file mode 100644
index 0000000000..cd924846c5
--- /dev/null
+++ b/compute_kernel_writer/src/cl/CLTensorArgument.h
@@ -0,0 +1,70 @@
+/*
+ * Copyright (c) 2023 Arm Limited.
+ *
+ * SPDX-License-Identifier: MIT
+ *
+ * Permission is hereby granted, free of charge, to any person obtaining a copy
+ * of this software and associated documentation files (the "Software"), to
+ * deal in the Software without restriction, including without limitation the
+ * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
+ * sell copies of the Software, and to permit persons to whom the Software is
+ * furnished to do so, subject to the following conditions:
+ *
+ * The above copyright notice and this permission notice shall be included in all
+ * copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+ * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+ * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+ * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+ * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+ * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+ * SOFTWARE.
+ */
+#ifndef CKW_SRC_CL_CLTENSORARGUMENT_H
+#define CKW_SRC_CL_CLTENSORARGUMENT_H
+
+#include "src/ITensorArgument.h"
+
+#include <string>
+#include <vector>
+
+namespace ckw
+{
+// Forward declarations
+class TensorInfo;
+
+/** OpenCL specific tensor argument
+ * Internally, the object keeps track of the components and storages used to minimize the number
+ * of kernel arguments required. Therefore, if we create this object but we do not access any components
+ * or storages, the storages() and components() method will return an empty list.
+*/
+class CLTensorArgument : public ITensorArgument, ITensorStorageArgument, ITensorComponentArgument
+{
+public:
+ /** Constructor
+ *
+ * @param[in] name Tensor name
+ * @param[in] info Tensor info
+ * @param[in] return_dims_by_value Flag to return the dimensions by value whenever it is possible.
+ * True, if the dimensions should be returned as value instead as variable.
+ */
+ CLTensorArgument(const std::string &name, const TensorInfo &info, bool return_dims_by_value);
+
+ // Inherited method overridden
+ TensorStorageVariable storage(TensorStorageType x);
+ TileVariable component(TensorComponentType x);
+ std::vector<TensorStorageVariable> storages() const;
+ std::vector<TileVariable> components() const;
+
+private:
+ std::string create_storage_name(TensorStorageType x) const;
+ std::string create_component_name(TensorComponentType x) const;
+
+ bool _return_dims_by_value{ false };
+ std::vector<TensorStorageType> _storages_used{};
+ std::vector<TensorComponentType> _components_used{};
+};
+} // namespace ckw
+
+#endif // CKW_SRC_CL_CLTENSORARGUMENT_H