diff options
Diffstat (limited to 'src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp')
-rw-r--r-- | src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp | 9 |
1 files changed, 4 insertions, 5 deletions
diff --git a/src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp b/src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp index 26399c50a9..c6e14f90c5 100644 --- a/src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp +++ b/src/dynamic_fusion/sketch/gpu/template_writer/cl/ClTemplateDirectConv2d.cpp @@ -86,7 +86,6 @@ std::string ClTemplateDirectConv2d::get_component_code(const ComponentGroup &com code += R"_( // OUT(dst, accum) {{dst}} -TILE({{ACC_DATA_TYPE}}, M0, N0, {{dst}}); TILE(uint, M0, 1, g_dst_indirect_y); { @@ -227,30 +226,30 @@ code += R"_( void ClTemplateDirectConv2d::declare_variables(GpuKernelVariableTable &vtable, const ComponentGroup &comp_group) const { vtable.declare_variable( + comp_group, _src, GpuKernelArgumentInfo(GpuKernelArgumentInfo::Type::Tensor_4D_t_Buffer), - comp_group.is_intermediate_tensor(_src), "src"); const GpuKernelArgumentInfo::Type weight_type = _settings.export_to_cl_image() ? GpuKernelArgumentInfo::Type::Tensor_4D_t_Image : GpuKernelArgumentInfo::Type::Tensor_4D_t_Buffer; vtable.declare_variable( + comp_group, _weight, GpuKernelArgumentInfo(weight_type), - comp_group.is_intermediate_tensor(_weight), "weight"); if(_bias && _bias->has_valid_id()) // optional bias { vtable.declare_variable( + comp_group, _bias, GpuKernelArgumentInfo(GpuKernelArgumentInfo::Type::Vector), - comp_group.is_intermediate_tensor(_bias), "bias"); } vtable.declare_variable( + comp_group, _dst, GpuKernelArgumentInfo(common_tensor_type), - comp_group.is_intermediate_tensor(_dst), "dst"); } |