// // This confidential and proprietary software may be used only as // authorised by a licensing agreement from ARM Limited // (C) COPYRIGHT 2020-2024 ARM Limited // ALL RIGHTS RESERVED // The entire notice above must be reproduced on all authorised // copies and copies may only be made to the extent permitted // by a licensing agreement from ARM Limited. ERROR_IF(in_t != i8_t && input_zp != 0); // Zero point only allowed for int8_t ERROR_IF(weight_t != i8_t && weight_zp != 0); ERROR_IF(out_pad_top <= -KH || out_pad_bottom <= -KH); ERROR_IF(out_pad_left <= -KW || out_pad_right <= -KW); ERROR_IF(stride_y < 1 || stride_x < 1); ERROR_IF(OH != (IH - 1) * stride_y + out_pad_top + out_pad_bottom + KH); ERROR_IF(OW != (IW - 1) * stride_x + out_pad_left + out_pad_right + KW); ERROR_IF(BC != OC && BC != 1); for_each(index in [N, OH, OW, OC]) { tensor_write(output, [N,OH,OW,OC], index, bias[(BC == 1) ? 0 : index[3]]); } for_each(0 <= n < N, 0 <= iy < IH, 0 <= ix < IW, 0 <= oc < OC, 0 <= ic < IC, 0 <= ky < KH, 0 <= kx < KW) { index_t oy = iy * stride_y + out_pad_top + ky; index_t ox = ix * stride_x + out_pad_left + kx; if (oy >= 0 && oy < OH && ox >= 0 && ox < OW) { out_t acc = static_cast(tensor_read(output, [N,OH,OW,OC], [n,oy,ox,oc])); out_t value = static_cast(tensor_read(input, [N,IH,IW,IC], [n,iy,ix,ic])); out_t weight = static_cast(tensor_read(weight, [OC,KH,KW,IC], [oc,ky,kx,ic])); value = apply_sub_s(value, static_cast(input_zp)); weight = apply_sub_s(weight, static_cast(weight_zp)); acc = apply_add_s(acc, apply_mul_s(value, weight)); tensor_write(output, [N,OH,OW,OC], [n,oy,ox,oc], acc); } }