| /* |
| * Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved. |
| * |
| * SPDX-License-Identifier: Apache-2.0 |
| * |
| * Licensed under the Apache License, Version 2.0 (the License); you may |
| * not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an AS IS BASIS, WITHOUT |
| * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "ref_functions.h" |
| |
| void arm_avepool_q7_HWC_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimension |
| const uint16_t ch_im_in, // number of input image channels |
| const uint16_t dim_kernel, // window kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const uint16_t dim_im_out, // output image dimension |
| q7_t * bufferA, // a buffer for local storage |
| q7_t * Im_out) |
| { |
| int16_t i_ch_in, i_x, i_y; |
| int16_t k_x, k_y; |
| |
| for (i_ch_in = 0; i_ch_in < ch_im_in; i_ch_in++) |
| { |
| for (i_y = 0; i_y < dim_im_out; i_y++) |
| { |
| for (i_x = 0; i_x < dim_im_out; i_x++) |
| { |
| int sum = 0; |
| int count = 0; |
| for (k_y = i_y * stride - padding; k_y < i_y * stride - padding + dim_kernel; k_y++) |
| { |
| for (k_x = i_x * stride - padding; k_x < i_x * stride - padding + dim_kernel; k_x++) |
| { |
| if (k_y >= 0 && k_x >= 0 && k_y < dim_im_in && k_x < dim_im_in) |
| { |
| sum += Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)]; |
| count++; |
| } |
| } |
| } |
| Im_out[i_ch_in + ch_im_in * (i_x + i_y * dim_im_out)] = sum / count; |
| } |
| } |
| } |
| } |
| |
| void arm_maxpool_q7_HWC_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimension |
| const uint16_t ch_im_in, // number of input image channels |
| const uint16_t dim_kernel, // window kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const uint16_t dim_im_out, // output image dimension |
| q7_t * bufferA, // a buffer for local storage |
| q7_t * Im_out) |
| { |
| int16_t i_ch_in, i_x, i_y; |
| int16_t k_x, k_y; |
| |
| for (i_ch_in = 0; i_ch_in < ch_im_in; i_ch_in++) |
| { |
| for (i_y = 0; i_y < dim_im_out; i_y++) |
| { |
| for (i_x = 0; i_x < dim_im_out; i_x++) |
| { |
| int max = -129; |
| for (k_y = i_y * stride - padding; k_y < i_y * stride - padding + dim_kernel; k_y++) |
| { |
| for (k_x = i_x * stride - padding; k_x < i_x * stride - padding + dim_kernel; k_x++) |
| { |
| if (k_y >= 0 && k_x >= 0 && k_y < dim_im_in && k_x < dim_im_in) |
| { |
| if (Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)] > max) |
| { |
| max = Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)]; |
| } |
| } |
| } |
| } |
| Im_out[i_ch_in + ch_im_in * (i_x + i_y * dim_im_out)] = max; |
| } |
| } |
| } |
| } |