| /* |
| * Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved. |
| * |
| * SPDX-License-Identifier: Apache-2.0 |
| * |
| * Licensed under the Apache License, Version 2.0 (the License); you may |
| * not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an AS IS BASIS, WITHOUT |
| * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #ifndef _REF_FUNCTIONS_H_ |
| #define _REF_FUNCTIONS_H_ |
| |
| #include "arm_math.h" |
| #include "arm_nnfunctions.h" |
| //#include "arm_nnsupportfunctions.h" |
| #include "fully_connected_testing_weights.h" |
| |
| #ifdef __cplusplus |
| extern "C" |
| { |
| #endif |
| |
| /* |
| * |
| * Convolution reference implemenation |
| * |
| */ |
| |
| void arm_convolve_HWC_q7_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimention |
| const uint16_t ch_im_in, // number of input image channels |
| const q7_t * wt, // kernel weights |
| const uint16_t ch_im_out, // number of filters, i.e., output image channels |
| const uint16_t dim_kernel, // filter kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const q7_t * bias, // bias |
| const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image |
| const uint16_t dim_im_out, // output image dimension |
| q15_t * bufferA, //buffer space for input |
| q7_t * bufferB //buffer space for output |
| ); |
| |
| void arm_convolve_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in_x, // input image dimention x |
| const uint16_t dim_im_in_y, // input image dimention y |
| const uint16_t ch_im_in, // number of input image channels |
| const q7_t * wt, // kernel weights |
| const uint16_t ch_im_out, // number of filters, i.e., output image channels |
| const uint16_t dim_kernel_x, // filter kernel size x |
| const uint16_t dim_kernel_y, // filter kernel size y |
| const uint16_t padding_x, // padding sizes x |
| const uint16_t padding_y, // padding sizes y |
| const uint16_t stride_x, // stride x |
| const uint16_t stride_y, // stride y |
| const q7_t * bias, // bias |
| const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image |
| const uint16_t dim_im_out_x, // output image dimension x |
| const uint16_t dim_im_out_y, // output image dimension y |
| q15_t * bufferA, //buffer space for input |
| q7_t * bufferB //buffer space for output |
| ); |
| |
| void arm_convolve_HWC_q15_ref(const q15_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimention |
| const uint16_t ch_im_in, // number of input image channels |
| const q15_t * wt, // kernel weights |
| const uint16_t ch_im_out, // number of filters, i.e., output image channels |
| const uint16_t dim_kernel, // filter kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const q15_t * bias, // bias |
| const uint16_t bias_shift, const uint16_t out_shift, q15_t * Im_out, // output image |
| const uint16_t dim_im_out, // output image dimension |
| q15_t * bufferA, //buffer space for input |
| q7_t * bufferB //buffer space for output |
| ); |
| void arm_convolve_HWC_q15_nonsquare_ref(const q15_t * Im_in, |
| const uint16_t dim_im_in_x, |
| const uint16_t dim_im_in_y, |
| const uint16_t ch_im_in, |
| const q15_t * wt, |
| const uint16_t ch_im_out, |
| const uint16_t dim_kernel_x, |
| const uint16_t dim_kernel_y, |
| const uint16_t padding_x, |
| const uint16_t padding_y, |
| const uint16_t stride_x, |
| const uint16_t stride_y, |
| const q15_t * bias, |
| const uint16_t bias_shift, |
| const uint16_t out_shift, |
| q15_t * Im_out, |
| const uint16_t dim_im_out_x, |
| const uint16_t dim_im_out_y, |
| q15_t * bufferA, |
| q7_t * bufferB); |
| |
| void arm_depthwise_separable_conv_HWC_q7_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimention |
| const uint16_t ch_im_in, // number of input image channels |
| const q7_t * wt, // kernel weights |
| const uint16_t ch_im_out, // number of filters, i.e., output image channels |
| const uint16_t dim_kernel, // filter kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const q7_t * bias, // bias |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| q7_t * Im_out, // output image |
| const uint16_t dim_im_out, // output image dimension |
| q15_t * bufferA, //buffer space for input |
| q7_t * bufferB //buffer space for output |
| ); |
| void arm_depthwise_separable_conv_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in_x, // input image dimention x |
| const uint16_t dim_im_in_y, // input image dimention y |
| const uint16_t ch_im_in, // number of input image channels |
| const q7_t * wt, // kernel weights |
| const uint16_t ch_im_out, // number of filters, i.e., output image channels |
| const uint16_t dim_kernel_x, // filter kernel size x |
| const uint16_t dim_kernel_y, // filter kernel size y |
| const uint16_t padding_x, // padding sizes x |
| const uint16_t padding_y, // padding sizes y |
| const uint16_t stride_x, // stride x |
| const uint16_t stride_y, // stride y |
| const q7_t * bias, // bias |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| q7_t * Im_out, // output image |
| const uint16_t dim_im_out_x, // output image dimension x |
| const uint16_t dim_im_out_y, // output image dimension y |
| q15_t * bufferA, //buffer space for input |
| q7_t * bufferB //buffer space for output |
| ); |
| |
| /* |
| * |
| * Fully-connected reference implemenation |
| * |
| */ |
| |
| void arm_fully_connected_q7_ref(const q7_t * pV, // pointer to vector |
| const q7_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q7_t * bias, q7_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| void arm_fully_connected_q15_ref(const q15_t * pV, // pointer to vector |
| const q15_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q15_t * bias, q15_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| void arm_fully_connected_mat_q7_vec_q15_ref(const q15_t * pV, // pointer to vector |
| const q7_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q7_t * bias, q15_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| void arm_fully_connected_q7_opt_ref(const q7_t * pV, // pointer to vector |
| const q7_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q7_t * bias, q7_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| void arm_fully_connected_q15_opt_ref(const q15_t * pV, // pointer to vector |
| const q15_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q15_t * bias, q15_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| void arm_fully_connected_mat_q7_vec_q15_opt_ref(const q15_t * pV, // pointer to vector |
| const q7_t * pM, // pointer to matrix |
| const uint16_t dim_vec, // length of the vector |
| const uint16_t num_of_rows, // numCol of A |
| const uint16_t bias_shift, // amount of left-shift for bias |
| const uint16_t out_shift, // amount of right-shift for output |
| const q7_t * bias, q15_t * pOut, // output operand |
| q15_t * vec_buffer); |
| |
| /* |
| * |
| * Pooling reference implemenation |
| * |
| */ |
| |
| void arm_avepool_q7_HWC_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimension |
| const uint16_t ch_im_in, // number of input image channels |
| const uint16_t dim_kernel, // window kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const uint16_t dim_im_out, // output image dimension |
| q7_t * bufferA, // a buffer for local storage |
| q7_t * Im_out); |
| |
| void arm_maxpool_q7_HWC_ref(const q7_t * Im_in, // input image |
| const uint16_t dim_im_in, // input image dimension |
| const uint16_t ch_im_in, // number of input image channels |
| const uint16_t dim_kernel, // window kernel size |
| const uint16_t padding, // padding sizes |
| const uint16_t stride, // stride |
| const uint16_t dim_im_out, // output image dimension |
| q7_t * bufferA, // a buffer for local storage |
| q7_t * Im_out); |
| |
| /* |
| * |
| * Other reference implemenation |
| * |
| */ |
| |
| void arm_relu_q7_ref(q7_t * data, uint16_t size); |
| |
| void arm_relu_q15_ref(q15_t * data, uint16_t size); |
| |
| void arm_nn_mult_q7_ref(q7_t * pSrcA, q7_t * pSrcB, q7_t * pDst, const uint16_t out_shift, uint32_t blockSize); |
| |
| void arm_nn_mult_q15_ref(q15_t * pSrcA, q15_t * pSrcB, q15_t * pDst, const uint16_t out_shift, uint32_t blockSize); |
| |
| #ifdef __cplusplus |
| } |
| #endif |
| |
| #endif |