NN/NN_Lib_Tests/nn_test/Ref_Implementations/ref_functions.h - third_party/github/STMicroelectronics/cmsis_core.git - Git at Google

 /*
  * Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved.
  *
  * SPDX-License-Identifier: Apache-2.0
  *
  * Licensed under the Apache License, Version 2.0 (the License); you may
  * not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  * www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an AS IS BASIS, WITHOUT
  * WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 #ifndef _REF_FUNCTIONS_H_
 #define _REF_FUNCTIONS_H_

 #include "arm_math.h"
 #include "arm_nnfunctions.h"
 //#include "arm_nnsupportfunctions.h"
 #include "fully_connected_testing_weights.h"

 #ifdef __cplusplus
 extern    "C"
 {
 #endif

 /*
  *
  * Convolution reference implemenation
  *
  */

     void      arm_convolve_HWC_q7_ref(const q7_t * Im_in,   // input image
                                       const uint16_t dim_im_in, // input image dimention
                                       const uint16_t ch_im_in,  // number of input image channels
                                       const q7_t * wt,  // kernel weights
                                       const uint16_t ch_im_out, // number of filters, i.e., output image channels
                                       const uint16_t dim_kernel,    // filter kernel size
                                       const uint16_t padding,   // padding sizes
                                       const uint16_t stride,    // stride
                                       const q7_t * bias,    // bias
                                       const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out,   // output image
                                       const uint16_t dim_im_out,    // output image dimension
                                       q15_t * bufferA,  //buffer space for input
                                       q7_t * bufferB    //buffer space for output
         );

     void      arm_convolve_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
                                                 const uint16_t dim_im_in_x, // input image dimention x
                                                 const uint16_t dim_im_in_y, // input image dimention y
                                                 const uint16_t ch_im_in,    // number of input image channels
                                                 const q7_t * wt,    // kernel weights
                                                 const uint16_t ch_im_out,   // number of filters, i.e., output image channels
                                                 const uint16_t dim_kernel_x,    // filter kernel size x
                                                 const uint16_t dim_kernel_y,    // filter kernel size y
                                                 const uint16_t padding_x,   // padding sizes x
                                                 const uint16_t padding_y,   // padding sizes y
                                                 const uint16_t stride_x,    // stride x
                                                 const uint16_t stride_y,    // stride y
                                                 const q7_t * bias,  // bias
                                                 const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image
                                                 const uint16_t dim_im_out_x,    // output image dimension x
                                                 const uint16_t dim_im_out_y,    // output image dimension y
                                                 q15_t * bufferA,    //buffer space for input
                                                 q7_t * bufferB  //buffer space for output
         );

     void      arm_convolve_HWC_q15_ref(const q15_t * Im_in, // input image
                                        const uint16_t dim_im_in,    // input image dimention
                                        const uint16_t ch_im_in, // number of input image channels
                                        const q15_t * wt,    // kernel weights
                                        const uint16_t ch_im_out,    // number of filters, i.e., output image channels
                                        const uint16_t dim_kernel,   // filter kernel size
                                        const uint16_t padding,  // padding sizes
                                        const uint16_t stride,   // stride
                                        const q15_t * bias,  // bias
                                        const uint16_t bias_shift, const uint16_t out_shift, q15_t * Im_out, // output image
                                        const uint16_t dim_im_out,   // output image dimension
                                        q15_t * bufferA, //buffer space for input
                                        q7_t * bufferB   //buffer space for output
         );
     void      arm_convolve_HWC_q15_nonsquare_ref(const q15_t * Im_in,
                                                       const uint16_t dim_im_in_x,
                                                       const uint16_t dim_im_in_y,
                                                       const uint16_t ch_im_in,
                                                       const q15_t * wt,
                                                       const uint16_t ch_im_out,
                                                       const uint16_t dim_kernel_x,
                                                       const uint16_t dim_kernel_y,
                                                       const uint16_t padding_x,
                                                       const uint16_t padding_y,
                                                       const uint16_t stride_x,
                                                       const uint16_t stride_y,
                                                       const q15_t * bias,
                                                       const uint16_t bias_shift,
                                                       const uint16_t out_shift,
                                                       q15_t * Im_out,
                                                       const uint16_t dim_im_out_x,
                                                       const uint16_t dim_im_out_y,
                                                       q15_t * bufferA,
                                                       q7_t * bufferB);

     void      arm_depthwise_separable_conv_HWC_q7_ref(const q7_t * Im_in,   // input image
                                                       const uint16_t dim_im_in, // input image dimention
                                                       const uint16_t ch_im_in,  // number of input image channels
                                                       const q7_t * wt,  // kernel weights
                                                       const uint16_t ch_im_out, // number of filters, i.e., output image channels
                                                       const uint16_t dim_kernel,    // filter kernel size
                                                       const uint16_t padding,   // padding sizes
                                                       const uint16_t stride,    // stride
                                                       const q7_t * bias,    // bias
                                                       const uint16_t bias_shift,    // amount of left-shift for bias
                                                       const uint16_t out_shift, // amount of right-shift for output
                                                       q7_t * Im_out,    // output image
                                                       const uint16_t dim_im_out,    // output image dimension
                                                       q15_t * bufferA,  //buffer space for input
                                                       q7_t * bufferB    //buffer space for output
         );
     void      arm_depthwise_separable_conv_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
                                                                 const uint16_t dim_im_in_x, // input image dimention x
                                                                 const uint16_t dim_im_in_y, // input image dimention y
                                                                 const uint16_t ch_im_in,    // number of input image channels
                                                                 const q7_t * wt,    // kernel weights
                                                                 const uint16_t ch_im_out,   // number of filters, i.e., output image channels
                                                                 const uint16_t dim_kernel_x,    // filter kernel size x
                                                                 const uint16_t dim_kernel_y,    // filter kernel size y
                                                                 const uint16_t padding_x,   // padding sizes x
                                                                 const uint16_t padding_y,   // padding sizes y
                                                                 const uint16_t stride_x,    // stride x
                                                                 const uint16_t stride_y,    // stride y
                                                                 const q7_t * bias,  // bias
                                                                 const uint16_t bias_shift,  // amount of left-shift for bias
                                                                 const uint16_t out_shift,   // amount of right-shift for output
                                                                 q7_t * Im_out,  // output image
                                                                 const uint16_t dim_im_out_x,    // output image dimension x
                                                                 const uint16_t dim_im_out_y,    // output image dimension y
                                                                 q15_t * bufferA,    //buffer space for input
                                                                 q7_t * bufferB  //buffer space for output
         );

 /*
  *
  * Fully-connected reference implemenation
  *
  */

     void      arm_fully_connected_q7_ref(const q7_t * pV,   // pointer to vector
                                          const q7_t * pM,   // pointer to matrix
                                          const uint16_t dim_vec,    // length of the vector
                                          const uint16_t num_of_rows,    // numCol of A
                                          const uint16_t bias_shift, // amount of left-shift for bias
                                          const uint16_t out_shift,  // amount of right-shift for output
                                          const q7_t * bias, q7_t * pOut,    // output operand
                                          q15_t * vec_buffer);

     void      arm_fully_connected_q15_ref(const q15_t * pV, // pointer to vector
                                           const q15_t * pM, // pointer to matrix
                                           const uint16_t dim_vec,   // length of the vector
                                           const uint16_t num_of_rows,   // numCol of A
                                           const uint16_t bias_shift,    // amount of left-shift for bias
                                           const uint16_t out_shift, // amount of right-shift for output
                                           const q15_t * bias, q15_t * pOut, // output operand
                                           q15_t * vec_buffer);

     void      arm_fully_connected_mat_q7_vec_q15_ref(const q15_t * pV,  // pointer to vector
                                                      const q7_t * pM,   // pointer to matrix
                                                      const uint16_t dim_vec,    // length of the vector
                                                      const uint16_t num_of_rows,    // numCol of A
                                                      const uint16_t bias_shift, // amount of left-shift for bias
                                                      const uint16_t out_shift,  // amount of right-shift for output
                                                      const q7_t * bias, q15_t * pOut,   // output operand
                                                      q15_t * vec_buffer);

     void      arm_fully_connected_q7_opt_ref(const q7_t * pV,   // pointer to vector
                                              const q7_t * pM,   // pointer to matrix
                                              const uint16_t dim_vec,    // length of the vector
                                              const uint16_t num_of_rows,    // numCol of A
                                              const uint16_t bias_shift, // amount of left-shift for bias
                                              const uint16_t out_shift,  // amount of right-shift for output
                                              const q7_t * bias, q7_t * pOut,    // output operand
                                              q15_t * vec_buffer);

     void      arm_fully_connected_q15_opt_ref(const q15_t * pV, // pointer to vector
                                               const q15_t * pM, // pointer to matrix
                                               const uint16_t dim_vec,   // length of the vector
                                               const uint16_t num_of_rows,   // numCol of A
                                               const uint16_t bias_shift,    // amount of left-shift for bias
                                               const uint16_t out_shift, // amount of right-shift for output
                                               const q15_t * bias, q15_t * pOut, // output operand
                                               q15_t * vec_buffer);

     void      arm_fully_connected_mat_q7_vec_q15_opt_ref(const q15_t * pV,  // pointer to vector
                                                          const q7_t * pM,   // pointer to matrix
                                                          const uint16_t dim_vec,    // length of the vector
                                                          const uint16_t num_of_rows,    // numCol of A
                                                          const uint16_t bias_shift, // amount of left-shift for bias
                                                          const uint16_t out_shift,  // amount of right-shift for output
                                                          const q7_t * bias, q15_t * pOut,   // output operand
                                                          q15_t * vec_buffer);

 /*
  *
  * Pooling reference implemenation
  *
  */

     void      arm_avepool_q7_HWC_ref(const q7_t * Im_in,    // input image
                                      const uint16_t dim_im_in,  // input image dimension
                                      const uint16_t ch_im_in,   // number of input image channels
                                      const uint16_t dim_kernel, // window kernel size
                                      const uint16_t padding,    // padding sizes
                                      const uint16_t stride, // stride
                                      const uint16_t dim_im_out, // output image dimension
                                      q7_t * bufferA,    // a buffer for local storage
                                      q7_t * Im_out);

     void      arm_maxpool_q7_HWC_ref(const q7_t * Im_in,    // input image
                                      const uint16_t dim_im_in,  // input image dimension
                                      const uint16_t ch_im_in,   // number of input image channels
                                      const uint16_t dim_kernel, // window kernel size
                                      const uint16_t padding,    // padding sizes
                                      const uint16_t stride, // stride
                                      const uint16_t dim_im_out, // output image dimension
                                      q7_t * bufferA,    // a buffer for local storage
                                      q7_t * Im_out);

 /*
  *
  * Other reference implemenation
  *
  */

     void      arm_relu_q7_ref(q7_t * data, uint16_t size);

     void      arm_relu_q15_ref(q15_t * data, uint16_t size);

     void      arm_nn_mult_q7_ref(q7_t * pSrcA, q7_t * pSrcB, q7_t * pDst, const uint16_t out_shift, uint32_t blockSize);

     void      arm_nn_mult_q15_ref(q15_t * pSrcA, q15_t * pSrcB, q15_t * pDst, const uint16_t out_shift, uint32_t blockSize);

 #ifdef __cplusplus
 }
 #endif

 #endif
	/*
	* Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved.
	*
	* SPDX-License-Identifier: Apache-2.0
	*
	* Licensed under the Apache License, Version 2.0 (the License); you may
	* not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an AS IS BASIS, WITHOUT
	* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	#ifndef _REF_FUNCTIONS_H_
	#define _REF_FUNCTIONS_H_

	#include "arm_math.h"
	#include "arm_nnfunctions.h"
	//#include "arm_nnsupportfunctions.h"
	#include "fully_connected_testing_weights.h"

	#ifdef __cplusplus
	extern "C"
	{
	#endif

	/*
	*
	* Convolution reference implemenation
	*
	*/

	void arm_convolve_HWC_q7_ref(const q7_t * Im_in, // input image
	const uint16_t dim_im_in, // input image dimention
	const uint16_t ch_im_in, // number of input image channels
	const q7_t * wt, // kernel weights
	const uint16_t ch_im_out, // number of filters, i.e., output image channels
	const uint16_t dim_kernel, // filter kernel size
	const uint16_t padding, // padding sizes
	const uint16_t stride, // stride
	const q7_t * bias, // bias
	const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image
	const uint16_t dim_im_out, // output image dimension
	q15_t * bufferA, //buffer space for input
	q7_t * bufferB //buffer space for output
	);

	void arm_convolve_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
	const uint16_t dim_im_in_x, // input image dimention x
	const uint16_t dim_im_in_y, // input image dimention y
	const uint16_t ch_im_in, // number of input image channels
	const q7_t * wt, // kernel weights
	const uint16_t ch_im_out, // number of filters, i.e., output image channels
	const uint16_t dim_kernel_x, // filter kernel size x
	const uint16_t dim_kernel_y, // filter kernel size y
	const uint16_t padding_x, // padding sizes x
	const uint16_t padding_y, // padding sizes y
	const uint16_t stride_x, // stride x
	const uint16_t stride_y, // stride y
	const q7_t * bias, // bias
	const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image
	const uint16_t dim_im_out_x, // output image dimension x
	const uint16_t dim_im_out_y, // output image dimension y
	q15_t * bufferA, //buffer space for input
	q7_t * bufferB //buffer space for output
	);

	void arm_convolve_HWC_q15_ref(const q15_t * Im_in, // input image
	const uint16_t dim_im_in, // input image dimention
	const uint16_t ch_im_in, // number of input image channels
	const q15_t * wt, // kernel weights
	const uint16_t ch_im_out, // number of filters, i.e., output image channels
	const uint16_t dim_kernel, // filter kernel size
	const uint16_t padding, // padding sizes
	const uint16_t stride, // stride
	const q15_t * bias, // bias
	const uint16_t bias_shift, const uint16_t out_shift, q15_t * Im_out, // output image
	const uint16_t dim_im_out, // output image dimension
	q15_t * bufferA, //buffer space for input
	q7_t * bufferB //buffer space for output
	);
	void arm_convolve_HWC_q15_nonsquare_ref(const q15_t * Im_in,
	const uint16_t dim_im_in_x,
	const uint16_t dim_im_in_y,
	const uint16_t ch_im_in,
	const q15_t * wt,
	const uint16_t ch_im_out,
	const uint16_t dim_kernel_x,
	const uint16_t dim_kernel_y,
	const uint16_t padding_x,
	const uint16_t padding_y,
	const uint16_t stride_x,
	const uint16_t stride_y,
	const q15_t * bias,
	const uint16_t bias_shift,
	const uint16_t out_shift,
	q15_t * Im_out,
	const uint16_t dim_im_out_x,
	const uint16_t dim_im_out_y,
	q15_t * bufferA,
	q7_t * bufferB);

	void arm_depthwise_separable_conv_HWC_q7_ref(const q7_t * Im_in, // input image
	const uint16_t dim_im_in, // input image dimention
	const uint16_t ch_im_in, // number of input image channels
	const q7_t * wt, // kernel weights
	const uint16_t ch_im_out, // number of filters, i.e., output image channels
	const uint16_t dim_kernel, // filter kernel size
	const uint16_t padding, // padding sizes
	const uint16_t stride, // stride
	const q7_t * bias, // bias
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	q7_t * Im_out, // output image
	const uint16_t dim_im_out, // output image dimension
	q15_t * bufferA, //buffer space for input
	q7_t * bufferB //buffer space for output
	);
	void arm_depthwise_separable_conv_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
	const uint16_t dim_im_in_x, // input image dimention x
	const uint16_t dim_im_in_y, // input image dimention y
	const uint16_t ch_im_in, // number of input image channels
	const q7_t * wt, // kernel weights
	const uint16_t ch_im_out, // number of filters, i.e., output image channels
	const uint16_t dim_kernel_x, // filter kernel size x
	const uint16_t dim_kernel_y, // filter kernel size y
	const uint16_t padding_x, // padding sizes x
	const uint16_t padding_y, // padding sizes y
	const uint16_t stride_x, // stride x
	const uint16_t stride_y, // stride y
	const q7_t * bias, // bias
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	q7_t * Im_out, // output image
	const uint16_t dim_im_out_x, // output image dimension x
	const uint16_t dim_im_out_y, // output image dimension y
	q15_t * bufferA, //buffer space for input
	q7_t * bufferB //buffer space for output
	);

	/*
	*
	* Fully-connected reference implemenation
	*
	*/

	void arm_fully_connected_q7_ref(const q7_t * pV, // pointer to vector
	const q7_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q7_t * bias, q7_t * pOut, // output operand
	q15_t * vec_buffer);

	void arm_fully_connected_q15_ref(const q15_t * pV, // pointer to vector
	const q15_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q15_t * bias, q15_t * pOut, // output operand
	q15_t * vec_buffer);

	void arm_fully_connected_mat_q7_vec_q15_ref(const q15_t * pV, // pointer to vector
	const q7_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q7_t * bias, q15_t * pOut, // output operand
	q15_t * vec_buffer);

	void arm_fully_connected_q7_opt_ref(const q7_t * pV, // pointer to vector
	const q7_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q7_t * bias, q7_t * pOut, // output operand
	q15_t * vec_buffer);

	void arm_fully_connected_q15_opt_ref(const q15_t * pV, // pointer to vector
	const q15_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q15_t * bias, q15_t * pOut, // output operand
	q15_t * vec_buffer);

	void arm_fully_connected_mat_q7_vec_q15_opt_ref(const q15_t * pV, // pointer to vector
	const q7_t * pM, // pointer to matrix
	const uint16_t dim_vec, // length of the vector
	const uint16_t num_of_rows, // numCol of A
	const uint16_t bias_shift, // amount of left-shift for bias
	const uint16_t out_shift, // amount of right-shift for output
	const q7_t * bias, q15_t * pOut, // output operand
	q15_t * vec_buffer);

	/*
	*
	* Pooling reference implemenation
	*
	*/

	void arm_avepool_q7_HWC_ref(const q7_t * Im_in, // input image
	const uint16_t dim_im_in, // input image dimension
	const uint16_t ch_im_in, // number of input image channels
	const uint16_t dim_kernel, // window kernel size
	const uint16_t padding, // padding sizes
	const uint16_t stride, // stride
	const uint16_t dim_im_out, // output image dimension
	q7_t * bufferA, // a buffer for local storage
	q7_t * Im_out);

	void arm_maxpool_q7_HWC_ref(const q7_t * Im_in, // input image
	const uint16_t dim_im_in, // input image dimension
	const uint16_t ch_im_in, // number of input image channels
	const uint16_t dim_kernel, // window kernel size
	const uint16_t padding, // padding sizes
	const uint16_t stride, // stride
	const uint16_t dim_im_out, // output image dimension
	q7_t * bufferA, // a buffer for local storage
	q7_t * Im_out);

	/*
	*
	* Other reference implemenation
	*
	*/

	void arm_relu_q7_ref(q7_t * data, uint16_t size);

	void arm_relu_q15_ref(q15_t * data, uint16_t size);

	void arm_nn_mult_q7_ref(q7_t * pSrcA, q7_t * pSrcB, q7_t * pDst, const uint16_t out_shift, uint32_t blockSize);

	void arm_nn_mult_q15_ref(q15_t * pSrcA, q15_t * pSrcB, q15_t * pDst, const uint16_t out_shift, uint32_t blockSize);

	#ifdef __cplusplus
	}
	#endif

	#endif