/*
|
* Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved.
|
*
|
* SPDX-License-Identifier: Apache-2.0
|
*
|
* Licensed under the Apache License, Version 2.0 (the License); you may
|
* not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an AS IS BASIS, WITHOUT
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
#ifndef _REF_FUNCTIONS_H_
|
#define _REF_FUNCTIONS_H_
|
|
#include "arm_math.h"
|
#include "arm_nnfunctions.h"
|
//#include "arm_nnsupportfunctions.h"
|
#include "fully_connected_testing_weights.h"
|
|
#ifdef __cplusplus
|
extern "C"
|
{
|
#endif
|
|
/*
|
*
|
* Convolution reference implemenation
|
*
|
*/
|
|
void arm_convolve_HWC_q7_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimention
|
const uint16_t ch_im_in, // number of input image channels
|
const q7_t * wt, // kernel weights
|
const uint16_t ch_im_out, // number of filters, i.e., output image channels
|
const uint16_t dim_kernel, // filter kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const q7_t * bias, // bias
|
const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image
|
const uint16_t dim_im_out, // output image dimension
|
q15_t * bufferA, //buffer space for input
|
q7_t * bufferB //buffer space for output
|
);
|
|
void arm_convolve_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in_x, // input image dimention x
|
const uint16_t dim_im_in_y, // input image dimention y
|
const uint16_t ch_im_in, // number of input image channels
|
const q7_t * wt, // kernel weights
|
const uint16_t ch_im_out, // number of filters, i.e., output image channels
|
const uint16_t dim_kernel_x, // filter kernel size x
|
const uint16_t dim_kernel_y, // filter kernel size y
|
const uint16_t padding_x, // padding sizes x
|
const uint16_t padding_y, // padding sizes y
|
const uint16_t stride_x, // stride x
|
const uint16_t stride_y, // stride y
|
const q7_t * bias, // bias
|
const uint16_t bias_shift, const uint16_t out_shift, q7_t * Im_out, // output image
|
const uint16_t dim_im_out_x, // output image dimension x
|
const uint16_t dim_im_out_y, // output image dimension y
|
q15_t * bufferA, //buffer space for input
|
q7_t * bufferB //buffer space for output
|
);
|
|
void arm_convolve_HWC_q15_ref(const q15_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimention
|
const uint16_t ch_im_in, // number of input image channels
|
const q15_t * wt, // kernel weights
|
const uint16_t ch_im_out, // number of filters, i.e., output image channels
|
const uint16_t dim_kernel, // filter kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const q15_t * bias, // bias
|
const uint16_t bias_shift, const uint16_t out_shift, q15_t * Im_out, // output image
|
const uint16_t dim_im_out, // output image dimension
|
q15_t * bufferA, //buffer space for input
|
q7_t * bufferB //buffer space for output
|
);
|
void arm_convolve_HWC_q15_nonsquare_ref(const q15_t * Im_in,
|
const uint16_t dim_im_in_x,
|
const uint16_t dim_im_in_y,
|
const uint16_t ch_im_in,
|
const q15_t * wt,
|
const uint16_t ch_im_out,
|
const uint16_t dim_kernel_x,
|
const uint16_t dim_kernel_y,
|
const uint16_t padding_x,
|
const uint16_t padding_y,
|
const uint16_t stride_x,
|
const uint16_t stride_y,
|
const q15_t * bias,
|
const uint16_t bias_shift,
|
const uint16_t out_shift,
|
q15_t * Im_out,
|
const uint16_t dim_im_out_x,
|
const uint16_t dim_im_out_y,
|
q15_t * bufferA,
|
q7_t * bufferB);
|
|
void arm_depthwise_separable_conv_HWC_q7_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimention
|
const uint16_t ch_im_in, // number of input image channels
|
const q7_t * wt, // kernel weights
|
const uint16_t ch_im_out, // number of filters, i.e., output image channels
|
const uint16_t dim_kernel, // filter kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const q7_t * bias, // bias
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
q7_t * Im_out, // output image
|
const uint16_t dim_im_out, // output image dimension
|
q15_t * bufferA, //buffer space for input
|
q7_t * bufferB //buffer space for output
|
);
|
void arm_depthwise_separable_conv_HWC_q7_ref_nonsquare(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in_x, // input image dimention x
|
const uint16_t dim_im_in_y, // input image dimention y
|
const uint16_t ch_im_in, // number of input image channels
|
const q7_t * wt, // kernel weights
|
const uint16_t ch_im_out, // number of filters, i.e., output image channels
|
const uint16_t dim_kernel_x, // filter kernel size x
|
const uint16_t dim_kernel_y, // filter kernel size y
|
const uint16_t padding_x, // padding sizes x
|
const uint16_t padding_y, // padding sizes y
|
const uint16_t stride_x, // stride x
|
const uint16_t stride_y, // stride y
|
const q7_t * bias, // bias
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
q7_t * Im_out, // output image
|
const uint16_t dim_im_out_x, // output image dimension x
|
const uint16_t dim_im_out_y, // output image dimension y
|
q15_t * bufferA, //buffer space for input
|
q7_t * bufferB //buffer space for output
|
);
|
|
/*
|
*
|
* Fully-connected reference implemenation
|
*
|
*/
|
|
void arm_fully_connected_q7_ref(const q7_t * pV, // pointer to vector
|
const q7_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q7_t * bias, q7_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
void arm_fully_connected_q15_ref(const q15_t * pV, // pointer to vector
|
const q15_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q15_t * bias, q15_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
void arm_fully_connected_mat_q7_vec_q15_ref(const q15_t * pV, // pointer to vector
|
const q7_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q7_t * bias, q15_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
void arm_fully_connected_q7_opt_ref(const q7_t * pV, // pointer to vector
|
const q7_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q7_t * bias, q7_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
void arm_fully_connected_q15_opt_ref(const q15_t * pV, // pointer to vector
|
const q15_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q15_t * bias, q15_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
void arm_fully_connected_mat_q7_vec_q15_opt_ref(const q15_t * pV, // pointer to vector
|
const q7_t * pM, // pointer to matrix
|
const uint16_t dim_vec, // length of the vector
|
const uint16_t num_of_rows, // numCol of A
|
const uint16_t bias_shift, // amount of left-shift for bias
|
const uint16_t out_shift, // amount of right-shift for output
|
const q7_t * bias, q15_t * pOut, // output operand
|
q15_t * vec_buffer);
|
|
/*
|
*
|
* Pooling reference implemenation
|
*
|
*/
|
|
void arm_avepool_q7_HWC_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimension
|
const uint16_t ch_im_in, // number of input image channels
|
const uint16_t dim_kernel, // window kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const uint16_t dim_im_out, // output image dimension
|
q7_t * bufferA, // a buffer for local storage
|
q7_t * Im_out);
|
|
void arm_maxpool_q7_HWC_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimension
|
const uint16_t ch_im_in, // number of input image channels
|
const uint16_t dim_kernel, // window kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const uint16_t dim_im_out, // output image dimension
|
q7_t * bufferA, // a buffer for local storage
|
q7_t * Im_out);
|
|
/*
|
*
|
* Other reference implemenation
|
*
|
*/
|
|
void arm_relu_q7_ref(q7_t * data, uint16_t size);
|
|
void arm_relu_q15_ref(q15_t * data, uint16_t size);
|
|
void arm_nn_mult_q7_ref(q7_t * pSrcA, q7_t * pSrcB, q7_t * pDst, const uint16_t out_shift, uint32_t blockSize);
|
|
void arm_nn_mult_q15_ref(q15_t * pSrcA, q15_t * pSrcB, q15_t * pDst, const uint16_t out_shift, uint32_t blockSize);
|
|
#ifdef __cplusplus
|
}
|
#endif
|
|
#endif
|