/*
|
* Copyright (C) 2010-2018 Arm Limited or its affiliates. All rights reserved.
|
*
|
* SPDX-License-Identifier: Apache-2.0
|
*
|
* Licensed under the Apache License, Version 2.0 (the License); you may
|
* not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an AS IS BASIS, WITHOUT
|
* WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
#include "ref_functions.h"
|
|
void arm_avepool_q7_HWC_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimension
|
const uint16_t ch_im_in, // number of input image channels
|
const uint16_t dim_kernel, // window kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const uint16_t dim_im_out, // output image dimension
|
q7_t * bufferA, // a buffer for local storage
|
q7_t * Im_out)
|
{
|
int16_t i_ch_in, i_x, i_y;
|
int16_t k_x, k_y;
|
|
for (i_ch_in = 0; i_ch_in < ch_im_in; i_ch_in++)
|
{
|
for (i_y = 0; i_y < dim_im_out; i_y++)
|
{
|
for (i_x = 0; i_x < dim_im_out; i_x++)
|
{
|
int sum = 0;
|
int count = 0;
|
for (k_y = i_y * stride - padding; k_y < i_y * stride - padding + dim_kernel; k_y++)
|
{
|
for (k_x = i_x * stride - padding; k_x < i_x * stride - padding + dim_kernel; k_x++)
|
{
|
if (k_y >= 0 && k_x >= 0 && k_y < dim_im_in && k_x < dim_im_in)
|
{
|
sum += Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)];
|
count++;
|
}
|
}
|
}
|
Im_out[i_ch_in + ch_im_in * (i_x + i_y * dim_im_out)] = sum / count;
|
}
|
}
|
}
|
}
|
|
void arm_maxpool_q7_HWC_ref(const q7_t * Im_in, // input image
|
const uint16_t dim_im_in, // input image dimension
|
const uint16_t ch_im_in, // number of input image channels
|
const uint16_t dim_kernel, // window kernel size
|
const uint16_t padding, // padding sizes
|
const uint16_t stride, // stride
|
const uint16_t dim_im_out, // output image dimension
|
q7_t * bufferA, // a buffer for local storage
|
q7_t * Im_out)
|
{
|
int16_t i_ch_in, i_x, i_y;
|
int16_t k_x, k_y;
|
|
for (i_ch_in = 0; i_ch_in < ch_im_in; i_ch_in++)
|
{
|
for (i_y = 0; i_y < dim_im_out; i_y++)
|
{
|
for (i_x = 0; i_x < dim_im_out; i_x++)
|
{
|
int max = -129;
|
for (k_y = i_y * stride - padding; k_y < i_y * stride - padding + dim_kernel; k_y++)
|
{
|
for (k_x = i_x * stride - padding; k_x < i_x * stride - padding + dim_kernel; k_x++)
|
{
|
if (k_y >= 0 && k_x >= 0 && k_y < dim_im_in && k_x < dim_im_in)
|
{
|
if (Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)] > max)
|
{
|
max = Im_in[i_ch_in + ch_im_in * (k_x + k_y * dim_im_in)];
|
}
|
}
|
}
|
}
|
Im_out[i_ch_in + ch_im_in * (i_x + i_y * dim_im_out)] = max;
|
}
|
}
|
}
|
}
|