/* ----------------------------------------------------------------------
|
* Copyright (C) 2010-2012 ARM Limited. All rights reserved.
|
*
|
* $Date: 17. January 2013
|
* $Revision: V1.4.0
|
*
|
* Project: CMSIS DSP Library
|
* Title: arm_dotproduct_example_f32.c
|
*
|
* Description: Example code computing dot product of two vectors.
|
*
|
* Target Processor: Cortex-M4/Cortex-M3
|
*
|
* Redistribution and use in source and binary forms, with or without
|
* modification, are permitted provided that the following conditions
|
* are met:
|
* - Redistributions of source code must retain the above copyright
|
* notice, this list of conditions and the following disclaimer.
|
* - Redistributions in binary form must reproduce the above copyright
|
* notice, this list of conditions and the following disclaimer in
|
* the documentation and/or other materials provided with the
|
* distribution.
|
* - Neither the name of ARM LIMITED nor the names of its contributors
|
* may be used to endorse or promote products derived from this
|
* software without specific prior written permission.
|
*
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
|
* FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
|
* COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
|
* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
|
* BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
|
* LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
* CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
|
* LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
|
* ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
* POSSIBILITY OF SUCH DAMAGE.
|
* -------------------------------------------------------------------- */
|
|
/**
|
* @ingroup groupExamples
|
*/
|
|
/**
|
* @defgroup DotproductExample Dot Product Example
|
*
|
* \par Description:
|
* \par
|
* Demonstrates the use of the Multiply and Add functions to perform the dot product.
|
* The dot product of two vectors is obtained by multiplying corresponding elements
|
* and summing the products.
|
|
* \par Algorithm:
|
* \par
|
* The two input vectors \c A and \c B with length \c n, are multiplied element-by-element
|
* and then added to obtain dot product.
|
* \par
|
* This is denoted by the following equation:
|
* <pre> dotProduct = A[0] * B[0] + A[1] * B[1] + ... + A[n-1] * B[n-1]</pre>
|
*
|
* \par Block Diagram:
|
* \par
|
* \image html dotProduct.gif
|
*
|
* \par Variables Description:
|
* \par
|
* \li \c srcA_buf_f32 points to first input vector
|
* \li \c srcB_buf_f32 points to second input vector
|
* \li \c testOutput stores dot product of the two input vectors.
|
*
|
* \par CMSIS DSP Software Library Functions Used:
|
* \par
|
* - arm_mult_f32()
|
* - arm_add_f32()
|
*
|
* <b> Refer </b>
|
* \link arm_dotproduct_example_f32.c \endlink
|
*
|
*/
|
|
|
/** \example arm_dotproduct_example_f32.c
|
*/
|
|
#include <math.h>
|
#include "arm_math.h"
|
|
/* ----------------------------------------------------------------------
|
* Defines each of the tests performed
|
* ------------------------------------------------------------------- */
|
#define MAX_BLOCKSIZE 32
|
#define DELTA (0.000001f)
|
|
/* ----------------------------------------------------------------------
|
* Test input data for Floating point Dot Product example for 32-blockSize
|
* Generated by the MATLAB randn() function
|
* ------------------------------------------------------------------- */
|
/* ----------------------------------------------------------------------
|
** Test input data of srcA for blockSize 32
|
** ------------------------------------------------------------------- */
|
float32_t srcA_buf_f32[MAX_BLOCKSIZE] =
|
{
|
-0.4325648115282207, -1.6655843782380970, 0.1253323064748307,
|
0.2876764203585489, -1.1464713506814637, 1.1909154656429988,
|
1.1891642016521031, -0.0376332765933176, 0.3272923614086541,
|
0.1746391428209245, -0.1867085776814394, 0.7257905482933027,
|
-0.5883165430141887, 2.1831858181971011, -0.1363958830865957,
|
0.1139313135208096, 1.0667682113591888, 0.0592814605236053,
|
-0.0956484054836690, -0.8323494636500225, 0.2944108163926404,
|
-1.3361818579378040, 0.7143245518189522, 1.6235620644462707,
|
-0.6917757017022868, 0.8579966728282626, 1.2540014216025324,
|
-1.5937295764474768, -1.4409644319010200, 0.5711476236581780,
|
-0.3998855777153632, 0.6899973754643451
|
};
|
|
/* ----------------------------------------------------------------------
|
** Test input data of srcB for blockSize 32
|
** ------------------------------------------------------------------- */
|
float32_t srcB_buf_f32[MAX_BLOCKSIZE] =
|
{
|
1.7491401329284098, 0.1325982188803279, 0.3252281811989881,
|
-0.7938091410349637, 0.3149236145048914, -0.5272704888029532,
|
0.9322666565031119, 1.1646643544607362, -2.0456694357357357,
|
-0.6443728590041911, 1.7410657940825480, 0.4867684246821860,
|
1.0488288293660140, 1.4885752747099299, 1.2705014969484090,
|
-1.8561241921210170, 2.1343209047321410, 1.4358467535865909,
|
-0.9173023332875400, -1.1060770780029008, 0.8105708062681296,
|
0.6985430696369063, -0.4015827425012831, 1.2687512030669628,
|
-0.7836083053674872, 0.2132664971465569, 0.7878984786088954,
|
0.8966819356782295, -0.1869172943544062, 1.0131816724341454,
|
0.2484350696132857, 0.0596083377937976
|
};
|
|
/* Reference dot product output */
|
float32_t refDotProdOut = 5.9273644806352142;
|
|
/* ----------------------------------------------------------------------
|
* Declare Global variables
|
* ------------------------------------------------------------------- */
|
float32_t multOutput[MAX_BLOCKSIZE]; /* Intermediate output */
|
float32_t testOutput; /* Final ouput */
|
|
arm_status status; /* Status of the example */
|
|
int32_t main(void)
|
{
|
uint32_t i; /* Loop counter */
|
float32_t diff; /* Difference between reference and test outputs */
|
|
/* Multiplication of two input buffers */
|
arm_mult_f32(srcA_buf_f32, srcB_buf_f32, multOutput, MAX_BLOCKSIZE);
|
|
/* Accumulate the multiplication output values to
|
get the dot product of the two inputs */
|
for(i=0; i< MAX_BLOCKSIZE; i++)
|
{
|
arm_add_f32(&testOutput, &multOutput[i], &testOutput, 1);
|
}
|
|
/* absolute value of difference between ref and test */
|
diff = fabsf(refDotProdOut - testOutput);
|
|
/* Comparison of dot product value with reference */
|
if (diff > DELTA)
|
{
|
status = ARM_MATH_TEST_FAILURE;
|
}
|
|
if ( status == ARM_MATH_TEST_FAILURE)
|
{
|
while (1);
|
}
|
|
while (1); /* main function does not return */
|
}
|
|
/** \endlink */
|