1 /* ----------------------------------------------------------------------
2 * Copyright (C) 2010-2012 ARM Limited. All rights reserved.
3 *
4 * $Date: 17. January 2013
5 * $Revision: V1.4.0
6 *
7 * Project: CMSIS DSP Library
8 * Title: arm_dotproduct_example_f32.c
9 *
10 * Description: Example code computing dot product of two vectors.
11 *
12 * Target Processor: Cortex-M4/Cortex-M3
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions
16 * are met:
17 * - Redistributions of source code must retain the above copyright
18 * notice, this list of conditions and the following disclaimer.
19 * - Redistributions in binary form must reproduce the above copyright
20 * notice, this list of conditions and the following disclaimer in
21 * the documentation and/or other materials provided with the
22 * distribution.
23 * - Neither the name of ARM LIMITED nor the names of its contributors
24 * may be used to endorse or promote products derived from this
25 * software without specific prior written permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
28 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
29 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
30 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
31 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
32 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
33 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
34 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
35 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
37 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38 * POSSIBILITY OF SUCH DAMAGE.
39 * -------------------------------------------------------------------- */
40
41 /**
42 * @addtogroup groupExamples
43 * @{
44 *
45 * @defgroup DotproductExample Dot Product Example
46 *
47 * \par Description:
48 * \par
49 * Demonstrates the use of the Multiply and Add functions to perform the dot product.
50 * The dot product of two vectors is obtained by multiplying corresponding elements
51 * and summing the products.
52
53 * \par Algorithm:
54 * \par
55 * The two input vectors \c A and \c B with length \c n, are multiplied element-by-element
56 * and then added to obtain dot product.
57 * \par
58 * This is denoted by the following equation:
59 * <pre> dotProduct = A[0] * B[0] + A[1] * B[1] + ... + A[n-1] * B[n-1]</pre>
60 *
61 * \par Block Diagram:
62 * \par
63 * \image html dotProduct.gif
64 *
65 * \par Variables Description:
66 * \par
67 * \li \c srcA_buf_f32 points to first input vector
68 * \li \c srcB_buf_f32 points to second input vector
69 * \li \c testOutput stores dot product of the two input vectors.
70 *
71 * \par CMSIS DSP Software Library Functions Used:
72 * \par
73 * - arm_mult_f32()
74 * - arm_add_f32()
75 *
76 * <b> Refer </b>
77 * \link arm_dotproduct_example_f32.c \endlink
78 *
79 * \example arm_dotproduct_example_f32.c
80 *
81 * @} */
82
83 #include <math.h>
84 #include "arm_math.h"
85
86 #if defined(SEMIHOSTING)
87 #include <stdio.h>
88 #endif
89
90 /* ----------------------------------------------------------------------
91 * Defines each of the tests performed
92 * ------------------------------------------------------------------- */
93 #define MAX_BLOCKSIZE 32
94 #define DELTA (0.000001f)
95
96 /* ----------------------------------------------------------------------
97 * Test input data for Floating point Dot Product example for 32-blockSize
98 * Generated by the MATLAB randn() function
99 * ------------------------------------------------------------------- */
100 /* ----------------------------------------------------------------------
101 ** Test input data of srcA for blockSize 32
102 ** ------------------------------------------------------------------- */
103 float32_t srcA_buf_f32[MAX_BLOCKSIZE] =
104 {
105 -0.4325648115282207, -1.6655843782380970, 0.1253323064748307,
106 0.2876764203585489, -1.1464713506814637, 1.1909154656429988,
107 1.1891642016521031, -0.0376332765933176, 0.3272923614086541,
108 0.1746391428209245, -0.1867085776814394, 0.7257905482933027,
109 -0.5883165430141887, 2.1831858181971011, -0.1363958830865957,
110 0.1139313135208096, 1.0667682113591888, 0.0592814605236053,
111 -0.0956484054836690, -0.8323494636500225, 0.2944108163926404,
112 -1.3361818579378040, 0.7143245518189522, 1.6235620644462707,
113 -0.6917757017022868, 0.8579966728282626, 1.2540014216025324,
114 -1.5937295764474768, -1.4409644319010200, 0.5711476236581780,
115 -0.3998855777153632, 0.6899973754643451
116 };
117
118 /* ----------------------------------------------------------------------
119 ** Test input data of srcB for blockSize 32
120 ** ------------------------------------------------------------------- */
121 float32_t srcB_buf_f32[MAX_BLOCKSIZE] =
122 {
123 1.7491401329284098, 0.1325982188803279, 0.3252281811989881,
124 -0.7938091410349637, 0.3149236145048914, -0.5272704888029532,
125 0.9322666565031119, 1.1646643544607362, -2.0456694357357357,
126 -0.6443728590041911, 1.7410657940825480, 0.4867684246821860,
127 1.0488288293660140, 1.4885752747099299, 1.2705014969484090,
128 -1.8561241921210170, 2.1343209047321410, 1.4358467535865909,
129 -0.9173023332875400, -1.1060770780029008, 0.8105708062681296,
130 0.6985430696369063, -0.4015827425012831, 1.2687512030669628,
131 -0.7836083053674872, 0.2132664971465569, 0.7878984786088954,
132 0.8966819356782295, -0.1869172943544062, 1.0131816724341454,
133 0.2484350696132857, 0.0596083377937976
134 };
135
136 /* Reference dot product output */
137 float32_t refDotProdOut = 5.9273644806352142;
138
139 /* ----------------------------------------------------------------------
140 * Declare Global variables
141 * ------------------------------------------------------------------- */
142 float32_t multOutput[MAX_BLOCKSIZE]; /* Intermediate output */
143 float32_t testOutput; /* Final ouput */
144
145 arm_status status; /* Status of the example */
146
main(void)147 int32_t main(void)
148 {
149 uint32_t i; /* Loop counter */
150 float32_t diff; /* Difference between reference and test outputs */
151
152 /* Multiplication of two input buffers */
153 arm_mult_f32(srcA_buf_f32, srcB_buf_f32, multOutput, MAX_BLOCKSIZE);
154
155 /* Accumulate the multiplication output values to
156 get the dot product of the two inputs */
157 for(i=0; i< MAX_BLOCKSIZE; i++)
158 {
159 arm_add_f32(&testOutput, &multOutput[i], &testOutput, 1);
160 }
161
162 /* absolute value of difference between ref and test */
163 diff = fabsf(refDotProdOut - testOutput);
164
165 /* Comparison of dot product value with reference */
166 status = (diff > DELTA) ? ARM_MATH_TEST_FAILURE : ARM_MATH_SUCCESS;
167
168 if (status != ARM_MATH_SUCCESS)
169 {
170 #if defined (SEMIHOSTING)
171 printf("FAILURE\n");
172 #else
173 while (1); /* main function does not return */
174 #endif
175 }
176 else
177 {
178 #if defined (SEMIHOSTING)
179 printf("SUCCESS\n");
180 #else
181 while (1); /* main function does not return */
182 #endif
183 }
184 }
185
186 /** \endlink */
187