comparison Common/Drivers/CMSIS/Include/arm_math.h @ 128:c78bcbd5deda FlipDisplay

Added current STM32 standandard libraries in version independend folder structure
author Ideenmodellierer
date Sun, 17 Feb 2019 21:12:22 +0100
parents
children
comparison
equal deleted inserted replaced
127:1369f8660eaa 128:c78bcbd5deda
1 /* ----------------------------------------------------------------------
2 * Copyright (C) 2010-2015 ARM Limited. All rights reserved.
3 *
4 * $Date: 20. October 2015
5 * $Revision: V1.4.5 b
6 *
7 * Project: CMSIS DSP Library
8 * Title: arm_math.h
9 *
10 * Description: Public header file for CMSIS DSP Library
11 *
12 * Target Processor: Cortex-M7/Cortex-M4/Cortex-M3/Cortex-M0
13 *
14 * Redistribution and use in source and binary forms, with or without
15 * modification, are permitted provided that the following conditions
16 * are met:
17 * - Redistributions of source code must retain the above copyright
18 * notice, this list of conditions and the following disclaimer.
19 * - Redistributions in binary form must reproduce the above copyright
20 * notice, this list of conditions and the following disclaimer in
21 * the documentation and/or other materials provided with the
22 * distribution.
23 * - Neither the name of ARM LIMITED nor the names of its contributors
24 * may be used to endorse or promote products derived from this
25 * software without specific prior written permission.
26 *
27 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
28 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
29 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
30 * FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
31 * COPYRIGHT OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
32 * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
33 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
34 * LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
35 * CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
36 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
37 * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38 * POSSIBILITY OF SUCH DAMAGE.
39 * -------------------------------------------------------------------- */
40
41 /**
42 \mainpage CMSIS DSP Software Library
43 *
44 * Introduction
45 * ------------
46 *
47 * This user manual describes the CMSIS DSP software library,
48 * a suite of common signal processing functions for use on Cortex-M processor based devices.
49 *
50 * The library is divided into a number of functions each covering a specific category:
51 * - Basic math functions
52 * - Fast math functions
53 * - Complex math functions
54 * - Filters
55 * - Matrix functions
56 * - Transforms
57 * - Motor control functions
58 * - Statistical functions
59 * - Support functions
60 * - Interpolation functions
61 *
62 * The library has separate functions for operating on 8-bit integers, 16-bit integers,
63 * 32-bit integer and 32-bit floating-point values.
64 *
65 * Using the Library
66 * ------------
67 *
68 * The library installer contains prebuilt versions of the libraries in the <code>Lib</code> folder.
69 * - arm_cortexM7lfdp_math.lib (Little endian and Double Precision Floating Point Unit on Cortex-M7)
70 * - arm_cortexM7bfdp_math.lib (Big endian and Double Precision Floating Point Unit on Cortex-M7)
71 * - arm_cortexM7lfsp_math.lib (Little endian and Single Precision Floating Point Unit on Cortex-M7)
72 * - arm_cortexM7bfsp_math.lib (Big endian and Single Precision Floating Point Unit on Cortex-M7)
73 * - arm_cortexM7l_math.lib (Little endian on Cortex-M7)
74 * - arm_cortexM7b_math.lib (Big endian on Cortex-M7)
75 * - arm_cortexM4lf_math.lib (Little endian and Floating Point Unit on Cortex-M4)
76 * - arm_cortexM4bf_math.lib (Big endian and Floating Point Unit on Cortex-M4)
77 * - arm_cortexM4l_math.lib (Little endian on Cortex-M4)
78 * - arm_cortexM4b_math.lib (Big endian on Cortex-M4)
79 * - arm_cortexM3l_math.lib (Little endian on Cortex-M3)
80 * - arm_cortexM3b_math.lib (Big endian on Cortex-M3)
81 * - arm_cortexM0l_math.lib (Little endian on Cortex-M0 / CortexM0+)
82 * - arm_cortexM0b_math.lib (Big endian on Cortex-M0 / CortexM0+)
83 *
84 * The library functions are declared in the public file <code>arm_math.h</code> which is placed in the <code>Include</code> folder.
85 * Simply include this file and link the appropriate library in the application and begin calling the library functions. The Library supports single
86 * public header file <code> arm_math.h</code> for Cortex-M7/M4/M3/M0/M0+ with little endian and big endian. Same header file will be used for floating point unit(FPU) variants.
87 * Define the appropriate pre processor MACRO ARM_MATH_CM7 or ARM_MATH_CM4 or ARM_MATH_CM3 or
88 * ARM_MATH_CM0 or ARM_MATH_CM0PLUS depending on the target processor in the application.
89 *
90 * Examples
91 * --------
92 *
93 * The library ships with a number of examples which demonstrate how to use the library functions.
94 *
95 * Toolchain Support
96 * ------------
97 *
98 * The library has been developed and tested with MDK-ARM version 5.14.0.0
99 * The library is being tested in GCC and IAR toolchains and updates on this activity will be made available shortly.
100 *
101 * Building the Library
102 * ------------
103 *
104 * The library installer contains a project file to re build libraries on MDK-ARM Tool chain in the <code>CMSIS\\DSP_Lib\\Source\\ARM</code> folder.
105 * - arm_cortexM_math.uvprojx
106 *
107 *
108 * The libraries can be built by opening the arm_cortexM_math.uvprojx project in MDK-ARM, selecting a specific target, and defining the optional pre processor MACROs detailed above.
109 *
110 * Pre-processor Macros
111 * ------------
112 *
113 * Each library project have differant pre-processor macros.
114 *
115 * - UNALIGNED_SUPPORT_DISABLE:
116 *
117 * Define macro UNALIGNED_SUPPORT_DISABLE, If the silicon does not support unaligned memory access
118 *
119 * - ARM_MATH_BIG_ENDIAN:
120 *
121 * Define macro ARM_MATH_BIG_ENDIAN to build the library for big endian targets. By default library builds for little endian targets.
122 *
123 * - ARM_MATH_MATRIX_CHECK:
124 *
125 * Define macro ARM_MATH_MATRIX_CHECK for checking on the input and output sizes of matrices
126 *
127 * - ARM_MATH_ROUNDING:
128 *
129 * Define macro ARM_MATH_ROUNDING for rounding on support functions
130 *
131 * - ARM_MATH_CMx:
132 *
133 * Define macro ARM_MATH_CM4 for building the library on Cortex-M4 target, ARM_MATH_CM3 for building library on Cortex-M3 target
134 * and ARM_MATH_CM0 for building library on Cortex-M0 target, ARM_MATH_CM0PLUS for building library on Cortex-M0+ target, and
135 * ARM_MATH_CM7 for building the library on cortex-M7.
136 *
137 * - __FPU_PRESENT:
138 *
139 * Initialize macro __FPU_PRESENT = 1 when building on FPU supported Targets. Enable this macro for M4bf and M4lf libraries
140 *
141 * <hr>
142 * CMSIS-DSP in ARM::CMSIS Pack
143 * -----------------------------
144 *
145 * The following files relevant to CMSIS-DSP are present in the <b>ARM::CMSIS</b> Pack directories:
146 * |File/Folder |Content |
147 * |------------------------------|------------------------------------------------------------------------|
148 * |\b CMSIS\\Documentation\\DSP | This documentation |
149 * |\b CMSIS\\DSP_Lib | Software license agreement (license.txt) |
150 * |\b CMSIS\\DSP_Lib\\Examples | Example projects demonstrating the usage of the library functions |
151 * |\b CMSIS\\DSP_Lib\\Source | Source files for rebuilding the library |
152 *
153 * <hr>
154 * Revision History of CMSIS-DSP
155 * ------------
156 * Please refer to \ref ChangeLog_pg.
157 *
158 * Copyright Notice
159 * ------------
160 *
161 * Copyright (C) 2010-2015 ARM Limited. All rights reserved.
162 */
163
164
165 /**
166 * @defgroup groupMath Basic Math Functions
167 */
168
169 /**
170 * @defgroup groupFastMath Fast Math Functions
171 * This set of functions provides a fast approximation to sine, cosine, and square root.
172 * As compared to most of the other functions in the CMSIS math library, the fast math functions
173 * operate on individual values and not arrays.
174 * There are separate functions for Q15, Q31, and floating-point data.
175 *
176 */
177
178 /**
179 * @defgroup groupCmplxMath Complex Math Functions
180 * This set of functions operates on complex data vectors.
181 * The data in the complex arrays is stored in an interleaved fashion
182 * (real, imag, real, imag, ...).
183 * In the API functions, the number of samples in a complex array refers
184 * to the number of complex values; the array contains twice this number of
185 * real values.
186 */
187
188 /**
189 * @defgroup groupFilters Filtering Functions
190 */
191
192 /**
193 * @defgroup groupMatrix Matrix Functions
194 *
195 * This set of functions provides basic matrix math operations.
196 * The functions operate on matrix data structures. For example,
197 * the type
198 * definition for the floating-point matrix structure is shown
199 * below:
200 * <pre>
201 * typedef struct
202 * {
203 * uint16_t numRows; // number of rows of the matrix.
204 * uint16_t numCols; // number of columns of the matrix.
205 * float32_t *pData; // points to the data of the matrix.
206 * } arm_matrix_instance_f32;
207 * </pre>
208 * There are similar definitions for Q15 and Q31 data types.
209 *
210 * The structure specifies the size of the matrix and then points to
211 * an array of data. The array is of size <code>numRows X numCols</code>
212 * and the values are arranged in row order. That is, the
213 * matrix element (i, j) is stored at:
214 * <pre>
215 * pData[i*numCols + j]
216 * </pre>
217 *
218 * \par Init Functions
219 * There is an associated initialization function for each type of matrix
220 * data structure.
221 * The initialization function sets the values of the internal structure fields.
222 * Refer to the function <code>arm_mat_init_f32()</code>, <code>arm_mat_init_q31()</code>
223 * and <code>arm_mat_init_q15()</code> for floating-point, Q31 and Q15 types, respectively.
224 *
225 * \par
226 * Use of the initialization function is optional. However, if initialization function is used
227 * then the instance structure cannot be placed into a const data section.
228 * To place the instance structure in a const data
229 * section, manually initialize the data structure. For example:
230 * <pre>
231 * <code>arm_matrix_instance_f32 S = {nRows, nColumns, pData};</code>
232 * <code>arm_matrix_instance_q31 S = {nRows, nColumns, pData};</code>
233 * <code>arm_matrix_instance_q15 S = {nRows, nColumns, pData};</code>
234 * </pre>
235 * where <code>nRows</code> specifies the number of rows, <code>nColumns</code>
236 * specifies the number of columns, and <code>pData</code> points to the
237 * data array.
238 *
239 * \par Size Checking
240 * By default all of the matrix functions perform size checking on the input and
241 * output matrices. For example, the matrix addition function verifies that the
242 * two input matrices and the output matrix all have the same number of rows and
243 * columns. If the size check fails the functions return:
244 * <pre>
245 * ARM_MATH_SIZE_MISMATCH
246 * </pre>
247 * Otherwise the functions return
248 * <pre>
249 * ARM_MATH_SUCCESS
250 * </pre>
251 * There is some overhead associated with this matrix size checking.
252 * The matrix size checking is enabled via the \#define
253 * <pre>
254 * ARM_MATH_MATRIX_CHECK
255 * </pre>
256 * within the library project settings. By default this macro is defined
257 * and size checking is enabled. By changing the project settings and
258 * undefining this macro size checking is eliminated and the functions
259 * run a bit faster. With size checking disabled the functions always
260 * return <code>ARM_MATH_SUCCESS</code>.
261 */
262
263 /**
264 * @defgroup groupTransforms Transform Functions
265 */
266
267 /**
268 * @defgroup groupController Controller Functions
269 */
270
271 /**
272 * @defgroup groupStats Statistics Functions
273 */
274 /**
275 * @defgroup groupSupport Support Functions
276 */
277
278 /**
279 * @defgroup groupInterpolation Interpolation Functions
280 * These functions perform 1- and 2-dimensional interpolation of data.
281 * Linear interpolation is used for 1-dimensional data and
282 * bilinear interpolation is used for 2-dimensional data.
283 */
284
285 /**
286 * @defgroup groupExamples Examples
287 */
288 #ifndef _ARM_MATH_H
289 #define _ARM_MATH_H
290
291 /* ignore some GCC warnings */
292 #if defined ( __GNUC__ )
293 #pragma GCC diagnostic push
294 #pragma GCC diagnostic ignored "-Wsign-conversion"
295 #pragma GCC diagnostic ignored "-Wconversion"
296 #pragma GCC diagnostic ignored "-Wunused-parameter"
297 #endif
298
299 #define __CMSIS_GENERIC /* disable NVIC and Systick functions */
300
301 #if defined(ARM_MATH_CM7)
302 #include "core_cm7.h"
303 #elif defined (ARM_MATH_CM4)
304 #include "core_cm4.h"
305 #elif defined (ARM_MATH_CM3)
306 #include "core_cm3.h"
307 #elif defined (ARM_MATH_CM0)
308 #include "core_cm0.h"
309 #define ARM_MATH_CM0_FAMILY
310 #elif defined (ARM_MATH_CM0PLUS)
311 #include "core_cm0plus.h"
312 #define ARM_MATH_CM0_FAMILY
313 #else
314 #error "Define according the used Cortex core ARM_MATH_CM7, ARM_MATH_CM4, ARM_MATH_CM3, ARM_MATH_CM0PLUS or ARM_MATH_CM0"
315 #endif
316
317 #undef __CMSIS_GENERIC /* enable NVIC and Systick functions */
318 #include "string.h"
319 #include "math.h"
320 #ifdef __cplusplus
321 extern "C"
322 {
323 #endif
324
325
326 /**
327 * @brief Macros required for reciprocal calculation in Normalized LMS
328 */
329
330 #define DELTA_Q31 (0x100)
331 #define DELTA_Q15 0x5
332 #define INDEX_MASK 0x0000003F
333 #ifndef PI
334 #define PI 3.14159265358979f
335 #endif
336
337 /**
338 * @brief Macros required for SINE and COSINE Fast math approximations
339 */
340
341 #define FAST_MATH_TABLE_SIZE 512
342 #define FAST_MATH_Q31_SHIFT (32 - 10)
343 #define FAST_MATH_Q15_SHIFT (16 - 10)
344 #define CONTROLLER_Q31_SHIFT (32 - 9)
345 #define TABLE_SIZE 256
346 #define TABLE_SPACING_Q31 0x400000
347 #define TABLE_SPACING_Q15 0x80
348
349 /**
350 * @brief Macros required for SINE and COSINE Controller functions
351 */
352 /* 1.31(q31) Fixed value of 2/360 */
353 /* -1 to +1 is divided into 360 values so total spacing is (2/360) */
354 #define INPUT_SPACING 0xB60B61
355
356 /**
357 * @brief Macro for Unaligned Support
358 */
359 #ifndef UNALIGNED_SUPPORT_DISABLE
360 #define ALIGN4
361 #else
362 #if defined (__GNUC__)
363 #define ALIGN4 __attribute__((aligned(4)))
364 #else
365 #define ALIGN4 __align(4)
366 #endif
367 #endif /* #ifndef UNALIGNED_SUPPORT_DISABLE */
368
369 /**
370 * @brief Error status returned by some functions in the library.
371 */
372
373 typedef enum
374 {
375 ARM_MATH_SUCCESS = 0, /**< No error */
376 ARM_MATH_ARGUMENT_ERROR = -1, /**< One or more arguments are incorrect */
377 ARM_MATH_LENGTH_ERROR = -2, /**< Length of data buffer is incorrect */
378 ARM_MATH_SIZE_MISMATCH = -3, /**< Size of matrices is not compatible with the operation. */
379 ARM_MATH_NANINF = -4, /**< Not-a-number (NaN) or infinity is generated */
380 ARM_MATH_SINGULAR = -5, /**< Generated by matrix inversion if the input matrix is singular and cannot be inverted. */
381 ARM_MATH_TEST_FAILURE = -6 /**< Test Failed */
382 } arm_status;
383
384 /**
385 * @brief 8-bit fractional data type in 1.7 format.
386 */
387 typedef int8_t q7_t;
388
389 /**
390 * @brief 16-bit fractional data type in 1.15 format.
391 */
392 typedef int16_t q15_t;
393
394 /**
395 * @brief 32-bit fractional data type in 1.31 format.
396 */
397 typedef int32_t q31_t;
398
399 /**
400 * @brief 64-bit fractional data type in 1.63 format.
401 */
402 typedef int64_t q63_t;
403
404 /**
405 * @brief 32-bit floating-point type definition.
406 */
407 typedef float float32_t;
408
409 /**
410 * @brief 64-bit floating-point type definition.
411 */
412 typedef double float64_t;
413
414 /**
415 * @brief definition to read/write two 16 bit values.
416 */
417 #if defined __CC_ARM
418 #define __SIMD32_TYPE int32_t __packed
419 #define CMSIS_UNUSED __attribute__((unused))
420
421 #elif defined(__ARMCC_VERSION) && (__ARMCC_VERSION >= 6010050)
422 #define __SIMD32_TYPE int32_t
423 #define CMSIS_UNUSED __attribute__((unused))
424
425 #elif defined __GNUC__
426 #define __SIMD32_TYPE int32_t
427 #define CMSIS_UNUSED __attribute__((unused))
428
429 #elif defined __ICCARM__
430 #define __SIMD32_TYPE int32_t __packed
431 #define CMSIS_UNUSED
432
433 #elif defined __CSMC__
434 #define __SIMD32_TYPE int32_t
435 #define CMSIS_UNUSED
436
437 #elif defined __TASKING__
438 #define __SIMD32_TYPE __unaligned int32_t
439 #define CMSIS_UNUSED
440
441 #else
442 #error Unknown compiler
443 #endif
444
445 #define __SIMD32(addr) (*(__SIMD32_TYPE **) & (addr))
446 #define __SIMD32_CONST(addr) ((__SIMD32_TYPE *)(addr))
447 #define _SIMD32_OFFSET(addr) (*(__SIMD32_TYPE *) (addr))
448 #define __SIMD64(addr) (*(int64_t **) & (addr))
449
450 #if defined (ARM_MATH_CM3) || defined (ARM_MATH_CM0_FAMILY)
451 /**
452 * @brief definition to pack two 16 bit values.
453 */
454 #define __PKHBT(ARG1, ARG2, ARG3) ( (((int32_t)(ARG1) << 0) & (int32_t)0x0000FFFF) | \
455 (((int32_t)(ARG2) << ARG3) & (int32_t)0xFFFF0000) )
456 #define __PKHTB(ARG1, ARG2, ARG3) ( (((int32_t)(ARG1) << 0) & (int32_t)0xFFFF0000) | \
457 (((int32_t)(ARG2) >> ARG3) & (int32_t)0x0000FFFF) )
458
459 #endif
460
461
462 /**
463 * @brief definition to pack four 8 bit values.
464 */
465 #ifndef ARM_MATH_BIG_ENDIAN
466
467 #define __PACKq7(v0,v1,v2,v3) ( (((int32_t)(v0) << 0) & (int32_t)0x000000FF) | \
468 (((int32_t)(v1) << 8) & (int32_t)0x0000FF00) | \
469 (((int32_t)(v2) << 16) & (int32_t)0x00FF0000) | \
470 (((int32_t)(v3) << 24) & (int32_t)0xFF000000) )
471 #else
472
473 #define __PACKq7(v0,v1,v2,v3) ( (((int32_t)(v3) << 0) & (int32_t)0x000000FF) | \
474 (((int32_t)(v2) << 8) & (int32_t)0x0000FF00) | \
475 (((int32_t)(v1) << 16) & (int32_t)0x00FF0000) | \
476 (((int32_t)(v0) << 24) & (int32_t)0xFF000000) )
477
478 #endif
479
480
481 /**
482 * @brief Clips Q63 to Q31 values.
483 */
484 static __INLINE q31_t clip_q63_to_q31(
485 q63_t x)
486 {
487 return ((q31_t) (x >> 32) != ((q31_t) x >> 31)) ?
488 ((0x7FFFFFFF ^ ((q31_t) (x >> 63)))) : (q31_t) x;
489 }
490
491 /**
492 * @brief Clips Q63 to Q15 values.
493 */
494 static __INLINE q15_t clip_q63_to_q15(
495 q63_t x)
496 {
497 return ((q31_t) (x >> 32) != ((q31_t) x >> 31)) ?
498 ((0x7FFF ^ ((q15_t) (x >> 63)))) : (q15_t) (x >> 15);
499 }
500
501 /**
502 * @brief Clips Q31 to Q7 values.
503 */
504 static __INLINE q7_t clip_q31_to_q7(
505 q31_t x)
506 {
507 return ((q31_t) (x >> 24) != ((q31_t) x >> 23)) ?
508 ((0x7F ^ ((q7_t) (x >> 31)))) : (q7_t) x;
509 }
510
511 /**
512 * @brief Clips Q31 to Q15 values.
513 */
514 static __INLINE q15_t clip_q31_to_q15(
515 q31_t x)
516 {
517 return ((q31_t) (x >> 16) != ((q31_t) x >> 15)) ?
518 ((0x7FFF ^ ((q15_t) (x >> 31)))) : (q15_t) x;
519 }
520
521 /**
522 * @brief Multiplies 32 X 64 and returns 32 bit result in 2.30 format.
523 */
524
525 static __INLINE q63_t mult32x64(
526 q63_t x,
527 q31_t y)
528 {
529 return ((((q63_t) (x & 0x00000000FFFFFFFF) * y) >> 32) +
530 (((q63_t) (x >> 32) * y)));
531 }
532
533 /*
534 #if defined (ARM_MATH_CM0_FAMILY) && defined ( __CC_ARM )
535 #define __CLZ __clz
536 #endif
537 */
538 /* note: function can be removed when all toolchain support __CLZ for Cortex-M0 */
539 #if defined (ARM_MATH_CM0_FAMILY) && ((defined (__ICCARM__)) )
540 static __INLINE uint32_t __CLZ(
541 q31_t data);
542
543 static __INLINE uint32_t __CLZ(
544 q31_t data)
545 {
546 uint32_t count = 0;
547 uint32_t mask = 0x80000000;
548
549 while((data & mask) == 0)
550 {
551 count += 1u;
552 mask = mask >> 1u;
553 }
554
555 return (count);
556 }
557 #endif
558
559 /**
560 * @brief Function to Calculates 1/in (reciprocal) value of Q31 Data type.
561 */
562
563 static __INLINE uint32_t arm_recip_q31(
564 q31_t in,
565 q31_t * dst,
566 q31_t * pRecipTable)
567 {
568 q31_t out;
569 uint32_t tempVal;
570 uint32_t index, i;
571 uint32_t signBits;
572
573 if(in > 0)
574 {
575 signBits = ((uint32_t) (__CLZ( in) - 1));
576 }
577 else
578 {
579 signBits = ((uint32_t) (__CLZ(-in) - 1));
580 }
581
582 /* Convert input sample to 1.31 format */
583 in = (in << signBits);
584
585 /* calculation of index for initial approximated Val */
586 index = (uint32_t)(in >> 24);
587 index = (index & INDEX_MASK);
588
589 /* 1.31 with exp 1 */
590 out = pRecipTable[index];
591
592 /* calculation of reciprocal value */
593 /* running approximation for two iterations */
594 for (i = 0u; i < 2u; i++)
595 {
596 tempVal = (uint32_t) (((q63_t) in * out) >> 31);
597 tempVal = 0x7FFFFFFFu - tempVal;
598 /* 1.31 with exp 1 */
599 /* out = (q31_t) (((q63_t) out * tempVal) >> 30); */
600 out = clip_q63_to_q31(((q63_t) out * tempVal) >> 30);
601 }
602
603 /* write output */
604 *dst = out;
605
606 /* return num of signbits of out = 1/in value */
607 return (signBits + 1u);
608 }
609
610
611 /**
612 * @brief Function to Calculates 1/in (reciprocal) value of Q15 Data type.
613 */
614 static __INLINE uint32_t arm_recip_q15(
615 q15_t in,
616 q15_t * dst,
617 q15_t * pRecipTable)
618 {
619 q15_t out = 0;
620 uint32_t tempVal = 0;
621 uint32_t index = 0, i = 0;
622 uint32_t signBits = 0;
623
624 if(in > 0)
625 {
626 signBits = ((uint32_t)(__CLZ( in) - 17));
627 }
628 else
629 {
630 signBits = ((uint32_t)(__CLZ(-in) - 17));
631 }
632
633 /* Convert input sample to 1.15 format */
634 in = (in << signBits);
635
636 /* calculation of index for initial approximated Val */
637 index = (uint32_t)(in >> 8);
638 index = (index & INDEX_MASK);
639
640 /* 1.15 with exp 1 */
641 out = pRecipTable[index];
642
643 /* calculation of reciprocal value */
644 /* running approximation for two iterations */
645 for (i = 0u; i < 2u; i++)
646 {
647 tempVal = (uint32_t) (((q31_t) in * out) >> 15);
648 tempVal = 0x7FFFu - tempVal;
649 /* 1.15 with exp 1 */
650 out = (q15_t) (((q31_t) out * tempVal) >> 14);
651 /* out = clip_q31_to_q15(((q31_t) out * tempVal) >> 14); */
652 }
653
654 /* write output */
655 *dst = out;
656
657 /* return num of signbits of out = 1/in value */
658 return (signBits + 1);
659 }
660
661
662 /*
663 * @brief C custom defined intrinisic function for only M0 processors
664 */
665 #if defined(ARM_MATH_CM0_FAMILY)
666 static __INLINE q31_t __SSAT(
667 q31_t x,
668 uint32_t y)
669 {
670 int32_t posMax, negMin;
671 uint32_t i;
672
673 posMax = 1;
674 for (i = 0; i < (y - 1); i++)
675 {
676 posMax = posMax * 2;
677 }
678
679 if(x > 0)
680 {
681 posMax = (posMax - 1);
682
683 if(x > posMax)
684 {
685 x = posMax;
686 }
687 }
688 else
689 {
690 negMin = -posMax;
691
692 if(x < negMin)
693 {
694 x = negMin;
695 }
696 }
697 return (x);
698 }
699 #endif /* end of ARM_MATH_CM0_FAMILY */
700
701
702 /*
703 * @brief C custom defined intrinsic function for M3 and M0 processors
704 */
705 #if defined (ARM_MATH_CM3) || defined (ARM_MATH_CM0_FAMILY)
706
707 /*
708 * @brief C custom defined QADD8 for M3 and M0 processors
709 */
710 static __INLINE uint32_t __QADD8(
711 uint32_t x,
712 uint32_t y)
713 {
714 q31_t r, s, t, u;
715
716 r = __SSAT(((((q31_t)x << 24) >> 24) + (((q31_t)y << 24) >> 24)), 8) & (int32_t)0x000000FF;
717 s = __SSAT(((((q31_t)x << 16) >> 24) + (((q31_t)y << 16) >> 24)), 8) & (int32_t)0x000000FF;
718 t = __SSAT(((((q31_t)x << 8) >> 24) + (((q31_t)y << 8) >> 24)), 8) & (int32_t)0x000000FF;
719 u = __SSAT(((((q31_t)x ) >> 24) + (((q31_t)y ) >> 24)), 8) & (int32_t)0x000000FF;
720
721 return ((uint32_t)((u << 24) | (t << 16) | (s << 8) | (r )));
722 }
723
724
725 /*
726 * @brief C custom defined QSUB8 for M3 and M0 processors
727 */
728 static __INLINE uint32_t __QSUB8(
729 uint32_t x,
730 uint32_t y)
731 {
732 q31_t r, s, t, u;
733
734 r = __SSAT(((((q31_t)x << 24) >> 24) - (((q31_t)y << 24) >> 24)), 8) & (int32_t)0x000000FF;
735 s = __SSAT(((((q31_t)x << 16) >> 24) - (((q31_t)y << 16) >> 24)), 8) & (int32_t)0x000000FF;
736 t = __SSAT(((((q31_t)x << 8) >> 24) - (((q31_t)y << 8) >> 24)), 8) & (int32_t)0x000000FF;
737 u = __SSAT(((((q31_t)x ) >> 24) - (((q31_t)y ) >> 24)), 8) & (int32_t)0x000000FF;
738
739 return ((uint32_t)((u << 24) | (t << 16) | (s << 8) | (r )));
740 }
741
742
743 /*
744 * @brief C custom defined QADD16 for M3 and M0 processors
745 */
746 static __INLINE uint32_t __QADD16(
747 uint32_t x,
748 uint32_t y)
749 {
750 /* q31_t r, s; without initialisation 'arm_offset_q15 test' fails but 'intrinsic' tests pass! for armCC */
751 q31_t r = 0, s = 0;
752
753 r = __SSAT(((((q31_t)x << 16) >> 16) + (((q31_t)y << 16) >> 16)), 16) & (int32_t)0x0000FFFF;
754 s = __SSAT(((((q31_t)x ) >> 16) + (((q31_t)y ) >> 16)), 16) & (int32_t)0x0000FFFF;
755
756 return ((uint32_t)((s << 16) | (r )));
757 }
758
759
760 /*
761 * @brief C custom defined SHADD16 for M3 and M0 processors
762 */
763 static __INLINE uint32_t __SHADD16(
764 uint32_t x,
765 uint32_t y)
766 {
767 q31_t r, s;
768
769 r = (((((q31_t)x << 16) >> 16) + (((q31_t)y << 16) >> 16)) >> 1) & (int32_t)0x0000FFFF;
770 s = (((((q31_t)x ) >> 16) + (((q31_t)y ) >> 16)) >> 1) & (int32_t)0x0000FFFF;
771
772 return ((uint32_t)((s << 16) | (r )));
773 }
774
775
776 /*
777 * @brief C custom defined QSUB16 for M3 and M0 processors
778 */
779 static __INLINE uint32_t __QSUB16(
780 uint32_t x,
781 uint32_t y)
782 {
783 q31_t r, s;
784
785 r = __SSAT(((((q31_t)x << 16) >> 16) - (((q31_t)y << 16) >> 16)), 16) & (int32_t)0x0000FFFF;
786 s = __SSAT(((((q31_t)x ) >> 16) - (((q31_t)y ) >> 16)), 16) & (int32_t)0x0000FFFF;
787
788 return ((uint32_t)((s << 16) | (r )));
789 }
790
791
792 /*
793 * @brief C custom defined SHSUB16 for M3 and M0 processors
794 */
795 static __INLINE uint32_t __SHSUB16(
796 uint32_t x,
797 uint32_t y)
798 {
799 q31_t r, s;
800
801 r = (((((q31_t)x << 16) >> 16) - (((q31_t)y << 16) >> 16)) >> 1) & (int32_t)0x0000FFFF;
802 s = (((((q31_t)x ) >> 16) - (((q31_t)y ) >> 16)) >> 1) & (int32_t)0x0000FFFF;
803
804 return ((uint32_t)((s << 16) | (r )));
805 }
806
807
808 /*
809 * @brief C custom defined QASX for M3 and M0 processors
810 */
811 static __INLINE uint32_t __QASX(
812 uint32_t x,
813 uint32_t y)
814 {
815 q31_t r, s;
816
817 r = __SSAT(((((q31_t)x << 16) >> 16) - (((q31_t)y ) >> 16)), 16) & (int32_t)0x0000FFFF;
818 s = __SSAT(((((q31_t)x ) >> 16) + (((q31_t)y << 16) >> 16)), 16) & (int32_t)0x0000FFFF;
819
820 return ((uint32_t)((s << 16) | (r )));
821 }
822
823
824 /*
825 * @brief C custom defined SHASX for M3 and M0 processors
826 */
827 static __INLINE uint32_t __SHASX(
828 uint32_t x,
829 uint32_t y)
830 {
831 q31_t r, s;
832
833 r = (((((q31_t)x << 16) >> 16) - (((q31_t)y ) >> 16)) >> 1) & (int32_t)0x0000FFFF;
834 s = (((((q31_t)x ) >> 16) + (((q31_t)y << 16) >> 16)) >> 1) & (int32_t)0x0000FFFF;
835
836 return ((uint32_t)((s << 16) | (r )));
837 }
838
839
840 /*
841 * @brief C custom defined QSAX for M3 and M0 processors
842 */
843 static __INLINE uint32_t __QSAX(
844 uint32_t x,
845 uint32_t y)
846 {
847 q31_t r, s;
848
849 r = __SSAT(((((q31_t)x << 16) >> 16) + (((q31_t)y ) >> 16)), 16) & (int32_t)0x0000FFFF;
850 s = __SSAT(((((q31_t)x ) >> 16) - (((q31_t)y << 16) >> 16)), 16) & (int32_t)0x0000FFFF;
851
852 return ((uint32_t)((s << 16) | (r )));
853 }
854
855
856 /*
857 * @brief C custom defined SHSAX for M3 and M0 processors
858 */
859 static __INLINE uint32_t __SHSAX(
860 uint32_t x,
861 uint32_t y)
862 {
863 q31_t r, s;
864
865 r = (((((q31_t)x << 16) >> 16) + (((q31_t)y ) >> 16)) >> 1) & (int32_t)0x0000FFFF;
866 s = (((((q31_t)x ) >> 16) - (((q31_t)y << 16) >> 16)) >> 1) & (int32_t)0x0000FFFF;
867
868 return ((uint32_t)((s << 16) | (r )));
869 }
870
871
872 /*
873 * @brief C custom defined SMUSDX for M3 and M0 processors
874 */
875 static __INLINE uint32_t __SMUSDX(
876 uint32_t x,
877 uint32_t y)
878 {
879 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y ) >> 16)) -
880 ((((q31_t)x ) >> 16) * (((q31_t)y << 16) >> 16)) ));
881 }
882
883 /*
884 * @brief C custom defined SMUADX for M3 and M0 processors
885 */
886 static __INLINE uint32_t __SMUADX(
887 uint32_t x,
888 uint32_t y)
889 {
890 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y ) >> 16)) +
891 ((((q31_t)x ) >> 16) * (((q31_t)y << 16) >> 16)) ));
892 }
893
894
895 /*
896 * @brief C custom defined QADD for M3 and M0 processors
897 */
898 static __INLINE int32_t __QADD(
899 int32_t x,
900 int32_t y)
901 {
902 return ((int32_t)(clip_q63_to_q31((q63_t)x + (q31_t)y)));
903 }
904
905
906 /*
907 * @brief C custom defined QSUB for M3 and M0 processors
908 */
909 static __INLINE int32_t __QSUB(
910 int32_t x,
911 int32_t y)
912 {
913 return ((int32_t)(clip_q63_to_q31((q63_t)x - (q31_t)y)));
914 }
915
916
917 /*
918 * @brief C custom defined SMLAD for M3 and M0 processors
919 */
920 static __INLINE uint32_t __SMLAD(
921 uint32_t x,
922 uint32_t y,
923 uint32_t sum)
924 {
925 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y << 16) >> 16)) +
926 ((((q31_t)x ) >> 16) * (((q31_t)y ) >> 16)) +
927 ( ((q31_t)sum ) ) ));
928 }
929
930
931 /*
932 * @brief C custom defined SMLADX for M3 and M0 processors
933 */
934 static __INLINE uint32_t __SMLADX(
935 uint32_t x,
936 uint32_t y,
937 uint32_t sum)
938 {
939 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y ) >> 16)) +
940 ((((q31_t)x ) >> 16) * (((q31_t)y << 16) >> 16)) +
941 ( ((q31_t)sum ) ) ));
942 }
943
944
945 /*
946 * @brief C custom defined SMLSDX for M3 and M0 processors
947 */
948 static __INLINE uint32_t __SMLSDX(
949 uint32_t x,
950 uint32_t y,
951 uint32_t sum)
952 {
953 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y ) >> 16)) -
954 ((((q31_t)x ) >> 16) * (((q31_t)y << 16) >> 16)) +
955 ( ((q31_t)sum ) ) ));
956 }
957
958
959 /*
960 * @brief C custom defined SMLALD for M3 and M0 processors
961 */
962 static __INLINE uint64_t __SMLALD(
963 uint32_t x,
964 uint32_t y,
965 uint64_t sum)
966 {
967 /* return (sum + ((q15_t) (x >> 16) * (q15_t) (y >> 16)) + ((q15_t) x * (q15_t) y)); */
968 return ((uint64_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y << 16) >> 16)) +
969 ((((q31_t)x ) >> 16) * (((q31_t)y ) >> 16)) +
970 ( ((q63_t)sum ) ) ));
971 }
972
973
974 /*
975 * @brief C custom defined SMLALDX for M3 and M0 processors
976 */
977 static __INLINE uint64_t __SMLALDX(
978 uint32_t x,
979 uint32_t y,
980 uint64_t sum)
981 {
982 /* return (sum + ((q15_t) (x >> 16) * (q15_t) y)) + ((q15_t) x * (q15_t) (y >> 16)); */
983 return ((uint64_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y ) >> 16)) +
984 ((((q31_t)x ) >> 16) * (((q31_t)y << 16) >> 16)) +
985 ( ((q63_t)sum ) ) ));
986 }
987
988
989 /*
990 * @brief C custom defined SMUAD for M3 and M0 processors
991 */
992 static __INLINE uint32_t __SMUAD(
993 uint32_t x,
994 uint32_t y)
995 {
996 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y << 16) >> 16)) +
997 ((((q31_t)x ) >> 16) * (((q31_t)y ) >> 16)) ));
998 }
999
1000
1001 /*
1002 * @brief C custom defined SMUSD for M3 and M0 processors
1003 */
1004 static __INLINE uint32_t __SMUSD(
1005 uint32_t x,
1006 uint32_t y)
1007 {
1008 return ((uint32_t)(((((q31_t)x << 16) >> 16) * (((q31_t)y << 16) >> 16)) -
1009 ((((q31_t)x ) >> 16) * (((q31_t)y ) >> 16)) ));
1010 }
1011
1012
1013 /*
1014 * @brief C custom defined SXTB16 for M3 and M0 processors
1015 */
1016 static __INLINE uint32_t __SXTB16(
1017 uint32_t x)
1018 {
1019 return ((uint32_t)(((((q31_t)x << 24) >> 24) & (q31_t)0x0000FFFF) |
1020 ((((q31_t)x << 8) >> 8) & (q31_t)0xFFFF0000) ));
1021 }
1022
1023 #endif /* defined (ARM_MATH_CM3) || defined (ARM_MATH_CM0_FAMILY) */
1024
1025
1026 /**
1027 * @brief Instance structure for the Q7 FIR filter.
1028 */
1029 typedef struct
1030 {
1031 uint16_t numTaps; /**< number of filter coefficients in the filter. */
1032 q7_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
1033 q7_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
1034 } arm_fir_instance_q7;
1035
1036 /**
1037 * @brief Instance structure for the Q15 FIR filter.
1038 */
1039 typedef struct
1040 {
1041 uint16_t numTaps; /**< number of filter coefficients in the filter. */
1042 q15_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
1043 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
1044 } arm_fir_instance_q15;
1045
1046 /**
1047 * @brief Instance structure for the Q31 FIR filter.
1048 */
1049 typedef struct
1050 {
1051 uint16_t numTaps; /**< number of filter coefficients in the filter. */
1052 q31_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
1053 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
1054 } arm_fir_instance_q31;
1055
1056 /**
1057 * @brief Instance structure for the floating-point FIR filter.
1058 */
1059 typedef struct
1060 {
1061 uint16_t numTaps; /**< number of filter coefficients in the filter. */
1062 float32_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
1063 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
1064 } arm_fir_instance_f32;
1065
1066
1067 /**
1068 * @brief Processing function for the Q7 FIR filter.
1069 * @param[in] S points to an instance of the Q7 FIR filter structure.
1070 * @param[in] pSrc points to the block of input data.
1071 * @param[out] pDst points to the block of output data.
1072 * @param[in] blockSize number of samples to process.
1073 */
1074 void arm_fir_q7(
1075 const arm_fir_instance_q7 * S,
1076 q7_t * pSrc,
1077 q7_t * pDst,
1078 uint32_t blockSize);
1079
1080
1081 /**
1082 * @brief Initialization function for the Q7 FIR filter.
1083 * @param[in,out] S points to an instance of the Q7 FIR structure.
1084 * @param[in] numTaps Number of filter coefficients in the filter.
1085 * @param[in] pCoeffs points to the filter coefficients.
1086 * @param[in] pState points to the state buffer.
1087 * @param[in] blockSize number of samples that are processed.
1088 */
1089 void arm_fir_init_q7(
1090 arm_fir_instance_q7 * S,
1091 uint16_t numTaps,
1092 q7_t * pCoeffs,
1093 q7_t * pState,
1094 uint32_t blockSize);
1095
1096
1097 /**
1098 * @brief Processing function for the Q15 FIR filter.
1099 * @param[in] S points to an instance of the Q15 FIR structure.
1100 * @param[in] pSrc points to the block of input data.
1101 * @param[out] pDst points to the block of output data.
1102 * @param[in] blockSize number of samples to process.
1103 */
1104 void arm_fir_q15(
1105 const arm_fir_instance_q15 * S,
1106 q15_t * pSrc,
1107 q15_t * pDst,
1108 uint32_t blockSize);
1109
1110
1111 /**
1112 * @brief Processing function for the fast Q15 FIR filter for Cortex-M3 and Cortex-M4.
1113 * @param[in] S points to an instance of the Q15 FIR filter structure.
1114 * @param[in] pSrc points to the block of input data.
1115 * @param[out] pDst points to the block of output data.
1116 * @param[in] blockSize number of samples to process.
1117 */
1118 void arm_fir_fast_q15(
1119 const arm_fir_instance_q15 * S,
1120 q15_t * pSrc,
1121 q15_t * pDst,
1122 uint32_t blockSize);
1123
1124
1125 /**
1126 * @brief Initialization function for the Q15 FIR filter.
1127 * @param[in,out] S points to an instance of the Q15 FIR filter structure.
1128 * @param[in] numTaps Number of filter coefficients in the filter. Must be even and greater than or equal to 4.
1129 * @param[in] pCoeffs points to the filter coefficients.
1130 * @param[in] pState points to the state buffer.
1131 * @param[in] blockSize number of samples that are processed at a time.
1132 * @return The function returns ARM_MATH_SUCCESS if initialization was successful or ARM_MATH_ARGUMENT_ERROR if
1133 * <code>numTaps</code> is not a supported value.
1134 */
1135 arm_status arm_fir_init_q15(
1136 arm_fir_instance_q15 * S,
1137 uint16_t numTaps,
1138 q15_t * pCoeffs,
1139 q15_t * pState,
1140 uint32_t blockSize);
1141
1142
1143 /**
1144 * @brief Processing function for the Q31 FIR filter.
1145 * @param[in] S points to an instance of the Q31 FIR filter structure.
1146 * @param[in] pSrc points to the block of input data.
1147 * @param[out] pDst points to the block of output data.
1148 * @param[in] blockSize number of samples to process.
1149 */
1150 void arm_fir_q31(
1151 const arm_fir_instance_q31 * S,
1152 q31_t * pSrc,
1153 q31_t * pDst,
1154 uint32_t blockSize);
1155
1156
1157 /**
1158 * @brief Processing function for the fast Q31 FIR filter for Cortex-M3 and Cortex-M4.
1159 * @param[in] S points to an instance of the Q31 FIR structure.
1160 * @param[in] pSrc points to the block of input data.
1161 * @param[out] pDst points to the block of output data.
1162 * @param[in] blockSize number of samples to process.
1163 */
1164 void arm_fir_fast_q31(
1165 const arm_fir_instance_q31 * S,
1166 q31_t * pSrc,
1167 q31_t * pDst,
1168 uint32_t blockSize);
1169
1170
1171 /**
1172 * @brief Initialization function for the Q31 FIR filter.
1173 * @param[in,out] S points to an instance of the Q31 FIR structure.
1174 * @param[in] numTaps Number of filter coefficients in the filter.
1175 * @param[in] pCoeffs points to the filter coefficients.
1176 * @param[in] pState points to the state buffer.
1177 * @param[in] blockSize number of samples that are processed at a time.
1178 */
1179 void arm_fir_init_q31(
1180 arm_fir_instance_q31 * S,
1181 uint16_t numTaps,
1182 q31_t * pCoeffs,
1183 q31_t * pState,
1184 uint32_t blockSize);
1185
1186
1187 /**
1188 * @brief Processing function for the floating-point FIR filter.
1189 * @param[in] S points to an instance of the floating-point FIR structure.
1190 * @param[in] pSrc points to the block of input data.
1191 * @param[out] pDst points to the block of output data.
1192 * @param[in] blockSize number of samples to process.
1193 */
1194 void arm_fir_f32(
1195 const arm_fir_instance_f32 * S,
1196 float32_t * pSrc,
1197 float32_t * pDst,
1198 uint32_t blockSize);
1199
1200
1201 /**
1202 * @brief Initialization function for the floating-point FIR filter.
1203 * @param[in,out] S points to an instance of the floating-point FIR filter structure.
1204 * @param[in] numTaps Number of filter coefficients in the filter.
1205 * @param[in] pCoeffs points to the filter coefficients.
1206 * @param[in] pState points to the state buffer.
1207 * @param[in] blockSize number of samples that are processed at a time.
1208 */
1209 void arm_fir_init_f32(
1210 arm_fir_instance_f32 * S,
1211 uint16_t numTaps,
1212 float32_t * pCoeffs,
1213 float32_t * pState,
1214 uint32_t blockSize);
1215
1216
1217 /**
1218 * @brief Instance structure for the Q15 Biquad cascade filter.
1219 */
1220 typedef struct
1221 {
1222 int8_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
1223 q15_t *pState; /**< Points to the array of state coefficients. The array is of length 4*numStages. */
1224 q15_t *pCoeffs; /**< Points to the array of coefficients. The array is of length 5*numStages. */
1225 int8_t postShift; /**< Additional shift, in bits, applied to each output sample. */
1226 } arm_biquad_casd_df1_inst_q15;
1227
1228 /**
1229 * @brief Instance structure for the Q31 Biquad cascade filter.
1230 */
1231 typedef struct
1232 {
1233 uint32_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
1234 q31_t *pState; /**< Points to the array of state coefficients. The array is of length 4*numStages. */
1235 q31_t *pCoeffs; /**< Points to the array of coefficients. The array is of length 5*numStages. */
1236 uint8_t postShift; /**< Additional shift, in bits, applied to each output sample. */
1237 } arm_biquad_casd_df1_inst_q31;
1238
1239 /**
1240 * @brief Instance structure for the floating-point Biquad cascade filter.
1241 */
1242 typedef struct
1243 {
1244 uint32_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
1245 float32_t *pState; /**< Points to the array of state coefficients. The array is of length 4*numStages. */
1246 float32_t *pCoeffs; /**< Points to the array of coefficients. The array is of length 5*numStages. */
1247 } arm_biquad_casd_df1_inst_f32;
1248
1249
1250 /**
1251 * @brief Processing function for the Q15 Biquad cascade filter.
1252 * @param[in] S points to an instance of the Q15 Biquad cascade structure.
1253 * @param[in] pSrc points to the block of input data.
1254 * @param[out] pDst points to the block of output data.
1255 * @param[in] blockSize number of samples to process.
1256 */
1257 void arm_biquad_cascade_df1_q15(
1258 const arm_biquad_casd_df1_inst_q15 * S,
1259 q15_t * pSrc,
1260 q15_t * pDst,
1261 uint32_t blockSize);
1262
1263
1264 /**
1265 * @brief Initialization function for the Q15 Biquad cascade filter.
1266 * @param[in,out] S points to an instance of the Q15 Biquad cascade structure.
1267 * @param[in] numStages number of 2nd order stages in the filter.
1268 * @param[in] pCoeffs points to the filter coefficients.
1269 * @param[in] pState points to the state buffer.
1270 * @param[in] postShift Shift to be applied to the output. Varies according to the coefficients format
1271 */
1272 void arm_biquad_cascade_df1_init_q15(
1273 arm_biquad_casd_df1_inst_q15 * S,
1274 uint8_t numStages,
1275 q15_t * pCoeffs,
1276 q15_t * pState,
1277 int8_t postShift);
1278
1279
1280 /**
1281 * @brief Fast but less precise processing function for the Q15 Biquad cascade filter for Cortex-M3 and Cortex-M4.
1282 * @param[in] S points to an instance of the Q15 Biquad cascade structure.
1283 * @param[in] pSrc points to the block of input data.
1284 * @param[out] pDst points to the block of output data.
1285 * @param[in] blockSize number of samples to process.
1286 */
1287 void arm_biquad_cascade_df1_fast_q15(
1288 const arm_biquad_casd_df1_inst_q15 * S,
1289 q15_t * pSrc,
1290 q15_t * pDst,
1291 uint32_t blockSize);
1292
1293
1294 /**
1295 * @brief Processing function for the Q31 Biquad cascade filter
1296 * @param[in] S points to an instance of the Q31 Biquad cascade structure.
1297 * @param[in] pSrc points to the block of input data.
1298 * @param[out] pDst points to the block of output data.
1299 * @param[in] blockSize number of samples to process.
1300 */
1301 void arm_biquad_cascade_df1_q31(
1302 const arm_biquad_casd_df1_inst_q31 * S,
1303 q31_t * pSrc,
1304 q31_t * pDst,
1305 uint32_t blockSize);
1306
1307
1308 /**
1309 * @brief Fast but less precise processing function for the Q31 Biquad cascade filter for Cortex-M3 and Cortex-M4.
1310 * @param[in] S points to an instance of the Q31 Biquad cascade structure.
1311 * @param[in] pSrc points to the block of input data.
1312 * @param[out] pDst points to the block of output data.
1313 * @param[in] blockSize number of samples to process.
1314 */
1315 void arm_biquad_cascade_df1_fast_q31(
1316 const arm_biquad_casd_df1_inst_q31 * S,
1317 q31_t * pSrc,
1318 q31_t * pDst,
1319 uint32_t blockSize);
1320
1321
1322 /**
1323 * @brief Initialization function for the Q31 Biquad cascade filter.
1324 * @param[in,out] S points to an instance of the Q31 Biquad cascade structure.
1325 * @param[in] numStages number of 2nd order stages in the filter.
1326 * @param[in] pCoeffs points to the filter coefficients.
1327 * @param[in] pState points to the state buffer.
1328 * @param[in] postShift Shift to be applied to the output. Varies according to the coefficients format
1329 */
1330 void arm_biquad_cascade_df1_init_q31(
1331 arm_biquad_casd_df1_inst_q31 * S,
1332 uint8_t numStages,
1333 q31_t * pCoeffs,
1334 q31_t * pState,
1335 int8_t postShift);
1336
1337
1338 /**
1339 * @brief Processing function for the floating-point Biquad cascade filter.
1340 * @param[in] S points to an instance of the floating-point Biquad cascade structure.
1341 * @param[in] pSrc points to the block of input data.
1342 * @param[out] pDst points to the block of output data.
1343 * @param[in] blockSize number of samples to process.
1344 */
1345 void arm_biquad_cascade_df1_f32(
1346 const arm_biquad_casd_df1_inst_f32 * S,
1347 float32_t * pSrc,
1348 float32_t * pDst,
1349 uint32_t blockSize);
1350
1351
1352 /**
1353 * @brief Initialization function for the floating-point Biquad cascade filter.
1354 * @param[in,out] S points to an instance of the floating-point Biquad cascade structure.
1355 * @param[in] numStages number of 2nd order stages in the filter.
1356 * @param[in] pCoeffs points to the filter coefficients.
1357 * @param[in] pState points to the state buffer.
1358 */
1359 void arm_biquad_cascade_df1_init_f32(
1360 arm_biquad_casd_df1_inst_f32 * S,
1361 uint8_t numStages,
1362 float32_t * pCoeffs,
1363 float32_t * pState);
1364
1365
1366 /**
1367 * @brief Instance structure for the floating-point matrix structure.
1368 */
1369 typedef struct
1370 {
1371 uint16_t numRows; /**< number of rows of the matrix. */
1372 uint16_t numCols; /**< number of columns of the matrix. */
1373 float32_t *pData; /**< points to the data of the matrix. */
1374 } arm_matrix_instance_f32;
1375
1376
1377 /**
1378 * @brief Instance structure for the floating-point matrix structure.
1379 */
1380 typedef struct
1381 {
1382 uint16_t numRows; /**< number of rows of the matrix. */
1383 uint16_t numCols; /**< number of columns of the matrix. */
1384 float64_t *pData; /**< points to the data of the matrix. */
1385 } arm_matrix_instance_f64;
1386
1387 /**
1388 * @brief Instance structure for the Q15 matrix structure.
1389 */
1390 typedef struct
1391 {
1392 uint16_t numRows; /**< number of rows of the matrix. */
1393 uint16_t numCols; /**< number of columns of the matrix. */
1394 q15_t *pData; /**< points to the data of the matrix. */
1395 } arm_matrix_instance_q15;
1396
1397 /**
1398 * @brief Instance structure for the Q31 matrix structure.
1399 */
1400 typedef struct
1401 {
1402 uint16_t numRows; /**< number of rows of the matrix. */
1403 uint16_t numCols; /**< number of columns of the matrix. */
1404 q31_t *pData; /**< points to the data of the matrix. */
1405 } arm_matrix_instance_q31;
1406
1407
1408 /**
1409 * @brief Floating-point matrix addition.
1410 * @param[in] pSrcA points to the first input matrix structure
1411 * @param[in] pSrcB points to the second input matrix structure
1412 * @param[out] pDst points to output matrix structure
1413 * @return The function returns either
1414 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1415 */
1416 arm_status arm_mat_add_f32(
1417 const arm_matrix_instance_f32 * pSrcA,
1418 const arm_matrix_instance_f32 * pSrcB,
1419 arm_matrix_instance_f32 * pDst);
1420
1421
1422 /**
1423 * @brief Q15 matrix addition.
1424 * @param[in] pSrcA points to the first input matrix structure
1425 * @param[in] pSrcB points to the second input matrix structure
1426 * @param[out] pDst points to output matrix structure
1427 * @return The function returns either
1428 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1429 */
1430 arm_status arm_mat_add_q15(
1431 const arm_matrix_instance_q15 * pSrcA,
1432 const arm_matrix_instance_q15 * pSrcB,
1433 arm_matrix_instance_q15 * pDst);
1434
1435
1436 /**
1437 * @brief Q31 matrix addition.
1438 * @param[in] pSrcA points to the first input matrix structure
1439 * @param[in] pSrcB points to the second input matrix structure
1440 * @param[out] pDst points to output matrix structure
1441 * @return The function returns either
1442 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1443 */
1444 arm_status arm_mat_add_q31(
1445 const arm_matrix_instance_q31 * pSrcA,
1446 const arm_matrix_instance_q31 * pSrcB,
1447 arm_matrix_instance_q31 * pDst);
1448
1449
1450 /**
1451 * @brief Floating-point, complex, matrix multiplication.
1452 * @param[in] pSrcA points to the first input matrix structure
1453 * @param[in] pSrcB points to the second input matrix structure
1454 * @param[out] pDst points to output matrix structure
1455 * @return The function returns either
1456 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1457 */
1458 arm_status arm_mat_cmplx_mult_f32(
1459 const arm_matrix_instance_f32 * pSrcA,
1460 const arm_matrix_instance_f32 * pSrcB,
1461 arm_matrix_instance_f32 * pDst);
1462
1463
1464 /**
1465 * @brief Q15, complex, matrix multiplication.
1466 * @param[in] pSrcA points to the first input matrix structure
1467 * @param[in] pSrcB points to the second input matrix structure
1468 * @param[out] pDst points to output matrix structure
1469 * @return The function returns either
1470 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1471 */
1472 arm_status arm_mat_cmplx_mult_q15(
1473 const arm_matrix_instance_q15 * pSrcA,
1474 const arm_matrix_instance_q15 * pSrcB,
1475 arm_matrix_instance_q15 * pDst,
1476 q15_t * pScratch);
1477
1478
1479 /**
1480 * @brief Q31, complex, matrix multiplication.
1481 * @param[in] pSrcA points to the first input matrix structure
1482 * @param[in] pSrcB points to the second input matrix structure
1483 * @param[out] pDst points to output matrix structure
1484 * @return The function returns either
1485 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1486 */
1487 arm_status arm_mat_cmplx_mult_q31(
1488 const arm_matrix_instance_q31 * pSrcA,
1489 const arm_matrix_instance_q31 * pSrcB,
1490 arm_matrix_instance_q31 * pDst);
1491
1492
1493 /**
1494 * @brief Floating-point matrix transpose.
1495 * @param[in] pSrc points to the input matrix
1496 * @param[out] pDst points to the output matrix
1497 * @return The function returns either <code>ARM_MATH_SIZE_MISMATCH</code>
1498 * or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1499 */
1500 arm_status arm_mat_trans_f32(
1501 const arm_matrix_instance_f32 * pSrc,
1502 arm_matrix_instance_f32 * pDst);
1503
1504
1505 /**
1506 * @brief Q15 matrix transpose.
1507 * @param[in] pSrc points to the input matrix
1508 * @param[out] pDst points to the output matrix
1509 * @return The function returns either <code>ARM_MATH_SIZE_MISMATCH</code>
1510 * or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1511 */
1512 arm_status arm_mat_trans_q15(
1513 const arm_matrix_instance_q15 * pSrc,
1514 arm_matrix_instance_q15 * pDst);
1515
1516
1517 /**
1518 * @brief Q31 matrix transpose.
1519 * @param[in] pSrc points to the input matrix
1520 * @param[out] pDst points to the output matrix
1521 * @return The function returns either <code>ARM_MATH_SIZE_MISMATCH</code>
1522 * or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1523 */
1524 arm_status arm_mat_trans_q31(
1525 const arm_matrix_instance_q31 * pSrc,
1526 arm_matrix_instance_q31 * pDst);
1527
1528
1529 /**
1530 * @brief Floating-point matrix multiplication
1531 * @param[in] pSrcA points to the first input matrix structure
1532 * @param[in] pSrcB points to the second input matrix structure
1533 * @param[out] pDst points to output matrix structure
1534 * @return The function returns either
1535 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1536 */
1537 arm_status arm_mat_mult_f32(
1538 const arm_matrix_instance_f32 * pSrcA,
1539 const arm_matrix_instance_f32 * pSrcB,
1540 arm_matrix_instance_f32 * pDst);
1541
1542
1543 /**
1544 * @brief Q15 matrix multiplication
1545 * @param[in] pSrcA points to the first input matrix structure
1546 * @param[in] pSrcB points to the second input matrix structure
1547 * @param[out] pDst points to output matrix structure
1548 * @param[in] pState points to the array for storing intermediate results
1549 * @return The function returns either
1550 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1551 */
1552 arm_status arm_mat_mult_q15(
1553 const arm_matrix_instance_q15 * pSrcA,
1554 const arm_matrix_instance_q15 * pSrcB,
1555 arm_matrix_instance_q15 * pDst,
1556 q15_t * pState);
1557
1558
1559 /**
1560 * @brief Q15 matrix multiplication (fast variant) for Cortex-M3 and Cortex-M4
1561 * @param[in] pSrcA points to the first input matrix structure
1562 * @param[in] pSrcB points to the second input matrix structure
1563 * @param[out] pDst points to output matrix structure
1564 * @param[in] pState points to the array for storing intermediate results
1565 * @return The function returns either
1566 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1567 */
1568 arm_status arm_mat_mult_fast_q15(
1569 const arm_matrix_instance_q15 * pSrcA,
1570 const arm_matrix_instance_q15 * pSrcB,
1571 arm_matrix_instance_q15 * pDst,
1572 q15_t * pState);
1573
1574
1575 /**
1576 * @brief Q31 matrix multiplication
1577 * @param[in] pSrcA points to the first input matrix structure
1578 * @param[in] pSrcB points to the second input matrix structure
1579 * @param[out] pDst points to output matrix structure
1580 * @return The function returns either
1581 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1582 */
1583 arm_status arm_mat_mult_q31(
1584 const arm_matrix_instance_q31 * pSrcA,
1585 const arm_matrix_instance_q31 * pSrcB,
1586 arm_matrix_instance_q31 * pDst);
1587
1588
1589 /**
1590 * @brief Q31 matrix multiplication (fast variant) for Cortex-M3 and Cortex-M4
1591 * @param[in] pSrcA points to the first input matrix structure
1592 * @param[in] pSrcB points to the second input matrix structure
1593 * @param[out] pDst points to output matrix structure
1594 * @return The function returns either
1595 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1596 */
1597 arm_status arm_mat_mult_fast_q31(
1598 const arm_matrix_instance_q31 * pSrcA,
1599 const arm_matrix_instance_q31 * pSrcB,
1600 arm_matrix_instance_q31 * pDst);
1601
1602
1603 /**
1604 * @brief Floating-point matrix subtraction
1605 * @param[in] pSrcA points to the first input matrix structure
1606 * @param[in] pSrcB points to the second input matrix structure
1607 * @param[out] pDst points to output matrix structure
1608 * @return The function returns either
1609 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1610 */
1611 arm_status arm_mat_sub_f32(
1612 const arm_matrix_instance_f32 * pSrcA,
1613 const arm_matrix_instance_f32 * pSrcB,
1614 arm_matrix_instance_f32 * pDst);
1615
1616
1617 /**
1618 * @brief Q15 matrix subtraction
1619 * @param[in] pSrcA points to the first input matrix structure
1620 * @param[in] pSrcB points to the second input matrix structure
1621 * @param[out] pDst points to output matrix structure
1622 * @return The function returns either
1623 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1624 */
1625 arm_status arm_mat_sub_q15(
1626 const arm_matrix_instance_q15 * pSrcA,
1627 const arm_matrix_instance_q15 * pSrcB,
1628 arm_matrix_instance_q15 * pDst);
1629
1630
1631 /**
1632 * @brief Q31 matrix subtraction
1633 * @param[in] pSrcA points to the first input matrix structure
1634 * @param[in] pSrcB points to the second input matrix structure
1635 * @param[out] pDst points to output matrix structure
1636 * @return The function returns either
1637 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1638 */
1639 arm_status arm_mat_sub_q31(
1640 const arm_matrix_instance_q31 * pSrcA,
1641 const arm_matrix_instance_q31 * pSrcB,
1642 arm_matrix_instance_q31 * pDst);
1643
1644
1645 /**
1646 * @brief Floating-point matrix scaling.
1647 * @param[in] pSrc points to the input matrix
1648 * @param[in] scale scale factor
1649 * @param[out] pDst points to the output matrix
1650 * @return The function returns either
1651 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1652 */
1653 arm_status arm_mat_scale_f32(
1654 const arm_matrix_instance_f32 * pSrc,
1655 float32_t scale,
1656 arm_matrix_instance_f32 * pDst);
1657
1658
1659 /**
1660 * @brief Q15 matrix scaling.
1661 * @param[in] pSrc points to input matrix
1662 * @param[in] scaleFract fractional portion of the scale factor
1663 * @param[in] shift number of bits to shift the result by
1664 * @param[out] pDst points to output matrix
1665 * @return The function returns either
1666 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1667 */
1668 arm_status arm_mat_scale_q15(
1669 const arm_matrix_instance_q15 * pSrc,
1670 q15_t scaleFract,
1671 int32_t shift,
1672 arm_matrix_instance_q15 * pDst);
1673
1674
1675 /**
1676 * @brief Q31 matrix scaling.
1677 * @param[in] pSrc points to input matrix
1678 * @param[in] scaleFract fractional portion of the scale factor
1679 * @param[in] shift number of bits to shift the result by
1680 * @param[out] pDst points to output matrix structure
1681 * @return The function returns either
1682 * <code>ARM_MATH_SIZE_MISMATCH</code> or <code>ARM_MATH_SUCCESS</code> based on the outcome of size checking.
1683 */
1684 arm_status arm_mat_scale_q31(
1685 const arm_matrix_instance_q31 * pSrc,
1686 q31_t scaleFract,
1687 int32_t shift,
1688 arm_matrix_instance_q31 * pDst);
1689
1690
1691 /**
1692 * @brief Q31 matrix initialization.
1693 * @param[in,out] S points to an instance of the floating-point matrix structure.
1694 * @param[in] nRows number of rows in the matrix.
1695 * @param[in] nColumns number of columns in the matrix.
1696 * @param[in] pData points to the matrix data array.
1697 */
1698 void arm_mat_init_q31(
1699 arm_matrix_instance_q31 * S,
1700 uint16_t nRows,
1701 uint16_t nColumns,
1702 q31_t * pData);
1703
1704
1705 /**
1706 * @brief Q15 matrix initialization.
1707 * @param[in,out] S points to an instance of the floating-point matrix structure.
1708 * @param[in] nRows number of rows in the matrix.
1709 * @param[in] nColumns number of columns in the matrix.
1710 * @param[in] pData points to the matrix data array.
1711 */
1712 void arm_mat_init_q15(
1713 arm_matrix_instance_q15 * S,
1714 uint16_t nRows,
1715 uint16_t nColumns,
1716 q15_t * pData);
1717
1718
1719 /**
1720 * @brief Floating-point matrix initialization.
1721 * @param[in,out] S points to an instance of the floating-point matrix structure.
1722 * @param[in] nRows number of rows in the matrix.
1723 * @param[in] nColumns number of columns in the matrix.
1724 * @param[in] pData points to the matrix data array.
1725 */
1726 void arm_mat_init_f32(
1727 arm_matrix_instance_f32 * S,
1728 uint16_t nRows,
1729 uint16_t nColumns,
1730 float32_t * pData);
1731
1732
1733
1734 /**
1735 * @brief Instance structure for the Q15 PID Control.
1736 */
1737 typedef struct
1738 {
1739 q15_t A0; /**< The derived gain, A0 = Kp + Ki + Kd . */
1740 #ifdef ARM_MATH_CM0_FAMILY
1741 q15_t A1;
1742 q15_t A2;
1743 #else
1744 q31_t A1; /**< The derived gain A1 = -Kp - 2Kd | Kd.*/
1745 #endif
1746 q15_t state[3]; /**< The state array of length 3. */
1747 q15_t Kp; /**< The proportional gain. */
1748 q15_t Ki; /**< The integral gain. */
1749 q15_t Kd; /**< The derivative gain. */
1750 } arm_pid_instance_q15;
1751
1752 /**
1753 * @brief Instance structure for the Q31 PID Control.
1754 */
1755 typedef struct
1756 {
1757 q31_t A0; /**< The derived gain, A0 = Kp + Ki + Kd . */
1758 q31_t A1; /**< The derived gain, A1 = -Kp - 2Kd. */
1759 q31_t A2; /**< The derived gain, A2 = Kd . */
1760 q31_t state[3]; /**< The state array of length 3. */
1761 q31_t Kp; /**< The proportional gain. */
1762 q31_t Ki; /**< The integral gain. */
1763 q31_t Kd; /**< The derivative gain. */
1764 } arm_pid_instance_q31;
1765
1766 /**
1767 * @brief Instance structure for the floating-point PID Control.
1768 */
1769 typedef struct
1770 {
1771 float32_t A0; /**< The derived gain, A0 = Kp + Ki + Kd . */
1772 float32_t A1; /**< The derived gain, A1 = -Kp - 2Kd. */
1773 float32_t A2; /**< The derived gain, A2 = Kd . */
1774 float32_t state[3]; /**< The state array of length 3. */
1775 float32_t Kp; /**< The proportional gain. */
1776 float32_t Ki; /**< The integral gain. */
1777 float32_t Kd; /**< The derivative gain. */
1778 } arm_pid_instance_f32;
1779
1780
1781
1782 /**
1783 * @brief Initialization function for the floating-point PID Control.
1784 * @param[in,out] S points to an instance of the PID structure.
1785 * @param[in] resetStateFlag flag to reset the state. 0 = no change in state 1 = reset the state.
1786 */
1787 void arm_pid_init_f32(
1788 arm_pid_instance_f32 * S,
1789 int32_t resetStateFlag);
1790
1791
1792 /**
1793 * @brief Reset function for the floating-point PID Control.
1794 * @param[in,out] S is an instance of the floating-point PID Control structure
1795 */
1796 void arm_pid_reset_f32(
1797 arm_pid_instance_f32 * S);
1798
1799
1800 /**
1801 * @brief Initialization function for the Q31 PID Control.
1802 * @param[in,out] S points to an instance of the Q15 PID structure.
1803 * @param[in] resetStateFlag flag to reset the state. 0 = no change in state 1 = reset the state.
1804 */
1805 void arm_pid_init_q31(
1806 arm_pid_instance_q31 * S,
1807 int32_t resetStateFlag);
1808
1809
1810 /**
1811 * @brief Reset function for the Q31 PID Control.
1812 * @param[in,out] S points to an instance of the Q31 PID Control structure
1813 */
1814
1815 void arm_pid_reset_q31(
1816 arm_pid_instance_q31 * S);
1817
1818
1819 /**
1820 * @brief Initialization function for the Q15 PID Control.
1821 * @param[in,out] S points to an instance of the Q15 PID structure.
1822 * @param[in] resetStateFlag flag to reset the state. 0 = no change in state 1 = reset the state.
1823 */
1824 void arm_pid_init_q15(
1825 arm_pid_instance_q15 * S,
1826 int32_t resetStateFlag);
1827
1828
1829 /**
1830 * @brief Reset function for the Q15 PID Control.
1831 * @param[in,out] S points to an instance of the q15 PID Control structure
1832 */
1833 void arm_pid_reset_q15(
1834 arm_pid_instance_q15 * S);
1835
1836
1837 /**
1838 * @brief Instance structure for the floating-point Linear Interpolate function.
1839 */
1840 typedef struct
1841 {
1842 uint32_t nValues; /**< nValues */
1843 float32_t x1; /**< x1 */
1844 float32_t xSpacing; /**< xSpacing */
1845 float32_t *pYData; /**< pointer to the table of Y values */
1846 } arm_linear_interp_instance_f32;
1847
1848 /**
1849 * @brief Instance structure for the floating-point bilinear interpolation function.
1850 */
1851 typedef struct
1852 {
1853 uint16_t numRows; /**< number of rows in the data table. */
1854 uint16_t numCols; /**< number of columns in the data table. */
1855 float32_t *pData; /**< points to the data table. */
1856 } arm_bilinear_interp_instance_f32;
1857
1858 /**
1859 * @brief Instance structure for the Q31 bilinear interpolation function.
1860 */
1861 typedef struct
1862 {
1863 uint16_t numRows; /**< number of rows in the data table. */
1864 uint16_t numCols; /**< number of columns in the data table. */
1865 q31_t *pData; /**< points to the data table. */
1866 } arm_bilinear_interp_instance_q31;
1867
1868 /**
1869 * @brief Instance structure for the Q15 bilinear interpolation function.
1870 */
1871 typedef struct
1872 {
1873 uint16_t numRows; /**< number of rows in the data table. */
1874 uint16_t numCols; /**< number of columns in the data table. */
1875 q15_t *pData; /**< points to the data table. */
1876 } arm_bilinear_interp_instance_q15;
1877
1878 /**
1879 * @brief Instance structure for the Q15 bilinear interpolation function.
1880 */
1881 typedef struct
1882 {
1883 uint16_t numRows; /**< number of rows in the data table. */
1884 uint16_t numCols; /**< number of columns in the data table. */
1885 q7_t *pData; /**< points to the data table. */
1886 } arm_bilinear_interp_instance_q7;
1887
1888
1889 /**
1890 * @brief Q7 vector multiplication.
1891 * @param[in] pSrcA points to the first input vector
1892 * @param[in] pSrcB points to the second input vector
1893 * @param[out] pDst points to the output vector
1894 * @param[in] blockSize number of samples in each vector
1895 */
1896 void arm_mult_q7(
1897 q7_t * pSrcA,
1898 q7_t * pSrcB,
1899 q7_t * pDst,
1900 uint32_t blockSize);
1901
1902
1903 /**
1904 * @brief Q15 vector multiplication.
1905 * @param[in] pSrcA points to the first input vector
1906 * @param[in] pSrcB points to the second input vector
1907 * @param[out] pDst points to the output vector
1908 * @param[in] blockSize number of samples in each vector
1909 */
1910 void arm_mult_q15(
1911 q15_t * pSrcA,
1912 q15_t * pSrcB,
1913 q15_t * pDst,
1914 uint32_t blockSize);
1915
1916
1917 /**
1918 * @brief Q31 vector multiplication.
1919 * @param[in] pSrcA points to the first input vector
1920 * @param[in] pSrcB points to the second input vector
1921 * @param[out] pDst points to the output vector
1922 * @param[in] blockSize number of samples in each vector
1923 */
1924 void arm_mult_q31(
1925 q31_t * pSrcA,
1926 q31_t * pSrcB,
1927 q31_t * pDst,
1928 uint32_t blockSize);
1929
1930
1931 /**
1932 * @brief Floating-point vector multiplication.
1933 * @param[in] pSrcA points to the first input vector
1934 * @param[in] pSrcB points to the second input vector
1935 * @param[out] pDst points to the output vector
1936 * @param[in] blockSize number of samples in each vector
1937 */
1938 void arm_mult_f32(
1939 float32_t * pSrcA,
1940 float32_t * pSrcB,
1941 float32_t * pDst,
1942 uint32_t blockSize);
1943
1944
1945 /**
1946 * @brief Instance structure for the Q15 CFFT/CIFFT function.
1947 */
1948 typedef struct
1949 {
1950 uint16_t fftLen; /**< length of the FFT. */
1951 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
1952 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
1953 q15_t *pTwiddle; /**< points to the Sin twiddle factor table. */
1954 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
1955 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
1956 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
1957 } arm_cfft_radix2_instance_q15;
1958
1959 /* Deprecated */
1960 arm_status arm_cfft_radix2_init_q15(
1961 arm_cfft_radix2_instance_q15 * S,
1962 uint16_t fftLen,
1963 uint8_t ifftFlag,
1964 uint8_t bitReverseFlag);
1965
1966 /* Deprecated */
1967 void arm_cfft_radix2_q15(
1968 const arm_cfft_radix2_instance_q15 * S,
1969 q15_t * pSrc);
1970
1971
1972 /**
1973 * @brief Instance structure for the Q15 CFFT/CIFFT function.
1974 */
1975 typedef struct
1976 {
1977 uint16_t fftLen; /**< length of the FFT. */
1978 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
1979 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
1980 q15_t *pTwiddle; /**< points to the twiddle factor table. */
1981 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
1982 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
1983 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
1984 } arm_cfft_radix4_instance_q15;
1985
1986 /* Deprecated */
1987 arm_status arm_cfft_radix4_init_q15(
1988 arm_cfft_radix4_instance_q15 * S,
1989 uint16_t fftLen,
1990 uint8_t ifftFlag,
1991 uint8_t bitReverseFlag);
1992
1993 /* Deprecated */
1994 void arm_cfft_radix4_q15(
1995 const arm_cfft_radix4_instance_q15 * S,
1996 q15_t * pSrc);
1997
1998 /**
1999 * @brief Instance structure for the Radix-2 Q31 CFFT/CIFFT function.
2000 */
2001 typedef struct
2002 {
2003 uint16_t fftLen; /**< length of the FFT. */
2004 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
2005 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
2006 q31_t *pTwiddle; /**< points to the Twiddle factor table. */
2007 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2008 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2009 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
2010 } arm_cfft_radix2_instance_q31;
2011
2012 /* Deprecated */
2013 arm_status arm_cfft_radix2_init_q31(
2014 arm_cfft_radix2_instance_q31 * S,
2015 uint16_t fftLen,
2016 uint8_t ifftFlag,
2017 uint8_t bitReverseFlag);
2018
2019 /* Deprecated */
2020 void arm_cfft_radix2_q31(
2021 const arm_cfft_radix2_instance_q31 * S,
2022 q31_t * pSrc);
2023
2024 /**
2025 * @brief Instance structure for the Q31 CFFT/CIFFT function.
2026 */
2027 typedef struct
2028 {
2029 uint16_t fftLen; /**< length of the FFT. */
2030 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
2031 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
2032 q31_t *pTwiddle; /**< points to the twiddle factor table. */
2033 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2034 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2035 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
2036 } arm_cfft_radix4_instance_q31;
2037
2038 /* Deprecated */
2039 void arm_cfft_radix4_q31(
2040 const arm_cfft_radix4_instance_q31 * S,
2041 q31_t * pSrc);
2042
2043 /* Deprecated */
2044 arm_status arm_cfft_radix4_init_q31(
2045 arm_cfft_radix4_instance_q31 * S,
2046 uint16_t fftLen,
2047 uint8_t ifftFlag,
2048 uint8_t bitReverseFlag);
2049
2050 /**
2051 * @brief Instance structure for the floating-point CFFT/CIFFT function.
2052 */
2053 typedef struct
2054 {
2055 uint16_t fftLen; /**< length of the FFT. */
2056 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
2057 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
2058 float32_t *pTwiddle; /**< points to the Twiddle factor table. */
2059 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2060 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2061 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
2062 float32_t onebyfftLen; /**< value of 1/fftLen. */
2063 } arm_cfft_radix2_instance_f32;
2064
2065 /* Deprecated */
2066 arm_status arm_cfft_radix2_init_f32(
2067 arm_cfft_radix2_instance_f32 * S,
2068 uint16_t fftLen,
2069 uint8_t ifftFlag,
2070 uint8_t bitReverseFlag);
2071
2072 /* Deprecated */
2073 void arm_cfft_radix2_f32(
2074 const arm_cfft_radix2_instance_f32 * S,
2075 float32_t * pSrc);
2076
2077 /**
2078 * @brief Instance structure for the floating-point CFFT/CIFFT function.
2079 */
2080 typedef struct
2081 {
2082 uint16_t fftLen; /**< length of the FFT. */
2083 uint8_t ifftFlag; /**< flag that selects forward (ifftFlag=0) or inverse (ifftFlag=1) transform. */
2084 uint8_t bitReverseFlag; /**< flag that enables (bitReverseFlag=1) or disables (bitReverseFlag=0) bit reversal of output. */
2085 float32_t *pTwiddle; /**< points to the Twiddle factor table. */
2086 uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2087 uint16_t twidCoefModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2088 uint16_t bitRevFactor; /**< bit reversal modifier that supports different size FFTs with the same bit reversal table. */
2089 float32_t onebyfftLen; /**< value of 1/fftLen. */
2090 } arm_cfft_radix4_instance_f32;
2091
2092 /* Deprecated */
2093 arm_status arm_cfft_radix4_init_f32(
2094 arm_cfft_radix4_instance_f32 * S,
2095 uint16_t fftLen,
2096 uint8_t ifftFlag,
2097 uint8_t bitReverseFlag);
2098
2099 /* Deprecated */
2100 void arm_cfft_radix4_f32(
2101 const arm_cfft_radix4_instance_f32 * S,
2102 float32_t * pSrc);
2103
2104 /**
2105 * @brief Instance structure for the fixed-point CFFT/CIFFT function.
2106 */
2107 typedef struct
2108 {
2109 uint16_t fftLen; /**< length of the FFT. */
2110 const q15_t *pTwiddle; /**< points to the Twiddle factor table. */
2111 const uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2112 uint16_t bitRevLength; /**< bit reversal table length. */
2113 } arm_cfft_instance_q15;
2114
2115 void arm_cfft_q15(
2116 const arm_cfft_instance_q15 * S,
2117 q15_t * p1,
2118 uint8_t ifftFlag,
2119 uint8_t bitReverseFlag);
2120
2121 /**
2122 * @brief Instance structure for the fixed-point CFFT/CIFFT function.
2123 */
2124 typedef struct
2125 {
2126 uint16_t fftLen; /**< length of the FFT. */
2127 const q31_t *pTwiddle; /**< points to the Twiddle factor table. */
2128 const uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2129 uint16_t bitRevLength; /**< bit reversal table length. */
2130 } arm_cfft_instance_q31;
2131
2132 void arm_cfft_q31(
2133 const arm_cfft_instance_q31 * S,
2134 q31_t * p1,
2135 uint8_t ifftFlag,
2136 uint8_t bitReverseFlag);
2137
2138 /**
2139 * @brief Instance structure for the floating-point CFFT/CIFFT function.
2140 */
2141 typedef struct
2142 {
2143 uint16_t fftLen; /**< length of the FFT. */
2144 const float32_t *pTwiddle; /**< points to the Twiddle factor table. */
2145 const uint16_t *pBitRevTable; /**< points to the bit reversal table. */
2146 uint16_t bitRevLength; /**< bit reversal table length. */
2147 } arm_cfft_instance_f32;
2148
2149 void arm_cfft_f32(
2150 const arm_cfft_instance_f32 * S,
2151 float32_t * p1,
2152 uint8_t ifftFlag,
2153 uint8_t bitReverseFlag);
2154
2155 /**
2156 * @brief Instance structure for the Q15 RFFT/RIFFT function.
2157 */
2158 typedef struct
2159 {
2160 uint32_t fftLenReal; /**< length of the real FFT. */
2161 uint8_t ifftFlagR; /**< flag that selects forward (ifftFlagR=0) or inverse (ifftFlagR=1) transform. */
2162 uint8_t bitReverseFlagR; /**< flag that enables (bitReverseFlagR=1) or disables (bitReverseFlagR=0) bit reversal of output. */
2163 uint32_t twidCoefRModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2164 q15_t *pTwiddleAReal; /**< points to the real twiddle factor table. */
2165 q15_t *pTwiddleBReal; /**< points to the imag twiddle factor table. */
2166 const arm_cfft_instance_q15 *pCfft; /**< points to the complex FFT instance. */
2167 } arm_rfft_instance_q15;
2168
2169 arm_status arm_rfft_init_q15(
2170 arm_rfft_instance_q15 * S,
2171 uint32_t fftLenReal,
2172 uint32_t ifftFlagR,
2173 uint32_t bitReverseFlag);
2174
2175 void arm_rfft_q15(
2176 const arm_rfft_instance_q15 * S,
2177 q15_t * pSrc,
2178 q15_t * pDst);
2179
2180 /**
2181 * @brief Instance structure for the Q31 RFFT/RIFFT function.
2182 */
2183 typedef struct
2184 {
2185 uint32_t fftLenReal; /**< length of the real FFT. */
2186 uint8_t ifftFlagR; /**< flag that selects forward (ifftFlagR=0) or inverse (ifftFlagR=1) transform. */
2187 uint8_t bitReverseFlagR; /**< flag that enables (bitReverseFlagR=1) or disables (bitReverseFlagR=0) bit reversal of output. */
2188 uint32_t twidCoefRModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2189 q31_t *pTwiddleAReal; /**< points to the real twiddle factor table. */
2190 q31_t *pTwiddleBReal; /**< points to the imag twiddle factor table. */
2191 const arm_cfft_instance_q31 *pCfft; /**< points to the complex FFT instance. */
2192 } arm_rfft_instance_q31;
2193
2194 arm_status arm_rfft_init_q31(
2195 arm_rfft_instance_q31 * S,
2196 uint32_t fftLenReal,
2197 uint32_t ifftFlagR,
2198 uint32_t bitReverseFlag);
2199
2200 void arm_rfft_q31(
2201 const arm_rfft_instance_q31 * S,
2202 q31_t * pSrc,
2203 q31_t * pDst);
2204
2205 /**
2206 * @brief Instance structure for the floating-point RFFT/RIFFT function.
2207 */
2208 typedef struct
2209 {
2210 uint32_t fftLenReal; /**< length of the real FFT. */
2211 uint16_t fftLenBy2; /**< length of the complex FFT. */
2212 uint8_t ifftFlagR; /**< flag that selects forward (ifftFlagR=0) or inverse (ifftFlagR=1) transform. */
2213 uint8_t bitReverseFlagR; /**< flag that enables (bitReverseFlagR=1) or disables (bitReverseFlagR=0) bit reversal of output. */
2214 uint32_t twidCoefRModifier; /**< twiddle coefficient modifier that supports different size FFTs with the same twiddle factor table. */
2215 float32_t *pTwiddleAReal; /**< points to the real twiddle factor table. */
2216 float32_t *pTwiddleBReal; /**< points to the imag twiddle factor table. */
2217 arm_cfft_radix4_instance_f32 *pCfft; /**< points to the complex FFT instance. */
2218 } arm_rfft_instance_f32;
2219
2220 arm_status arm_rfft_init_f32(
2221 arm_rfft_instance_f32 * S,
2222 arm_cfft_radix4_instance_f32 * S_CFFT,
2223 uint32_t fftLenReal,
2224 uint32_t ifftFlagR,
2225 uint32_t bitReverseFlag);
2226
2227 void arm_rfft_f32(
2228 const arm_rfft_instance_f32 * S,
2229 float32_t * pSrc,
2230 float32_t * pDst);
2231
2232 /**
2233 * @brief Instance structure for the floating-point RFFT/RIFFT function.
2234 */
2235 typedef struct
2236 {
2237 arm_cfft_instance_f32 Sint; /**< Internal CFFT structure. */
2238 uint16_t fftLenRFFT; /**< length of the real sequence */
2239 float32_t * pTwiddleRFFT; /**< Twiddle factors real stage */
2240 } arm_rfft_fast_instance_f32 ;
2241
2242 arm_status arm_rfft_fast_init_f32 (
2243 arm_rfft_fast_instance_f32 * S,
2244 uint16_t fftLen);
2245
2246 void arm_rfft_fast_f32(
2247 arm_rfft_fast_instance_f32 * S,
2248 float32_t * p, float32_t * pOut,
2249 uint8_t ifftFlag);
2250
2251 /**
2252 * @brief Instance structure for the floating-point DCT4/IDCT4 function.
2253 */
2254 typedef struct
2255 {
2256 uint16_t N; /**< length of the DCT4. */
2257 uint16_t Nby2; /**< half of the length of the DCT4. */
2258 float32_t normalize; /**< normalizing factor. */
2259 float32_t *pTwiddle; /**< points to the twiddle factor table. */
2260 float32_t *pCosFactor; /**< points to the cosFactor table. */
2261 arm_rfft_instance_f32 *pRfft; /**< points to the real FFT instance. */
2262 arm_cfft_radix4_instance_f32 *pCfft; /**< points to the complex FFT instance. */
2263 } arm_dct4_instance_f32;
2264
2265
2266 /**
2267 * @brief Initialization function for the floating-point DCT4/IDCT4.
2268 * @param[in,out] S points to an instance of floating-point DCT4/IDCT4 structure.
2269 * @param[in] S_RFFT points to an instance of floating-point RFFT/RIFFT structure.
2270 * @param[in] S_CFFT points to an instance of floating-point CFFT/CIFFT structure.
2271 * @param[in] N length of the DCT4.
2272 * @param[in] Nby2 half of the length of the DCT4.
2273 * @param[in] normalize normalizing factor.
2274 * @return arm_status function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_ARGUMENT_ERROR if <code>fftLenReal</code> is not a supported transform length.
2275 */
2276 arm_status arm_dct4_init_f32(
2277 arm_dct4_instance_f32 * S,
2278 arm_rfft_instance_f32 * S_RFFT,
2279 arm_cfft_radix4_instance_f32 * S_CFFT,
2280 uint16_t N,
2281 uint16_t Nby2,
2282 float32_t normalize);
2283
2284
2285 /**
2286 * @brief Processing function for the floating-point DCT4/IDCT4.
2287 * @param[in] S points to an instance of the floating-point DCT4/IDCT4 structure.
2288 * @param[in] pState points to state buffer.
2289 * @param[in,out] pInlineBuffer points to the in-place input and output buffer.
2290 */
2291 void arm_dct4_f32(
2292 const arm_dct4_instance_f32 * S,
2293 float32_t * pState,
2294 float32_t * pInlineBuffer);
2295
2296
2297 /**
2298 * @brief Instance structure for the Q31 DCT4/IDCT4 function.
2299 */
2300 typedef struct
2301 {
2302 uint16_t N; /**< length of the DCT4. */
2303 uint16_t Nby2; /**< half of the length of the DCT4. */
2304 q31_t normalize; /**< normalizing factor. */
2305 q31_t *pTwiddle; /**< points to the twiddle factor table. */
2306 q31_t *pCosFactor; /**< points to the cosFactor table. */
2307 arm_rfft_instance_q31 *pRfft; /**< points to the real FFT instance. */
2308 arm_cfft_radix4_instance_q31 *pCfft; /**< points to the complex FFT instance. */
2309 } arm_dct4_instance_q31;
2310
2311
2312 /**
2313 * @brief Initialization function for the Q31 DCT4/IDCT4.
2314 * @param[in,out] S points to an instance of Q31 DCT4/IDCT4 structure.
2315 * @param[in] S_RFFT points to an instance of Q31 RFFT/RIFFT structure
2316 * @param[in] S_CFFT points to an instance of Q31 CFFT/CIFFT structure
2317 * @param[in] N length of the DCT4.
2318 * @param[in] Nby2 half of the length of the DCT4.
2319 * @param[in] normalize normalizing factor.
2320 * @return arm_status function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_ARGUMENT_ERROR if <code>N</code> is not a supported transform length.
2321 */
2322 arm_status arm_dct4_init_q31(
2323 arm_dct4_instance_q31 * S,
2324 arm_rfft_instance_q31 * S_RFFT,
2325 arm_cfft_radix4_instance_q31 * S_CFFT,
2326 uint16_t N,
2327 uint16_t Nby2,
2328 q31_t normalize);
2329
2330
2331 /**
2332 * @brief Processing function for the Q31 DCT4/IDCT4.
2333 * @param[in] S points to an instance of the Q31 DCT4 structure.
2334 * @param[in] pState points to state buffer.
2335 * @param[in,out] pInlineBuffer points to the in-place input and output buffer.
2336 */
2337 void arm_dct4_q31(
2338 const arm_dct4_instance_q31 * S,
2339 q31_t * pState,
2340 q31_t * pInlineBuffer);
2341
2342
2343 /**
2344 * @brief Instance structure for the Q15 DCT4/IDCT4 function.
2345 */
2346 typedef struct
2347 {
2348 uint16_t N; /**< length of the DCT4. */
2349 uint16_t Nby2; /**< half of the length of the DCT4. */
2350 q15_t normalize; /**< normalizing factor. */
2351 q15_t *pTwiddle; /**< points to the twiddle factor table. */
2352 q15_t *pCosFactor; /**< points to the cosFactor table. */
2353 arm_rfft_instance_q15 *pRfft; /**< points to the real FFT instance. */
2354 arm_cfft_radix4_instance_q15 *pCfft; /**< points to the complex FFT instance. */
2355 } arm_dct4_instance_q15;
2356
2357
2358 /**
2359 * @brief Initialization function for the Q15 DCT4/IDCT4.
2360 * @param[in,out] S points to an instance of Q15 DCT4/IDCT4 structure.
2361 * @param[in] S_RFFT points to an instance of Q15 RFFT/RIFFT structure.
2362 * @param[in] S_CFFT points to an instance of Q15 CFFT/CIFFT structure.
2363 * @param[in] N length of the DCT4.
2364 * @param[in] Nby2 half of the length of the DCT4.
2365 * @param[in] normalize normalizing factor.
2366 * @return arm_status function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_ARGUMENT_ERROR if <code>N</code> is not a supported transform length.
2367 */
2368 arm_status arm_dct4_init_q15(
2369 arm_dct4_instance_q15 * S,
2370 arm_rfft_instance_q15 * S_RFFT,
2371 arm_cfft_radix4_instance_q15 * S_CFFT,
2372 uint16_t N,
2373 uint16_t Nby2,
2374 q15_t normalize);
2375
2376
2377 /**
2378 * @brief Processing function for the Q15 DCT4/IDCT4.
2379 * @param[in] S points to an instance of the Q15 DCT4 structure.
2380 * @param[in] pState points to state buffer.
2381 * @param[in,out] pInlineBuffer points to the in-place input and output buffer.
2382 */
2383 void arm_dct4_q15(
2384 const arm_dct4_instance_q15 * S,
2385 q15_t * pState,
2386 q15_t * pInlineBuffer);
2387
2388
2389 /**
2390 * @brief Floating-point vector addition.
2391 * @param[in] pSrcA points to the first input vector
2392 * @param[in] pSrcB points to the second input vector
2393 * @param[out] pDst points to the output vector
2394 * @param[in] blockSize number of samples in each vector
2395 */
2396 void arm_add_f32(
2397 float32_t * pSrcA,
2398 float32_t * pSrcB,
2399 float32_t * pDst,
2400 uint32_t blockSize);
2401
2402
2403 /**
2404 * @brief Q7 vector addition.
2405 * @param[in] pSrcA points to the first input vector
2406 * @param[in] pSrcB points to the second input vector
2407 * @param[out] pDst points to the output vector
2408 * @param[in] blockSize number of samples in each vector
2409 */
2410 void arm_add_q7(
2411 q7_t * pSrcA,
2412 q7_t * pSrcB,
2413 q7_t * pDst,
2414 uint32_t blockSize);
2415
2416
2417 /**
2418 * @brief Q15 vector addition.
2419 * @param[in] pSrcA points to the first input vector
2420 * @param[in] pSrcB points to the second input vector
2421 * @param[out] pDst points to the output vector
2422 * @param[in] blockSize number of samples in each vector
2423 */
2424 void arm_add_q15(
2425 q15_t * pSrcA,
2426 q15_t * pSrcB,
2427 q15_t * pDst,
2428 uint32_t blockSize);
2429
2430
2431 /**
2432 * @brief Q31 vector addition.
2433 * @param[in] pSrcA points to the first input vector
2434 * @param[in] pSrcB points to the second input vector
2435 * @param[out] pDst points to the output vector
2436 * @param[in] blockSize number of samples in each vector
2437 */
2438 void arm_add_q31(
2439 q31_t * pSrcA,
2440 q31_t * pSrcB,
2441 q31_t * pDst,
2442 uint32_t blockSize);
2443
2444
2445 /**
2446 * @brief Floating-point vector subtraction.
2447 * @param[in] pSrcA points to the first input vector
2448 * @param[in] pSrcB points to the second input vector
2449 * @param[out] pDst points to the output vector
2450 * @param[in] blockSize number of samples in each vector
2451 */
2452 void arm_sub_f32(
2453 float32_t * pSrcA,
2454 float32_t * pSrcB,
2455 float32_t * pDst,
2456 uint32_t blockSize);
2457
2458
2459 /**
2460 * @brief Q7 vector subtraction.
2461 * @param[in] pSrcA points to the first input vector
2462 * @param[in] pSrcB points to the second input vector
2463 * @param[out] pDst points to the output vector
2464 * @param[in] blockSize number of samples in each vector
2465 */
2466 void arm_sub_q7(
2467 q7_t * pSrcA,
2468 q7_t * pSrcB,
2469 q7_t * pDst,
2470 uint32_t blockSize);
2471
2472
2473 /**
2474 * @brief Q15 vector subtraction.
2475 * @param[in] pSrcA points to the first input vector
2476 * @param[in] pSrcB points to the second input vector
2477 * @param[out] pDst points to the output vector
2478 * @param[in] blockSize number of samples in each vector
2479 */
2480 void arm_sub_q15(
2481 q15_t * pSrcA,
2482 q15_t * pSrcB,
2483 q15_t * pDst,
2484 uint32_t blockSize);
2485
2486
2487 /**
2488 * @brief Q31 vector subtraction.
2489 * @param[in] pSrcA points to the first input vector
2490 * @param[in] pSrcB points to the second input vector
2491 * @param[out] pDst points to the output vector
2492 * @param[in] blockSize number of samples in each vector
2493 */
2494 void arm_sub_q31(
2495 q31_t * pSrcA,
2496 q31_t * pSrcB,
2497 q31_t * pDst,
2498 uint32_t blockSize);
2499
2500
2501 /**
2502 * @brief Multiplies a floating-point vector by a scalar.
2503 * @param[in] pSrc points to the input vector
2504 * @param[in] scale scale factor to be applied
2505 * @param[out] pDst points to the output vector
2506 * @param[in] blockSize number of samples in the vector
2507 */
2508 void arm_scale_f32(
2509 float32_t * pSrc,
2510 float32_t scale,
2511 float32_t * pDst,
2512 uint32_t blockSize);
2513
2514
2515 /**
2516 * @brief Multiplies a Q7 vector by a scalar.
2517 * @param[in] pSrc points to the input vector
2518 * @param[in] scaleFract fractional portion of the scale value
2519 * @param[in] shift number of bits to shift the result by
2520 * @param[out] pDst points to the output vector
2521 * @param[in] blockSize number of samples in the vector
2522 */
2523 void arm_scale_q7(
2524 q7_t * pSrc,
2525 q7_t scaleFract,
2526 int8_t shift,
2527 q7_t * pDst,
2528 uint32_t blockSize);
2529
2530
2531 /**
2532 * @brief Multiplies a Q15 vector by a scalar.
2533 * @param[in] pSrc points to the input vector
2534 * @param[in] scaleFract fractional portion of the scale value
2535 * @param[in] shift number of bits to shift the result by
2536 * @param[out] pDst points to the output vector
2537 * @param[in] blockSize number of samples in the vector
2538 */
2539 void arm_scale_q15(
2540 q15_t * pSrc,
2541 q15_t scaleFract,
2542 int8_t shift,
2543 q15_t * pDst,
2544 uint32_t blockSize);
2545
2546
2547 /**
2548 * @brief Multiplies a Q31 vector by a scalar.
2549 * @param[in] pSrc points to the input vector
2550 * @param[in] scaleFract fractional portion of the scale value
2551 * @param[in] shift number of bits to shift the result by
2552 * @param[out] pDst points to the output vector
2553 * @param[in] blockSize number of samples in the vector
2554 */
2555 void arm_scale_q31(
2556 q31_t * pSrc,
2557 q31_t scaleFract,
2558 int8_t shift,
2559 q31_t * pDst,
2560 uint32_t blockSize);
2561
2562
2563 /**
2564 * @brief Q7 vector absolute value.
2565 * @param[in] pSrc points to the input buffer
2566 * @param[out] pDst points to the output buffer
2567 * @param[in] blockSize number of samples in each vector
2568 */
2569 void arm_abs_q7(
2570 q7_t * pSrc,
2571 q7_t * pDst,
2572 uint32_t blockSize);
2573
2574
2575 /**
2576 * @brief Floating-point vector absolute value.
2577 * @param[in] pSrc points to the input buffer
2578 * @param[out] pDst points to the output buffer
2579 * @param[in] blockSize number of samples in each vector
2580 */
2581 void arm_abs_f32(
2582 float32_t * pSrc,
2583 float32_t * pDst,
2584 uint32_t blockSize);
2585
2586
2587 /**
2588 * @brief Q15 vector absolute value.
2589 * @param[in] pSrc points to the input buffer
2590 * @param[out] pDst points to the output buffer
2591 * @param[in] blockSize number of samples in each vector
2592 */
2593 void arm_abs_q15(
2594 q15_t * pSrc,
2595 q15_t * pDst,
2596 uint32_t blockSize);
2597
2598
2599 /**
2600 * @brief Q31 vector absolute value.
2601 * @param[in] pSrc points to the input buffer
2602 * @param[out] pDst points to the output buffer
2603 * @param[in] blockSize number of samples in each vector
2604 */
2605 void arm_abs_q31(
2606 q31_t * pSrc,
2607 q31_t * pDst,
2608 uint32_t blockSize);
2609
2610
2611 /**
2612 * @brief Dot product of floating-point vectors.
2613 * @param[in] pSrcA points to the first input vector
2614 * @param[in] pSrcB points to the second input vector
2615 * @param[in] blockSize number of samples in each vector
2616 * @param[out] result output result returned here
2617 */
2618 void arm_dot_prod_f32(
2619 float32_t * pSrcA,
2620 float32_t * pSrcB,
2621 uint32_t blockSize,
2622 float32_t * result);
2623
2624
2625 /**
2626 * @brief Dot product of Q7 vectors.
2627 * @param[in] pSrcA points to the first input vector
2628 * @param[in] pSrcB points to the second input vector
2629 * @param[in] blockSize number of samples in each vector
2630 * @param[out] result output result returned here
2631 */
2632 void arm_dot_prod_q7(
2633 q7_t * pSrcA,
2634 q7_t * pSrcB,
2635 uint32_t blockSize,
2636 q31_t * result);
2637
2638
2639 /**
2640 * @brief Dot product of Q15 vectors.
2641 * @param[in] pSrcA points to the first input vector
2642 * @param[in] pSrcB points to the second input vector
2643 * @param[in] blockSize number of samples in each vector
2644 * @param[out] result output result returned here
2645 */
2646 void arm_dot_prod_q15(
2647 q15_t * pSrcA,
2648 q15_t * pSrcB,
2649 uint32_t blockSize,
2650 q63_t * result);
2651
2652
2653 /**
2654 * @brief Dot product of Q31 vectors.
2655 * @param[in] pSrcA points to the first input vector
2656 * @param[in] pSrcB points to the second input vector
2657 * @param[in] blockSize number of samples in each vector
2658 * @param[out] result output result returned here
2659 */
2660 void arm_dot_prod_q31(
2661 q31_t * pSrcA,
2662 q31_t * pSrcB,
2663 uint32_t blockSize,
2664 q63_t * result);
2665
2666
2667 /**
2668 * @brief Shifts the elements of a Q7 vector a specified number of bits.
2669 * @param[in] pSrc points to the input vector
2670 * @param[in] shiftBits number of bits to shift. A positive value shifts left; a negative value shifts right.
2671 * @param[out] pDst points to the output vector
2672 * @param[in] blockSize number of samples in the vector
2673 */
2674 void arm_shift_q7(
2675 q7_t * pSrc,
2676 int8_t shiftBits,
2677 q7_t * pDst,
2678 uint32_t blockSize);
2679
2680
2681 /**
2682 * @brief Shifts the elements of a Q15 vector a specified number of bits.
2683 * @param[in] pSrc points to the input vector
2684 * @param[in] shiftBits number of bits to shift. A positive value shifts left; a negative value shifts right.
2685 * @param[out] pDst points to the output vector
2686 * @param[in] blockSize number of samples in the vector
2687 */
2688 void arm_shift_q15(
2689 q15_t * pSrc,
2690 int8_t shiftBits,
2691 q15_t * pDst,
2692 uint32_t blockSize);
2693
2694
2695 /**
2696 * @brief Shifts the elements of a Q31 vector a specified number of bits.
2697 * @param[in] pSrc points to the input vector
2698 * @param[in] shiftBits number of bits to shift. A positive value shifts left; a negative value shifts right.
2699 * @param[out] pDst points to the output vector
2700 * @param[in] blockSize number of samples in the vector
2701 */
2702 void arm_shift_q31(
2703 q31_t * pSrc,
2704 int8_t shiftBits,
2705 q31_t * pDst,
2706 uint32_t blockSize);
2707
2708
2709 /**
2710 * @brief Adds a constant offset to a floating-point vector.
2711 * @param[in] pSrc points to the input vector
2712 * @param[in] offset is the offset to be added
2713 * @param[out] pDst points to the output vector
2714 * @param[in] blockSize number of samples in the vector
2715 */
2716 void arm_offset_f32(
2717 float32_t * pSrc,
2718 float32_t offset,
2719 float32_t * pDst,
2720 uint32_t blockSize);
2721
2722
2723 /**
2724 * @brief Adds a constant offset to a Q7 vector.
2725 * @param[in] pSrc points to the input vector
2726 * @param[in] offset is the offset to be added
2727 * @param[out] pDst points to the output vector
2728 * @param[in] blockSize number of samples in the vector
2729 */
2730 void arm_offset_q7(
2731 q7_t * pSrc,
2732 q7_t offset,
2733 q7_t * pDst,
2734 uint32_t blockSize);
2735
2736
2737 /**
2738 * @brief Adds a constant offset to a Q15 vector.
2739 * @param[in] pSrc points to the input vector
2740 * @param[in] offset is the offset to be added
2741 * @param[out] pDst points to the output vector
2742 * @param[in] blockSize number of samples in the vector
2743 */
2744 void arm_offset_q15(
2745 q15_t * pSrc,
2746 q15_t offset,
2747 q15_t * pDst,
2748 uint32_t blockSize);
2749
2750
2751 /**
2752 * @brief Adds a constant offset to a Q31 vector.
2753 * @param[in] pSrc points to the input vector
2754 * @param[in] offset is the offset to be added
2755 * @param[out] pDst points to the output vector
2756 * @param[in] blockSize number of samples in the vector
2757 */
2758 void arm_offset_q31(
2759 q31_t * pSrc,
2760 q31_t offset,
2761 q31_t * pDst,
2762 uint32_t blockSize);
2763
2764
2765 /**
2766 * @brief Negates the elements of a floating-point vector.
2767 * @param[in] pSrc points to the input vector
2768 * @param[out] pDst points to the output vector
2769 * @param[in] blockSize number of samples in the vector
2770 */
2771 void arm_negate_f32(
2772 float32_t * pSrc,
2773 float32_t * pDst,
2774 uint32_t blockSize);
2775
2776
2777 /**
2778 * @brief Negates the elements of a Q7 vector.
2779 * @param[in] pSrc points to the input vector
2780 * @param[out] pDst points to the output vector
2781 * @param[in] blockSize number of samples in the vector
2782 */
2783 void arm_negate_q7(
2784 q7_t * pSrc,
2785 q7_t * pDst,
2786 uint32_t blockSize);
2787
2788
2789 /**
2790 * @brief Negates the elements of a Q15 vector.
2791 * @param[in] pSrc points to the input vector
2792 * @param[out] pDst points to the output vector
2793 * @param[in] blockSize number of samples in the vector
2794 */
2795 void arm_negate_q15(
2796 q15_t * pSrc,
2797 q15_t * pDst,
2798 uint32_t blockSize);
2799
2800
2801 /**
2802 * @brief Negates the elements of a Q31 vector.
2803 * @param[in] pSrc points to the input vector
2804 * @param[out] pDst points to the output vector
2805 * @param[in] blockSize number of samples in the vector
2806 */
2807 void arm_negate_q31(
2808 q31_t * pSrc,
2809 q31_t * pDst,
2810 uint32_t blockSize);
2811
2812
2813 /**
2814 * @brief Copies the elements of a floating-point vector.
2815 * @param[in] pSrc input pointer
2816 * @param[out] pDst output pointer
2817 * @param[in] blockSize number of samples to process
2818 */
2819 void arm_copy_f32(
2820 float32_t * pSrc,
2821 float32_t * pDst,
2822 uint32_t blockSize);
2823
2824
2825 /**
2826 * @brief Copies the elements of a Q7 vector.
2827 * @param[in] pSrc input pointer
2828 * @param[out] pDst output pointer
2829 * @param[in] blockSize number of samples to process
2830 */
2831 void arm_copy_q7(
2832 q7_t * pSrc,
2833 q7_t * pDst,
2834 uint32_t blockSize);
2835
2836
2837 /**
2838 * @brief Copies the elements of a Q15 vector.
2839 * @param[in] pSrc input pointer
2840 * @param[out] pDst output pointer
2841 * @param[in] blockSize number of samples to process
2842 */
2843 void arm_copy_q15(
2844 q15_t * pSrc,
2845 q15_t * pDst,
2846 uint32_t blockSize);
2847
2848
2849 /**
2850 * @brief Copies the elements of a Q31 vector.
2851 * @param[in] pSrc input pointer
2852 * @param[out] pDst output pointer
2853 * @param[in] blockSize number of samples to process
2854 */
2855 void arm_copy_q31(
2856 q31_t * pSrc,
2857 q31_t * pDst,
2858 uint32_t blockSize);
2859
2860
2861 /**
2862 * @brief Fills a constant value into a floating-point vector.
2863 * @param[in] value input value to be filled
2864 * @param[out] pDst output pointer
2865 * @param[in] blockSize number of samples to process
2866 */
2867 void arm_fill_f32(
2868 float32_t value,
2869 float32_t * pDst,
2870 uint32_t blockSize);
2871
2872
2873 /**
2874 * @brief Fills a constant value into a Q7 vector.
2875 * @param[in] value input value to be filled
2876 * @param[out] pDst output pointer
2877 * @param[in] blockSize number of samples to process
2878 */
2879 void arm_fill_q7(
2880 q7_t value,
2881 q7_t * pDst,
2882 uint32_t blockSize);
2883
2884
2885 /**
2886 * @brief Fills a constant value into a Q15 vector.
2887 * @param[in] value input value to be filled
2888 * @param[out] pDst output pointer
2889 * @param[in] blockSize number of samples to process
2890 */
2891 void arm_fill_q15(
2892 q15_t value,
2893 q15_t * pDst,
2894 uint32_t blockSize);
2895
2896
2897 /**
2898 * @brief Fills a constant value into a Q31 vector.
2899 * @param[in] value input value to be filled
2900 * @param[out] pDst output pointer
2901 * @param[in] blockSize number of samples to process
2902 */
2903 void arm_fill_q31(
2904 q31_t value,
2905 q31_t * pDst,
2906 uint32_t blockSize);
2907
2908
2909 /**
2910 * @brief Convolution of floating-point sequences.
2911 * @param[in] pSrcA points to the first input sequence.
2912 * @param[in] srcALen length of the first input sequence.
2913 * @param[in] pSrcB points to the second input sequence.
2914 * @param[in] srcBLen length of the second input sequence.
2915 * @param[out] pDst points to the location where the output result is written. Length srcALen+srcBLen-1.
2916 */
2917 void arm_conv_f32(
2918 float32_t * pSrcA,
2919 uint32_t srcALen,
2920 float32_t * pSrcB,
2921 uint32_t srcBLen,
2922 float32_t * pDst);
2923
2924
2925 /**
2926 * @brief Convolution of Q15 sequences.
2927 * @param[in] pSrcA points to the first input sequence.
2928 * @param[in] srcALen length of the first input sequence.
2929 * @param[in] pSrcB points to the second input sequence.
2930 * @param[in] srcBLen length of the second input sequence.
2931 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
2932 * @param[in] pScratch1 points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
2933 * @param[in] pScratch2 points to scratch buffer of size min(srcALen, srcBLen).
2934 */
2935 void arm_conv_opt_q15(
2936 q15_t * pSrcA,
2937 uint32_t srcALen,
2938 q15_t * pSrcB,
2939 uint32_t srcBLen,
2940 q15_t * pDst,
2941 q15_t * pScratch1,
2942 q15_t * pScratch2);
2943
2944
2945 /**
2946 * @brief Convolution of Q15 sequences.
2947 * @param[in] pSrcA points to the first input sequence.
2948 * @param[in] srcALen length of the first input sequence.
2949 * @param[in] pSrcB points to the second input sequence.
2950 * @param[in] srcBLen length of the second input sequence.
2951 * @param[out] pDst points to the location where the output result is written. Length srcALen+srcBLen-1.
2952 */
2953 void arm_conv_q15(
2954 q15_t * pSrcA,
2955 uint32_t srcALen,
2956 q15_t * pSrcB,
2957 uint32_t srcBLen,
2958 q15_t * pDst);
2959
2960
2961 /**
2962 * @brief Convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4
2963 * @param[in] pSrcA points to the first input sequence.
2964 * @param[in] srcALen length of the first input sequence.
2965 * @param[in] pSrcB points to the second input sequence.
2966 * @param[in] srcBLen length of the second input sequence.
2967 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
2968 */
2969 void arm_conv_fast_q15(
2970 q15_t * pSrcA,
2971 uint32_t srcALen,
2972 q15_t * pSrcB,
2973 uint32_t srcBLen,
2974 q15_t * pDst);
2975
2976
2977 /**
2978 * @brief Convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4
2979 * @param[in] pSrcA points to the first input sequence.
2980 * @param[in] srcALen length of the first input sequence.
2981 * @param[in] pSrcB points to the second input sequence.
2982 * @param[in] srcBLen length of the second input sequence.
2983 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
2984 * @param[in] pScratch1 points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
2985 * @param[in] pScratch2 points to scratch buffer of size min(srcALen, srcBLen).
2986 */
2987 void arm_conv_fast_opt_q15(
2988 q15_t * pSrcA,
2989 uint32_t srcALen,
2990 q15_t * pSrcB,
2991 uint32_t srcBLen,
2992 q15_t * pDst,
2993 q15_t * pScratch1,
2994 q15_t * pScratch2);
2995
2996
2997 /**
2998 * @brief Convolution of Q31 sequences.
2999 * @param[in] pSrcA points to the first input sequence.
3000 * @param[in] srcALen length of the first input sequence.
3001 * @param[in] pSrcB points to the second input sequence.
3002 * @param[in] srcBLen length of the second input sequence.
3003 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
3004 */
3005 void arm_conv_q31(
3006 q31_t * pSrcA,
3007 uint32_t srcALen,
3008 q31_t * pSrcB,
3009 uint32_t srcBLen,
3010 q31_t * pDst);
3011
3012
3013 /**
3014 * @brief Convolution of Q31 sequences (fast version) for Cortex-M3 and Cortex-M4
3015 * @param[in] pSrcA points to the first input sequence.
3016 * @param[in] srcALen length of the first input sequence.
3017 * @param[in] pSrcB points to the second input sequence.
3018 * @param[in] srcBLen length of the second input sequence.
3019 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
3020 */
3021 void arm_conv_fast_q31(
3022 q31_t * pSrcA,
3023 uint32_t srcALen,
3024 q31_t * pSrcB,
3025 uint32_t srcBLen,
3026 q31_t * pDst);
3027
3028
3029 /**
3030 * @brief Convolution of Q7 sequences.
3031 * @param[in] pSrcA points to the first input sequence.
3032 * @param[in] srcALen length of the first input sequence.
3033 * @param[in] pSrcB points to the second input sequence.
3034 * @param[in] srcBLen length of the second input sequence.
3035 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
3036 * @param[in] pScratch1 points to scratch buffer(of type q15_t) of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
3037 * @param[in] pScratch2 points to scratch buffer (of type q15_t) of size min(srcALen, srcBLen).
3038 */
3039 void arm_conv_opt_q7(
3040 q7_t * pSrcA,
3041 uint32_t srcALen,
3042 q7_t * pSrcB,
3043 uint32_t srcBLen,
3044 q7_t * pDst,
3045 q15_t * pScratch1,
3046 q15_t * pScratch2);
3047
3048
3049 /**
3050 * @brief Convolution of Q7 sequences.
3051 * @param[in] pSrcA points to the first input sequence.
3052 * @param[in] srcALen length of the first input sequence.
3053 * @param[in] pSrcB points to the second input sequence.
3054 * @param[in] srcBLen length of the second input sequence.
3055 * @param[out] pDst points to the block of output data Length srcALen+srcBLen-1.
3056 */
3057 void arm_conv_q7(
3058 q7_t * pSrcA,
3059 uint32_t srcALen,
3060 q7_t * pSrcB,
3061 uint32_t srcBLen,
3062 q7_t * pDst);
3063
3064
3065 /**
3066 * @brief Partial convolution of floating-point sequences.
3067 * @param[in] pSrcA points to the first input sequence.
3068 * @param[in] srcALen length of the first input sequence.
3069 * @param[in] pSrcB points to the second input sequence.
3070 * @param[in] srcBLen length of the second input sequence.
3071 * @param[out] pDst points to the block of output data
3072 * @param[in] firstIndex is the first output sample to start with.
3073 * @param[in] numPoints is the number of output points to be computed.
3074 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3075 */
3076 arm_status arm_conv_partial_f32(
3077 float32_t * pSrcA,
3078 uint32_t srcALen,
3079 float32_t * pSrcB,
3080 uint32_t srcBLen,
3081 float32_t * pDst,
3082 uint32_t firstIndex,
3083 uint32_t numPoints);
3084
3085
3086 /**
3087 * @brief Partial convolution of Q15 sequences.
3088 * @param[in] pSrcA points to the first input sequence.
3089 * @param[in] srcALen length of the first input sequence.
3090 * @param[in] pSrcB points to the second input sequence.
3091 * @param[in] srcBLen length of the second input sequence.
3092 * @param[out] pDst points to the block of output data
3093 * @param[in] firstIndex is the first output sample to start with.
3094 * @param[in] numPoints is the number of output points to be computed.
3095 * @param[in] pScratch1 points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
3096 * @param[in] pScratch2 points to scratch buffer of size min(srcALen, srcBLen).
3097 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3098 */
3099 arm_status arm_conv_partial_opt_q15(
3100 q15_t * pSrcA,
3101 uint32_t srcALen,
3102 q15_t * pSrcB,
3103 uint32_t srcBLen,
3104 q15_t * pDst,
3105 uint32_t firstIndex,
3106 uint32_t numPoints,
3107 q15_t * pScratch1,
3108 q15_t * pScratch2);
3109
3110
3111 /**
3112 * @brief Partial convolution of Q15 sequences.
3113 * @param[in] pSrcA points to the first input sequence.
3114 * @param[in] srcALen length of the first input sequence.
3115 * @param[in] pSrcB points to the second input sequence.
3116 * @param[in] srcBLen length of the second input sequence.
3117 * @param[out] pDst points to the block of output data
3118 * @param[in] firstIndex is the first output sample to start with.
3119 * @param[in] numPoints is the number of output points to be computed.
3120 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3121 */
3122 arm_status arm_conv_partial_q15(
3123 q15_t * pSrcA,
3124 uint32_t srcALen,
3125 q15_t * pSrcB,
3126 uint32_t srcBLen,
3127 q15_t * pDst,
3128 uint32_t firstIndex,
3129 uint32_t numPoints);
3130
3131
3132 /**
3133 * @brief Partial convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4
3134 * @param[in] pSrcA points to the first input sequence.
3135 * @param[in] srcALen length of the first input sequence.
3136 * @param[in] pSrcB points to the second input sequence.
3137 * @param[in] srcBLen length of the second input sequence.
3138 * @param[out] pDst points to the block of output data
3139 * @param[in] firstIndex is the first output sample to start with.
3140 * @param[in] numPoints is the number of output points to be computed.
3141 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3142 */
3143 arm_status arm_conv_partial_fast_q15(
3144 q15_t * pSrcA,
3145 uint32_t srcALen,
3146 q15_t * pSrcB,
3147 uint32_t srcBLen,
3148 q15_t * pDst,
3149 uint32_t firstIndex,
3150 uint32_t numPoints);
3151
3152
3153 /**
3154 * @brief Partial convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4
3155 * @param[in] pSrcA points to the first input sequence.
3156 * @param[in] srcALen length of the first input sequence.
3157 * @param[in] pSrcB points to the second input sequence.
3158 * @param[in] srcBLen length of the second input sequence.
3159 * @param[out] pDst points to the block of output data
3160 * @param[in] firstIndex is the first output sample to start with.
3161 * @param[in] numPoints is the number of output points to be computed.
3162 * @param[in] pScratch1 points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
3163 * @param[in] pScratch2 points to scratch buffer of size min(srcALen, srcBLen).
3164 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3165 */
3166 arm_status arm_conv_partial_fast_opt_q15(
3167 q15_t * pSrcA,
3168 uint32_t srcALen,
3169 q15_t * pSrcB,
3170 uint32_t srcBLen,
3171 q15_t * pDst,
3172 uint32_t firstIndex,
3173 uint32_t numPoints,
3174 q15_t * pScratch1,
3175 q15_t * pScratch2);
3176
3177
3178 /**
3179 * @brief Partial convolution of Q31 sequences.
3180 * @param[in] pSrcA points to the first input sequence.
3181 * @param[in] srcALen length of the first input sequence.
3182 * @param[in] pSrcB points to the second input sequence.
3183 * @param[in] srcBLen length of the second input sequence.
3184 * @param[out] pDst points to the block of output data
3185 * @param[in] firstIndex is the first output sample to start with.
3186 * @param[in] numPoints is the number of output points to be computed.
3187 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3188 */
3189 arm_status arm_conv_partial_q31(
3190 q31_t * pSrcA,
3191 uint32_t srcALen,
3192 q31_t * pSrcB,
3193 uint32_t srcBLen,
3194 q31_t * pDst,
3195 uint32_t firstIndex,
3196 uint32_t numPoints);
3197
3198
3199 /**
3200 * @brief Partial convolution of Q31 sequences (fast version) for Cortex-M3 and Cortex-M4
3201 * @param[in] pSrcA points to the first input sequence.
3202 * @param[in] srcALen length of the first input sequence.
3203 * @param[in] pSrcB points to the second input sequence.
3204 * @param[in] srcBLen length of the second input sequence.
3205 * @param[out] pDst points to the block of output data
3206 * @param[in] firstIndex is the first output sample to start with.
3207 * @param[in] numPoints is the number of output points to be computed.
3208 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3209 */
3210 arm_status arm_conv_partial_fast_q31(
3211 q31_t * pSrcA,
3212 uint32_t srcALen,
3213 q31_t * pSrcB,
3214 uint32_t srcBLen,
3215 q31_t * pDst,
3216 uint32_t firstIndex,
3217 uint32_t numPoints);
3218
3219
3220 /**
3221 * @brief Partial convolution of Q7 sequences
3222 * @param[in] pSrcA points to the first input sequence.
3223 * @param[in] srcALen length of the first input sequence.
3224 * @param[in] pSrcB points to the second input sequence.
3225 * @param[in] srcBLen length of the second input sequence.
3226 * @param[out] pDst points to the block of output data
3227 * @param[in] firstIndex is the first output sample to start with.
3228 * @param[in] numPoints is the number of output points to be computed.
3229 * @param[in] pScratch1 points to scratch buffer(of type q15_t) of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
3230 * @param[in] pScratch2 points to scratch buffer (of type q15_t) of size min(srcALen, srcBLen).
3231 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3232 */
3233 arm_status arm_conv_partial_opt_q7(
3234 q7_t * pSrcA,
3235 uint32_t srcALen,
3236 q7_t * pSrcB,
3237 uint32_t srcBLen,
3238 q7_t * pDst,
3239 uint32_t firstIndex,
3240 uint32_t numPoints,
3241 q15_t * pScratch1,
3242 q15_t * pScratch2);
3243
3244
3245 /**
3246 * @brief Partial convolution of Q7 sequences.
3247 * @param[in] pSrcA points to the first input sequence.
3248 * @param[in] srcALen length of the first input sequence.
3249 * @param[in] pSrcB points to the second input sequence.
3250 * @param[in] srcBLen length of the second input sequence.
3251 * @param[out] pDst points to the block of output data
3252 * @param[in] firstIndex is the first output sample to start with.
3253 * @param[in] numPoints is the number of output points to be computed.
3254 * @return Returns either ARM_MATH_SUCCESS if the function completed correctly or ARM_MATH_ARGUMENT_ERROR if the requested subset is not in the range [0 srcALen+srcBLen-2].
3255 */
3256 arm_status arm_conv_partial_q7(
3257 q7_t * pSrcA,
3258 uint32_t srcALen,
3259 q7_t * pSrcB,
3260 uint32_t srcBLen,
3261 q7_t * pDst,
3262 uint32_t firstIndex,
3263 uint32_t numPoints);
3264
3265
3266 /**
3267 * @brief Instance structure for the Q15 FIR decimator.
3268 */
3269 typedef struct
3270 {
3271 uint8_t M; /**< decimation factor. */
3272 uint16_t numTaps; /**< number of coefficients in the filter. */
3273 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
3274 q15_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
3275 } arm_fir_decimate_instance_q15;
3276
3277 /**
3278 * @brief Instance structure for the Q31 FIR decimator.
3279 */
3280 typedef struct
3281 {
3282 uint8_t M; /**< decimation factor. */
3283 uint16_t numTaps; /**< number of coefficients in the filter. */
3284 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
3285 q31_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
3286 } arm_fir_decimate_instance_q31;
3287
3288 /**
3289 * @brief Instance structure for the floating-point FIR decimator.
3290 */
3291 typedef struct
3292 {
3293 uint8_t M; /**< decimation factor. */
3294 uint16_t numTaps; /**< number of coefficients in the filter. */
3295 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
3296 float32_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
3297 } arm_fir_decimate_instance_f32;
3298
3299
3300 /**
3301 * @brief Processing function for the floating-point FIR decimator.
3302 * @param[in] S points to an instance of the floating-point FIR decimator structure.
3303 * @param[in] pSrc points to the block of input data.
3304 * @param[out] pDst points to the block of output data
3305 * @param[in] blockSize number of input samples to process per call.
3306 */
3307 void arm_fir_decimate_f32(
3308 const arm_fir_decimate_instance_f32 * S,
3309 float32_t * pSrc,
3310 float32_t * pDst,
3311 uint32_t blockSize);
3312
3313
3314 /**
3315 * @brief Initialization function for the floating-point FIR decimator.
3316 * @param[in,out] S points to an instance of the floating-point FIR decimator structure.
3317 * @param[in] numTaps number of coefficients in the filter.
3318 * @param[in] M decimation factor.
3319 * @param[in] pCoeffs points to the filter coefficients.
3320 * @param[in] pState points to the state buffer.
3321 * @param[in] blockSize number of input samples to process per call.
3322 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3323 * <code>blockSize</code> is not a multiple of <code>M</code>.
3324 */
3325 arm_status arm_fir_decimate_init_f32(
3326 arm_fir_decimate_instance_f32 * S,
3327 uint16_t numTaps,
3328 uint8_t M,
3329 float32_t * pCoeffs,
3330 float32_t * pState,
3331 uint32_t blockSize);
3332
3333
3334 /**
3335 * @brief Processing function for the Q15 FIR decimator.
3336 * @param[in] S points to an instance of the Q15 FIR decimator structure.
3337 * @param[in] pSrc points to the block of input data.
3338 * @param[out] pDst points to the block of output data
3339 * @param[in] blockSize number of input samples to process per call.
3340 */
3341 void arm_fir_decimate_q15(
3342 const arm_fir_decimate_instance_q15 * S,
3343 q15_t * pSrc,
3344 q15_t * pDst,
3345 uint32_t blockSize);
3346
3347
3348 /**
3349 * @brief Processing function for the Q15 FIR decimator (fast variant) for Cortex-M3 and Cortex-M4.
3350 * @param[in] S points to an instance of the Q15 FIR decimator structure.
3351 * @param[in] pSrc points to the block of input data.
3352 * @param[out] pDst points to the block of output data
3353 * @param[in] blockSize number of input samples to process per call.
3354 */
3355 void arm_fir_decimate_fast_q15(
3356 const arm_fir_decimate_instance_q15 * S,
3357 q15_t * pSrc,
3358 q15_t * pDst,
3359 uint32_t blockSize);
3360
3361
3362 /**
3363 * @brief Initialization function for the Q15 FIR decimator.
3364 * @param[in,out] S points to an instance of the Q15 FIR decimator structure.
3365 * @param[in] numTaps number of coefficients in the filter.
3366 * @param[in] M decimation factor.
3367 * @param[in] pCoeffs points to the filter coefficients.
3368 * @param[in] pState points to the state buffer.
3369 * @param[in] blockSize number of input samples to process per call.
3370 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3371 * <code>blockSize</code> is not a multiple of <code>M</code>.
3372 */
3373 arm_status arm_fir_decimate_init_q15(
3374 arm_fir_decimate_instance_q15 * S,
3375 uint16_t numTaps,
3376 uint8_t M,
3377 q15_t * pCoeffs,
3378 q15_t * pState,
3379 uint32_t blockSize);
3380
3381
3382 /**
3383 * @brief Processing function for the Q31 FIR decimator.
3384 * @param[in] S points to an instance of the Q31 FIR decimator structure.
3385 * @param[in] pSrc points to the block of input data.
3386 * @param[out] pDst points to the block of output data
3387 * @param[in] blockSize number of input samples to process per call.
3388 */
3389 void arm_fir_decimate_q31(
3390 const arm_fir_decimate_instance_q31 * S,
3391 q31_t * pSrc,
3392 q31_t * pDst,
3393 uint32_t blockSize);
3394
3395 /**
3396 * @brief Processing function for the Q31 FIR decimator (fast variant) for Cortex-M3 and Cortex-M4.
3397 * @param[in] S points to an instance of the Q31 FIR decimator structure.
3398 * @param[in] pSrc points to the block of input data.
3399 * @param[out] pDst points to the block of output data
3400 * @param[in] blockSize number of input samples to process per call.
3401 */
3402 void arm_fir_decimate_fast_q31(
3403 arm_fir_decimate_instance_q31 * S,
3404 q31_t * pSrc,
3405 q31_t * pDst,
3406 uint32_t blockSize);
3407
3408
3409 /**
3410 * @brief Initialization function for the Q31 FIR decimator.
3411 * @param[in,out] S points to an instance of the Q31 FIR decimator structure.
3412 * @param[in] numTaps number of coefficients in the filter.
3413 * @param[in] M decimation factor.
3414 * @param[in] pCoeffs points to the filter coefficients.
3415 * @param[in] pState points to the state buffer.
3416 * @param[in] blockSize number of input samples to process per call.
3417 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3418 * <code>blockSize</code> is not a multiple of <code>M</code>.
3419 */
3420 arm_status arm_fir_decimate_init_q31(
3421 arm_fir_decimate_instance_q31 * S,
3422 uint16_t numTaps,
3423 uint8_t M,
3424 q31_t * pCoeffs,
3425 q31_t * pState,
3426 uint32_t blockSize);
3427
3428
3429 /**
3430 * @brief Instance structure for the Q15 FIR interpolator.
3431 */
3432 typedef struct
3433 {
3434 uint8_t L; /**< upsample factor. */
3435 uint16_t phaseLength; /**< length of each polyphase filter component. */
3436 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length L*phaseLength. */
3437 q15_t *pState; /**< points to the state variable array. The array is of length blockSize+phaseLength-1. */
3438 } arm_fir_interpolate_instance_q15;
3439
3440 /**
3441 * @brief Instance structure for the Q31 FIR interpolator.
3442 */
3443 typedef struct
3444 {
3445 uint8_t L; /**< upsample factor. */
3446 uint16_t phaseLength; /**< length of each polyphase filter component. */
3447 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length L*phaseLength. */
3448 q31_t *pState; /**< points to the state variable array. The array is of length blockSize+phaseLength-1. */
3449 } arm_fir_interpolate_instance_q31;
3450
3451 /**
3452 * @brief Instance structure for the floating-point FIR interpolator.
3453 */
3454 typedef struct
3455 {
3456 uint8_t L; /**< upsample factor. */
3457 uint16_t phaseLength; /**< length of each polyphase filter component. */
3458 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length L*phaseLength. */
3459 float32_t *pState; /**< points to the state variable array. The array is of length phaseLength+numTaps-1. */
3460 } arm_fir_interpolate_instance_f32;
3461
3462
3463 /**
3464 * @brief Processing function for the Q15 FIR interpolator.
3465 * @param[in] S points to an instance of the Q15 FIR interpolator structure.
3466 * @param[in] pSrc points to the block of input data.
3467 * @param[out] pDst points to the block of output data.
3468 * @param[in] blockSize number of input samples to process per call.
3469 */
3470 void arm_fir_interpolate_q15(
3471 const arm_fir_interpolate_instance_q15 * S,
3472 q15_t * pSrc,
3473 q15_t * pDst,
3474 uint32_t blockSize);
3475
3476
3477 /**
3478 * @brief Initialization function for the Q15 FIR interpolator.
3479 * @param[in,out] S points to an instance of the Q15 FIR interpolator structure.
3480 * @param[in] L upsample factor.
3481 * @param[in] numTaps number of filter coefficients in the filter.
3482 * @param[in] pCoeffs points to the filter coefficient buffer.
3483 * @param[in] pState points to the state buffer.
3484 * @param[in] blockSize number of input samples to process per call.
3485 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3486 * the filter length <code>numTaps</code> is not a multiple of the interpolation factor <code>L</code>.
3487 */
3488 arm_status arm_fir_interpolate_init_q15(
3489 arm_fir_interpolate_instance_q15 * S,
3490 uint8_t L,
3491 uint16_t numTaps,
3492 q15_t * pCoeffs,
3493 q15_t * pState,
3494 uint32_t blockSize);
3495
3496
3497 /**
3498 * @brief Processing function for the Q31 FIR interpolator.
3499 * @param[in] S points to an instance of the Q15 FIR interpolator structure.
3500 * @param[in] pSrc points to the block of input data.
3501 * @param[out] pDst points to the block of output data.
3502 * @param[in] blockSize number of input samples to process per call.
3503 */
3504 void arm_fir_interpolate_q31(
3505 const arm_fir_interpolate_instance_q31 * S,
3506 q31_t * pSrc,
3507 q31_t * pDst,
3508 uint32_t blockSize);
3509
3510
3511 /**
3512 * @brief Initialization function for the Q31 FIR interpolator.
3513 * @param[in,out] S points to an instance of the Q31 FIR interpolator structure.
3514 * @param[in] L upsample factor.
3515 * @param[in] numTaps number of filter coefficients in the filter.
3516 * @param[in] pCoeffs points to the filter coefficient buffer.
3517 * @param[in] pState points to the state buffer.
3518 * @param[in] blockSize number of input samples to process per call.
3519 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3520 * the filter length <code>numTaps</code> is not a multiple of the interpolation factor <code>L</code>.
3521 */
3522 arm_status arm_fir_interpolate_init_q31(
3523 arm_fir_interpolate_instance_q31 * S,
3524 uint8_t L,
3525 uint16_t numTaps,
3526 q31_t * pCoeffs,
3527 q31_t * pState,
3528 uint32_t blockSize);
3529
3530
3531 /**
3532 * @brief Processing function for the floating-point FIR interpolator.
3533 * @param[in] S points to an instance of the floating-point FIR interpolator structure.
3534 * @param[in] pSrc points to the block of input data.
3535 * @param[out] pDst points to the block of output data.
3536 * @param[in] blockSize number of input samples to process per call.
3537 */
3538 void arm_fir_interpolate_f32(
3539 const arm_fir_interpolate_instance_f32 * S,
3540 float32_t * pSrc,
3541 float32_t * pDst,
3542 uint32_t blockSize);
3543
3544
3545 /**
3546 * @brief Initialization function for the floating-point FIR interpolator.
3547 * @param[in,out] S points to an instance of the floating-point FIR interpolator structure.
3548 * @param[in] L upsample factor.
3549 * @param[in] numTaps number of filter coefficients in the filter.
3550 * @param[in] pCoeffs points to the filter coefficient buffer.
3551 * @param[in] pState points to the state buffer.
3552 * @param[in] blockSize number of input samples to process per call.
3553 * @return The function returns ARM_MATH_SUCCESS if initialization is successful or ARM_MATH_LENGTH_ERROR if
3554 * the filter length <code>numTaps</code> is not a multiple of the interpolation factor <code>L</code>.
3555 */
3556 arm_status arm_fir_interpolate_init_f32(
3557 arm_fir_interpolate_instance_f32 * S,
3558 uint8_t L,
3559 uint16_t numTaps,
3560 float32_t * pCoeffs,
3561 float32_t * pState,
3562 uint32_t blockSize);
3563
3564
3565 /**
3566 * @brief Instance structure for the high precision Q31 Biquad cascade filter.
3567 */
3568 typedef struct
3569 {
3570 uint8_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
3571 q63_t *pState; /**< points to the array of state coefficients. The array is of length 4*numStages. */
3572 q31_t *pCoeffs; /**< points to the array of coefficients. The array is of length 5*numStages. */
3573 uint8_t postShift; /**< additional shift, in bits, applied to each output sample. */
3574 } arm_biquad_cas_df1_32x64_ins_q31;
3575
3576
3577 /**
3578 * @param[in] S points to an instance of the high precision Q31 Biquad cascade filter structure.
3579 * @param[in] pSrc points to the block of input data.
3580 * @param[out] pDst points to the block of output data
3581 * @param[in] blockSize number of samples to process.
3582 */
3583 void arm_biquad_cas_df1_32x64_q31(
3584 const arm_biquad_cas_df1_32x64_ins_q31 * S,
3585 q31_t * pSrc,
3586 q31_t * pDst,
3587 uint32_t blockSize);
3588
3589
3590 /**
3591 * @param[in,out] S points to an instance of the high precision Q31 Biquad cascade filter structure.
3592 * @param[in] numStages number of 2nd order stages in the filter.
3593 * @param[in] pCoeffs points to the filter coefficients.
3594 * @param[in] pState points to the state buffer.
3595 * @param[in] postShift shift to be applied to the output. Varies according to the coefficients format
3596 */
3597 void arm_biquad_cas_df1_32x64_init_q31(
3598 arm_biquad_cas_df1_32x64_ins_q31 * S,
3599 uint8_t numStages,
3600 q31_t * pCoeffs,
3601 q63_t * pState,
3602 uint8_t postShift);
3603
3604
3605 /**
3606 * @brief Instance structure for the floating-point transposed direct form II Biquad cascade filter.
3607 */
3608 typedef struct
3609 {
3610 uint8_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
3611 float32_t *pState; /**< points to the array of state coefficients. The array is of length 2*numStages. */
3612 float32_t *pCoeffs; /**< points to the array of coefficients. The array is of length 5*numStages. */
3613 } arm_biquad_cascade_df2T_instance_f32;
3614
3615 /**
3616 * @brief Instance structure for the floating-point transposed direct form II Biquad cascade filter.
3617 */
3618 typedef struct
3619 {
3620 uint8_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
3621 float32_t *pState; /**< points to the array of state coefficients. The array is of length 4*numStages. */
3622 float32_t *pCoeffs; /**< points to the array of coefficients. The array is of length 5*numStages. */
3623 } arm_biquad_cascade_stereo_df2T_instance_f32;
3624
3625 /**
3626 * @brief Instance structure for the floating-point transposed direct form II Biquad cascade filter.
3627 */
3628 typedef struct
3629 {
3630 uint8_t numStages; /**< number of 2nd order stages in the filter. Overall order is 2*numStages. */
3631 float64_t *pState; /**< points to the array of state coefficients. The array is of length 2*numStages. */
3632 float64_t *pCoeffs; /**< points to the array of coefficients. The array is of length 5*numStages. */
3633 } arm_biquad_cascade_df2T_instance_f64;
3634
3635
3636 /**
3637 * @brief Processing function for the floating-point transposed direct form II Biquad cascade filter.
3638 * @param[in] S points to an instance of the filter data structure.
3639 * @param[in] pSrc points to the block of input data.
3640 * @param[out] pDst points to the block of output data
3641 * @param[in] blockSize number of samples to process.
3642 */
3643 void arm_biquad_cascade_df2T_f32(
3644 const arm_biquad_cascade_df2T_instance_f32 * S,
3645 float32_t * pSrc,
3646 float32_t * pDst,
3647 uint32_t blockSize);
3648
3649
3650 /**
3651 * @brief Processing function for the floating-point transposed direct form II Biquad cascade filter. 2 channels
3652 * @param[in] S points to an instance of the filter data structure.
3653 * @param[in] pSrc points to the block of input data.
3654 * @param[out] pDst points to the block of output data
3655 * @param[in] blockSize number of samples to process.
3656 */
3657 void arm_biquad_cascade_stereo_df2T_f32(
3658 const arm_biquad_cascade_stereo_df2T_instance_f32 * S,
3659 float32_t * pSrc,
3660 float32_t * pDst,
3661 uint32_t blockSize);
3662
3663
3664 /**
3665 * @brief Processing function for the floating-point transposed direct form II Biquad cascade filter.
3666 * @param[in] S points to an instance of the filter data structure.
3667 * @param[in] pSrc points to the block of input data.
3668 * @param[out] pDst points to the block of output data
3669 * @param[in] blockSize number of samples to process.
3670 */
3671 void arm_biquad_cascade_df2T_f64(
3672 const arm_biquad_cascade_df2T_instance_f64 * S,
3673 float64_t * pSrc,
3674 float64_t * pDst,
3675 uint32_t blockSize);
3676
3677
3678 /**
3679 * @brief Initialization function for the floating-point transposed direct form II Biquad cascade filter.
3680 * @param[in,out] S points to an instance of the filter data structure.
3681 * @param[in] numStages number of 2nd order stages in the filter.
3682 * @param[in] pCoeffs points to the filter coefficients.
3683 * @param[in] pState points to the state buffer.
3684 */
3685 void arm_biquad_cascade_df2T_init_f32(
3686 arm_biquad_cascade_df2T_instance_f32 * S,
3687 uint8_t numStages,
3688 float32_t * pCoeffs,
3689 float32_t * pState);
3690
3691
3692 /**
3693 * @brief Initialization function for the floating-point transposed direct form II Biquad cascade filter.
3694 * @param[in,out] S points to an instance of the filter data structure.
3695 * @param[in] numStages number of 2nd order stages in the filter.
3696 * @param[in] pCoeffs points to the filter coefficients.
3697 * @param[in] pState points to the state buffer.
3698 */
3699 void arm_biquad_cascade_stereo_df2T_init_f32(
3700 arm_biquad_cascade_stereo_df2T_instance_f32 * S,
3701 uint8_t numStages,
3702 float32_t * pCoeffs,
3703 float32_t * pState);
3704
3705
3706 /**
3707 * @brief Initialization function for the floating-point transposed direct form II Biquad cascade filter.
3708 * @param[in,out] S points to an instance of the filter data structure.
3709 * @param[in] numStages number of 2nd order stages in the filter.
3710 * @param[in] pCoeffs points to the filter coefficients.
3711 * @param[in] pState points to the state buffer.
3712 */
3713 void arm_biquad_cascade_df2T_init_f64(
3714 arm_biquad_cascade_df2T_instance_f64 * S,
3715 uint8_t numStages,
3716 float64_t * pCoeffs,
3717 float64_t * pState);
3718
3719
3720 /**
3721 * @brief Instance structure for the Q15 FIR lattice filter.
3722 */
3723 typedef struct
3724 {
3725 uint16_t numStages; /**< number of filter stages. */
3726 q15_t *pState; /**< points to the state variable array. The array is of length numStages. */
3727 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numStages. */
3728 } arm_fir_lattice_instance_q15;
3729
3730 /**
3731 * @brief Instance structure for the Q31 FIR lattice filter.
3732 */
3733 typedef struct
3734 {
3735 uint16_t numStages; /**< number of filter stages. */
3736 q31_t *pState; /**< points to the state variable array. The array is of length numStages. */
3737 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numStages. */
3738 } arm_fir_lattice_instance_q31;
3739
3740 /**
3741 * @brief Instance structure for the floating-point FIR lattice filter.
3742 */
3743 typedef struct
3744 {
3745 uint16_t numStages; /**< number of filter stages. */
3746 float32_t *pState; /**< points to the state variable array. The array is of length numStages. */
3747 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numStages. */
3748 } arm_fir_lattice_instance_f32;
3749
3750
3751 /**
3752 * @brief Initialization function for the Q15 FIR lattice filter.
3753 * @param[in] S points to an instance of the Q15 FIR lattice structure.
3754 * @param[in] numStages number of filter stages.
3755 * @param[in] pCoeffs points to the coefficient buffer. The array is of length numStages.
3756 * @param[in] pState points to the state buffer. The array is of length numStages.
3757 */
3758 void arm_fir_lattice_init_q15(
3759 arm_fir_lattice_instance_q15 * S,
3760 uint16_t numStages,
3761 q15_t * pCoeffs,
3762 q15_t * pState);
3763
3764
3765 /**
3766 * @brief Processing function for the Q15 FIR lattice filter.
3767 * @param[in] S points to an instance of the Q15 FIR lattice structure.
3768 * @param[in] pSrc points to the block of input data.
3769 * @param[out] pDst points to the block of output data.
3770 * @param[in] blockSize number of samples to process.
3771 */
3772 void arm_fir_lattice_q15(
3773 const arm_fir_lattice_instance_q15 * S,
3774 q15_t * pSrc,
3775 q15_t * pDst,
3776 uint32_t blockSize);
3777
3778
3779 /**
3780 * @brief Initialization function for the Q31 FIR lattice filter.
3781 * @param[in] S points to an instance of the Q31 FIR lattice structure.
3782 * @param[in] numStages number of filter stages.
3783 * @param[in] pCoeffs points to the coefficient buffer. The array is of length numStages.
3784 * @param[in] pState points to the state buffer. The array is of length numStages.
3785 */
3786 void arm_fir_lattice_init_q31(
3787 arm_fir_lattice_instance_q31 * S,
3788 uint16_t numStages,
3789 q31_t * pCoeffs,
3790 q31_t * pState);
3791
3792
3793 /**
3794 * @brief Processing function for the Q31 FIR lattice filter.
3795 * @param[in] S points to an instance of the Q31 FIR lattice structure.
3796 * @param[in] pSrc points to the block of input data.
3797 * @param[out] pDst points to the block of output data
3798 * @param[in] blockSize number of samples to process.
3799 */
3800 void arm_fir_lattice_q31(
3801 const arm_fir_lattice_instance_q31 * S,
3802 q31_t * pSrc,
3803 q31_t * pDst,
3804 uint32_t blockSize);
3805
3806
3807 /**
3808 * @brief Initialization function for the floating-point FIR lattice filter.
3809 * @param[in] S points to an instance of the floating-point FIR lattice structure.
3810 * @param[in] numStages number of filter stages.
3811 * @param[in] pCoeffs points to the coefficient buffer. The array is of length numStages.
3812 * @param[in] pState points to the state buffer. The array is of length numStages.
3813 */
3814 void arm_fir_lattice_init_f32(
3815 arm_fir_lattice_instance_f32 * S,
3816 uint16_t numStages,
3817 float32_t * pCoeffs,
3818 float32_t * pState);
3819
3820
3821 /**
3822 * @brief Processing function for the floating-point FIR lattice filter.
3823 * @param[in] S points to an instance of the floating-point FIR lattice structure.
3824 * @param[in] pSrc points to the block of input data.
3825 * @param[out] pDst points to the block of output data
3826 * @param[in] blockSize number of samples to process.
3827 */
3828 void arm_fir_lattice_f32(
3829 const arm_fir_lattice_instance_f32 * S,
3830 float32_t * pSrc,
3831 float32_t * pDst,
3832 uint32_t blockSize);
3833
3834
3835 /**
3836 * @brief Instance structure for the Q15 IIR lattice filter.
3837 */
3838 typedef struct
3839 {
3840 uint16_t numStages; /**< number of stages in the filter. */
3841 q15_t *pState; /**< points to the state variable array. The array is of length numStages+blockSize. */
3842 q15_t *pkCoeffs; /**< points to the reflection coefficient array. The array is of length numStages. */
3843 q15_t *pvCoeffs; /**< points to the ladder coefficient array. The array is of length numStages+1. */
3844 } arm_iir_lattice_instance_q15;
3845
3846 /**
3847 * @brief Instance structure for the Q31 IIR lattice filter.
3848 */
3849 typedef struct
3850 {
3851 uint16_t numStages; /**< number of stages in the filter. */
3852 q31_t *pState; /**< points to the state variable array. The array is of length numStages+blockSize. */
3853 q31_t *pkCoeffs; /**< points to the reflection coefficient array. The array is of length numStages. */
3854 q31_t *pvCoeffs; /**< points to the ladder coefficient array. The array is of length numStages+1. */
3855 } arm_iir_lattice_instance_q31;
3856
3857 /**
3858 * @brief Instance structure for the floating-point IIR lattice filter.
3859 */
3860 typedef struct
3861 {
3862 uint16_t numStages; /**< number of stages in the filter. */
3863 float32_t *pState; /**< points to the state variable array. The array is of length numStages+blockSize. */
3864 float32_t *pkCoeffs; /**< points to the reflection coefficient array. The array is of length numStages. */
3865 float32_t *pvCoeffs; /**< points to the ladder coefficient array. The array is of length numStages+1. */
3866 } arm_iir_lattice_instance_f32;
3867
3868
3869 /**
3870 * @brief Processing function for the floating-point IIR lattice filter.
3871 * @param[in] S points to an instance of the floating-point IIR lattice structure.
3872 * @param[in] pSrc points to the block of input data.
3873 * @param[out] pDst points to the block of output data.
3874 * @param[in] blockSize number of samples to process.
3875 */
3876 void arm_iir_lattice_f32(
3877 const arm_iir_lattice_instance_f32 * S,
3878 float32_t * pSrc,
3879 float32_t * pDst,
3880 uint32_t blockSize);
3881
3882
3883 /**
3884 * @brief Initialization function for the floating-point IIR lattice filter.
3885 * @param[in] S points to an instance of the floating-point IIR lattice structure.
3886 * @param[in] numStages number of stages in the filter.
3887 * @param[in] pkCoeffs points to the reflection coefficient buffer. The array is of length numStages.
3888 * @param[in] pvCoeffs points to the ladder coefficient buffer. The array is of length numStages+1.
3889 * @param[in] pState points to the state buffer. The array is of length numStages+blockSize-1.
3890 * @param[in] blockSize number of samples to process.
3891 */
3892 void arm_iir_lattice_init_f32(
3893 arm_iir_lattice_instance_f32 * S,
3894 uint16_t numStages,
3895 float32_t * pkCoeffs,
3896 float32_t * pvCoeffs,
3897 float32_t * pState,
3898 uint32_t blockSize);
3899
3900
3901 /**
3902 * @brief Processing function for the Q31 IIR lattice filter.
3903 * @param[in] S points to an instance of the Q31 IIR lattice structure.
3904 * @param[in] pSrc points to the block of input data.
3905 * @param[out] pDst points to the block of output data.
3906 * @param[in] blockSize number of samples to process.
3907 */
3908 void arm_iir_lattice_q31(
3909 const arm_iir_lattice_instance_q31 * S,
3910 q31_t * pSrc,
3911 q31_t * pDst,
3912 uint32_t blockSize);
3913
3914
3915 /**
3916 * @brief Initialization function for the Q31 IIR lattice filter.
3917 * @param[in] S points to an instance of the Q31 IIR lattice structure.
3918 * @param[in] numStages number of stages in the filter.
3919 * @param[in] pkCoeffs points to the reflection coefficient buffer. The array is of length numStages.
3920 * @param[in] pvCoeffs points to the ladder coefficient buffer. The array is of length numStages+1.
3921 * @param[in] pState points to the state buffer. The array is of length numStages+blockSize.
3922 * @param[in] blockSize number of samples to process.
3923 */
3924 void arm_iir_lattice_init_q31(
3925 arm_iir_lattice_instance_q31 * S,
3926 uint16_t numStages,
3927 q31_t * pkCoeffs,
3928 q31_t * pvCoeffs,
3929 q31_t * pState,
3930 uint32_t blockSize);
3931
3932
3933 /**
3934 * @brief Processing function for the Q15 IIR lattice filter.
3935 * @param[in] S points to an instance of the Q15 IIR lattice structure.
3936 * @param[in] pSrc points to the block of input data.
3937 * @param[out] pDst points to the block of output data.
3938 * @param[in] blockSize number of samples to process.
3939 */
3940 void arm_iir_lattice_q15(
3941 const arm_iir_lattice_instance_q15 * S,
3942 q15_t * pSrc,
3943 q15_t * pDst,
3944 uint32_t blockSize);
3945
3946
3947 /**
3948 * @brief Initialization function for the Q15 IIR lattice filter.
3949 * @param[in] S points to an instance of the fixed-point Q15 IIR lattice structure.
3950 * @param[in] numStages number of stages in the filter.
3951 * @param[in] pkCoeffs points to reflection coefficient buffer. The array is of length numStages.
3952 * @param[in] pvCoeffs points to ladder coefficient buffer. The array is of length numStages+1.
3953 * @param[in] pState points to state buffer. The array is of length numStages+blockSize.
3954 * @param[in] blockSize number of samples to process per call.
3955 */
3956 void arm_iir_lattice_init_q15(
3957 arm_iir_lattice_instance_q15 * S,
3958 uint16_t numStages,
3959 q15_t * pkCoeffs,
3960 q15_t * pvCoeffs,
3961 q15_t * pState,
3962 uint32_t blockSize);
3963
3964
3965 /**
3966 * @brief Instance structure for the floating-point LMS filter.
3967 */
3968 typedef struct
3969 {
3970 uint16_t numTaps; /**< number of coefficients in the filter. */
3971 float32_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
3972 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
3973 float32_t mu; /**< step size that controls filter coefficient updates. */
3974 } arm_lms_instance_f32;
3975
3976
3977 /**
3978 * @brief Processing function for floating-point LMS filter.
3979 * @param[in] S points to an instance of the floating-point LMS filter structure.
3980 * @param[in] pSrc points to the block of input data.
3981 * @param[in] pRef points to the block of reference data.
3982 * @param[out] pOut points to the block of output data.
3983 * @param[out] pErr points to the block of error data.
3984 * @param[in] blockSize number of samples to process.
3985 */
3986 void arm_lms_f32(
3987 const arm_lms_instance_f32 * S,
3988 float32_t * pSrc,
3989 float32_t * pRef,
3990 float32_t * pOut,
3991 float32_t * pErr,
3992 uint32_t blockSize);
3993
3994
3995 /**
3996 * @brief Initialization function for floating-point LMS filter.
3997 * @param[in] S points to an instance of the floating-point LMS filter structure.
3998 * @param[in] numTaps number of filter coefficients.
3999 * @param[in] pCoeffs points to the coefficient buffer.
4000 * @param[in] pState points to state buffer.
4001 * @param[in] mu step size that controls filter coefficient updates.
4002 * @param[in] blockSize number of samples to process.
4003 */
4004 void arm_lms_init_f32(
4005 arm_lms_instance_f32 * S,
4006 uint16_t numTaps,
4007 float32_t * pCoeffs,
4008 float32_t * pState,
4009 float32_t mu,
4010 uint32_t blockSize);
4011
4012
4013 /**
4014 * @brief Instance structure for the Q15 LMS filter.
4015 */
4016 typedef struct
4017 {
4018 uint16_t numTaps; /**< number of coefficients in the filter. */
4019 q15_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
4020 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
4021 q15_t mu; /**< step size that controls filter coefficient updates. */
4022 uint32_t postShift; /**< bit shift applied to coefficients. */
4023 } arm_lms_instance_q15;
4024
4025
4026 /**
4027 * @brief Initialization function for the Q15 LMS filter.
4028 * @param[in] S points to an instance of the Q15 LMS filter structure.
4029 * @param[in] numTaps number of filter coefficients.
4030 * @param[in] pCoeffs points to the coefficient buffer.
4031 * @param[in] pState points to the state buffer.
4032 * @param[in] mu step size that controls filter coefficient updates.
4033 * @param[in] blockSize number of samples to process.
4034 * @param[in] postShift bit shift applied to coefficients.
4035 */
4036 void arm_lms_init_q15(
4037 arm_lms_instance_q15 * S,
4038 uint16_t numTaps,
4039 q15_t * pCoeffs,
4040 q15_t * pState,
4041 q15_t mu,
4042 uint32_t blockSize,
4043 uint32_t postShift);
4044
4045
4046 /**
4047 * @brief Processing function for Q15 LMS filter.
4048 * @param[in] S points to an instance of the Q15 LMS filter structure.
4049 * @param[in] pSrc points to the block of input data.
4050 * @param[in] pRef points to the block of reference data.
4051 * @param[out] pOut points to the block of output data.
4052 * @param[out] pErr points to the block of error data.
4053 * @param[in] blockSize number of samples to process.
4054 */
4055 void arm_lms_q15(
4056 const arm_lms_instance_q15 * S,
4057 q15_t * pSrc,
4058 q15_t * pRef,
4059 q15_t * pOut,
4060 q15_t * pErr,
4061 uint32_t blockSize);
4062
4063
4064 /**
4065 * @brief Instance structure for the Q31 LMS filter.
4066 */
4067 typedef struct
4068 {
4069 uint16_t numTaps; /**< number of coefficients in the filter. */
4070 q31_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
4071 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
4072 q31_t mu; /**< step size that controls filter coefficient updates. */
4073 uint32_t postShift; /**< bit shift applied to coefficients. */
4074 } arm_lms_instance_q31;
4075
4076
4077 /**
4078 * @brief Processing function for Q31 LMS filter.
4079 * @param[in] S points to an instance of the Q15 LMS filter structure.
4080 * @param[in] pSrc points to the block of input data.
4081 * @param[in] pRef points to the block of reference data.
4082 * @param[out] pOut points to the block of output data.
4083 * @param[out] pErr points to the block of error data.
4084 * @param[in] blockSize number of samples to process.
4085 */
4086 void arm_lms_q31(
4087 const arm_lms_instance_q31 * S,
4088 q31_t * pSrc,
4089 q31_t * pRef,
4090 q31_t * pOut,
4091 q31_t * pErr,
4092 uint32_t blockSize);
4093
4094
4095 /**
4096 * @brief Initialization function for Q31 LMS filter.
4097 * @param[in] S points to an instance of the Q31 LMS filter structure.
4098 * @param[in] numTaps number of filter coefficients.
4099 * @param[in] pCoeffs points to coefficient buffer.
4100 * @param[in] pState points to state buffer.
4101 * @param[in] mu step size that controls filter coefficient updates.
4102 * @param[in] blockSize number of samples to process.
4103 * @param[in] postShift bit shift applied to coefficients.
4104 */
4105 void arm_lms_init_q31(
4106 arm_lms_instance_q31 * S,
4107 uint16_t numTaps,
4108 q31_t * pCoeffs,
4109 q31_t * pState,
4110 q31_t mu,
4111 uint32_t blockSize,
4112 uint32_t postShift);
4113
4114
4115 /**
4116 * @brief Instance structure for the floating-point normalized LMS filter.
4117 */
4118 typedef struct
4119 {
4120 uint16_t numTaps; /**< number of coefficients in the filter. */
4121 float32_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
4122 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
4123 float32_t mu; /**< step size that control filter coefficient updates. */
4124 float32_t energy; /**< saves previous frame energy. */
4125 float32_t x0; /**< saves previous input sample. */
4126 } arm_lms_norm_instance_f32;
4127
4128
4129 /**
4130 * @brief Processing function for floating-point normalized LMS filter.
4131 * @param[in] S points to an instance of the floating-point normalized LMS filter structure.
4132 * @param[in] pSrc points to the block of input data.
4133 * @param[in] pRef points to the block of reference data.
4134 * @param[out] pOut points to the block of output data.
4135 * @param[out] pErr points to the block of error data.
4136 * @param[in] blockSize number of samples to process.
4137 */
4138 void arm_lms_norm_f32(
4139 arm_lms_norm_instance_f32 * S,
4140 float32_t * pSrc,
4141 float32_t * pRef,
4142 float32_t * pOut,
4143 float32_t * pErr,
4144 uint32_t blockSize);
4145
4146
4147 /**
4148 * @brief Initialization function for floating-point normalized LMS filter.
4149 * @param[in] S points to an instance of the floating-point LMS filter structure.
4150 * @param[in] numTaps number of filter coefficients.
4151 * @param[in] pCoeffs points to coefficient buffer.
4152 * @param[in] pState points to state buffer.
4153 * @param[in] mu step size that controls filter coefficient updates.
4154 * @param[in] blockSize number of samples to process.
4155 */
4156 void arm_lms_norm_init_f32(
4157 arm_lms_norm_instance_f32 * S,
4158 uint16_t numTaps,
4159 float32_t * pCoeffs,
4160 float32_t * pState,
4161 float32_t mu,
4162 uint32_t blockSize);
4163
4164
4165 /**
4166 * @brief Instance structure for the Q31 normalized LMS filter.
4167 */
4168 typedef struct
4169 {
4170 uint16_t numTaps; /**< number of coefficients in the filter. */
4171 q31_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
4172 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
4173 q31_t mu; /**< step size that controls filter coefficient updates. */
4174 uint8_t postShift; /**< bit shift applied to coefficients. */
4175 q31_t *recipTable; /**< points to the reciprocal initial value table. */
4176 q31_t energy; /**< saves previous frame energy. */
4177 q31_t x0; /**< saves previous input sample. */
4178 } arm_lms_norm_instance_q31;
4179
4180
4181 /**
4182 * @brief Processing function for Q31 normalized LMS filter.
4183 * @param[in] S points to an instance of the Q31 normalized LMS filter structure.
4184 * @param[in] pSrc points to the block of input data.
4185 * @param[in] pRef points to the block of reference data.
4186 * @param[out] pOut points to the block of output data.
4187 * @param[out] pErr points to the block of error data.
4188 * @param[in] blockSize number of samples to process.
4189 */
4190 void arm_lms_norm_q31(
4191 arm_lms_norm_instance_q31 * S,
4192 q31_t * pSrc,
4193 q31_t * pRef,
4194 q31_t * pOut,
4195 q31_t * pErr,
4196 uint32_t blockSize);
4197
4198
4199 /**
4200 * @brief Initialization function for Q31 normalized LMS filter.
4201 * @param[in] S points to an instance of the Q31 normalized LMS filter structure.
4202 * @param[in] numTaps number of filter coefficients.
4203 * @param[in] pCoeffs points to coefficient buffer.
4204 * @param[in] pState points to state buffer.
4205 * @param[in] mu step size that controls filter coefficient updates.
4206 * @param[in] blockSize number of samples to process.
4207 * @param[in] postShift bit shift applied to coefficients.
4208 */
4209 void arm_lms_norm_init_q31(
4210 arm_lms_norm_instance_q31 * S,
4211 uint16_t numTaps,
4212 q31_t * pCoeffs,
4213 q31_t * pState,
4214 q31_t mu,
4215 uint32_t blockSize,
4216 uint8_t postShift);
4217
4218
4219 /**
4220 * @brief Instance structure for the Q15 normalized LMS filter.
4221 */
4222 typedef struct
4223 {
4224 uint16_t numTaps; /**< Number of coefficients in the filter. */
4225 q15_t *pState; /**< points to the state variable array. The array is of length numTaps+blockSize-1. */
4226 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps. */
4227 q15_t mu; /**< step size that controls filter coefficient updates. */
4228 uint8_t postShift; /**< bit shift applied to coefficients. */
4229 q15_t *recipTable; /**< Points to the reciprocal initial value table. */
4230 q15_t energy; /**< saves previous frame energy. */
4231 q15_t x0; /**< saves previous input sample. */
4232 } arm_lms_norm_instance_q15;
4233
4234
4235 /**
4236 * @brief Processing function for Q15 normalized LMS filter.
4237 * @param[in] S points to an instance of the Q15 normalized LMS filter structure.
4238 * @param[in] pSrc points to the block of input data.
4239 * @param[in] pRef points to the block of reference data.
4240 * @param[out] pOut points to the block of output data.
4241 * @param[out] pErr points to the block of error data.
4242 * @param[in] blockSize number of samples to process.
4243 */
4244 void arm_lms_norm_q15(
4245 arm_lms_norm_instance_q15 * S,
4246 q15_t * pSrc,
4247 q15_t * pRef,
4248 q15_t * pOut,
4249 q15_t * pErr,
4250 uint32_t blockSize);
4251
4252
4253 /**
4254 * @brief Initialization function for Q15 normalized LMS filter.
4255 * @param[in] S points to an instance of the Q15 normalized LMS filter structure.
4256 * @param[in] numTaps number of filter coefficients.
4257 * @param[in] pCoeffs points to coefficient buffer.
4258 * @param[in] pState points to state buffer.
4259 * @param[in] mu step size that controls filter coefficient updates.
4260 * @param[in] blockSize number of samples to process.
4261 * @param[in] postShift bit shift applied to coefficients.
4262 */
4263 void arm_lms_norm_init_q15(
4264 arm_lms_norm_instance_q15 * S,
4265 uint16_t numTaps,
4266 q15_t * pCoeffs,
4267 q15_t * pState,
4268 q15_t mu,
4269 uint32_t blockSize,
4270 uint8_t postShift);
4271
4272
4273 /**
4274 * @brief Correlation of floating-point sequences.
4275 * @param[in] pSrcA points to the first input sequence.
4276 * @param[in] srcALen length of the first input sequence.
4277 * @param[in] pSrcB points to the second input sequence.
4278 * @param[in] srcBLen length of the second input sequence.
4279 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4280 */
4281 void arm_correlate_f32(
4282 float32_t * pSrcA,
4283 uint32_t srcALen,
4284 float32_t * pSrcB,
4285 uint32_t srcBLen,
4286 float32_t * pDst);
4287
4288
4289 /**
4290 * @brief Correlation of Q15 sequences
4291 * @param[in] pSrcA points to the first input sequence.
4292 * @param[in] srcALen length of the first input sequence.
4293 * @param[in] pSrcB points to the second input sequence.
4294 * @param[in] srcBLen length of the second input sequence.
4295 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4296 * @param[in] pScratch points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
4297 */
4298 void arm_correlate_opt_q15(
4299 q15_t * pSrcA,
4300 uint32_t srcALen,
4301 q15_t * pSrcB,
4302 uint32_t srcBLen,
4303 q15_t * pDst,
4304 q15_t * pScratch);
4305
4306
4307 /**
4308 * @brief Correlation of Q15 sequences.
4309 * @param[in] pSrcA points to the first input sequence.
4310 * @param[in] srcALen length of the first input sequence.
4311 * @param[in] pSrcB points to the second input sequence.
4312 * @param[in] srcBLen length of the second input sequence.
4313 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4314 */
4315
4316 void arm_correlate_q15(
4317 q15_t * pSrcA,
4318 uint32_t srcALen,
4319 q15_t * pSrcB,
4320 uint32_t srcBLen,
4321 q15_t * pDst);
4322
4323
4324 /**
4325 * @brief Correlation of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4.
4326 * @param[in] pSrcA points to the first input sequence.
4327 * @param[in] srcALen length of the first input sequence.
4328 * @param[in] pSrcB points to the second input sequence.
4329 * @param[in] srcBLen length of the second input sequence.
4330 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4331 */
4332
4333 void arm_correlate_fast_q15(
4334 q15_t * pSrcA,
4335 uint32_t srcALen,
4336 q15_t * pSrcB,
4337 uint32_t srcBLen,
4338 q15_t * pDst);
4339
4340
4341 /**
4342 * @brief Correlation of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4.
4343 * @param[in] pSrcA points to the first input sequence.
4344 * @param[in] srcALen length of the first input sequence.
4345 * @param[in] pSrcB points to the second input sequence.
4346 * @param[in] srcBLen length of the second input sequence.
4347 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4348 * @param[in] pScratch points to scratch buffer of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
4349 */
4350 void arm_correlate_fast_opt_q15(
4351 q15_t * pSrcA,
4352 uint32_t srcALen,
4353 q15_t * pSrcB,
4354 uint32_t srcBLen,
4355 q15_t * pDst,
4356 q15_t * pScratch);
4357
4358
4359 /**
4360 * @brief Correlation of Q31 sequences.
4361 * @param[in] pSrcA points to the first input sequence.
4362 * @param[in] srcALen length of the first input sequence.
4363 * @param[in] pSrcB points to the second input sequence.
4364 * @param[in] srcBLen length of the second input sequence.
4365 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4366 */
4367 void arm_correlate_q31(
4368 q31_t * pSrcA,
4369 uint32_t srcALen,
4370 q31_t * pSrcB,
4371 uint32_t srcBLen,
4372 q31_t * pDst);
4373
4374
4375 /**
4376 * @brief Correlation of Q31 sequences (fast version) for Cortex-M3 and Cortex-M4
4377 * @param[in] pSrcA points to the first input sequence.
4378 * @param[in] srcALen length of the first input sequence.
4379 * @param[in] pSrcB points to the second input sequence.
4380 * @param[in] srcBLen length of the second input sequence.
4381 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4382 */
4383 void arm_correlate_fast_q31(
4384 q31_t * pSrcA,
4385 uint32_t srcALen,
4386 q31_t * pSrcB,
4387 uint32_t srcBLen,
4388 q31_t * pDst);
4389
4390
4391 /**
4392 * @brief Correlation of Q7 sequences.
4393 * @param[in] pSrcA points to the first input sequence.
4394 * @param[in] srcALen length of the first input sequence.
4395 * @param[in] pSrcB points to the second input sequence.
4396 * @param[in] srcBLen length of the second input sequence.
4397 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4398 * @param[in] pScratch1 points to scratch buffer(of type q15_t) of size max(srcALen, srcBLen) + 2*min(srcALen, srcBLen) - 2.
4399 * @param[in] pScratch2 points to scratch buffer (of type q15_t) of size min(srcALen, srcBLen).
4400 */
4401 void arm_correlate_opt_q7(
4402 q7_t * pSrcA,
4403 uint32_t srcALen,
4404 q7_t * pSrcB,
4405 uint32_t srcBLen,
4406 q7_t * pDst,
4407 q15_t * pScratch1,
4408 q15_t * pScratch2);
4409
4410
4411 /**
4412 * @brief Correlation of Q7 sequences.
4413 * @param[in] pSrcA points to the first input sequence.
4414 * @param[in] srcALen length of the first input sequence.
4415 * @param[in] pSrcB points to the second input sequence.
4416 * @param[in] srcBLen length of the second input sequence.
4417 * @param[out] pDst points to the block of output data Length 2 * max(srcALen, srcBLen) - 1.
4418 */
4419 void arm_correlate_q7(
4420 q7_t * pSrcA,
4421 uint32_t srcALen,
4422 q7_t * pSrcB,
4423 uint32_t srcBLen,
4424 q7_t * pDst);
4425
4426
4427 /**
4428 * @brief Instance structure for the floating-point sparse FIR filter.
4429 */
4430 typedef struct
4431 {
4432 uint16_t numTaps; /**< number of coefficients in the filter. */
4433 uint16_t stateIndex; /**< state buffer index. Points to the oldest sample in the state buffer. */
4434 float32_t *pState; /**< points to the state buffer array. The array is of length maxDelay+blockSize-1. */
4435 float32_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
4436 uint16_t maxDelay; /**< maximum offset specified by the pTapDelay array. */
4437 int32_t *pTapDelay; /**< points to the array of delay values. The array is of length numTaps. */
4438 } arm_fir_sparse_instance_f32;
4439
4440 /**
4441 * @brief Instance structure for the Q31 sparse FIR filter.
4442 */
4443 typedef struct
4444 {
4445 uint16_t numTaps; /**< number of coefficients in the filter. */
4446 uint16_t stateIndex; /**< state buffer index. Points to the oldest sample in the state buffer. */
4447 q31_t *pState; /**< points to the state buffer array. The array is of length maxDelay+blockSize-1. */
4448 q31_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
4449 uint16_t maxDelay; /**< maximum offset specified by the pTapDelay array. */
4450 int32_t *pTapDelay; /**< points to the array of delay values. The array is of length numTaps. */
4451 } arm_fir_sparse_instance_q31;
4452
4453 /**
4454 * @brief Instance structure for the Q15 sparse FIR filter.
4455 */
4456 typedef struct
4457 {
4458 uint16_t numTaps; /**< number of coefficients in the filter. */
4459 uint16_t stateIndex; /**< state buffer index. Points to the oldest sample in the state buffer. */
4460 q15_t *pState; /**< points to the state buffer array. The array is of length maxDelay+blockSize-1. */
4461 q15_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
4462 uint16_t maxDelay; /**< maximum offset specified by the pTapDelay array. */
4463 int32_t *pTapDelay; /**< points to the array of delay values. The array is of length numTaps. */
4464 } arm_fir_sparse_instance_q15;
4465
4466 /**
4467 * @brief Instance structure for the Q7 sparse FIR filter.
4468 */
4469 typedef struct
4470 {
4471 uint16_t numTaps; /**< number of coefficients in the filter. */
4472 uint16_t stateIndex; /**< state buffer index. Points to the oldest sample in the state buffer. */
4473 q7_t *pState; /**< points to the state buffer array. The array is of length maxDelay+blockSize-1. */
4474 q7_t *pCoeffs; /**< points to the coefficient array. The array is of length numTaps.*/
4475 uint16_t maxDelay; /**< maximum offset specified by the pTapDelay array. */
4476 int32_t *pTapDelay; /**< points to the array of delay values. The array is of length numTaps. */
4477 } arm_fir_sparse_instance_q7;
4478
4479
4480 /**
4481 * @brief Processing function for the floating-point sparse FIR filter.
4482 * @param[in] S points to an instance of the floating-point sparse FIR structure.
4483 * @param[in] pSrc points to the block of input data.
4484 * @param[out] pDst points to the block of output data
4485 * @param[in] pScratchIn points to a temporary buffer of size blockSize.
4486 * @param[in] blockSize number of input samples to process per call.
4487 */
4488 void arm_fir_sparse_f32(
4489 arm_fir_sparse_instance_f32 * S,
4490 float32_t * pSrc,
4491 float32_t * pDst,
4492 float32_t * pScratchIn,
4493 uint32_t blockSize);
4494
4495
4496 /**
4497 * @brief Initialization function for the floating-point sparse FIR filter.
4498 * @param[in,out] S points to an instance of the floating-point sparse FIR structure.
4499 * @param[in] numTaps number of nonzero coefficients in the filter.
4500 * @param[in] pCoeffs points to the array of filter coefficients.
4501 * @param[in] pState points to the state buffer.
4502 * @param[in] pTapDelay points to the array of offset times.
4503 * @param[in] maxDelay maximum offset time supported.
4504 * @param[in] blockSize number of samples that will be processed per block.
4505 */
4506 void arm_fir_sparse_init_f32(
4507 arm_fir_sparse_instance_f32 * S,
4508 uint16_t numTaps,
4509 float32_t * pCoeffs,
4510 float32_t * pState,
4511 int32_t * pTapDelay,
4512 uint16_t maxDelay,
4513 uint32_t blockSize);
4514
4515
4516 /**
4517 * @brief Processing function for the Q31 sparse FIR filter.
4518 * @param[in] S points to an instance of the Q31 sparse FIR structure.
4519 * @param[in] pSrc points to the block of input data.
4520 * @param[out] pDst points to the block of output data
4521 * @param[in] pScratchIn points to a temporary buffer of size blockSize.
4522 * @param[in] blockSize number of input samples to process per call.
4523 */
4524 void arm_fir_sparse_q31(
4525 arm_fir_sparse_instance_q31 * S,
4526 q31_t * pSrc,
4527 q31_t * pDst,
4528 q31_t * pScratchIn,
4529 uint32_t blockSize);
4530
4531
4532 /**
4533 * @brief Initialization function for the Q31 sparse FIR filter.
4534 * @param[in,out] S points to an instance of the Q31 sparse FIR structure.
4535 * @param[in] numTaps number of nonzero coefficients in the filter.
4536 * @param[in] pCoeffs points to the array of filter coefficients.
4537 * @param[in] pState points to the state buffer.
4538 * @param[in] pTapDelay points to the array of offset times.
4539 * @param[in] maxDelay maximum offset time supported.
4540 * @param[in] blockSize number of samples that will be processed per block.
4541 */
4542 void arm_fir_sparse_init_q31(
4543 arm_fir_sparse_instance_q31 * S,
4544 uint16_t numTaps,
4545 q31_t * pCoeffs,
4546 q31_t * pState,
4547 int32_t * pTapDelay,
4548 uint16_t maxDelay,
4549 uint32_t blockSize);
4550
4551
4552 /**
4553 * @brief Processing function for the Q15 sparse FIR filter.
4554 * @param[in] S points to an instance of the Q15 sparse FIR structure.
4555 * @param[in] pSrc points to the block of input data.
4556 * @param[out] pDst points to the block of output data
4557 * @param[in] pScratchIn points to a temporary buffer of size blockSize.
4558 * @param[in] pScratchOut points to a temporary buffer of size blockSize.
4559 * @param[in] blockSize number of input samples to process per call.
4560 */
4561 void arm_fir_sparse_q15(
4562 arm_fir_sparse_instance_q15 * S,
4563 q15_t * pSrc,
4564 q15_t * pDst,
4565 q15_t * pScratchIn,
4566 q31_t * pScratchOut,
4567 uint32_t blockSize);
4568
4569
4570 /**
4571 * @brief Initialization function for the Q15 sparse FIR filter.
4572 * @param[in,out] S points to an instance of the Q15 sparse FIR structure.
4573 * @param[in] numTaps number of nonzero coefficients in the filter.
4574 * @param[in] pCoeffs points to the array of filter coefficients.
4575 * @param[in] pState points to the state buffer.
4576 * @param[in] pTapDelay points to the array of offset times.
4577 * @param[in] maxDelay maximum offset time supported.
4578 * @param[in] blockSize number of samples that will be processed per block.
4579 */
4580 void arm_fir_sparse_init_q15(
4581 arm_fir_sparse_instance_q15 * S,
4582 uint16_t numTaps,
4583 q15_t * pCoeffs,
4584 q15_t * pState,
4585 int32_t * pTapDelay,
4586 uint16_t maxDelay,
4587 uint32_t blockSize);
4588
4589
4590 /**
4591 * @brief Processing function for the Q7 sparse FIR filter.
4592 * @param[in] S points to an instance of the Q7 sparse FIR structure.
4593 * @param[in] pSrc points to the block of input data.
4594 * @param[out] pDst points to the block of output data
4595 * @param[in] pScratchIn points to a temporary buffer of size blockSize.
4596 * @param[in] pScratchOut points to a temporary buffer of size blockSize.
4597 * @param[in] blockSize number of input samples to process per call.
4598 */
4599 void arm_fir_sparse_q7(
4600 arm_fir_sparse_instance_q7 * S,
4601 q7_t * pSrc,
4602 q7_t * pDst,
4603 q7_t * pScratchIn,
4604 q31_t * pScratchOut,
4605 uint32_t blockSize);
4606
4607
4608 /**
4609 * @brief Initialization function for the Q7 sparse FIR filter.
4610 * @param[in,out] S points to an instance of the Q7 sparse FIR structure.
4611 * @param[in] numTaps number of nonzero coefficients in the filter.
4612 * @param[in] pCoeffs points to the array of filter coefficients.
4613 * @param[in] pState points to the state buffer.
4614 * @param[in] pTapDelay points to the array of offset times.
4615 * @param[in] maxDelay maximum offset time supported.
4616 * @param[in] blockSize number of samples that will be processed per block.
4617 */
4618 void arm_fir_sparse_init_q7(
4619 arm_fir_sparse_instance_q7 * S,
4620 uint16_t numTaps,
4621 q7_t * pCoeffs,
4622 q7_t * pState,
4623 int32_t * pTapDelay,
4624 uint16_t maxDelay,
4625 uint32_t blockSize);
4626
4627
4628 /**
4629 * @brief Floating-point sin_cos function.
4630 * @param[in] theta input value in degrees
4631 * @param[out] pSinVal points to the processed sine output.
4632 * @param[out] pCosVal points to the processed cos output.
4633 */
4634 void arm_sin_cos_f32(
4635 float32_t theta,
4636 float32_t * pSinVal,
4637 float32_t * pCosVal);
4638
4639
4640 /**
4641 * @brief Q31 sin_cos function.
4642 * @param[in] theta scaled input value in degrees
4643 * @param[out] pSinVal points to the processed sine output.
4644 * @param[out] pCosVal points to the processed cosine output.
4645 */
4646 void arm_sin_cos_q31(
4647 q31_t theta,
4648 q31_t * pSinVal,
4649 q31_t * pCosVal);
4650
4651
4652 /**
4653 * @brief Floating-point complex conjugate.
4654 * @param[in] pSrc points to the input vector
4655 * @param[out] pDst points to the output vector
4656 * @param[in] numSamples number of complex samples in each vector
4657 */
4658 void arm_cmplx_conj_f32(
4659 float32_t * pSrc,
4660 float32_t * pDst,
4661 uint32_t numSamples);
4662
4663 /**
4664 * @brief Q31 complex conjugate.
4665 * @param[in] pSrc points to the input vector
4666 * @param[out] pDst points to the output vector
4667 * @param[in] numSamples number of complex samples in each vector
4668 */
4669 void arm_cmplx_conj_q31(
4670 q31_t * pSrc,
4671 q31_t * pDst,
4672 uint32_t numSamples);
4673
4674
4675 /**
4676 * @brief Q15 complex conjugate.
4677 * @param[in] pSrc points to the input vector
4678 * @param[out] pDst points to the output vector
4679 * @param[in] numSamples number of complex samples in each vector
4680 */
4681 void arm_cmplx_conj_q15(
4682 q15_t * pSrc,
4683 q15_t * pDst,
4684 uint32_t numSamples);
4685
4686
4687 /**
4688 * @brief Floating-point complex magnitude squared
4689 * @param[in] pSrc points to the complex input vector
4690 * @param[out] pDst points to the real output vector
4691 * @param[in] numSamples number of complex samples in the input vector
4692 */
4693 void arm_cmplx_mag_squared_f32(
4694 float32_t * pSrc,
4695 float32_t * pDst,
4696 uint32_t numSamples);
4697
4698
4699 /**
4700 * @brief Q31 complex magnitude squared
4701 * @param[in] pSrc points to the complex input vector
4702 * @param[out] pDst points to the real output vector
4703 * @param[in] numSamples number of complex samples in the input vector
4704 */
4705 void arm_cmplx_mag_squared_q31(
4706 q31_t * pSrc,
4707 q31_t * pDst,
4708 uint32_t numSamples);
4709
4710
4711 /**
4712 * @brief Q15 complex magnitude squared
4713 * @param[in] pSrc points to the complex input vector
4714 * @param[out] pDst points to the real output vector
4715 * @param[in] numSamples number of complex samples in the input vector
4716 */
4717 void arm_cmplx_mag_squared_q15(
4718 q15_t * pSrc,
4719 q15_t * pDst,
4720 uint32_t numSamples);
4721
4722
4723 /**
4724 * @ingroup groupController
4725 */
4726
4727 /**
4728 * @defgroup PID PID Motor Control
4729 *
4730 * A Proportional Integral Derivative (PID) controller is a generic feedback control
4731 * loop mechanism widely used in industrial control systems.
4732 * A PID controller is the most commonly used type of feedback controller.
4733 *
4734 * This set of functions implements (PID) controllers
4735 * for Q15, Q31, and floating-point data types. The functions operate on a single sample
4736 * of data and each call to the function returns a single processed value.
4737 * <code>S</code> points to an instance of the PID control data structure. <code>in</code>
4738 * is the input sample value. The functions return the output value.
4739 *
4740 * \par Algorithm:
4741 * <pre>
4742 * y[n] = y[n-1] + A0 * x[n] + A1 * x[n-1] + A2 * x[n-2]
4743 * A0 = Kp + Ki + Kd
4744 * A1 = (-Kp ) - (2 * Kd )
4745 * A2 = Kd </pre>
4746 *
4747 * \par
4748 * where \c Kp is proportional constant, \c Ki is Integral constant and \c Kd is Derivative constant
4749 *
4750 * \par
4751 * \image html PID.gif "Proportional Integral Derivative Controller"
4752 *
4753 * \par
4754 * The PID controller calculates an "error" value as the difference between
4755 * the measured output and the reference input.
4756 * The controller attempts to minimize the error by adjusting the process control inputs.
4757 * The proportional value determines the reaction to the current error,
4758 * the integral value determines the reaction based on the sum of recent errors,
4759 * and the derivative value determines the reaction based on the rate at which the error has been changing.
4760 *
4761 * \par Instance Structure
4762 * The Gains A0, A1, A2 and state variables for a PID controller are stored together in an instance data structure.
4763 * A separate instance structure must be defined for each PID Controller.
4764 * There are separate instance structure declarations for each of the 3 supported data types.
4765 *
4766 * \par Reset Functions
4767 * There is also an associated reset function for each data type which clears the state array.
4768 *
4769 * \par Initialization Functions
4770 * There is also an associated initialization function for each data type.
4771 * The initialization function performs the following operations:
4772 * - Initializes the Gains A0, A1, A2 from Kp,Ki, Kd gains.
4773 * - Zeros out the values in the state buffer.
4774 *
4775 * \par
4776 * Instance structure cannot be placed into a const data section and it is recommended to use the initialization function.
4777 *
4778 * \par Fixed-Point Behavior
4779 * Care must be taken when using the fixed-point versions of the PID Controller functions.
4780 * In particular, the overflow and saturation behavior of the accumulator used in each function must be considered.
4781 * Refer to the function specific documentation below for usage guidelines.
4782 */
4783
4784 /**
4785 * @addtogroup PID
4786 * @{
4787 */
4788
4789 /**
4790 * @brief Process function for the floating-point PID Control.
4791 * @param[in,out] S is an instance of the floating-point PID Control structure
4792 * @param[in] in input sample to process
4793 * @return out processed output sample.
4794 */
4795 static __INLINE float32_t arm_pid_f32(
4796 arm_pid_instance_f32 * S,
4797 float32_t in)
4798 {
4799 float32_t out;
4800
4801 /* y[n] = y[n-1] + A0 * x[n] + A1 * x[n-1] + A2 * x[n-2] */
4802 out = (S->A0 * in) +
4803 (S->A1 * S->state[0]) + (S->A2 * S->state[1]) + (S->state[2]);
4804
4805 /* Update state */
4806 S->state[1] = S->state[0];
4807 S->state[0] = in;
4808 S->state[2] = out;
4809
4810 /* return to application */
4811 return (out);
4812
4813 }
4814
4815 /**
4816 * @brief Process function for the Q31 PID Control.
4817 * @param[in,out] S points to an instance of the Q31 PID Control structure
4818 * @param[in] in input sample to process
4819 * @return out processed output sample.
4820 *
4821 * <b>Scaling and Overflow Behavior:</b>
4822 * \par
4823 * The function is implemented using an internal 64-bit accumulator.
4824 * The accumulator has a 2.62 format and maintains full precision of the intermediate multiplication results but provides only a single guard bit.
4825 * Thus, if the accumulator result overflows it wraps around rather than clip.
4826 * In order to avoid overflows completely the input signal must be scaled down by 2 bits as there are four additions.
4827 * After all multiply-accumulates are performed, the 2.62 accumulator is truncated to 1.32 format and then saturated to 1.31 format.
4828 */
4829 static __INLINE q31_t arm_pid_q31(
4830 arm_pid_instance_q31 * S,
4831 q31_t in)
4832 {
4833 q63_t acc;
4834 q31_t out;
4835
4836 /* acc = A0 * x[n] */
4837 acc = (q63_t) S->A0 * in;
4838
4839 /* acc += A1 * x[n-1] */
4840 acc += (q63_t) S->A1 * S->state[0];
4841
4842 /* acc += A2 * x[n-2] */
4843 acc += (q63_t) S->A2 * S->state[1];
4844
4845 /* convert output to 1.31 format to add y[n-1] */
4846 out = (q31_t) (acc >> 31u);
4847
4848 /* out += y[n-1] */
4849 out += S->state[2];
4850
4851 /* Update state */
4852 S->state[1] = S->state[0];
4853 S->state[0] = in;
4854 S->state[2] = out;
4855
4856 /* return to application */
4857 return (out);
4858 }
4859
4860
4861 /**
4862 * @brief Process function for the Q15 PID Control.
4863 * @param[in,out] S points to an instance of the Q15 PID Control structure
4864 * @param[in] in input sample to process
4865 * @return out processed output sample.
4866 *
4867 * <b>Scaling and Overflow Behavior:</b>
4868 * \par
4869 * The function is implemented using a 64-bit internal accumulator.
4870 * Both Gains and state variables are represented in 1.15 format and multiplications yield a 2.30 result.
4871 * The 2.30 intermediate results are accumulated in a 64-bit accumulator in 34.30 format.
4872 * There is no risk of internal overflow with this approach and the full precision of intermediate multiplications is preserved.
4873 * After all additions have been performed, the accumulator is truncated to 34.15 format by discarding low 15 bits.
4874 * Lastly, the accumulator is saturated to yield a result in 1.15 format.
4875 */
4876 static __INLINE q15_t arm_pid_q15(
4877 arm_pid_instance_q15 * S,
4878 q15_t in)
4879 {
4880 q63_t acc;
4881 q15_t out;
4882
4883 #ifndef ARM_MATH_CM0_FAMILY
4884 __SIMD32_TYPE *vstate;
4885
4886 /* Implementation of PID controller */
4887
4888 /* acc = A0 * x[n] */
4889 acc = (q31_t) __SMUAD((uint32_t)S->A0, (uint32_t)in);
4890
4891 /* acc += A1 * x[n-1] + A2 * x[n-2] */
4892 vstate = __SIMD32_CONST(S->state);
4893 acc = (q63_t)__SMLALD((uint32_t)S->A1, (uint32_t)*vstate, (uint64_t)acc);
4894 #else
4895 /* acc = A0 * x[n] */
4896 acc = ((q31_t) S->A0) * in;
4897
4898 /* acc += A1 * x[n-1] + A2 * x[n-2] */
4899 acc += (q31_t) S->A1 * S->state[0];
4900 acc += (q31_t) S->A2 * S->state[1];
4901 #endif
4902
4903 /* acc += y[n-1] */
4904 acc += (q31_t) S->state[2] << 15;
4905
4906 /* saturate the output */
4907 out = (q15_t) (__SSAT((acc >> 15), 16));
4908
4909 /* Update state */
4910 S->state[1] = S->state[0];
4911 S->state[0] = in;
4912 S->state[2] = out;
4913
4914 /* return to application */
4915 return (out);
4916 }
4917
4918 /**
4919 * @} end of PID group
4920 */
4921
4922
4923 /**
4924 * @brief Floating-point matrix inverse.
4925 * @param[in] src points to the instance of the input floating-point matrix structure.
4926 * @param[out] dst points to the instance of the output floating-point matrix structure.
4927 * @return The function returns ARM_MATH_SIZE_MISMATCH, if the dimensions do not match.
4928 * If the input matrix is singular (does not have an inverse), then the algorithm terminates and returns error status ARM_MATH_SINGULAR.
4929 */
4930 arm_status arm_mat_inverse_f32(
4931 const arm_matrix_instance_f32 * src,
4932 arm_matrix_instance_f32 * dst);
4933
4934
4935 /**
4936 * @brief Floating-point matrix inverse.
4937 * @param[in] src points to the instance of the input floating-point matrix structure.
4938 * @param[out] dst points to the instance of the output floating-point matrix structure.
4939 * @return The function returns ARM_MATH_SIZE_MISMATCH, if the dimensions do not match.
4940 * If the input matrix is singular (does not have an inverse), then the algorithm terminates and returns error status ARM_MATH_SINGULAR.
4941 */
4942 arm_status arm_mat_inverse_f64(
4943 const arm_matrix_instance_f64 * src,
4944 arm_matrix_instance_f64 * dst);
4945
4946
4947
4948 /**
4949 * @ingroup groupController
4950 */
4951
4952 /**
4953 * @defgroup clarke Vector Clarke Transform
4954 * Forward Clarke transform converts the instantaneous stator phases into a two-coordinate time invariant vector.
4955 * Generally the Clarke transform uses three-phase currents <code>Ia, Ib and Ic</code> to calculate currents
4956 * in the two-phase orthogonal stator axis <code>Ialpha</code> and <code>Ibeta</code>.
4957 * When <code>Ialpha</code> is superposed with <code>Ia</code> as shown in the figure below
4958 * \image html clarke.gif Stator current space vector and its components in (a,b).
4959 * and <code>Ia + Ib + Ic = 0</code>, in this condition <code>Ialpha</code> and <code>Ibeta</code>
4960 * can be calculated using only <code>Ia</code> and <code>Ib</code>.
4961 *
4962 * The function operates on a single sample of data and each call to the function returns the processed output.
4963 * The library provides separate functions for Q31 and floating-point data types.
4964 * \par Algorithm
4965 * \image html clarkeFormula.gif
4966 * where <code>Ia</code> and <code>Ib</code> are the instantaneous stator phases and
4967 * <code>pIalpha</code> and <code>pIbeta</code> are the two coordinates of time invariant vector.
4968 * \par Fixed-Point Behavior
4969 * Care must be taken when using the Q31 version of the Clarke transform.
4970 * In particular, the overflow and saturation behavior of the accumulator used must be considered.
4971 * Refer to the function specific documentation below for usage guidelines.
4972 */
4973
4974 /**
4975 * @addtogroup clarke
4976 * @{
4977 */
4978
4979 /**
4980 *
4981 * @brief Floating-point Clarke transform
4982 * @param[in] Ia input three-phase coordinate <code>a</code>
4983 * @param[in] Ib input three-phase coordinate <code>b</code>
4984 * @param[out] pIalpha points to output two-phase orthogonal vector axis alpha
4985 * @param[out] pIbeta points to output two-phase orthogonal vector axis beta
4986 */
4987 static __INLINE void arm_clarke_f32(
4988 float32_t Ia,
4989 float32_t Ib,
4990 float32_t * pIalpha,
4991 float32_t * pIbeta)
4992 {
4993 /* Calculate pIalpha using the equation, pIalpha = Ia */
4994 *pIalpha = Ia;
4995
4996 /* Calculate pIbeta using the equation, pIbeta = (1/sqrt(3)) * Ia + (2/sqrt(3)) * Ib */
4997 *pIbeta = ((float32_t) 0.57735026919 * Ia + (float32_t) 1.15470053838 * Ib);
4998 }
4999
5000
5001 /**
5002 * @brief Clarke transform for Q31 version
5003 * @param[in] Ia input three-phase coordinate <code>a</code>
5004 * @param[in] Ib input three-phase coordinate <code>b</code>
5005 * @param[out] pIalpha points to output two-phase orthogonal vector axis alpha
5006 * @param[out] pIbeta points to output two-phase orthogonal vector axis beta
5007 *
5008 * <b>Scaling and Overflow Behavior:</b>
5009 * \par
5010 * The function is implemented using an internal 32-bit accumulator.
5011 * The accumulator maintains 1.31 format by truncating lower 31 bits of the intermediate multiplication in 2.62 format.
5012 * There is saturation on the addition, hence there is no risk of overflow.
5013 */
5014 static __INLINE void arm_clarke_q31(
5015 q31_t Ia,
5016 q31_t Ib,
5017 q31_t * pIalpha,
5018 q31_t * pIbeta)
5019 {
5020 q31_t product1, product2; /* Temporary variables used to store intermediate results */
5021
5022 /* Calculating pIalpha from Ia by equation pIalpha = Ia */
5023 *pIalpha = Ia;
5024
5025 /* Intermediate product is calculated by (1/(sqrt(3)) * Ia) */
5026 product1 = (q31_t) (((q63_t) Ia * 0x24F34E8B) >> 30);
5027
5028 /* Intermediate product is calculated by (2/sqrt(3) * Ib) */
5029 product2 = (q31_t) (((q63_t) Ib * 0x49E69D16) >> 30);
5030
5031 /* pIbeta is calculated by adding the intermediate products */
5032 *pIbeta = __QADD(product1, product2);
5033 }
5034
5035 /**
5036 * @} end of clarke group
5037 */
5038
5039 /**
5040 * @brief Converts the elements of the Q7 vector to Q31 vector.
5041 * @param[in] pSrc input pointer
5042 * @param[out] pDst output pointer
5043 * @param[in] blockSize number of samples to process
5044 */
5045 void arm_q7_to_q31(
5046 q7_t * pSrc,
5047 q31_t * pDst,
5048 uint32_t blockSize);
5049
5050
5051
5052 /**
5053 * @ingroup groupController
5054 */
5055
5056 /**
5057 * @defgroup inv_clarke Vector Inverse Clarke Transform
5058 * Inverse Clarke transform converts the two-coordinate time invariant vector into instantaneous stator phases.
5059 *
5060 * The function operates on a single sample of data and each call to the function returns the processed output.
5061 * The library provides separate functions for Q31 and floating-point data types.
5062 * \par Algorithm
5063 * \image html clarkeInvFormula.gif
5064 * where <code>pIa</code> and <code>pIb</code> are the instantaneous stator phases and
5065 * <code>Ialpha</code> and <code>Ibeta</code> are the two coordinates of time invariant vector.
5066 * \par Fixed-Point Behavior
5067 * Care must be taken when using the Q31 version of the Clarke transform.
5068 * In particular, the overflow and saturation behavior of the accumulator used must be considered.
5069 * Refer to the function specific documentation below for usage guidelines.
5070 */
5071
5072 /**
5073 * @addtogroup inv_clarke
5074 * @{
5075 */
5076
5077 /**
5078 * @brief Floating-point Inverse Clarke transform
5079 * @param[in] Ialpha input two-phase orthogonal vector axis alpha
5080 * @param[in] Ibeta input two-phase orthogonal vector axis beta
5081 * @param[out] pIa points to output three-phase coordinate <code>a</code>
5082 * @param[out] pIb points to output three-phase coordinate <code>b</code>
5083 */
5084 static __INLINE void arm_inv_clarke_f32(
5085 float32_t Ialpha,
5086 float32_t Ibeta,
5087 float32_t * pIa,
5088 float32_t * pIb)
5089 {
5090 /* Calculating pIa from Ialpha by equation pIa = Ialpha */
5091 *pIa = Ialpha;
5092
5093 /* Calculating pIb from Ialpha and Ibeta by equation pIb = -(1/2) * Ialpha + (sqrt(3)/2) * Ibeta */
5094 *pIb = -0.5f * Ialpha + 0.8660254039f * Ibeta;
5095 }
5096
5097
5098 /**
5099 * @brief Inverse Clarke transform for Q31 version
5100 * @param[in] Ialpha input two-phase orthogonal vector axis alpha
5101 * @param[in] Ibeta input two-phase orthogonal vector axis beta
5102 * @param[out] pIa points to output three-phase coordinate <code>a</code>
5103 * @param[out] pIb points to output three-phase coordinate <code>b</code>
5104 *
5105 * <b>Scaling and Overflow Behavior:</b>
5106 * \par
5107 * The function is implemented using an internal 32-bit accumulator.
5108 * The accumulator maintains 1.31 format by truncating lower 31 bits of the intermediate multiplication in 2.62 format.
5109 * There is saturation on the subtraction, hence there is no risk of overflow.
5110 */
5111 static __INLINE void arm_inv_clarke_q31(
5112 q31_t Ialpha,
5113 q31_t Ibeta,
5114 q31_t * pIa,
5115 q31_t * pIb)
5116 {
5117 q31_t product1, product2; /* Temporary variables used to store intermediate results */
5118
5119 /* Calculating pIa from Ialpha by equation pIa = Ialpha */
5120 *pIa = Ialpha;
5121
5122 /* Intermediate product is calculated by (1/(2*sqrt(3)) * Ia) */
5123 product1 = (q31_t) (((q63_t) (Ialpha) * (0x40000000)) >> 31);
5124
5125 /* Intermediate product is calculated by (1/sqrt(3) * pIb) */
5126 product2 = (q31_t) (((q63_t) (Ibeta) * (0x6ED9EBA1)) >> 31);
5127
5128 /* pIb is calculated by subtracting the products */
5129 *pIb = __QSUB(product2, product1);
5130 }
5131
5132 /**
5133 * @} end of inv_clarke group
5134 */
5135
5136 /**
5137 * @brief Converts the elements of the Q7 vector to Q15 vector.
5138 * @param[in] pSrc input pointer
5139 * @param[out] pDst output pointer
5140 * @param[in] blockSize number of samples to process
5141 */
5142 void arm_q7_to_q15(
5143 q7_t * pSrc,
5144 q15_t * pDst,
5145 uint32_t blockSize);
5146
5147
5148
5149 /**
5150 * @ingroup groupController
5151 */
5152
5153 /**
5154 * @defgroup park Vector Park Transform
5155 *
5156 * Forward Park transform converts the input two-coordinate vector to flux and torque components.
5157 * The Park transform can be used to realize the transformation of the <code>Ialpha</code> and the <code>Ibeta</code> currents
5158 * from the stationary to the moving reference frame and control the spatial relationship between
5159 * the stator vector current and rotor flux vector.
5160 * If we consider the d axis aligned with the rotor flux, the diagram below shows the
5161 * current vector and the relationship from the two reference frames:
5162 * \image html park.gif "Stator current space vector and its component in (a,b) and in the d,q rotating reference frame"
5163 *
5164 * The function operates on a single sample of data and each call to the function returns the processed output.
5165 * The library provides separate functions for Q31 and floating-point data types.
5166 * \par Algorithm
5167 * \image html parkFormula.gif
5168 * where <code>Ialpha</code> and <code>Ibeta</code> are the stator vector components,
5169 * <code>pId</code> and <code>pIq</code> are rotor vector components and <code>cosVal</code> and <code>sinVal</code> are the
5170 * cosine and sine values of theta (rotor flux position).
5171 * \par Fixed-Point Behavior
5172 * Care must be taken when using the Q31 version of the Park transform.
5173 * In particular, the overflow and saturation behavior of the accumulator used must be considered.
5174 * Refer to the function specific documentation below for usage guidelines.
5175 */
5176
5177 /**
5178 * @addtogroup park
5179 * @{
5180 */
5181
5182 /**
5183 * @brief Floating-point Park transform
5184 * @param[in] Ialpha input two-phase vector coordinate alpha
5185 * @param[in] Ibeta input two-phase vector coordinate beta
5186 * @param[out] pId points to output rotor reference frame d
5187 * @param[out] pIq points to output rotor reference frame q
5188 * @param[in] sinVal sine value of rotation angle theta
5189 * @param[in] cosVal cosine value of rotation angle theta
5190 *
5191 * The function implements the forward Park transform.
5192 *
5193 */
5194 static __INLINE void arm_park_f32(
5195 float32_t Ialpha,
5196 float32_t Ibeta,
5197 float32_t * pId,
5198 float32_t * pIq,
5199 float32_t sinVal,
5200 float32_t cosVal)
5201 {
5202 /* Calculate pId using the equation, pId = Ialpha * cosVal + Ibeta * sinVal */
5203 *pId = Ialpha * cosVal + Ibeta * sinVal;
5204
5205 /* Calculate pIq using the equation, pIq = - Ialpha * sinVal + Ibeta * cosVal */
5206 *pIq = -Ialpha * sinVal + Ibeta * cosVal;
5207 }
5208
5209
5210 /**
5211 * @brief Park transform for Q31 version
5212 * @param[in] Ialpha input two-phase vector coordinate alpha
5213 * @param[in] Ibeta input two-phase vector coordinate beta
5214 * @param[out] pId points to output rotor reference frame d
5215 * @param[out] pIq points to output rotor reference frame q
5216 * @param[in] sinVal sine value of rotation angle theta
5217 * @param[in] cosVal cosine value of rotation angle theta
5218 *
5219 * <b>Scaling and Overflow Behavior:</b>
5220 * \par
5221 * The function is implemented using an internal 32-bit accumulator.
5222 * The accumulator maintains 1.31 format by truncating lower 31 bits of the intermediate multiplication in 2.62 format.
5223 * There is saturation on the addition and subtraction, hence there is no risk of overflow.
5224 */
5225 static __INLINE void arm_park_q31(
5226 q31_t Ialpha,
5227 q31_t Ibeta,
5228 q31_t * pId,
5229 q31_t * pIq,
5230 q31_t sinVal,
5231 q31_t cosVal)
5232 {
5233 q31_t product1, product2; /* Temporary variables used to store intermediate results */
5234 q31_t product3, product4; /* Temporary variables used to store intermediate results */
5235
5236 /* Intermediate product is calculated by (Ialpha * cosVal) */
5237 product1 = (q31_t) (((q63_t) (Ialpha) * (cosVal)) >> 31);
5238
5239 /* Intermediate product is calculated by (Ibeta * sinVal) */
5240 product2 = (q31_t) (((q63_t) (Ibeta) * (sinVal)) >> 31);
5241
5242
5243 /* Intermediate product is calculated by (Ialpha * sinVal) */
5244 product3 = (q31_t) (((q63_t) (Ialpha) * (sinVal)) >> 31);
5245
5246 /* Intermediate product is calculated by (Ibeta * cosVal) */
5247 product4 = (q31_t) (((q63_t) (Ibeta) * (cosVal)) >> 31);
5248
5249 /* Calculate pId by adding the two intermediate products 1 and 2 */
5250 *pId = __QADD(product1, product2);
5251
5252 /* Calculate pIq by subtracting the two intermediate products 3 from 4 */
5253 *pIq = __QSUB(product4, product3);
5254 }
5255
5256 /**
5257 * @} end of park group
5258 */
5259
5260 /**
5261 * @brief Converts the elements of the Q7 vector to floating-point vector.
5262 * @param[in] pSrc is input pointer
5263 * @param[out] pDst is output pointer
5264 * @param[in] blockSize is the number of samples to process
5265 */
5266 void arm_q7_to_float(
5267 q7_t * pSrc,
5268 float32_t * pDst,
5269 uint32_t blockSize);
5270
5271
5272 /**
5273 * @ingroup groupController
5274 */
5275
5276 /**
5277 * @defgroup inv_park Vector Inverse Park transform
5278 * Inverse Park transform converts the input flux and torque components to two-coordinate vector.
5279 *
5280 * The function operates on a single sample of data and each call to the function returns the processed output.
5281 * The library provides separate functions for Q31 and floating-point data types.
5282 * \par Algorithm
5283 * \image html parkInvFormula.gif
5284 * where <code>pIalpha</code> and <code>pIbeta</code> are the stator vector components,
5285 * <code>Id</code> and <code>Iq</code> are rotor vector components and <code>cosVal</code> and <code>sinVal</code> are the
5286 * cosine and sine values of theta (rotor flux position).
5287 * \par Fixed-Point Behavior
5288 * Care must be taken when using the Q31 version of the Park transform.
5289 * In particular, the overflow and saturation behavior of the accumulator used must be considered.
5290 * Refer to the function specific documentation below for usage guidelines.
5291 */
5292
5293 /**
5294 * @addtogroup inv_park
5295 * @{
5296 */
5297
5298 /**
5299 * @brief Floating-point Inverse Park transform
5300 * @param[in] Id input coordinate of rotor reference frame d
5301 * @param[in] Iq input coordinate of rotor reference frame q
5302 * @param[out] pIalpha points to output two-phase orthogonal vector axis alpha
5303 * @param[out] pIbeta points to output two-phase orthogonal vector axis beta
5304 * @param[in] sinVal sine value of rotation angle theta
5305 * @param[in] cosVal cosine value of rotation angle theta
5306 */
5307 static __INLINE void arm_inv_park_f32(
5308 float32_t Id,
5309 float32_t Iq,
5310 float32_t * pIalpha,
5311 float32_t * pIbeta,
5312 float32_t sinVal,
5313 float32_t cosVal)
5314 {
5315 /* Calculate pIalpha using the equation, pIalpha = Id * cosVal - Iq * sinVal */
5316 *pIalpha = Id * cosVal - Iq * sinVal;
5317
5318 /* Calculate pIbeta using the equation, pIbeta = Id * sinVal + Iq * cosVal */
5319 *pIbeta = Id * sinVal + Iq * cosVal;
5320 }
5321
5322
5323 /**
5324 * @brief Inverse Park transform for Q31 version
5325 * @param[in] Id input coordinate of rotor reference frame d
5326 * @param[in] Iq input coordinate of rotor reference frame q
5327 * @param[out] pIalpha points to output two-phase orthogonal vector axis alpha
5328 * @param[out] pIbeta points to output two-phase orthogonal vector axis beta
5329 * @param[in] sinVal sine value of rotation angle theta
5330 * @param[in] cosVal cosine value of rotation angle theta
5331 *
5332 * <b>Scaling and Overflow Behavior:</b>
5333 * \par
5334 * The function is implemented using an internal 32-bit accumulator.
5335 * The accumulator maintains 1.31 format by truncating lower 31 bits of the intermediate multiplication in 2.62 format.
5336 * There is saturation on the addition, hence there is no risk of overflow.
5337 */
5338 static __INLINE void arm_inv_park_q31(
5339 q31_t Id,
5340 q31_t Iq,
5341 q31_t * pIalpha,
5342 q31_t * pIbeta,
5343 q31_t sinVal,
5344 q31_t cosVal)
5345 {
5346 q31_t product1, product2; /* Temporary variables used to store intermediate results */
5347 q31_t product3, product4; /* Temporary variables used to store intermediate results */
5348
5349 /* Intermediate product is calculated by (Id * cosVal) */
5350 product1 = (q31_t) (((q63_t) (Id) * (cosVal)) >> 31);
5351
5352 /* Intermediate product is calculated by (Iq * sinVal) */
5353 product2 = (q31_t) (((q63_t) (Iq) * (sinVal)) >> 31);
5354
5355
5356 /* Intermediate product is calculated by (Id * sinVal) */
5357 product3 = (q31_t) (((q63_t) (Id) * (sinVal)) >> 31);
5358
5359 /* Intermediate product is calculated by (Iq * cosVal) */
5360 product4 = (q31_t) (((q63_t) (Iq) * (cosVal)) >> 31);
5361
5362 /* Calculate pIalpha by using the two intermediate products 1 and 2 */
5363 *pIalpha = __QSUB(product1, product2);
5364
5365 /* Calculate pIbeta by using the two intermediate products 3 and 4 */
5366 *pIbeta = __QADD(product4, product3);
5367 }
5368
5369 /**
5370 * @} end of Inverse park group
5371 */
5372
5373
5374 /**
5375 * @brief Converts the elements of the Q31 vector to floating-point vector.
5376 * @param[in] pSrc is input pointer
5377 * @param[out] pDst is output pointer
5378 * @param[in] blockSize is the number of samples to process
5379 */
5380 void arm_q31_to_float(
5381 q31_t * pSrc,
5382 float32_t * pDst,
5383 uint32_t blockSize);
5384
5385 /**
5386 * @ingroup groupInterpolation
5387 */
5388
5389 /**
5390 * @defgroup LinearInterpolate Linear Interpolation
5391 *
5392 * Linear interpolation is a method of curve fitting using linear polynomials.
5393 * Linear interpolation works by effectively drawing a straight line between two neighboring samples and returning the appropriate point along that line
5394 *
5395 * \par
5396 * \image html LinearInterp.gif "Linear interpolation"
5397 *
5398 * \par
5399 * A Linear Interpolate function calculates an output value(y), for the input(x)
5400 * using linear interpolation of the input values x0, x1( nearest input values) and the output values y0 and y1(nearest output values)
5401 *
5402 * \par Algorithm:
5403 * <pre>
5404 * y = y0 + (x - x0) * ((y1 - y0)/(x1-x0))
5405 * where x0, x1 are nearest values of input x
5406 * y0, y1 are nearest values to output y
5407 * </pre>
5408 *
5409 * \par
5410 * This set of functions implements Linear interpolation process
5411 * for Q7, Q15, Q31, and floating-point data types. The functions operate on a single
5412 * sample of data and each call to the function returns a single processed value.
5413 * <code>S</code> points to an instance of the Linear Interpolate function data structure.
5414 * <code>x</code> is the input sample value. The functions returns the output value.
5415 *
5416 * \par
5417 * if x is outside of the table boundary, Linear interpolation returns first value of the table
5418 * if x is below input range and returns last value of table if x is above range.
5419 */
5420
5421 /**
5422 * @addtogroup LinearInterpolate
5423 * @{
5424 */
5425
5426 /**
5427 * @brief Process function for the floating-point Linear Interpolation Function.
5428 * @param[in,out] S is an instance of the floating-point Linear Interpolation structure
5429 * @param[in] x input sample to process
5430 * @return y processed output sample.
5431 *
5432 */
5433 static __INLINE float32_t arm_linear_interp_f32(
5434 arm_linear_interp_instance_f32 * S,
5435 float32_t x)
5436 {
5437 float32_t y;
5438 float32_t x0, x1; /* Nearest input values */
5439 float32_t y0, y1; /* Nearest output values */
5440 float32_t xSpacing = S->xSpacing; /* spacing between input values */
5441 int32_t i; /* Index variable */
5442 float32_t *pYData = S->pYData; /* pointer to output table */
5443
5444 /* Calculation of index */
5445 i = (int32_t) ((x - S->x1) / xSpacing);
5446
5447 if(i < 0)
5448 {
5449 /* Iniatilize output for below specified range as least output value of table */
5450 y = pYData[0];
5451 }
5452 else if((uint32_t)i >= S->nValues)
5453 {
5454 /* Iniatilize output for above specified range as last output value of table */
5455 y = pYData[S->nValues - 1];
5456 }
5457 else
5458 {
5459 /* Calculation of nearest input values */
5460 x0 = S->x1 + i * xSpacing;
5461 x1 = S->x1 + (i + 1) * xSpacing;
5462
5463 /* Read of nearest output values */
5464 y0 = pYData[i];
5465 y1 = pYData[i + 1];
5466
5467 /* Calculation of output */
5468 y = y0 + (x - x0) * ((y1 - y0) / (x1 - x0));
5469
5470 }
5471
5472 /* returns output value */
5473 return (y);
5474 }
5475
5476
5477 /**
5478 *
5479 * @brief Process function for the Q31 Linear Interpolation Function.
5480 * @param[in] pYData pointer to Q31 Linear Interpolation table
5481 * @param[in] x input sample to process
5482 * @param[in] nValues number of table values
5483 * @return y processed output sample.
5484 *
5485 * \par
5486 * Input sample <code>x</code> is in 12.20 format which contains 12 bits for table index and 20 bits for fractional part.
5487 * This function can support maximum of table size 2^12.
5488 *
5489 */
5490 static __INLINE q31_t arm_linear_interp_q31(
5491 q31_t * pYData,
5492 q31_t x,
5493 uint32_t nValues)
5494 {
5495 q31_t y; /* output */
5496 q31_t y0, y1; /* Nearest output values */
5497 q31_t fract; /* fractional part */
5498 int32_t index; /* Index to read nearest output values */
5499
5500 /* Input is in 12.20 format */
5501 /* 12 bits for the table index */
5502 /* Index value calculation */
5503 index = ((x & (q31_t)0xFFF00000) >> 20);
5504
5505 if(index >= (int32_t)(nValues - 1))
5506 {
5507 return (pYData[nValues - 1]);
5508 }
5509 else if(index < 0)
5510 {
5511 return (pYData[0]);
5512 }
5513 else
5514 {
5515 /* 20 bits for the fractional part */
5516 /* shift left by 11 to keep fract in 1.31 format */
5517 fract = (x & 0x000FFFFF) << 11;
5518
5519 /* Read two nearest output values from the index in 1.31(q31) format */
5520 y0 = pYData[index];
5521 y1 = pYData[index + 1];
5522
5523 /* Calculation of y0 * (1-fract) and y is in 2.30 format */
5524 y = ((q31_t) ((q63_t) y0 * (0x7FFFFFFF - fract) >> 32));
5525
5526 /* Calculation of y0 * (1-fract) + y1 *fract and y is in 2.30 format */
5527 y += ((q31_t) (((q63_t) y1 * fract) >> 32));
5528
5529 /* Convert y to 1.31 format */
5530 return (y << 1u);
5531 }
5532 }
5533
5534
5535 /**
5536 *
5537 * @brief Process function for the Q15 Linear Interpolation Function.
5538 * @param[in] pYData pointer to Q15 Linear Interpolation table
5539 * @param[in] x input sample to process
5540 * @param[in] nValues number of table values
5541 * @return y processed output sample.
5542 *
5543 * \par
5544 * Input sample <code>x</code> is in 12.20 format which contains 12 bits for table index and 20 bits for fractional part.
5545 * This function can support maximum of table size 2^12.
5546 *
5547 */
5548 static __INLINE q15_t arm_linear_interp_q15(
5549 q15_t * pYData,
5550 q31_t x,
5551 uint32_t nValues)
5552 {
5553 q63_t y; /* output */
5554 q15_t y0, y1; /* Nearest output values */
5555 q31_t fract; /* fractional part */
5556 int32_t index; /* Index to read nearest output values */
5557
5558 /* Input is in 12.20 format */
5559 /* 12 bits for the table index */
5560 /* Index value calculation */
5561 index = ((x & (int32_t)0xFFF00000) >> 20);
5562
5563 if(index >= (int32_t)(nValues - 1))
5564 {
5565 return (pYData[nValues - 1]);
5566 }
5567 else if(index < 0)
5568 {
5569 return (pYData[0]);
5570 }
5571 else
5572 {
5573 /* 20 bits for the fractional part */
5574 /* fract is in 12.20 format */
5575 fract = (x & 0x000FFFFF);
5576
5577 /* Read two nearest output values from the index */
5578 y0 = pYData[index];
5579 y1 = pYData[index + 1];
5580
5581 /* Calculation of y0 * (1-fract) and y is in 13.35 format */
5582 y = ((q63_t) y0 * (0xFFFFF - fract));
5583
5584 /* Calculation of (y0 * (1-fract) + y1 * fract) and y is in 13.35 format */
5585 y += ((q63_t) y1 * (fract));
5586
5587 /* convert y to 1.15 format */
5588 return (q15_t) (y >> 20);
5589 }
5590 }
5591
5592
5593 /**
5594 *
5595 * @brief Process function for the Q7 Linear Interpolation Function.
5596 * @param[in] pYData pointer to Q7 Linear Interpolation table
5597 * @param[in] x input sample to process
5598 * @param[in] nValues number of table values
5599 * @return y processed output sample.
5600 *
5601 * \par
5602 * Input sample <code>x</code> is in 12.20 format which contains 12 bits for table index and 20 bits for fractional part.
5603 * This function can support maximum of table size 2^12.
5604 */
5605 static __INLINE q7_t arm_linear_interp_q7(
5606 q7_t * pYData,
5607 q31_t x,
5608 uint32_t nValues)
5609 {
5610 q31_t y; /* output */
5611 q7_t y0, y1; /* Nearest output values */
5612 q31_t fract; /* fractional part */
5613 uint32_t index; /* Index to read nearest output values */
5614
5615 /* Input is in 12.20 format */
5616 /* 12 bits for the table index */
5617 /* Index value calculation */
5618 if (x < 0)
5619 {
5620 return (pYData[0]);
5621 }
5622 index = (x >> 20) & 0xfff;
5623
5624 if(index >= (nValues - 1))
5625 {
5626 return (pYData[nValues - 1]);
5627 }
5628 else
5629 {
5630 /* 20 bits for the fractional part */
5631 /* fract is in 12.20 format */
5632 fract = (x & 0x000FFFFF);
5633
5634 /* Read two nearest output values from the index and are in 1.7(q7) format */
5635 y0 = pYData[index];
5636 y1 = pYData[index + 1];
5637
5638 /* Calculation of y0 * (1-fract ) and y is in 13.27(q27) format */
5639 y = ((y0 * (0xFFFFF - fract)));
5640
5641 /* Calculation of y1 * fract + y0 * (1-fract) and y is in 13.27(q27) format */
5642 y += (y1 * fract);
5643
5644 /* convert y to 1.7(q7) format */
5645 return (q7_t) (y >> 20);
5646 }
5647 }
5648
5649 /**
5650 * @} end of LinearInterpolate group
5651 */
5652
5653 /**
5654 * @brief Fast approximation to the trigonometric sine function for floating-point data.
5655 * @param[in] x input value in radians.
5656 * @return sin(x).
5657 */
5658 float32_t arm_sin_f32(
5659 float32_t x);
5660
5661
5662 /**
5663 * @brief Fast approximation to the trigonometric sine function for Q31 data.
5664 * @param[in] x Scaled input value in radians.
5665 * @return sin(x).
5666 */
5667 q31_t arm_sin_q31(
5668 q31_t x);
5669
5670
5671 /**
5672 * @brief Fast approximation to the trigonometric sine function for Q15 data.
5673 * @param[in] x Scaled input value in radians.
5674 * @return sin(x).
5675 */
5676 q15_t arm_sin_q15(
5677 q15_t x);
5678
5679
5680 /**
5681 * @brief Fast approximation to the trigonometric cosine function for floating-point data.
5682 * @param[in] x input value in radians.
5683 * @return cos(x).
5684 */
5685 float32_t arm_cos_f32(
5686 float32_t x);
5687
5688
5689 /**
5690 * @brief Fast approximation to the trigonometric cosine function for Q31 data.
5691 * @param[in] x Scaled input value in radians.
5692 * @return cos(x).
5693 */
5694 q31_t arm_cos_q31(
5695 q31_t x);
5696
5697
5698 /**
5699 * @brief Fast approximation to the trigonometric cosine function for Q15 data.
5700 * @param[in] x Scaled input value in radians.
5701 * @return cos(x).
5702 */
5703 q15_t arm_cos_q15(
5704 q15_t x);
5705
5706
5707 /**
5708 * @ingroup groupFastMath
5709 */
5710
5711
5712 /**
5713 * @defgroup SQRT Square Root
5714 *
5715 * Computes the square root of a number.
5716 * There are separate functions for Q15, Q31, and floating-point data types.
5717 * The square root function is computed using the Newton-Raphson algorithm.
5718 * This is an iterative algorithm of the form:
5719 * <pre>
5720 * x1 = x0 - f(x0)/f'(x0)
5721 * </pre>
5722 * where <code>x1</code> is the current estimate,
5723 * <code>x0</code> is the previous estimate, and
5724 * <code>f'(x0)</code> is the derivative of <code>f()</code> evaluated at <code>x0</code>.
5725 * For the square root function, the algorithm reduces to:
5726 * <pre>
5727 * x0 = in/2 [initial guess]
5728 * x1 = 1/2 * ( x0 + in / x0) [each iteration]
5729 * </pre>
5730 */
5731
5732
5733 /**
5734 * @addtogroup SQRT
5735 * @{
5736 */
5737
5738 /**
5739 * @brief Floating-point square root function.
5740 * @param[in] in input value.
5741 * @param[out] pOut square root of input value.
5742 * @return The function returns ARM_MATH_SUCCESS if input value is positive value or ARM_MATH_ARGUMENT_ERROR if
5743 * <code>in</code> is negative value and returns zero output for negative values.
5744 */
5745 static __INLINE arm_status arm_sqrt_f32(
5746 float32_t in,
5747 float32_t * pOut)
5748 {
5749 if(in >= 0.0f)
5750 {
5751
5752 #if (__FPU_USED == 1) && defined ( __CC_ARM )
5753 *pOut = __sqrtf(in);
5754 #elif (__FPU_USED == 1) && (defined(__ARMCC_VERSION) && (__ARMCC_VERSION >= 6010050))
5755 *pOut = __builtin_sqrtf(in);
5756 #elif (__FPU_USED == 1) && defined(__GNUC__)
5757 *pOut = __builtin_sqrtf(in);
5758 #elif (__FPU_USED == 1) && defined ( __ICCARM__ ) && (__VER__ >= 6040000)
5759 __ASM("VSQRT.F32 %0,%1" : "=t"(*pOut) : "t"(in));
5760 #else
5761 *pOut = sqrtf(in);
5762 #endif
5763
5764 return (ARM_MATH_SUCCESS);
5765 }
5766 else
5767 {
5768 *pOut = 0.0f;
5769 return (ARM_MATH_ARGUMENT_ERROR);
5770 }
5771 }
5772
5773
5774 /**
5775 * @brief Q31 square root function.
5776 * @param[in] in input value. The range of the input value is [0 +1) or 0x00000000 to 0x7FFFFFFF.
5777 * @param[out] pOut square root of input value.
5778 * @return The function returns ARM_MATH_SUCCESS if input value is positive value or ARM_MATH_ARGUMENT_ERROR if
5779 * <code>in</code> is negative value and returns zero output for negative values.
5780 */
5781 arm_status arm_sqrt_q31(
5782 q31_t in,
5783 q31_t * pOut);
5784
5785
5786 /**
5787 * @brief Q15 square root function.
5788 * @param[in] in input value. The range of the input value is [0 +1) or 0x0000 to 0x7FFF.
5789 * @param[out] pOut square root of input value.
5790 * @return The function returns ARM_MATH_SUCCESS if input value is positive value or ARM_MATH_ARGUMENT_ERROR if
5791 * <code>in</code> is negative value and returns zero output for negative values.
5792 */
5793 arm_status arm_sqrt_q15(
5794 q15_t in,
5795 q15_t * pOut);
5796
5797 /**
5798 * @} end of SQRT group
5799 */
5800
5801
5802 /**
5803 * @brief floating-point Circular write function.
5804 */
5805 static __INLINE void arm_circularWrite_f32(
5806 int32_t * circBuffer,
5807 int32_t L,
5808 uint16_t * writeOffset,
5809 int32_t bufferInc,
5810 const int32_t * src,
5811 int32_t srcInc,
5812 uint32_t blockSize)
5813 {
5814 uint32_t i = 0u;
5815 int32_t wOffset;
5816
5817 /* Copy the value of Index pointer that points
5818 * to the current location where the input samples to be copied */
5819 wOffset = *writeOffset;
5820
5821 /* Loop over the blockSize */
5822 i = blockSize;
5823
5824 while(i > 0u)
5825 {
5826 /* copy the input sample to the circular buffer */
5827 circBuffer[wOffset] = *src;
5828
5829 /* Update the input pointer */
5830 src += srcInc;
5831
5832 /* Circularly update wOffset. Watch out for positive and negative value */
5833 wOffset += bufferInc;
5834 if(wOffset >= L)
5835 wOffset -= L;
5836
5837 /* Decrement the loop counter */
5838 i--;
5839 }
5840
5841 /* Update the index pointer */
5842 *writeOffset = (uint16_t)wOffset;
5843 }
5844
5845
5846
5847 /**
5848 * @brief floating-point Circular Read function.
5849 */
5850 static __INLINE void arm_circularRead_f32(
5851 int32_t * circBuffer,
5852 int32_t L,
5853 int32_t * readOffset,
5854 int32_t bufferInc,
5855 int32_t * dst,
5856 int32_t * dst_base,
5857 int32_t dst_length,
5858 int32_t dstInc,
5859 uint32_t blockSize)
5860 {
5861 uint32_t i = 0u;
5862 int32_t rOffset, dst_end;
5863
5864 /* Copy the value of Index pointer that points
5865 * to the current location from where the input samples to be read */
5866 rOffset = *readOffset;
5867 dst_end = (int32_t) (dst_base + dst_length);
5868
5869 /* Loop over the blockSize */
5870 i = blockSize;
5871
5872 while(i > 0u)
5873 {
5874 /* copy the sample from the circular buffer to the destination buffer */
5875 *dst = circBuffer[rOffset];
5876
5877 /* Update the input pointer */
5878 dst += dstInc;
5879
5880 if(dst == (int32_t *) dst_end)
5881 {
5882 dst = dst_base;
5883 }
5884
5885 /* Circularly update rOffset. Watch out for positive and negative value */
5886 rOffset += bufferInc;
5887
5888 if(rOffset >= L)
5889 {
5890 rOffset -= L;
5891 }
5892
5893 /* Decrement the loop counter */
5894 i--;
5895 }
5896
5897 /* Update the index pointer */
5898 *readOffset = rOffset;
5899 }
5900
5901
5902 /**
5903 * @brief Q15 Circular write function.
5904 */
5905 static __INLINE void arm_circularWrite_q15(
5906 q15_t * circBuffer,
5907 int32_t L,
5908 uint16_t * writeOffset,
5909 int32_t bufferInc,
5910 const q15_t * src,
5911 int32_t srcInc,
5912 uint32_t blockSize)
5913 {
5914 uint32_t i = 0u;
5915 int32_t wOffset;
5916
5917 /* Copy the value of Index pointer that points
5918 * to the current location where the input samples to be copied */
5919 wOffset = *writeOffset;
5920
5921 /* Loop over the blockSize */
5922 i = blockSize;
5923
5924 while(i > 0u)
5925 {
5926 /* copy the input sample to the circular buffer */
5927 circBuffer[wOffset] = *src;
5928
5929 /* Update the input pointer */
5930 src += srcInc;
5931
5932 /* Circularly update wOffset. Watch out for positive and negative value */
5933 wOffset += bufferInc;
5934 if(wOffset >= L)
5935 wOffset -= L;
5936
5937 /* Decrement the loop counter */
5938 i--;
5939 }
5940
5941 /* Update the index pointer */
5942 *writeOffset = (uint16_t)wOffset;
5943 }
5944
5945
5946 /**
5947 * @brief Q15 Circular Read function.
5948 */
5949 static __INLINE void arm_circularRead_q15(
5950 q15_t * circBuffer,
5951 int32_t L,
5952 int32_t * readOffset,
5953 int32_t bufferInc,
5954 q15_t * dst,
5955 q15_t * dst_base,
5956 int32_t dst_length,
5957 int32_t dstInc,
5958 uint32_t blockSize)
5959 {
5960 uint32_t i = 0;
5961 int32_t rOffset, dst_end;
5962
5963 /* Copy the value of Index pointer that points
5964 * to the current location from where the input samples to be read */
5965 rOffset = *readOffset;
5966
5967 dst_end = (int32_t) (dst_base + dst_length);
5968
5969 /* Loop over the blockSize */
5970 i = blockSize;
5971
5972 while(i > 0u)
5973 {
5974 /* copy the sample from the circular buffer to the destination buffer */
5975 *dst = circBuffer[rOffset];
5976
5977 /* Update the input pointer */
5978 dst += dstInc;
5979
5980 if(dst == (q15_t *) dst_end)
5981 {
5982 dst = dst_base;
5983 }
5984
5985 /* Circularly update wOffset. Watch out for positive and negative value */
5986 rOffset += bufferInc;
5987
5988 if(rOffset >= L)
5989 {
5990 rOffset -= L;
5991 }
5992
5993 /* Decrement the loop counter */
5994 i--;
5995 }
5996
5997 /* Update the index pointer */
5998 *readOffset = rOffset;
5999 }
6000
6001
6002 /**
6003 * @brief Q7 Circular write function.
6004 */
6005 static __INLINE void arm_circularWrite_q7(
6006 q7_t * circBuffer,
6007 int32_t L,
6008 uint16_t * writeOffset,
6009 int32_t bufferInc,
6010 const q7_t * src,
6011 int32_t srcInc,
6012 uint32_t blockSize)
6013 {
6014 uint32_t i = 0u;
6015 int32_t wOffset;
6016
6017 /* Copy the value of Index pointer that points
6018 * to the current location where the input samples to be copied */
6019 wOffset = *writeOffset;
6020
6021 /* Loop over the blockSize */
6022 i = blockSize;
6023
6024 while(i > 0u)
6025 {
6026 /* copy the input sample to the circular buffer */
6027 circBuffer[wOffset] = *src;
6028
6029 /* Update the input pointer */
6030 src += srcInc;
6031
6032 /* Circularly update wOffset. Watch out for positive and negative value */
6033 wOffset += bufferInc;
6034 if(wOffset >= L)
6035 wOffset -= L;
6036
6037 /* Decrement the loop counter */
6038 i--;
6039 }
6040
6041 /* Update the index pointer */
6042 *writeOffset = (uint16_t)wOffset;
6043 }
6044
6045
6046 /**
6047 * @brief Q7 Circular Read function.
6048 */
6049 static __INLINE void arm_circularRead_q7(
6050 q7_t * circBuffer,
6051 int32_t L,
6052 int32_t * readOffset,
6053 int32_t bufferInc,
6054 q7_t * dst,
6055 q7_t * dst_base,
6056 int32_t dst_length,
6057 int32_t dstInc,
6058 uint32_t blockSize)
6059 {
6060 uint32_t i = 0;
6061 int32_t rOffset, dst_end;
6062
6063 /* Copy the value of Index pointer that points
6064 * to the current location from where the input samples to be read */
6065 rOffset = *readOffset;
6066
6067 dst_end = (int32_t) (dst_base + dst_length);
6068
6069 /* Loop over the blockSize */
6070 i = blockSize;
6071
6072 while(i > 0u)
6073 {
6074 /* copy the sample from the circular buffer to the destination buffer */
6075 *dst = circBuffer[rOffset];
6076
6077 /* Update the input pointer */
6078 dst += dstInc;
6079
6080 if(dst == (q7_t *) dst_end)
6081 {
6082 dst = dst_base;
6083 }
6084
6085 /* Circularly update rOffset. Watch out for positive and negative value */
6086 rOffset += bufferInc;
6087
6088 if(rOffset >= L)
6089 {
6090 rOffset -= L;
6091 }
6092
6093 /* Decrement the loop counter */
6094 i--;
6095 }
6096
6097 /* Update the index pointer */
6098 *readOffset = rOffset;
6099 }
6100
6101
6102 /**
6103 * @brief Sum of the squares of the elements of a Q31 vector.
6104 * @param[in] pSrc is input pointer
6105 * @param[in] blockSize is the number of samples to process
6106 * @param[out] pResult is output value.
6107 */
6108 void arm_power_q31(
6109 q31_t * pSrc,
6110 uint32_t blockSize,
6111 q63_t * pResult);
6112
6113
6114 /**
6115 * @brief Sum of the squares of the elements of a floating-point vector.
6116 * @param[in] pSrc is input pointer
6117 * @param[in] blockSize is the number of samples to process
6118 * @param[out] pResult is output value.
6119 */
6120 void arm_power_f32(
6121 float32_t * pSrc,
6122 uint32_t blockSize,
6123 float32_t * pResult);
6124
6125
6126 /**
6127 * @brief Sum of the squares of the elements of a Q15 vector.
6128 * @param[in] pSrc is input pointer
6129 * @param[in] blockSize is the number of samples to process
6130 * @param[out] pResult is output value.
6131 */
6132 void arm_power_q15(
6133 q15_t * pSrc,
6134 uint32_t blockSize,
6135 q63_t * pResult);
6136
6137
6138 /**
6139 * @brief Sum of the squares of the elements of a Q7 vector.
6140 * @param[in] pSrc is input pointer
6141 * @param[in] blockSize is the number of samples to process
6142 * @param[out] pResult is output value.
6143 */
6144 void arm_power_q7(
6145 q7_t * pSrc,
6146 uint32_t blockSize,
6147 q31_t * pResult);
6148
6149
6150 /**
6151 * @brief Mean value of a Q7 vector.
6152 * @param[in] pSrc is input pointer
6153 * @param[in] blockSize is the number of samples to process
6154 * @param[out] pResult is output value.
6155 */
6156 void arm_mean_q7(
6157 q7_t * pSrc,
6158 uint32_t blockSize,
6159 q7_t * pResult);
6160
6161
6162 /**
6163 * @brief Mean value of a Q15 vector.
6164 * @param[in] pSrc is input pointer
6165 * @param[in] blockSize is the number of samples to process
6166 * @param[out] pResult is output value.
6167 */
6168 void arm_mean_q15(
6169 q15_t * pSrc,
6170 uint32_t blockSize,
6171 q15_t * pResult);
6172
6173
6174 /**
6175 * @brief Mean value of a Q31 vector.
6176 * @param[in] pSrc is input pointer
6177 * @param[in] blockSize is the number of samples to process
6178 * @param[out] pResult is output value.
6179 */
6180 void arm_mean_q31(
6181 q31_t * pSrc,
6182 uint32_t blockSize,
6183 q31_t * pResult);
6184
6185
6186 /**
6187 * @brief Mean value of a floating-point vector.
6188 * @param[in] pSrc is input pointer
6189 * @param[in] blockSize is the number of samples to process
6190 * @param[out] pResult is output value.
6191 */
6192 void arm_mean_f32(
6193 float32_t * pSrc,
6194 uint32_t blockSize,
6195 float32_t * pResult);
6196
6197
6198 /**
6199 * @brief Variance of the elements of a floating-point vector.
6200 * @param[in] pSrc is input pointer
6201 * @param[in] blockSize is the number of samples to process
6202 * @param[out] pResult is output value.
6203 */
6204 void arm_var_f32(
6205 float32_t * pSrc,
6206 uint32_t blockSize,
6207 float32_t * pResult);
6208
6209
6210 /**
6211 * @brief Variance of the elements of a Q31 vector.
6212 * @param[in] pSrc is input pointer
6213 * @param[in] blockSize is the number of samples to process
6214 * @param[out] pResult is output value.
6215 */
6216 void arm_var_q31(
6217 q31_t * pSrc,
6218 uint32_t blockSize,
6219 q31_t * pResult);
6220
6221
6222 /**
6223 * @brief Variance of the elements of a Q15 vector.
6224 * @param[in] pSrc is input pointer
6225 * @param[in] blockSize is the number of samples to process
6226 * @param[out] pResult is output value.
6227 */
6228 void arm_var_q15(
6229 q15_t * pSrc,
6230 uint32_t blockSize,
6231 q15_t * pResult);
6232
6233
6234 /**
6235 * @brief Root Mean Square of the elements of a floating-point vector.
6236 * @param[in] pSrc is input pointer
6237 * @param[in] blockSize is the number of samples to process
6238 * @param[out] pResult is output value.
6239 */
6240 void arm_rms_f32(
6241 float32_t * pSrc,
6242 uint32_t blockSize,
6243 float32_t * pResult);
6244
6245
6246 /**
6247 * @brief Root Mean Square of the elements of a Q31 vector.
6248 * @param[in] pSrc is input pointer
6249 * @param[in] blockSize is the number of samples to process
6250 * @param[out] pResult is output value.
6251 */
6252 void arm_rms_q31(
6253 q31_t * pSrc,
6254 uint32_t blockSize,
6255 q31_t * pResult);
6256
6257
6258 /**
6259 * @brief Root Mean Square of the elements of a Q15 vector.
6260 * @param[in] pSrc is input pointer
6261 * @param[in] blockSize is the number of samples to process
6262 * @param[out] pResult is output value.
6263 */
6264 void arm_rms_q15(
6265 q15_t * pSrc,
6266 uint32_t blockSize,
6267 q15_t * pResult);
6268
6269
6270 /**
6271 * @brief Standard deviation of the elements of a floating-point vector.
6272 * @param[in] pSrc is input pointer
6273 * @param[in] blockSize is the number of samples to process
6274 * @param[out] pResult is output value.
6275 */
6276 void arm_std_f32(
6277 float32_t * pSrc,
6278 uint32_t blockSize,
6279 float32_t * pResult);
6280
6281
6282 /**
6283 * @brief Standard deviation of the elements of a Q31 vector.
6284 * @param[in] pSrc is input pointer
6285 * @param[in] blockSize is the number of samples to process
6286 * @param[out] pResult is output value.
6287 */
6288 void arm_std_q31(
6289 q31_t * pSrc,
6290 uint32_t blockSize,
6291 q31_t * pResult);
6292
6293
6294 /**
6295 * @brief Standard deviation of the elements of a Q15 vector.
6296 * @param[in] pSrc is input pointer
6297 * @param[in] blockSize is the number of samples to process
6298 * @param[out] pResult is output value.
6299 */
6300 void arm_std_q15(
6301 q15_t * pSrc,
6302 uint32_t blockSize,
6303 q15_t * pResult);
6304
6305
6306 /**
6307 * @brief Floating-point complex magnitude
6308 * @param[in] pSrc points to the complex input vector
6309 * @param[out] pDst points to the real output vector
6310 * @param[in] numSamples number of complex samples in the input vector
6311 */
6312 void arm_cmplx_mag_f32(
6313 float32_t * pSrc,
6314 float32_t * pDst,
6315 uint32_t numSamples);
6316
6317
6318 /**
6319 * @brief Q31 complex magnitude
6320 * @param[in] pSrc points to the complex input vector
6321 * @param[out] pDst points to the real output vector
6322 * @param[in] numSamples number of complex samples in the input vector
6323 */
6324 void arm_cmplx_mag_q31(
6325 q31_t * pSrc,
6326 q31_t * pDst,
6327 uint32_t numSamples);
6328
6329
6330 /**
6331 * @brief Q15 complex magnitude
6332 * @param[in] pSrc points to the complex input vector
6333 * @param[out] pDst points to the real output vector
6334 * @param[in] numSamples number of complex samples in the input vector
6335 */
6336 void arm_cmplx_mag_q15(
6337 q15_t * pSrc,
6338 q15_t * pDst,
6339 uint32_t numSamples);
6340
6341
6342 /**
6343 * @brief Q15 complex dot product
6344 * @param[in] pSrcA points to the first input vector
6345 * @param[in] pSrcB points to the second input vector
6346 * @param[in] numSamples number of complex samples in each vector
6347 * @param[out] realResult real part of the result returned here
6348 * @param[out] imagResult imaginary part of the result returned here
6349 */
6350 void arm_cmplx_dot_prod_q15(
6351 q15_t * pSrcA,
6352 q15_t * pSrcB,
6353 uint32_t numSamples,
6354 q31_t * realResult,
6355 q31_t * imagResult);
6356
6357
6358 /**
6359 * @brief Q31 complex dot product
6360 * @param[in] pSrcA points to the first input vector
6361 * @param[in] pSrcB points to the second input vector
6362 * @param[in] numSamples number of complex samples in each vector
6363 * @param[out] realResult real part of the result returned here
6364 * @param[out] imagResult imaginary part of the result returned here
6365 */
6366 void arm_cmplx_dot_prod_q31(
6367 q31_t * pSrcA,
6368 q31_t * pSrcB,
6369 uint32_t numSamples,
6370 q63_t * realResult,
6371 q63_t * imagResult);
6372
6373
6374 /**
6375 * @brief Floating-point complex dot product
6376 * @param[in] pSrcA points to the first input vector
6377 * @param[in] pSrcB points to the second input vector
6378 * @param[in] numSamples number of complex samples in each vector
6379 * @param[out] realResult real part of the result returned here
6380 * @param[out] imagResult imaginary part of the result returned here
6381 */
6382 void arm_cmplx_dot_prod_f32(
6383 float32_t * pSrcA,
6384 float32_t * pSrcB,
6385 uint32_t numSamples,
6386 float32_t * realResult,
6387 float32_t * imagResult);
6388
6389
6390 /**
6391 * @brief Q15 complex-by-real multiplication
6392 * @param[in] pSrcCmplx points to the complex input vector
6393 * @param[in] pSrcReal points to the real input vector
6394 * @param[out] pCmplxDst points to the complex output vector
6395 * @param[in] numSamples number of samples in each vector
6396 */
6397 void arm_cmplx_mult_real_q15(
6398 q15_t * pSrcCmplx,
6399 q15_t * pSrcReal,
6400 q15_t * pCmplxDst,
6401 uint32_t numSamples);
6402
6403
6404 /**
6405 * @brief Q31 complex-by-real multiplication
6406 * @param[in] pSrcCmplx points to the complex input vector
6407 * @param[in] pSrcReal points to the real input vector
6408 * @param[out] pCmplxDst points to the complex output vector
6409 * @param[in] numSamples number of samples in each vector
6410 */
6411 void arm_cmplx_mult_real_q31(
6412 q31_t * pSrcCmplx,
6413 q31_t * pSrcReal,
6414 q31_t * pCmplxDst,
6415 uint32_t numSamples);
6416
6417
6418 /**
6419 * @brief Floating-point complex-by-real multiplication
6420 * @param[in] pSrcCmplx points to the complex input vector
6421 * @param[in] pSrcReal points to the real input vector
6422 * @param[out] pCmplxDst points to the complex output vector
6423 * @param[in] numSamples number of samples in each vector
6424 */
6425 void arm_cmplx_mult_real_f32(
6426 float32_t * pSrcCmplx,
6427 float32_t * pSrcReal,
6428 float32_t * pCmplxDst,
6429 uint32_t numSamples);
6430
6431
6432 /**
6433 * @brief Minimum value of a Q7 vector.
6434 * @param[in] pSrc is input pointer
6435 * @param[in] blockSize is the number of samples to process
6436 * @param[out] result is output pointer
6437 * @param[in] index is the array index of the minimum value in the input buffer.
6438 */
6439 void arm_min_q7(
6440 q7_t * pSrc,
6441 uint32_t blockSize,
6442 q7_t * result,
6443 uint32_t * index);
6444
6445
6446 /**
6447 * @brief Minimum value of a Q15 vector.
6448 * @param[in] pSrc is input pointer
6449 * @param[in] blockSize is the number of samples to process
6450 * @param[out] pResult is output pointer
6451 * @param[in] pIndex is the array index of the minimum value in the input buffer.
6452 */
6453 void arm_min_q15(
6454 q15_t * pSrc,
6455 uint32_t blockSize,
6456 q15_t * pResult,
6457 uint32_t * pIndex);
6458
6459
6460 /**
6461 * @brief Minimum value of a Q31 vector.
6462 * @param[in] pSrc is input pointer
6463 * @param[in] blockSize is the number of samples to process
6464 * @param[out] pResult is output pointer
6465 * @param[out] pIndex is the array index of the minimum value in the input buffer.
6466 */
6467 void arm_min_q31(
6468 q31_t * pSrc,
6469 uint32_t blockSize,
6470 q31_t * pResult,
6471 uint32_t * pIndex);
6472
6473
6474 /**
6475 * @brief Minimum value of a floating-point vector.
6476 * @param[in] pSrc is input pointer
6477 * @param[in] blockSize is the number of samples to process
6478 * @param[out] pResult is output pointer
6479 * @param[out] pIndex is the array index of the minimum value in the input buffer.
6480 */
6481 void arm_min_f32(
6482 float32_t * pSrc,
6483 uint32_t blockSize,
6484 float32_t * pResult,
6485 uint32_t * pIndex);
6486
6487
6488 /**
6489 * @brief Maximum value of a Q7 vector.
6490 * @param[in] pSrc points to the input buffer
6491 * @param[in] blockSize length of the input vector
6492 * @param[out] pResult maximum value returned here
6493 * @param[out] pIndex index of maximum value returned here
6494 */
6495 void arm_max_q7(
6496 q7_t * pSrc,
6497 uint32_t blockSize,
6498 q7_t * pResult,
6499 uint32_t * pIndex);
6500
6501
6502 /**
6503 * @brief Maximum value of a Q15 vector.
6504 * @param[in] pSrc points to the input buffer
6505 * @param[in] blockSize length of the input vector
6506 * @param[out] pResult maximum value returned here
6507 * @param[out] pIndex index of maximum value returned here
6508 */
6509 void arm_max_q15(
6510 q15_t * pSrc,
6511 uint32_t blockSize,
6512 q15_t * pResult,
6513 uint32_t * pIndex);
6514
6515
6516 /**
6517 * @brief Maximum value of a Q31 vector.
6518 * @param[in] pSrc points to the input buffer
6519 * @param[in] blockSize length of the input vector
6520 * @param[out] pResult maximum value returned here
6521 * @param[out] pIndex index of maximum value returned here
6522 */
6523 void arm_max_q31(
6524 q31_t * pSrc,
6525 uint32_t blockSize,
6526 q31_t * pResult,
6527 uint32_t * pIndex);
6528
6529
6530 /**
6531 * @brief Maximum value of a floating-point vector.
6532 * @param[in] pSrc points to the input buffer
6533 * @param[in] blockSize length of the input vector
6534 * @param[out] pResult maximum value returned here
6535 * @param[out] pIndex index of maximum value returned here
6536 */
6537 void arm_max_f32(
6538 float32_t * pSrc,
6539 uint32_t blockSize,
6540 float32_t * pResult,
6541 uint32_t * pIndex);
6542
6543
6544 /**
6545 * @brief Q15 complex-by-complex multiplication
6546 * @param[in] pSrcA points to the first input vector
6547 * @param[in] pSrcB points to the second input vector
6548 * @param[out] pDst points to the output vector
6549 * @param[in] numSamples number of complex samples in each vector
6550 */
6551 void arm_cmplx_mult_cmplx_q15(
6552 q15_t * pSrcA,
6553 q15_t * pSrcB,
6554 q15_t * pDst,
6555 uint32_t numSamples);
6556
6557
6558 /**
6559 * @brief Q31 complex-by-complex multiplication
6560 * @param[in] pSrcA points to the first input vector
6561 * @param[in] pSrcB points to the second input vector
6562 * @param[out] pDst points to the output vector
6563 * @param[in] numSamples number of complex samples in each vector
6564 */
6565 void arm_cmplx_mult_cmplx_q31(
6566 q31_t * pSrcA,
6567 q31_t * pSrcB,
6568 q31_t * pDst,
6569 uint32_t numSamples);
6570
6571
6572 /**
6573 * @brief Floating-point complex-by-complex multiplication
6574 * @param[in] pSrcA points to the first input vector
6575 * @param[in] pSrcB points to the second input vector
6576 * @param[out] pDst points to the output vector
6577 * @param[in] numSamples number of complex samples in each vector
6578 */
6579 void arm_cmplx_mult_cmplx_f32(
6580 float32_t * pSrcA,
6581 float32_t * pSrcB,
6582 float32_t * pDst,
6583 uint32_t numSamples);
6584
6585
6586 /**
6587 * @brief Converts the elements of the floating-point vector to Q31 vector.
6588 * @param[in] pSrc points to the floating-point input vector
6589 * @param[out] pDst points to the Q31 output vector
6590 * @param[in] blockSize length of the input vector
6591 */
6592 void arm_float_to_q31(
6593 float32_t * pSrc,
6594 q31_t * pDst,
6595 uint32_t blockSize);
6596
6597
6598 /**
6599 * @brief Converts the elements of the floating-point vector to Q15 vector.
6600 * @param[in] pSrc points to the floating-point input vector
6601 * @param[out] pDst points to the Q15 output vector
6602 * @param[in] blockSize length of the input vector
6603 */
6604 void arm_float_to_q15(
6605 float32_t * pSrc,
6606 q15_t * pDst,
6607 uint32_t blockSize);
6608
6609
6610 /**
6611 * @brief Converts the elements of the floating-point vector to Q7 vector.
6612 * @param[in] pSrc points to the floating-point input vector
6613 * @param[out] pDst points to the Q7 output vector
6614 * @param[in] blockSize length of the input vector
6615 */
6616 void arm_float_to_q7(
6617 float32_t * pSrc,
6618 q7_t * pDst,
6619 uint32_t blockSize);
6620
6621
6622 /**
6623 * @brief Converts the elements of the Q31 vector to Q15 vector.
6624 * @param[in] pSrc is input pointer
6625 * @param[out] pDst is output pointer
6626 * @param[in] blockSize is the number of samples to process
6627 */
6628 void arm_q31_to_q15(
6629 q31_t * pSrc,
6630 q15_t * pDst,
6631 uint32_t blockSize);
6632
6633
6634 /**
6635 * @brief Converts the elements of the Q31 vector to Q7 vector.
6636 * @param[in] pSrc is input pointer
6637 * @param[out] pDst is output pointer
6638 * @param[in] blockSize is the number of samples to process
6639 */
6640 void arm_q31_to_q7(
6641 q31_t * pSrc,
6642 q7_t * pDst,
6643 uint32_t blockSize);
6644
6645
6646 /**
6647 * @brief Converts the elements of the Q15 vector to floating-point vector.
6648 * @param[in] pSrc is input pointer
6649 * @param[out] pDst is output pointer
6650 * @param[in] blockSize is the number of samples to process
6651 */
6652 void arm_q15_to_float(
6653 q15_t * pSrc,
6654 float32_t * pDst,
6655 uint32_t blockSize);
6656
6657
6658 /**
6659 * @brief Converts the elements of the Q15 vector to Q31 vector.
6660 * @param[in] pSrc is input pointer
6661 * @param[out] pDst is output pointer
6662 * @param[in] blockSize is the number of samples to process
6663 */
6664 void arm_q15_to_q31(
6665 q15_t * pSrc,
6666 q31_t * pDst,
6667 uint32_t blockSize);
6668
6669
6670 /**
6671 * @brief Converts the elements of the Q15 vector to Q7 vector.
6672 * @param[in] pSrc is input pointer
6673 * @param[out] pDst is output pointer
6674 * @param[in] blockSize is the number of samples to process
6675 */
6676 void arm_q15_to_q7(
6677 q15_t * pSrc,
6678 q7_t * pDst,
6679 uint32_t blockSize);
6680
6681
6682 /**
6683 * @ingroup groupInterpolation
6684 */
6685
6686 /**
6687 * @defgroup BilinearInterpolate Bilinear Interpolation
6688 *
6689 * Bilinear interpolation is an extension of linear interpolation applied to a two dimensional grid.
6690 * The underlying function <code>f(x, y)</code> is sampled on a regular grid and the interpolation process
6691 * determines values between the grid points.
6692 * Bilinear interpolation is equivalent to two step linear interpolation, first in the x-dimension and then in the y-dimension.
6693 * Bilinear interpolation is often used in image processing to rescale images.
6694 * The CMSIS DSP library provides bilinear interpolation functions for Q7, Q15, Q31, and floating-point data types.
6695 *
6696 * <b>Algorithm</b>
6697 * \par
6698 * The instance structure used by the bilinear interpolation functions describes a two dimensional data table.
6699 * For floating-point, the instance structure is defined as:
6700 * <pre>
6701 * typedef struct
6702 * {
6703 * uint16_t numRows;
6704 * uint16_t numCols;
6705 * float32_t *pData;
6706 * } arm_bilinear_interp_instance_f32;
6707 * </pre>
6708 *
6709 * \par
6710 * where <code>numRows</code> specifies the number of rows in the table;
6711 * <code>numCols</code> specifies the number of columns in the table;
6712 * and <code>pData</code> points to an array of size <code>numRows*numCols</code> values.
6713 * The data table <code>pTable</code> is organized in row order and the supplied data values fall on integer indexes.
6714 * That is, table element (x,y) is located at <code>pTable[x + y*numCols]</code> where x and y are integers.
6715 *
6716 * \par
6717 * Let <code>(x, y)</code> specify the desired interpolation point. Then define:
6718 * <pre>
6719 * XF = floor(x)
6720 * YF = floor(y)
6721 * </pre>
6722 * \par
6723 * The interpolated output point is computed as:
6724 * <pre>
6725 * f(x, y) = f(XF, YF) * (1-(x-XF)) * (1-(y-YF))
6726 * + f(XF+1, YF) * (x-XF)*(1-(y-YF))
6727 * + f(XF, YF+1) * (1-(x-XF))*(y-YF)
6728 * + f(XF+1, YF+1) * (x-XF)*(y-YF)
6729 * </pre>
6730 * Note that the coordinates (x, y) contain integer and fractional components.
6731 * The integer components specify which portion of the table to use while the
6732 * fractional components control the interpolation processor.
6733 *
6734 * \par
6735 * if (x,y) are outside of the table boundary, Bilinear interpolation returns zero output.
6736 */
6737
6738 /**
6739 * @addtogroup BilinearInterpolate
6740 * @{
6741 */
6742
6743
6744 /**
6745 *
6746 * @brief Floating-point bilinear interpolation.
6747 * @param[in,out] S points to an instance of the interpolation structure.
6748 * @param[in] X interpolation coordinate.
6749 * @param[in] Y interpolation coordinate.
6750 * @return out interpolated value.
6751 */
6752 static __INLINE float32_t arm_bilinear_interp_f32(
6753 const arm_bilinear_interp_instance_f32 * S,
6754 float32_t X,
6755 float32_t Y)
6756 {
6757 float32_t out;
6758 float32_t f00, f01, f10, f11;
6759 float32_t *pData = S->pData;
6760 int32_t xIndex, yIndex, index;
6761 float32_t xdiff, ydiff;
6762 float32_t b1, b2, b3, b4;
6763
6764 xIndex = (int32_t) X;
6765 yIndex = (int32_t) Y;
6766
6767 /* Care taken for table outside boundary */
6768 /* Returns zero output when values are outside table boundary */
6769 if(xIndex < 0 || xIndex > (S->numRows - 1) || yIndex < 0 || yIndex > (S->numCols - 1))
6770 {
6771 return (0);
6772 }
6773
6774 /* Calculation of index for two nearest points in X-direction */
6775 index = (xIndex - 1) + (yIndex - 1) * S->numCols;
6776
6777
6778 /* Read two nearest points in X-direction */
6779 f00 = pData[index];
6780 f01 = pData[index + 1];
6781
6782 /* Calculation of index for two nearest points in Y-direction */
6783 index = (xIndex - 1) + (yIndex) * S->numCols;
6784
6785
6786 /* Read two nearest points in Y-direction */
6787 f10 = pData[index];
6788 f11 = pData[index + 1];
6789
6790 /* Calculation of intermediate values */
6791 b1 = f00;
6792 b2 = f01 - f00;
6793 b3 = f10 - f00;
6794 b4 = f00 - f01 - f10 + f11;
6795
6796 /* Calculation of fractional part in X */
6797 xdiff = X - xIndex;
6798
6799 /* Calculation of fractional part in Y */
6800 ydiff = Y - yIndex;
6801
6802 /* Calculation of bi-linear interpolated output */
6803 out = b1 + b2 * xdiff + b3 * ydiff + b4 * xdiff * ydiff;
6804
6805 /* return to application */
6806 return (out);
6807 }
6808
6809
6810 /**
6811 *
6812 * @brief Q31 bilinear interpolation.
6813 * @param[in,out] S points to an instance of the interpolation structure.
6814 * @param[in] X interpolation coordinate in 12.20 format.
6815 * @param[in] Y interpolation coordinate in 12.20 format.
6816 * @return out interpolated value.
6817 */
6818 static __INLINE q31_t arm_bilinear_interp_q31(
6819 arm_bilinear_interp_instance_q31 * S,
6820 q31_t X,
6821 q31_t Y)
6822 {
6823 q31_t out; /* Temporary output */
6824 q31_t acc = 0; /* output */
6825 q31_t xfract, yfract; /* X, Y fractional parts */
6826 q31_t x1, x2, y1, y2; /* Nearest output values */
6827 int32_t rI, cI; /* Row and column indices */
6828 q31_t *pYData = S->pData; /* pointer to output table values */
6829 uint32_t nCols = S->numCols; /* num of rows */
6830
6831 /* Input is in 12.20 format */
6832 /* 12 bits for the table index */
6833 /* Index value calculation */
6834 rI = ((X & (q31_t)0xFFF00000) >> 20);
6835
6836 /* Input is in 12.20 format */
6837 /* 12 bits for the table index */
6838 /* Index value calculation */
6839 cI = ((Y & (q31_t)0xFFF00000) >> 20);
6840
6841 /* Care taken for table outside boundary */
6842 /* Returns zero output when values are outside table boundary */
6843 if(rI < 0 || rI > (S->numRows - 1) || cI < 0 || cI > (S->numCols - 1))
6844 {
6845 return (0);
6846 }
6847
6848 /* 20 bits for the fractional part */
6849 /* shift left xfract by 11 to keep 1.31 format */
6850 xfract = (X & 0x000FFFFF) << 11u;
6851
6852 /* Read two nearest output values from the index */
6853 x1 = pYData[(rI) + (int32_t)nCols * (cI) ];
6854 x2 = pYData[(rI) + (int32_t)nCols * (cI) + 1];
6855
6856 /* 20 bits for the fractional part */
6857 /* shift left yfract by 11 to keep 1.31 format */
6858 yfract = (Y & 0x000FFFFF) << 11u;
6859
6860 /* Read two nearest output values from the index */
6861 y1 = pYData[(rI) + (int32_t)nCols * (cI + 1) ];
6862 y2 = pYData[(rI) + (int32_t)nCols * (cI + 1) + 1];
6863
6864 /* Calculation of x1 * (1-xfract ) * (1-yfract) and acc is in 3.29(q29) format */
6865 out = ((q31_t) (((q63_t) x1 * (0x7FFFFFFF - xfract)) >> 32));
6866 acc = ((q31_t) (((q63_t) out * (0x7FFFFFFF - yfract)) >> 32));
6867
6868 /* x2 * (xfract) * (1-yfract) in 3.29(q29) and adding to acc */
6869 out = ((q31_t) ((q63_t) x2 * (0x7FFFFFFF - yfract) >> 32));
6870 acc += ((q31_t) ((q63_t) out * (xfract) >> 32));
6871
6872 /* y1 * (1 - xfract) * (yfract) in 3.29(q29) and adding to acc */
6873 out = ((q31_t) ((q63_t) y1 * (0x7FFFFFFF - xfract) >> 32));
6874 acc += ((q31_t) ((q63_t) out * (yfract) >> 32));
6875
6876 /* y2 * (xfract) * (yfract) in 3.29(q29) and adding to acc */
6877 out = ((q31_t) ((q63_t) y2 * (xfract) >> 32));
6878 acc += ((q31_t) ((q63_t) out * (yfract) >> 32));
6879
6880 /* Convert acc to 1.31(q31) format */
6881 return ((q31_t)(acc << 2));
6882 }
6883
6884
6885 /**
6886 * @brief Q15 bilinear interpolation.
6887 * @param[in,out] S points to an instance of the interpolation structure.
6888 * @param[in] X interpolation coordinate in 12.20 format.
6889 * @param[in] Y interpolation coordinate in 12.20 format.
6890 * @return out interpolated value.
6891 */
6892 static __INLINE q15_t arm_bilinear_interp_q15(
6893 arm_bilinear_interp_instance_q15 * S,
6894 q31_t X,
6895 q31_t Y)
6896 {
6897 q63_t acc = 0; /* output */
6898 q31_t out; /* Temporary output */
6899 q15_t x1, x2, y1, y2; /* Nearest output values */
6900 q31_t xfract, yfract; /* X, Y fractional parts */
6901 int32_t rI, cI; /* Row and column indices */
6902 q15_t *pYData = S->pData; /* pointer to output table values */
6903 uint32_t nCols = S->numCols; /* num of rows */
6904
6905 /* Input is in 12.20 format */
6906 /* 12 bits for the table index */
6907 /* Index value calculation */
6908 rI = ((X & (q31_t)0xFFF00000) >> 20);
6909
6910 /* Input is in 12.20 format */
6911 /* 12 bits for the table index */
6912 /* Index value calculation */
6913 cI = ((Y & (q31_t)0xFFF00000) >> 20);
6914
6915 /* Care taken for table outside boundary */
6916 /* Returns zero output when values are outside table boundary */
6917 if(rI < 0 || rI > (S->numRows - 1) || cI < 0 || cI > (S->numCols - 1))
6918 {
6919 return (0);
6920 }
6921
6922 /* 20 bits for the fractional part */
6923 /* xfract should be in 12.20 format */
6924 xfract = (X & 0x000FFFFF);
6925
6926 /* Read two nearest output values from the index */
6927 x1 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI) ];
6928 x2 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI) + 1];
6929
6930 /* 20 bits for the fractional part */
6931 /* yfract should be in 12.20 format */
6932 yfract = (Y & 0x000FFFFF);
6933
6934 /* Read two nearest output values from the index */
6935 y1 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI + 1) ];
6936 y2 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI + 1) + 1];
6937
6938 /* Calculation of x1 * (1-xfract ) * (1-yfract) and acc is in 13.51 format */
6939
6940 /* x1 is in 1.15(q15), xfract in 12.20 format and out is in 13.35 format */
6941 /* convert 13.35 to 13.31 by right shifting and out is in 1.31 */
6942 out = (q31_t) (((q63_t) x1 * (0xFFFFF - xfract)) >> 4u);
6943 acc = ((q63_t) out * (0xFFFFF - yfract));
6944
6945 /* x2 * (xfract) * (1-yfract) in 1.51 and adding to acc */
6946 out = (q31_t) (((q63_t) x2 * (0xFFFFF - yfract)) >> 4u);
6947 acc += ((q63_t) out * (xfract));
6948
6949 /* y1 * (1 - xfract) * (yfract) in 1.51 and adding to acc */
6950 out = (q31_t) (((q63_t) y1 * (0xFFFFF - xfract)) >> 4u);
6951 acc += ((q63_t) out * (yfract));
6952
6953 /* y2 * (xfract) * (yfract) in 1.51 and adding to acc */
6954 out = (q31_t) (((q63_t) y2 * (xfract)) >> 4u);
6955 acc += ((q63_t) out * (yfract));
6956
6957 /* acc is in 13.51 format and down shift acc by 36 times */
6958 /* Convert out to 1.15 format */
6959 return ((q15_t)(acc >> 36));
6960 }
6961
6962
6963 /**
6964 * @brief Q7 bilinear interpolation.
6965 * @param[in,out] S points to an instance of the interpolation structure.
6966 * @param[in] X interpolation coordinate in 12.20 format.
6967 * @param[in] Y interpolation coordinate in 12.20 format.
6968 * @return out interpolated value.
6969 */
6970 static __INLINE q7_t arm_bilinear_interp_q7(
6971 arm_bilinear_interp_instance_q7 * S,
6972 q31_t X,
6973 q31_t Y)
6974 {
6975 q63_t acc = 0; /* output */
6976 q31_t out; /* Temporary output */
6977 q31_t xfract, yfract; /* X, Y fractional parts */
6978 q7_t x1, x2, y1, y2; /* Nearest output values */
6979 int32_t rI, cI; /* Row and column indices */
6980 q7_t *pYData = S->pData; /* pointer to output table values */
6981 uint32_t nCols = S->numCols; /* num of rows */
6982
6983 /* Input is in 12.20 format */
6984 /* 12 bits for the table index */
6985 /* Index value calculation */
6986 rI = ((X & (q31_t)0xFFF00000) >> 20);
6987
6988 /* Input is in 12.20 format */
6989 /* 12 bits for the table index */
6990 /* Index value calculation */
6991 cI = ((Y & (q31_t)0xFFF00000) >> 20);
6992
6993 /* Care taken for table outside boundary */
6994 /* Returns zero output when values are outside table boundary */
6995 if(rI < 0 || rI > (S->numRows - 1) || cI < 0 || cI > (S->numCols - 1))
6996 {
6997 return (0);
6998 }
6999
7000 /* 20 bits for the fractional part */
7001 /* xfract should be in 12.20 format */
7002 xfract = (X & (q31_t)0x000FFFFF);
7003
7004 /* Read two nearest output values from the index */
7005 x1 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI) ];
7006 x2 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI) + 1];
7007
7008 /* 20 bits for the fractional part */
7009 /* yfract should be in 12.20 format */
7010 yfract = (Y & (q31_t)0x000FFFFF);
7011
7012 /* Read two nearest output values from the index */
7013 y1 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI + 1) ];
7014 y2 = pYData[((uint32_t)rI) + nCols * ((uint32_t)cI + 1) + 1];
7015
7016 /* Calculation of x1 * (1-xfract ) * (1-yfract) and acc is in 16.47 format */
7017 out = ((x1 * (0xFFFFF - xfract)));
7018 acc = (((q63_t) out * (0xFFFFF - yfract)));
7019
7020 /* x2 * (xfract) * (1-yfract) in 2.22 and adding to acc */
7021 out = ((x2 * (0xFFFFF - yfract)));
7022 acc += (((q63_t) out * (xfract)));
7023
7024 /* y1 * (1 - xfract) * (yfract) in 2.22 and adding to acc */
7025 out = ((y1 * (0xFFFFF - xfract)));
7026 acc += (((q63_t) out * (yfract)));
7027
7028 /* y2 * (xfract) * (yfract) in 2.22 and adding to acc */
7029 out = ((y2 * (yfract)));
7030 acc += (((q63_t) out * (xfract)));
7031
7032 /* acc in 16.47 format and down shift by 40 to convert to 1.7 format */
7033 return ((q7_t)(acc >> 40));
7034 }
7035
7036 /**
7037 * @} end of BilinearInterpolate group
7038 */
7039
7040
7041 /* SMMLAR */
7042 #define multAcc_32x32_keep32_R(a, x, y) \
7043 a = (q31_t) (((((q63_t) a) << 32) + ((q63_t) x * y) + 0x80000000LL ) >> 32)
7044
7045 /* SMMLSR */
7046 #define multSub_32x32_keep32_R(a, x, y) \
7047 a = (q31_t) (((((q63_t) a) << 32) - ((q63_t) x * y) + 0x80000000LL ) >> 32)
7048
7049 /* SMMULR */
7050 #define mult_32x32_keep32_R(a, x, y) \
7051 a = (q31_t) (((q63_t) x * y + 0x80000000LL ) >> 32)
7052
7053 /* SMMLA */
7054 #define multAcc_32x32_keep32(a, x, y) \
7055 a += (q31_t) (((q63_t) x * y) >> 32)
7056
7057 /* SMMLS */
7058 #define multSub_32x32_keep32(a, x, y) \
7059 a -= (q31_t) (((q63_t) x * y) >> 32)
7060
7061 /* SMMUL */
7062 #define mult_32x32_keep32(a, x, y) \
7063 a = (q31_t) (((q63_t) x * y ) >> 32)
7064
7065
7066 #if defined ( __CC_ARM )
7067 /* Enter low optimization region - place directly above function definition */
7068 #if defined( ARM_MATH_CM4 ) || defined( ARM_MATH_CM7)
7069 #define LOW_OPTIMIZATION_ENTER \
7070 _Pragma ("push") \
7071 _Pragma ("O1")
7072 #else
7073 #define LOW_OPTIMIZATION_ENTER
7074 #endif
7075
7076 /* Exit low optimization region - place directly after end of function definition */
7077 #if defined( ARM_MATH_CM4 ) || defined( ARM_MATH_CM7)
7078 #define LOW_OPTIMIZATION_EXIT \
7079 _Pragma ("pop")
7080 #else
7081 #define LOW_OPTIMIZATION_EXIT
7082 #endif
7083
7084 /* Enter low optimization region - place directly above function definition */
7085 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7086
7087 /* Exit low optimization region - place directly after end of function definition */
7088 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7089
7090 #elif defined(__ARMCC_VERSION) && (__ARMCC_VERSION >= 6010050)
7091 #define LOW_OPTIMIZATION_ENTER
7092 #define LOW_OPTIMIZATION_EXIT
7093 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7094 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7095
7096 #elif defined(__GNUC__)
7097 #define LOW_OPTIMIZATION_ENTER __attribute__(( optimize("-O1") ))
7098 #define LOW_OPTIMIZATION_EXIT
7099 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7100 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7101
7102 #elif defined(__ICCARM__)
7103 /* Enter low optimization region - place directly above function definition */
7104 #if defined( ARM_MATH_CM4 ) || defined( ARM_MATH_CM7)
7105 #define LOW_OPTIMIZATION_ENTER \
7106 _Pragma ("optimize=low")
7107 #else
7108 #define LOW_OPTIMIZATION_ENTER
7109 #endif
7110
7111 /* Exit low optimization region - place directly after end of function definition */
7112 #define LOW_OPTIMIZATION_EXIT
7113
7114 /* Enter low optimization region - place directly above function definition */
7115 #if defined( ARM_MATH_CM4 ) || defined( ARM_MATH_CM7)
7116 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER \
7117 _Pragma ("optimize=low")
7118 #else
7119 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7120 #endif
7121
7122 /* Exit low optimization region - place directly after end of function definition */
7123 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7124
7125 #elif defined(__CSMC__)
7126 #define LOW_OPTIMIZATION_ENTER
7127 #define LOW_OPTIMIZATION_EXIT
7128 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7129 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7130
7131 #elif defined(__TASKING__)
7132 #define LOW_OPTIMIZATION_ENTER
7133 #define LOW_OPTIMIZATION_EXIT
7134 #define IAR_ONLY_LOW_OPTIMIZATION_ENTER
7135 #define IAR_ONLY_LOW_OPTIMIZATION_EXIT
7136
7137 #endif
7138
7139
7140 #ifdef __cplusplus
7141 }
7142 #endif
7143
7144
7145 #if defined ( __GNUC__ )
7146 #pragma GCC diagnostic pop
7147 #endif
7148
7149 #endif /* _ARM_MATH_H */
7150
7151 /**
7152 *
7153 * End of file.
7154 */