Convolution is a mathematical operation that operates on two finite length vectors to generate a finite length output vector. Convolution is similar to correlation and is frequently used in filtering and data analysis. The CMSIS DSP library contains functions for convolving Q7, Q15, Q31, and floating-point data types. The library also provides fast versions of the Q15 and Q31 functions.

Algorithm

Let a[n] and b[n] be sequences of length srcALen and srcBLen samples respectively. Then the convolution

+    c[n] = a[n] * b[n]
+

: is defined as

: Note that c[n] is of length srcALen + srcBLen - 1 and is defined over the interval n=0, 1, 2, ..., srcALen + srcBLen - 2. pSrcA points to the first input vector of length srcALen and pSrcB points to the second input vector of length srcBLen. The output result is written to pDst and the calling function must allocate srcALen+srcBLen-1 words for the result.

: Conceptually, when two signals a[n] and b[n] are convolved, the signal b[n] slides over a[n]. For each offset n, the overlapping portions of a[n] and b[n] are multiplied and summed together.

: Note that convolution is a commutative operation:

-                  a[n] * b[n] = b[n] * a[n].
-

: This means that switching the A and B arguments to the convolution functions has no effect.

Fixed-Point Behavior

: Convolution requires summing up a large number of intermediate products. As such, the Q7, Q15, and Q31 functions run a risk of overflow and saturation. Refer to the function specific documentation below for further details of the particular algorithm used.

Fast Versions

: Fast versions are supported for Q31 and Q15. Cycles for Fast versions are less compared to Q31 and Q15 of conv and the design requires the input signals should be scaled down to avoid intermediate overflows.

Opt Versions

: Opt versions are supported for Q15 and Q7. Design uses internal scratch buffer for getting good optimisation. These versions are optimised in cycles and consumes more memory(Scratch memory) compared to Q15 and Q7 versions

: Note that c[n] is of length srcALen + srcBLen - 1 and is defined over the interval n=0, 1, 2, ..., srcALen + srcBLen - 2. pSrcA points to the first input vector of length srcALen and pSrcB points to the second input vector of length srcBLen. The output result is written to pDst and the calling function must allocate srcALen+srcBLen-1 words for the result.

: Conceptually, when two signals a[n] and b[n] are convolved, the signal b[n] slides over a[n]. For each offset n, the overlapping portions of a[n] and b[n] are multiplied and summed together.

Note that convolution is a commutative operation:

+    a[n] * b[n] = b[n] * a[n].
+

: This means that switching the A and B arguments to the convolution functions has no effect.

Fixed-Point Behavior: Convolution requires summing up a large number of intermediate products. As such, the Q7, Q15, and Q31 functions run a risk of overflow and saturation. Refer to the function specific documentation below for further details of the particular algorithm used.

Fast Versions: Fast versions are supported for Q31 and Q15. Cycles for Fast versions are less compared to Q31 and Q15 of conv and the design requires the input signals should be scaled down to avoid intermediate overflows.

Opt Versions: Opt versions are supported for Q15 and Q7. Design uses internal scratch buffer for getting good optimisation. These versions are optimised in cycles and consumes more memory (Scratch memory) compared to Q15 and Q7 versions

Function Documentation

- +

- + @@ -185,7 +182,7 @@ Functions - + @@ -209,28 +206,26 @@ Functions

Parameters

void arm_conv_f32	(	float32_t *	const float32_t *	pSrcA,
		float32_t *	const float32_t *	pSrcB,

- - - - - + + + + +

[in]	*pSrcA	points to the first input sequence.
[in]	srcALen	length of the first input sequence.
[in]	*pSrcB	points to the second input sequence.
[in]	srcBLen	length of the second input sequence.
[out]	*pDst	points to the location where the output result is written. Length srcALen+srcBLen-1.
[in]	pSrcA	points to the first input sequence
[in]	srcALen	length of the first input sequence
[in]	pSrcB	points to the second input sequence
[in]	srcBLen	length of the second input sequence
[out]	pDst	points to the location where the output result is written. Length srcALen+srcBLen-1.

Functions
void	arm_conv_f32 (float32_t pSrcA, uint32_t srcALen, float32_t pSrcB, uint32_t srcBLen, float32_t *pDst)
	Convolution of floating-point sequences. More...

void	arm_conv_fast_opt_q15 (q15_t pSrcA, uint32_t srcALen, q15_t pSrcB, uint32_t srcBLen, q15_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4. More...

void	arm_conv_fast_q15 (q15_t pSrcA, uint32_t srcALen, q15_t pSrcB, uint32_t srcBLen, q15_t *pDst)
	Convolution of Q15 sequences (fast version) for Cortex-M3 and Cortex-M4. More...

void	arm_conv_fast_q31 (q31_t pSrcA, uint32_t srcALen, q31_t pSrcB, uint32_t srcBLen, q31_t *pDst)
	Convolution of Q31 sequences (fast version) for Cortex-M3 and Cortex-M4. More...

void	arm_conv_opt_q15 (q15_t pSrcA, uint32_t srcALen, q15_t pSrcB, uint32_t srcBLen, q15_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q15 sequences. More...

void	arm_conv_opt_q7 (q7_t pSrcA, uint32_t srcALen, q7_t pSrcB, uint32_t srcBLen, q7_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q7 sequences. More...

void	arm_conv_q15 (q15_t pSrcA, uint32_t srcALen, q15_t pSrcB, uint32_t srcBLen, q15_t *pDst)
	Convolution of Q15 sequences. More...

void	arm_conv_q31 (q31_t pSrcA, uint32_t srcALen, q31_t pSrcB, uint32_t srcBLen, q31_t *pDst)
	Convolution of Q31 sequences. More...

void	arm_conv_q7 (q7_t pSrcA, uint32_t srcALen, q7_t pSrcB, uint32_t srcBLen, q7_t *pDst)
	Convolution of Q7 sequences. More...

void	arm_conv_f32 (const float32_t pSrcA, uint32_t srcALen, const float32_t pSrcB, uint32_t srcBLen, float32_t *pDst)
	Convolution of floating-point sequences. More...

void	arm_conv_fast_opt_q15 (const q15_t pSrcA, uint32_t srcALen, const q15_t pSrcB, uint32_t srcBLen, q15_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q15 sequences (fast version). More...

void	arm_conv_fast_q15 (const q15_t pSrcA, uint32_t srcALen, const q15_t pSrcB, uint32_t srcBLen, q15_t *pDst)
	Convolution of Q15 sequences (fast version). More...

void	arm_conv_fast_q31 (const q31_t pSrcA, uint32_t srcALen, const q31_t pSrcB, uint32_t srcBLen, q31_t *pDst)
	Convolution of Q31 sequences (fast version). More...

void	arm_conv_opt_q15 (const q15_t pSrcA, uint32_t srcALen, const q15_t pSrcB, uint32_t srcBLen, q15_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q15 sequences. More...

void	arm_conv_opt_q7 (const q7_t pSrcA, uint32_t srcALen, const q7_t pSrcB, uint32_t srcBLen, q7_t pDst, q15_t pScratch1, q15_t *pScratch2)
	Convolution of Q7 sequences. More...

void	arm_conv_q15 (const q15_t pSrcA, uint32_t srcALen, const q15_t pSrcB, uint32_t srcBLen, q15_t *pDst)
	Convolution of Q15 sequences. More...

void	arm_conv_q31 (const q31_t pSrcA, uint32_t srcALen, const q31_t pSrcB, uint32_t srcBLen, q31_t *pDst)
	Convolution of Q31 sequences. More...

void	arm_conv_q7 (const q7_t pSrcA, uint32_t srcALen, const q7_t pSrcB, uint32_t srcBLen, q7_t *pDst)
	Convolution of Q7 sequences. More...

void arm_conv_fast_opt_q15	(	q15_t *	const q15_t *	pSrcA,
		q15_t *	const q15_t *	pSrcB,

void arm_conv_fast_q15	(	q15_t *	const q15_t *	pSrcA,
		q15_t *	const q15_t *	pSrcB,

void arm_conv_fast_q31	(	q31_t *	const q31_t *	pSrcA,
		q31_t *	const q31_t *	pSrcB,

void arm_conv_opt_q15	(	q15_t *	const q15_t *	pSrcA,
		q15_t *	const q15_t *	pSrcB,

void arm_conv_opt_q7	(	q7_t *	const q7_t *	pSrcA,
		q7_t *	const q7_t *	pSrcB,

void arm_conv_q15	(	q15_t *	const q15_t *	pSrcA,
		q15_t *	const q15_t *	pSrcB,

void arm_conv_q31	(	q31_t *	const q31_t *	pSrcA,
		q31_t *	const q31_t *	pSrcB,

void arm_conv_q7	(	q7_t *	const q7_t *	pSrcA,
		q7_t *	const q7_t *	pSrcB,

Functions

Description

Function Documentation