Introduce an API mirroring the CMSIS-DSP's basicmath. If CMSIS_DSP is enabled, then it will by default be used as a backend. Developers may opt into a custom backend by setting CONFIG_DSP_BACKEND_CMSIS=n. If done, the application must provide `zdsp_backend/dsp.h` and optionally implement the functions in its own .c files. Signed-off-by: Yuval Peress <peress@google.com>
281 lines
8.4 KiB
C
281 lines
8.4 KiB
C
/* Copyright (c) 2022 Google LLC
|
|
* SPDX-License-Identifier: Apache-2.0
|
|
*/
|
|
|
|
#ifndef SUBSYS_MATH_CMSIS_BACKEND_PUBLIC_ZDSP_BACKEND_DSP_H_
|
|
#define SUBSYS_MATH_CMSIS_BACKEND_PUBLIC_ZDSP_BACKEND_DSP_H_
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
/* This include MUST be done before arm_math.h so we can let the arch specific
|
|
* logic set up the right #define values for arm_math.h
|
|
*/
|
|
#include <zephyr/kernel.h>
|
|
|
|
#include <arm_math.h>
|
|
|
|
static inline void zdsp_mult_q7(const q7_t *src_a, const q7_t *src_b, q7_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_mult_q7(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_mult_q15(const q15_t *src_a, const q15_t *src_b, q15_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_mult_q15(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_mult_q31(const q31_t *src_a, const q31_t *src_b, q31_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_mult_q31(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_mult_f32(const float32_t *src_a, const float32_t *src_b, float32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_mult_f32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_add_q7(const q7_t *src_a, const q7_t *src_b, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_add_q7(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_add_q15(const q15_t *src_a, const q15_t *src_b, q15_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_add_q15(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_add_q31(const q31_t *src_a, const q31_t *src_b, q31_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_add_q31(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_add_f32(const float32_t *src_a, const float32_t *src_b, float32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_add_f32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_sub_q7(const q7_t *src_a, const q7_t *src_b, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_sub_q7(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_sub_q15(const q15_t *src_a, const q15_t *src_b, q15_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_sub_q15(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_sub_q31(const q31_t *src_a, const q31_t *src_b, q31_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_sub_q31(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_sub_f32(const float32_t *src_a, const float32_t *src_b, float32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_sub_f32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_scale_q7(const q7_t *src, q7_t scale_fract, int8_t shift, q7_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_scale_q7(src, scale_fract, shift, dst, block_size);
|
|
}
|
|
static inline void zdsp_scale_q15(const q15_t *src, q15_t scale_fract, int8_t shift, q15_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_scale_q15(src, scale_fract, shift, dst, block_size);
|
|
}
|
|
static inline void zdsp_scale_q31(const q31_t *src, q31_t scale_fract, int8_t shift, q31_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_scale_q31(src, scale_fract, shift, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_scale_f32(const float32_t *src, float32_t scale, float32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_scale_f32(src, scale, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_abs_q7(const q7_t *src, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_abs_q7(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_abs_q15(const q15_t *src, q15_t *dst, uint32_t block_size)
|
|
{
|
|
arm_abs_q15(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_abs_q31(const q31_t *src, q31_t *dst, uint32_t block_size)
|
|
{
|
|
arm_abs_q31(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_abs_f32(const float32_t *src, float32_t *dst, uint32_t block_size)
|
|
{
|
|
arm_abs_f32(src, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_negate_q7(const q7_t *src, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_negate_q7(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_negate_q15(const q15_t *src, q15_t *dst, uint32_t block_size)
|
|
{
|
|
arm_negate_q15(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_negate_q31(const q31_t *src, q31_t *dst, uint32_t block_size)
|
|
{
|
|
arm_negate_q31(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_negate_f32(const float32_t *src, float32_t *dst, uint32_t block_size)
|
|
{
|
|
arm_negate_f32(src, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_dot_prod_q7(const q7_t *src_a, const q7_t *src_b, uint32_t block_size,
|
|
q31_t *dst)
|
|
{
|
|
arm_dot_prod_q7(src_a, src_b, block_size, dst);
|
|
}
|
|
static inline void zdsp_dot_prod_q15(const q15_t *src_a, const q15_t *src_b, uint32_t block_size,
|
|
q63_t *dst)
|
|
{
|
|
arm_dot_prod_q15(src_a, src_b, block_size, dst);
|
|
}
|
|
static inline void zdsp_dot_prod_q31(const q31_t *src_a, const q31_t *src_b, uint32_t block_size,
|
|
q63_t *dst)
|
|
{
|
|
arm_dot_prod_q31(src_a, src_b, block_size, dst);
|
|
}
|
|
static inline void zdsp_dot_prod_f32(const float32_t *src_a, const float32_t *src_b,
|
|
uint32_t block_size, float32_t *dst)
|
|
{
|
|
arm_dot_prod_f32(src_a, src_b, block_size, dst);
|
|
}
|
|
|
|
static inline void zdsp_shift_q7(const q7_t *src, int8_t shift_bits, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_shift_q7(src, shift_bits, dst, block_size);
|
|
}
|
|
static inline void zdsp_shift_q15(const q15_t *src, int8_t shift_bits, q15_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_shift_q15(src, shift_bits, dst, block_size);
|
|
}
|
|
static inline void zdsp_shift_q31(const q31_t *src, int8_t shift_bits, q31_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_shift_q31(src, shift_bits, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_offset_q7(const q7_t *src, q7_t offset, q7_t *dst, uint32_t block_size)
|
|
{
|
|
arm_offset_q7(src, offset, dst, block_size);
|
|
}
|
|
static inline void zdsp_offset_q15(const q15_t *src, q15_t offset, q15_t *dst, uint32_t block_size)
|
|
{
|
|
arm_offset_q15(src, offset, dst, block_size);
|
|
}
|
|
static inline void zdsp_offset_q31(const q31_t *src, q31_t offset, q31_t *dst, uint32_t block_size)
|
|
{
|
|
arm_offset_q31(src, offset, dst, block_size);
|
|
}
|
|
static inline void zdsp_offset_f32(const float32_t *src, float32_t offset, float32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_offset_f32(src, offset, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_clip_q7(const q7_t *src, q7_t *dst, q7_t low, q7_t high,
|
|
uint32_t num_samples)
|
|
{
|
|
arm_clip_q7(src, dst, low, high, num_samples);
|
|
}
|
|
static inline void zdsp_clip_q15(const q15_t *src, q15_t *dst, q15_t low, q15_t high,
|
|
uint32_t num_samples)
|
|
{
|
|
arm_clip_q15(src, dst, low, high, num_samples);
|
|
}
|
|
static inline void zdsp_clip_q31(const q31_t *src, q31_t *dst, q31_t low, q31_t high,
|
|
uint32_t num_samples)
|
|
{
|
|
arm_clip_q31(src, dst, low, high, num_samples);
|
|
}
|
|
static inline void zdsp_clip_f32(const float32_t *src, float32_t *dst, float32_t low,
|
|
float32_t high, uint32_t num_samples)
|
|
{
|
|
arm_clip_f32(src, dst, low, high, num_samples);
|
|
}
|
|
|
|
static inline void zdsp_and_u8(const uint8_t *src_a, const uint8_t *src_b, uint8_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_and_u8(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_and_u16(const uint16_t *src_a, const uint16_t *src_b, uint16_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_and_u16(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_and_u32(const uint32_t *src_a, const uint32_t *src_b, uint32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_and_u32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_or_u8(const uint8_t *src_a, const uint8_t *src_b, uint8_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_or_u8(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_or_u16(const uint16_t *src_a, const uint16_t *src_b, uint16_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_or_u16(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_or_u32(const uint32_t *src_a, const uint32_t *src_b, uint32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_or_u32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_xor_u8(const uint8_t *src_a, const uint8_t *src_b, uint8_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_xor_u8(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_xor_u16(const uint16_t *src_a, const uint16_t *src_b, uint16_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_xor_u16(src_a, src_b, dst, block_size);
|
|
}
|
|
static inline void zdsp_xor_u32(const uint32_t *src_a, const uint32_t *src_b, uint32_t *dst,
|
|
uint32_t block_size)
|
|
{
|
|
arm_xor_u32(src_a, src_b, dst, block_size);
|
|
}
|
|
|
|
static inline void zdsp_not_u8(const uint8_t *src, uint8_t *dst, uint32_t block_size)
|
|
{
|
|
arm_not_u8(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_not_u16(const uint16_t *src, uint16_t *dst, uint32_t block_size)
|
|
{
|
|
arm_not_u16(src, dst, block_size);
|
|
}
|
|
static inline void zdsp_not_u32(const uint32_t *src, uint32_t *dst, uint32_t block_size)
|
|
{
|
|
arm_not_u32(src, dst, block_size);
|
|
}
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#ifdef CONFIG_FP16
|
|
#include "zdsp_backend_f16.h"
|
|
#endif /* COIFNG_FP16 */
|
|
|
|
#endif /* SUBSYS_MATH_CMSIS_BACKEND_PUBLIC_ZDSP_BACKEND_DSP_H_ */
|