#include "dsp_err.h"
#include "dspm_mult_platform.h"

Include dependency graph for dspm_mult.h:

This graph shows which files directly or indirectly include this file:

Functions
esp_err_t	dspm_mult_3x3x1_f32_ae32 (const float A, const float B, float *C)
	Matrix multiplication A[3x3]xB[3x1].
esp_err_t	dspm_mult_3x3x3_f32_ae32 (const float A, const float B, float *C)
	Matrix multiplication A[3x3]xB[3x3].
esp_err_t	dspm_mult_4x4x1_f32_ae32 (const float A, const float B, float *C)
	Matrix multiplication A[4x4]xB[4x1].
esp_err_t	dspm_mult_4x4x4_f32_ae32 (const float A, const float B, float *C)
	Matrix multiplication A[4x4]xB[4x4].

esp_err_t	dspm_mult_f32_ansi (const float A, const float B, float *C, int m, int n, int k)
	Matrix multiplication.
esp_err_t	dspm_mult_f32_ae32 (const float A, const float B, float *C, int m, int n, int k)
esp_err_t	dspm_mult_f32_aes3 (const float A, const float B, float *C, int m, int n, int k)
esp_err_t	dspm_mult_f32_arp4 (const float A, const float B, float *C, int m, int n, int k)

esp_err_t	dspm_mult_s16_ansi (const int16_t A, const int16_t B, int16_t *C, int m, int n, int k, int shift)
	Matrix multiplication 16 bit signeg int.
esp_err_t	dspm_mult_s16_ae32 (const int16_t A, const int16_t B, int16_t *C, int m, int n, int k, int shift)
esp_err_t	dspm_mult_s16_aes3 (const int16_t A, const int16_t B, int16_t *C, int m, int n, int k, int shift)
esp_err_t	dspm_mult_s16_arp4 (const int16_t A, const int16_t B, int16_t *C, int m, int n, int k, int shift)
#define	dspm_mult_s16 dspm_mult_s16_ansi
#define	dspm_mult_f32 dspm_mult_f32_ansi
#define	dspm_mult_3x3x1_f32(A, B, C)
#define	dsps_sub_f32 dsps_sub_f32_ansi
#define	dsps_add_f32 dsps_add_f32_ansi
#define	dspm_mult_4x4x4_f32(A, B, C)
#define	dspm_mult_ex_f32 dspm_mult_ex_f32_ansi
#define	dspm_mult_3x3x3_f32(A, B, C)
#define	dspm_mult_4x4x1_f32(A, B, C)
esp_err_t	dspm_mult_ex_f32_ansi (const float A, const float B, float *C, int m, int n, int k, int A_padd, int B_padd, int C_padd)
	Matrix subset multiplication.
esp_err_t	dspm_mult_ex_f32_ae32 (const float A, const float B, float *C, int m, int n, int k, int A_padd, int B_padd, int C_padd)
esp_err_t	dspm_mult_ex_f32_aes3 (const float A, const float B, float *C, int m, int n, int k, int A_padd, int B_padd, int C_padd)
esp_err_t	dspm_mult_ex_f32_arp4 (const float A, const float B, float *C, int m, int n, int k, int A_padd, int B_padd, int C_padd)

Macro Definition Documentation

◆ dspm_mult_3x3x1_f32

#define dspm_mult_3x3x1_f32	(	A,
		B,
		C )

Value:

dspm_mult_f32(A,B,C, 3, 3, 1)

dspm_mult_f32

#define dspm_mult_f32

Definition dspm_mult.h:221

C

float C[4][16]

Definition test_mmult.c:22

B

float B[8][16]

Definition test_mmult.c:21

A

float A[4][8]

Definition test_mmult.c:20

Definition at line 222 of file dspm_mult.h.

◆ dspm_mult_3x3x3_f32

#define dspm_mult_3x3x3_f32	(	A,
		B,
		C )

Value:

dspm_mult_f32(A,B,C,3,3,3);

Definition at line 227 of file dspm_mult.h.

◆ dspm_mult_4x4x1_f32

#define dspm_mult_4x4x1_f32	(	A,
		B,
		C )

Value:

dspm_mult_f32(A,B,C, 4, 4, 1)

Definition at line 228 of file dspm_mult.h.

◆ dspm_mult_4x4x4_f32

#define dspm_mult_4x4x4_f32	(	A,
		B,
		C )

Value:

dspm_mult_f32(A,B,C, 4, 4, 4)

Definition at line 225 of file dspm_mult.h.

◆ dspm_mult_ex_f32

#define dspm_mult_ex_f32 dspm_mult_ex_f32_ansi

Definition at line 226 of file dspm_mult.h.

Referenced by dspm::operator*(), and dspm::Mat::operator*=().

◆ dspm_mult_f32

#define dspm_mult_f32 dspm_mult_f32_ansi

Definition at line 221 of file dspm_mult.h.

Referenced by dspm::operator*(), and dspm::Mat::operator*=().

◆ dspm_mult_s16

#define dspm_mult_s16 dspm_mult_s16_ansi

Definition at line 220 of file dspm_mult.h.

◆ dsps_add_f32

#define dsps_add_f32 dsps_add_f32_ansi

Definition at line 224 of file dspm_mult.h.

◆ dsps_sub_f32

#define dsps_sub_f32 dsps_sub_f32_ansi

Definition at line 223 of file dspm_mult.h.

Function Documentation

◆ dspm_mult_3x3x1_f32_ae32()

esp_err_t dspm_mult_3x3x1_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C )

Matrix multiplication A[3x3]xB[3x1].

Matrix multiplication for two floating point matrices 3x3 and 3x1: C[1][3] = A[3][3] * B[3][1] The implementation is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[3][3]
[in]	B	input matrix/vector B[3][1]
	C	result matrix/vector C[3][3]

Returns

ESP_OK on success
One of the error codes from DSP library

References A, B, and C.

◆ dspm_mult_3x3x3_f32_ae32()

esp_err_t dspm_mult_3x3x3_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C )

Matrix multiplication A[3x3]xB[3x3].

Matrix multiplication for two square 3x3 floating point matrices: C[3][3] = A[3][3] * B[3][3] The implementation is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[3][3]
[in]	B	input matrix B[3][3]
	C	result matrix C[3][3]

Returns

ESP_OK on success
One of the error codes from DSP library

References A, B, and C.

◆ dspm_mult_4x4x1_f32_ae32()

esp_err_t dspm_mult_4x4x1_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C )

Matrix multiplication A[4x4]xB[4x1].

Matrix multiplication for two floating point matrices 4x4 and 4x1: C[1][4] = A[4][4] * B[4][1] The implementation is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[4][4]
[in]	B	input matrix/vector B[4][1]
	C	result matrix/vector C[4][4]

Returns

ESP_OK on success
One of the error codes from DSP library

References A, B, and C.

◆ dspm_mult_4x4x4_f32_ae32()

esp_err_t dspm_mult_4x4x4_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C )

Matrix multiplication A[4x4]xB[4x4].

Matrix multiplication for two square 3x3 floating point matrices: C[4][4] = A[4][4] * B[4][4] The implementation is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[4][4]
[in]	B	input matrix B[4][4]
	C	result matrix C[4][4]

Returns

ESP_OK on success
One of the error codes from DSP library

References A, B, C, k, m, and n.

◆ dspm_mult_ex_f32_ae32()

esp_err_t dspm_mult_ex_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k,
		int	A_padd,
		int	B_padd,
		int	C_padd )

References A, B, C, k, m, and n.

◆ dspm_mult_ex_f32_aes3()

esp_err_t dspm_mult_ex_f32_aes3	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k,
		int	A_padd,
		int	B_padd,
		int	C_padd )

References A, B, C, k, m, and n.

◆ dspm_mult_ex_f32_ansi()

esp_err_t dspm_mult_ex_f32_ansi	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k,
		int	A_padd,
		int	B_padd,
		int	C_padd )

Matrix subset multiplication.

One or all of the matrices are matrix subsets, described with pointers and strides Matrix multiplication for two floating point matrices: C[m][k] = A[m][n] * B[n][k] The extension (_ansi) use ANSI C and could be compiled and run on any platform. The extension (_ae32) is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[m][n]
[in]	B	input matrix B[n][k]
[out]	C	result matrix C[m][k]
[in]	m	matrix dimension
[in]	n	matrix dimension
[in]	k	matrix dimension
[in]	A_padd	input matrix A padding
[in]	B_padd	input matrix B padding
[in]	C_padd	result matrix C padding

Returns

ESP_OK on success
One of the error codes from DSP library

Definition at line 12 of file dspm_mult_ex_f32_ansi.c.

{
    if (NULL == A) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (NULL == B) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (NULL == C) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
 
    if (A_rows <= 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (A_cols <= 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (B_cols <= 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
 
    if (A_padding < 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (B_padding < 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
    if (C_padding < 0) {
        return ESP_ERR_DSP_PARAM_OUTOFRANGE;
    }
 
    const int A_step = A_cols + A_padding;
    const int B_step = B_cols + B_padding;
    const int C_step = B_cols + C_padding;
 
    for (int i = 0; i < A_rows; i++) {
        for (int j = 0; j < B_cols; j++) {
            C[i * C_step + j] = A[i * A_step] * B[j];
            for (int s = 1; s < A_cols; s++) {
                C[i * C_step + j] += A[i * A_step + s] * B[s * B_step + j];
            }
        }
    }
    return ESP_OK;
}

References A, B, C, ESP_ERR_DSP_PARAM_OUTOFRANGE, and ESP_OK.

◆ dspm_mult_ex_f32_arp4()

esp_err_t dspm_mult_ex_f32_arp4	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k,
		int	A_padd,
		int	B_padd,
		int	C_padd )

References A, B, C, k, m, and n.

◆ dspm_mult_f32_ae32()

esp_err_t dspm_mult_f32_ae32	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k )

References A, B, C, k, m, and n.

Referenced by test_mmult().

Here is the caller graph for this function:

◆ dspm_mult_f32_aes3()

esp_err_t dspm_mult_f32_aes3	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k )

References A, B, C, k, m, and n.

Referenced by test_mmult().

Here is the caller graph for this function:

◆ dspm_mult_f32_ansi()

esp_err_t dspm_mult_f32_ansi	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k )

Matrix multiplication.

Matrix multiplication for two floating point matrices: C[m][k] = A[m][n] * B[n][k] The extension (_ansi) use ANSI C and could be compiled and run on any platform. The extension (_ae32) is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[m][n]
[in]	B	input matrix B[n][k]
	C	result matrix C[m][k]
[in]	m	matrix dimension
[in]	n	matrix dimension
[in]	k	matrix dimension

Returns

ESP_OK on success
One of the error codes from DSP library

Definition at line 22 of file dspm_mult_f32_ansi.c.

{
    for (int i = 0 ; i < m ; i++) {
        for (int j = 0 ; j < k ; j++) {
            C[i * k + j] = A[i * n] * B[j];
            for (int s = 1; s < n ; s++) {
                C[i * k + j] += A[i * n + s] * B[s * k + j];
            }
        }
    }
    return ESP_OK;
}

References A, B, C, ESP_OK, k, m, and n.

◆ dspm_mult_f32_arp4()

esp_err_t dspm_mult_f32_arp4	(	const float *	A,
		const float *	B,
		float *	C,
		int	m,
		int	n,
		int	k )

References A, B, C, k, m, and n.

◆ dspm_mult_s16_ae32()

esp_err_t dspm_mult_s16_ae32	(	const int16_t *	A,
		const int16_t *	B,
		int16_t *	C,
		int	m,
		int	n,
		int	k,
		int	shift )

References A, B, C, k, m, and n.

◆ dspm_mult_s16_aes3()

esp_err_t dspm_mult_s16_aes3	(	const int16_t *	A,
		const int16_t *	B,
		int16_t *	C,
		int	m,
		int	n,
		int	k,
		int	shift )

References A, B, C, k, m, and n.

◆ dspm_mult_s16_ansi()

esp_err_t dspm_mult_s16_ansi	(	const int16_t *	A,
		const int16_t *	B,
		int16_t *	C,
		int	m,
		int	n,
		int	k,
		int	shift )

Matrix multiplication 16 bit signeg int.

Matrix multiplication for two signed 16 bit fixed point matrices: C[m][k] = (A[m][n] * B[n][k]) >> (15- shift) The extension (_ansi) use ANSI C and could be compiled and run on any platform. The extension (_ae32) is optimized for ESP32 chip.

Parameters

[in]	A	input matrix A[m][n]
[in]	B	input matrix B[n][k]
	C	result matrix C[m][k]
[in]	m	matrix dimension
[in]	n	matrix dimension
[in]	k	matrix dimension
[in]	shift	every result will be shifted and stored as 16 bit signed value.

Returns

ESP_OK on success
One of the error codes from DSP library

Definition at line 21 of file dspm_mult_s16_ansi.c.

{
    int final_shift = shift - 15;
    for (int i = 0 ; i < m ; i++) {
        for (int j = 0 ; j < k ; j++) {
            // This code also could be used
            //dsps_dotprode_f32_ae32(&A[i*n],&B[j],&C[i*k + j],n,1,n);
            long long acc = 0x7fff >> shift;
            for (int s = 0; s < n ; s++) {
                acc += (int32_t)A[i * n + s] * (int32_t)B[s * k + j];
            }
            if (final_shift > 0) {
                C[i * k + j] = (acc << final_shift);
            } else {
                C[i * k + j] = (acc >> (-final_shift));
            }
        }
    }
    return ESP_OK;
}

References A, B, C, ESP_OK, k, m, and n.

◆ dspm_mult_s16_arp4()

esp_err_t dspm_mult_s16_arp4	(	const int16_t *	A,
		const int16_t *	B,
		int16_t *	C,
		int	m,
		int	n,
		int	k,
		int	shift )

References A, B, C, k, m, and n.

Functions

Macro Definition Documentation

◆ dspm_mult_3x3x1_f32

◆ dspm_mult_3x3x3_f32

◆ dspm_mult_4x4x1_f32

◆ dspm_mult_4x4x4_f32

◆ dspm_mult_ex_f32

◆ dspm_mult_f32

◆ dspm_mult_s16

◆ dsps_add_f32

◆ dsps_sub_f32

Function Documentation

◆ dspm_mult_3x3x1_f32_ae32()

◆ dspm_mult_3x3x3_f32_ae32()

◆ dspm_mult_4x4x1_f32_ae32()

◆ dspm_mult_4x4x4_f32_ae32()

◆ dspm_mult_ex_f32_ae32()

◆ dspm_mult_ex_f32_aes3()

◆ dspm_mult_ex_f32_ansi()

◆ dspm_mult_ex_f32_arp4()

◆ dspm_mult_f32_ae32()

◆ dspm_mult_f32_aes3()

◆ dspm_mult_f32_ansi()

◆ dspm_mult_f32_arp4()

◆ dspm_mult_s16_ae32()

◆ dspm_mult_s16_aes3()

◆ dspm_mult_s16_ansi()

◆ dspm_mult_s16_arp4()