Files
kunlun/dtest/bee_afft_test/afft_test.c

508 lines
17 KiB
C
Raw Normal View History

2024-09-28 14:24:04 +08:00
#include "os_types.h"
#include "os_mem_api.h"
#include "dbg_io.h"
#include "iot_diag.h"
#include "iot_io.h"
#include "ahb_hw.h"
#include "afft_hw.h"
#include "iot_afft_api.h"
#include "iot_simd_api.h"
#include "cpu.h"
#include "math.h"
#include "fft_input_real.h"
#include "ifft_input_real.h"
#include "fft_output_real.h"
#include "ifft_output_real.h"
#include "fft_input_complex.h"
#include "ifft_input_complex.h"
#include "fft_output_complex.h"
#include "ifft_output_complex.h"
// test different data mode
#include "input_real.h"
#include "input_ireal.h"
#define AFFT_FFT_REAL_24 (1 << 0)
#define AFFT_IFFT_REAL_24 (1 << 1)
#define AFFT_FFT_COMPLEX_24 (1 << 2)
#define AFFT_IFFT_COMPLEX_24 (1 << 3)
#define AFFT_ALL (AFFT_FFT_REAL_24 | AFFT_IFFT_REAL_24 \
| AFFT_FFT_COMPLEX_24 | AFFT_IFFT_COMPLEX_24)
#define TEST_CASE_AFFT (AFFT_ALL)
#define AFFT_FFT_LOW_24 (1 << 0)
#define AFFT_FFT_HIGH_24 (1 << 1)
#define AFFT_FFT_16_REAL (1 << 2)
#define AFFT_FFT_FLOAT (1 << 3)
#define AFFT_IFFT_LOW_24 (1 << 4)
#define AFFT_IFFT_HIGH_24 (1 << 5)
#define AFFT_IFFT_16_REAL (1 << 6)
#define AFFT_IFFT_FLOAT (1 << 7)
#define AFFT_FFT_COMPLEX_LOW_24 (1 << 8)
#define AFFT_IFFT_COMPLEX_LOW_24 (1 << 9)
#define AFFT_TEST_DM_ALL (AFFT_IFFT_LOW_24 | AFFT_IFFT_HIGH_24 | \
AFFT_IFFT_16_REAL |AFFT_IFFT_FLOAT)
#define TEST_CASE_DATA_MODE (AFFT_FFT_COMPLEX_LOW_24|AFFT_IFFT_COMPLEX_LOW_24|AFFT_FFT_LOW_24|AFFT_IFFT_LOW_24|AFFT_IFFT_HIGH_24|AFFT_FFT_HIGH_24) //(AFFT_FFT_FLOAT)
typedef struct _mcycle_cnt {
uint64_t fft_float; // 512w fft float cost
uint64_t sw_dma_itoi; // 512w
uint64_t sw_dma_ftoi;
uint32_t sw_dma_itof;
} mcycle_cnt_t;
typedef struct _cycle_cpy {
uint64_t memcpy_ram2ram;
uint64_t memcpy_ram2fft;
uint64_t memcpy_fft2ram;
uint64_t simd_ram2ram;
uint64_t simd_ram2fft;
uint64_t simd_fft2ram;
uint64_t swdma_ram2ram;
uint64_t swdma_ram2fft;
uint64_t swdma_fft2ram;
} mcycle_cpy_t;
mcycle_cnt_t g_mcycle_cnt = {0};
mcycle_cpy_t g_mcycle_cpy = {0};
uint32_t result[1024] = {0};
void output_compare(uint32_t *dst, uint32_t *src, uint32_t size)
{
uint32_t s = 0;
uint32_t d = 0;
uint32_t inc = 0;
uint32_t err_cnt = 0;
for(uint32_t i = 0; i < size; i++) {
s = (*(src + i) & ~0xff000000);
d = (*(dst + i) & ~0xff000000);
if (s >= d) {
inc = s - d;
} else {
inc = d - s;
}
if (inc > 5) {
if(err_cnt<20)
iot_printf("error i: %d, val: [result:%d - %d], inc: %d\n",
i, (int32_t)(*(src + i)), (int32_t)(*(dst + i)), inc);
err_cnt++;
//return;
}
}
if(err_cnt==0)
iot_printf("successful.....\n");
else
iot_printf("ERROR: err_cnt %d.....\n",err_cnt);
}
void output_print(uint32_t *dst, uint32_t *src, uint32_t size)
{
for(uint32_t i = 0; i < size; i++) {
int32_t tmp;
tmp = (int32_t )(*(dst+i));
iot_printf("%08x\n", tmp);
}
iot_printf("successful.....\n");
}
void data_left_shift(void *dst, void *src, uint32_t len, uint8_t bit)
{
uint32_t *d = (uint32_t *)dst;
uint32_t *s = (uint32_t *) src;
for(uint32_t i = 0; i < len; i++) {
*(d + i) = (*(s +i) << bit);
}
}
void data_bind(void *dst, void *src, uint32_t len)
{
uint32_t *d = (uint32_t *)dst;
uint32_t *s = (uint32_t *) src;
for(uint32_t i = 0; i < len/2; i++) {
*(d + i) = (*(s +i*2)&0xffff) + (*(s + 2*i+1) << 16);
}
}
void data_right_shift(void *dst, void *src, uint32_t len, uint8_t bit)
{
int32_t *d = (int32_t *)dst;
int32_t *s = (int32_t *) src;
for(uint32_t i = 0; i < len; i++) {
*(d + i) = (*(s +i) >> bit);
}
}
void afft_new_test()
{
uint64_t org = cpu_get_mcycle();
iot_printf("----------------------mcycle org: %d-------------------\n", org);
#if (TEST_CASE_DATA_MODE & AFFT_FFT_LOW_24)
iot_printf("afft test fft 256 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_fft(result, (uint32_t *)input_real_256, 256,
AFFT_FMT_LOW_24BIT, AFFT_REAL_256); //result
output_compare((uint32_t *)result, (uint32_t *)output_real_256, 256);
iot_printf("afft test fft 512 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_fft(result, (uint32_t *)input_real_512, 512,
AFFT_FMT_LOW_24BIT, AFFT_REAL_512); //result
output_compare((uint32_t *)result, (uint32_t *)output_real_512, 512);
iot_printf("afft test fft 1024 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_fft(result, (uint32_t *)input_real_1024, 1024,
AFFT_FMT_LOW_24BIT, AFFT_REAL_1024); //result
output_compare((uint32_t *)result, (uint32_t *)output_real_1024, 1024);
iot_printf("afft test fft 64 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_init();
iot_afft_real_fft(result, (uint32_t *)input_real_64, 64,
AFFT_FMT_LOW_24BIT, AFFT_REAL_64); //result
output_compare((uint32_t *)result, (uint32_t *)output_real_64, 64);
iot_printf("afft test fft 128 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_fft(result, (uint32_t *)input_real_128, 128,
AFFT_FMT_LOW_24BIT, AFFT_REAL_128); //result
output_compare((uint32_t *)result, (uint32_t *)output_real_128, 128);
#endif
#if (TEST_CASE_DATA_MODE & AFFT_FFT_HIGH_24)
iot_printf("afft test fft 256 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_real_256_h24, input_real_256, 256, 8);
iot_afft_real_fft(result, (uint32_t *)input_real_256_h24, 256,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_256); //result
data_right_shift(result, result, 256, 8);
output_compare((uint32_t *)result, (uint32_t *)output_real_256, 256);
iot_printf("afft test fft 512 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_real_512_h24, input_real_512, 512, 8);
iot_afft_real_fft(result, (uint32_t *)input_real_512_h24, 512,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_512);
data_right_shift(result, result, 512, 8);
output_compare((uint32_t *)result, (uint32_t *)output_real_512, 512);
iot_printf("afft test fft 1024 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_real_1024_h24, input_real_1024, 1024, 8);
iot_afft_real_fft(result, (uint32_t *)input_real_1024_h24, 1024,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_1024); //result
data_right_shift(result, result, 1024, 8);
output_compare((uint32_t *)result, (uint32_t *)output_real_1024, 1024);
iot_printf("afft test fft 64 high 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_init();
data_left_shift(input_real_64_h24, input_real_64, 64, 8);
iot_afft_real_fft(result, (uint32_t *)input_real_64_h24, 64,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_64);
data_right_shift(result, result, 64, 8);
output_compare((uint32_t *)result, (uint32_t *)output_real_64, 64);
iot_printf("afft test fft 128 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_real_128_h24, input_real_128, 128, 8);
iot_afft_real_fft(result, (uint32_t *)input_real_128_h24, 128,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_128);
data_right_shift(result, result, 128, 8);
output_compare((uint32_t *)result, (uint32_t *)output_real_128, 128);
#endif
#if (TEST_CASE_DATA_MODE & AFFT_FFT_16_REAL)
iot_printf("afft test fft 512 16-16bit real data\n");
os_mem_set(result, 0, 1024);
data_bind(input_real_512_1616, input_real_512, 512);
iot_afft_real_fft(result, (uint32_t *)input_real_512_1616, 256,
AFFT_FMT_16BIT, AFFT_REAL_512);
iot_printf("output fft real 24:\n");
for(uint32_t i = 0; i < 256; i++) {
uint32_t tmp;
tmp = (uint32_t )(*(result+i));
iot_printf("0x%08x\n", tmp);
iot_printf("-\n");
}
for(uint32_t i = 0; i < 256; i++) {
int16_t low;
int16_t high;
low = (int16_t)(result[i] & 0xffff);
high = (int16_t)((result[i] & 0xffff0000) >> 16);
iot_printf("%d\n", low);
iot_printf("%d\n", high);
}
iot_printf("AFFT_FFT_REAL_24 done....\n");
#endif
#if (TEST_CASE_DATA_MODE & AFFT_FFT_FLOAT)
iot_printf("afft test fft 512 float real data\n");
os_mem_set(result, 0, 1024);
org = cpu_get_mcycle();
iot_afft_real_fft(result, (uint32_t *)input_float_512, 512,
AFFT_FMT_FLOAT_32BIT, AFFT_REAL_512);
g_mcycle_cnt.fft_float = cpu_get_mcycle() - org;
iot_printf("output fft real 24:\n");
for(uint32_t i = 0; i < 512; i++) {
uint32_t tmp;
tmp = (uint32_t )(*(result+i));
iot_printf("0x%08x\n", tmp);
}
iot_printf("AFFT_FFT_REAL_24 done....\n");
#endif
#if (TEST_CASE_DATA_MODE & AFFT_IFFT_LOW_24)
iot_printf("afft test ifft 256 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_256, 256,
AFFT_FMT_LOW_24BIT, AFFT_REAL_256);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_256, 256);
iot_printf("afft test ifft 512 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_512, 512,
AFFT_FMT_LOW_24BIT, AFFT_REAL_512);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_512, 512);
iot_printf("afft test ifft 1024 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_1024, 1024,
AFFT_FMT_LOW_24BIT, AFFT_REAL_1024);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_1024, 1024);
iot_printf("afft test ifft 64 low 24bit real data\n");
iot_afft_init();
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_64, 64,
AFFT_FMT_LOW_24BIT, AFFT_REAL_64);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_64, 64);
iot_printf("afft test ifft 128 low 24bit real data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_128, 128,
AFFT_FMT_LOW_24BIT, AFFT_REAL_128);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_128, 128);
#endif
#if (TEST_CASE_DATA_MODE & AFFT_IFFT_HIGH_24)
iot_printf("afft test ifft 256 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_ireal_256_h24, input_ireal_256, 256, 8);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_256_h24, 256,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_256);
data_right_shift(result, result, 256, 8);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_256, 256);
iot_printf("afft test ifft 512 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_ireal_512_h24, input_ireal_512, 512, 8);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_512_h24, 512,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_512);
data_right_shift(result, result, 512, 8);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_512, 512);
iot_printf("afft test ifft 1024 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_ireal_1024_h24, input_ireal_1024, 1024, 8);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_1024_h24, 1024,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_1024);
data_right_shift(result, result, 1024, 8);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_1024, 1024);
iot_printf("afft test ifft 64 high 24bit real data\n");
iot_afft_init();
os_mem_set(result, 0, 1024);
data_left_shift(input_ireal_64_h24, input_ireal_64, 64, 8);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_64_h24, 64,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_64);
data_right_shift(result, result, 64, 8);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_64, 64);
iot_printf("afft test ifft 128 high 24bit real data\n");
os_mem_set(result, 0, 1024);
data_left_shift(input_ireal_128_h24, input_ireal_128, 128, 8);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_128_h24, 128,
AFFT_FMT_HIGH_24BIT, AFFT_REAL_128);
data_right_shift(result, result, 128, 8);
output_compare((uint32_t *)result, (uint32_t *)output_ireal_128, 128);
#endif
#if (TEST_CASE_DATA_MODE & AFFT_IFFT_16_REAL)
iot_printf("afft test ifft 512 16-16bit real data\n");
os_mem_set(result, 0, 1024);
data_bind(input_ireal_512_1616, input_ireal_512, 512);
iot_afft_real_ifft(result, (uint32_t *)input_ireal_512_1616, 256,
AFFT_FMT_16BIT, AFFT_REAL_512);
iot_printf("output fft real 24:\n");
for(uint32_t i = 0; i < 256; i++) {
uint32_t tmp;
tmp = (uint32_t )(*(result+i));
iot_printf("0x%08x\n", tmp);
iot_printf("-\n");
}
for(uint32_t i = 0; i < 256; i++) {
int16_t low;
int16_t high;
low = (int16_t)(result[i] & 0xffff);
high = (int16_t)((result[i] & 0xffff0000) >> 16);
iot_printf("%d\n", low);
iot_printf("%d\n", high);
}
iot_printf("AFFT_FFT_REAL_24 done....\n");
#endif
#if (TEST_CASE_DATA_MODE & AFFT_IFFT_FLOAT)
iot_printf("afft test ifft 512 float data\n");
os_mem_set(result, 0, 1024);
iot_afft_real_ifft(result, (uint32_t *)input_ifloat_512, 512,
AFFT_FMT_FLOAT_32BIT, AFFT_REAL_512);
iot_printf("output fft real 24:\n");
for(uint32_t i = 0; i < 512; i++) {
uint32_t tmp;
tmp = (uint32_t )(*(result+i));
iot_printf("0x%08x\n", tmp);
}
iot_printf("AFFT_FFT_REAL_24 done....\n");
#endif
#if (TEST_CASE_DATA_MODE & AFFT_FFT_COMPLEX_LOW_24)
iot_printf("afft test fft 256 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_fft(result, fft_input_256_complex, 256,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_128);
output_compare((uint32_t *)result, fft_output_256_complex, 256);
iot_printf("afft test fft 512 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_fft(result, fft_input_512_complex, 512,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_256);
output_compare((uint32_t *)result, fft_output_512_complex, 512);
iot_printf("afft test fft 1K 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_fft(result, fft_input_complex, 1024,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_512);
output_compare((uint32_t *)result, fft_output_complex, 1024);
iot_printf("afft test fft 64 24bit complex data\n");
iot_afft_init();
os_mem_set(result, 0, 1024);
iot_afft_complex_fft(result, fft_input_64_complex, 64,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_32);
output_compare((uint32_t *)result, fft_output_64_complex, 64);
iot_printf("afft test fft 128 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_fft(result, fft_input_128_complex, 128,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_64);
output_compare((uint32_t *)result, fft_output_128_complex, 128);
#endif
#if (TEST_CASE_DATA_MODE & AFFT_IFFT_COMPLEX_LOW_24)
iot_printf("afft test ifft 256 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_ifft(result, ifft_input_256_complex, 256,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_128);
output_compare((uint32_t *)result, ifft_output_256_complex, 256);
iot_printf("afft test ifft 512 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_ifft(result, ifft_input_512_complex, 512,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_256);
output_compare((uint32_t *)result, ifft_output_512_complex, 512);
iot_printf("afft test ifft 1K 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_ifft(result, ifft_input_complex, 1024,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_512);
output_compare((uint32_t *)result, ifft_output_complex, 1024);
iot_printf("afft test ifft 64 24bit complex data\n");
iot_afft_init();
os_mem_set(result, 0, 1024);
iot_afft_complex_ifft(result, ifft_input_64_complex, 64,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_32);
output_compare((uint32_t *)result, ifft_output_64_complex, 64);
iot_printf("afft test ifft 128 24bit complex data\n");
os_mem_set(result, 0, 1024);
iot_afft_complex_ifft(result, ifft_input_128_complex, 128,
AFFT_FMT_LOW_24BIT, AFFT_COMPLEX_64);
output_compare((uint32_t *)result, ifft_output_128_complex, 128);
#endif
}
float sw_dma_test[512] = {0};
float sw_out[512] = {0};
extern void sw_dma_memcpy(void *dest, void *src, uint16_t total_len);
extern void* memcpy(void* dest, const void* src, uint32_t size);
int main(void)
{
volatile uint32_t mstatus = 0x8001f888;
asm volatile ("csrw mstatus, %0" : "=r"(mstatus));
dbg_uart_init();
//iot_dbg_uart_set_port(IOT_UART_PORT0, 3000000, 0, 8, 1);
iot_printf("\n-------AUDIO FFT TEST---------\n");
iot_afft_init();
while(1) {
afft_new_test();
}
iot_printf("\n-------AUDIO FFT TEST FINISH---------\n");
while(1);
return 0;
}