部署算法需要完成以下四个方面的功能:
- 创建DSP算法组件目录及编写代码
- 在DSP上录音
- 使用算法加速库加速算法
- 核间通讯
- DUMP 数据到PC
创建DSP算法组件目录创建并进入目录:
code">mkdir -p lichee/rtos-components/thirdparty/my_dsp_asr/srcmkdir -p lichee/rtos-components/thirdparty/my_dsp_asr/inccd lichee/rtos-components/thirdparty/my_dsp_asr/编写 Kconfig 文件:
code">menu "my dsp asr"config COMPONENTS_MY_DSP_ASR bool "my dsp asr" depends on ARCH_DSP default n help to doendmenu修改 Kconfig后建议重新 menuconfig
在 lichee/rtos-components/thirdparty/Kconfig 中追加:
code">source "components/common/thirdparty/my_dsp_asr/Kconfig"编写 Makefile:
code">obj-y += src/my_dsp_asr.o#selfCFLAGS += -Icomponents/common/aw/asr_demo/inc/在 lichee/rtos-components/thirdparty/Makefile 中追加:
code">obj-$(CONFIG_COMPONENTS_MY_DSP_ASR) += my_dsp_asr/编写基础代码 code">#include #include #include #include #include #include #include static void my_dsp_asr_thread(void *arg){ size_t loop = (size_t)arg; printf("%s enter\n", __func__); while (loop--) { printf("%s %u\n", __func__, loop); vTaskDelay(500 / portTICK_PERIOD_MS); } printf("%s exit\n", __func__); vTaskDelete(NULL);}const char *thread_name = "my_dsp_asr_thread";size_t stack_size = 0x4000;size_t thread_priority = 1;int cmd_my_dsp_asr(int argc, char *argv[]){ size_t loop = 10; TaskHandle_t handle = NULL; printf("%s enter\n", __func__); if(xTaskCreate(my_dsp_asr_thread, thread_name, stack_size, (void *)loop, thread_priority, &handle) != pdPASS) { printf("xTaskCreate %s failed!\n", thread_name); } printf("%s exit\n", __func__); return 0;}FINSH_FUNCTION_EXPORT_CMD(cmd_my_dsp_asr, my_dsp_asr, my dsp asr);./build.sh menuconfig,选择以下配置:
code">CONFIG_COMPONENTS_MY_DSP_ASR(会根据 Kconfig 的 select 字段自动选上依赖的组件)
检查是否编译进固件:
code">grep -r cmd_my_dsp_asr ./out/ --include=*.bin可以看到:
code">lichee/dsp$ grep -r cmd_my_dsp_asr ./out/ --include=*.binBinary file ./out/r128s3/evb1/r128s2_dsp0_evb1.bin matchesBinary file ./out/r128s3/evb1/r128s2_dsp0_evb1_raw.bin matchesBinary file ./out/r128s3/evb1/r128s2_dsp0_evb1_xcc.bin matches烧录固件即可在串口终端输入:
code">rpccli dsp my_dsp_asr后期可以添加开机自启:
code">diff --git a/arch/sun20iw2/init-sun20iw2.c b/arch/sun20iw2/init-sun20iw2.cindex cfb2d45d..9b5c2a5d 100644--- a/arch/sun20iw2/init-sun20iw2.c+++ b/arch/sun20iw2/init-sun20iw2.c@@ -160,5 +160,10 @@ void app_init(void) rpdata_ctrl_init(); #endif+#ifdef CONFIG_COMPONENTS_MY_DSP_ASR+ int cmd_my_dsp_asr(int argc, char *argv[]);+ cmd_my_dsp_asr(0, NULL);+#endif+ }在DSP上录音在Kconfig中添加:
code"> bool "my dsp asr" depends on ARCH_DSP+ select COMPONENTS_AW_AUDIO_SYSTEM default n help在Makefile中添加
code">#audio systemCFLAGS += -Icomponents/common/aw/AudioSystem/include/参考代码:
code">#include "AudioRecord.h"#define MS_PER_FRAME (10)#define RECORD_RATE (16000)#define RECORD_NAME "capture"static const size_t record_time_ms = 10 * 1000;static const uint32_t rate = RECORD_RATE;static const uint8_t channels = 3;static const uint8_t bitwidth = 16;static int16_t record_buffer[RECORD_RATE * MS_PER_FRAME * 3 / 1000];static void my_record_thread(void *arg){ tAudioRecord *pAudioRecord = NULL; int ret; size_t time_ms = 0; printf("%s enter\n", __func__); pAudioRecord = AudioRecordCreate(RECORD_NAME); if (!pAudioRecord) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } ret = AudioRecordSetup(pAudioRecord, rate, channels, bitwidth); if (ret) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } while (time_ms < record_time_ms) { ret = AudioRecordRead(pAudioRecord, record_buffer, sizeof(record_buffer)); if (ret < 0) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } time_ms += MS_PER_FRAME; printf("%ums: read %d\n", time_ms, ret); } AudioRecordStop(pAudioRecord); AudioRecordDestroy(pAudioRecord); printf("%s exit\n", __func__); vTaskDelete(NULL);}使用算法加速库本节只是代码演示,对于有HIFI5授权的客户可以向 Candence 获取 NatureDSP_Signal 和 xa_nnlib_api 的源码包,其中包含api的说明文档:
- libxa_nnlib/doc/HiFi5-NNLib-ProgrammersGuide-API.pdf
- hifi5_library/doc/NatureDSP_Signal_Library_Reference_HiFi5.pdf
在Kconfig中添加:
code"> bool "my dsp asr" depends on ARCH_DSP select COMPONENTS_AW_AUDIO_SYSTEM+ select COMPONENTS_XTENSA_HIFI5_NNLIB_LIBRARY+ select COMPONENTS_XTENSA_HIFI5_VFPU_LIBRARY default n help在Makefile中添加
code">CFLAGS += -I components/thirdparty/xtensa/hifi5_nn_v170_library/includeCFLAGS += -I components/thirdparty/xtensa/hifi5_vfpu_v200_library/include(链接加速库的动作已经在 lichee/dsp/Makefile 中添加,无需重复添加)
FFT 参考代码:
code">#include #include "NatureDSP_Signal.h"#include "xa_nnlib_api.h"#ifndef PI#define PI (3.141592653f)#endifstruct cplxf_t { float r; float i;};static inline void make_src_cplxf_from_record_buffer(struct cplxf_t *output, int16_t *input, int N, uint8_t chs, uint8_t ch_index){ int i = 0; for (i = 0; i < N; i++) { output.r = input[i * chs + ch_index]; output.i = 0.0f; }}// N*3/4 *twdstepstatic inline void make_twd_cplxf(struct cplxf_t *output, const int N, const int twdstep){ int n, m; for (n = 0; n < (twdstep * N) / 4; n++) { for (m = 0; m < 3; m++) { float phi = 2 * PI * (m + 1) * n / (twdstep * N); output[n * 3 + m].r = cosf(phi); output[n * 3 + m].i = sinf(phi); } }}int get_max(const struct cplxf_t *input_cplxf, int N){ float max = 0.0f; float index = 0; int i = 0; for (i = 0; i < N; i++) { float cur = input_cplxf.r * input_cplxf.r + input_cplxf.i * input_cplxf.i; if (cur > max) { max = cur; index = i; } } return index;}#define FFT_SIZE (1024)static struct cplxf_t g_tmp_cplxf[FFT_SIZE];static int record_data_handler(struct cplxf_t *output_cplxf, const struct cplxf_t *input_cplxf, const struct cplxf_t *twd_cplxf, int N){ if (N != FFT_SIZE) { printf("%s incorrect data length: %d\n", __func__, N); return -1; } memcpy(g_tmp_cplxf, input_cplxf, sizeof(g_tmp_cplxf)); fft_cplxf_ie( (complex_float *)output_cplxf, (complex_float *)g_tmp_cplxf, (const complex_float *)twd_cplxf, 1, FFT_SIZE); return 0;}在录音代码中添加:
code"> ret = AudioRecordSetup(pAudioRecord, rate, channels, bitwidth); if (ret) { printf("%s:%u error!\n", __func__, __LINE__); // TODO }+ static struct cplxf_t g_input_cplxf[FFT_SIZE];+ static struct cplxf_t g_output_cplxf[FFT_SIZE];+ static struct cplxf_t g_twd_cplxf[FFT_SIZE];+ int N = rate * MS_PER_FRAME / 1000;+ int twdstep = 1;+ int max_index = -1;+ make_twd_cplxf(g_twd_cplxf, N, twdstep); while (time_ms < record_time_ms) { ret = AudioRecordRead(pAudioRecord, record_buffer, sizeof(record_buffer)); if (ret < 0) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } time_ms += MS_PER_FRAME;+ max_index = -1;+ make_src_cplxf_from_record_buffer(g_input_cplxf, record_buffer, N, channels, 0);+ if( !record_data_handler(g_output_cplxf, g_input_cplxf, g_twd_cplxf, N)) {+ max_index = get_max(g_output_cplxf, N);+ } printf("%ums: read %d, max: %d\n", time_ms, ret, max_index); }核间通讯代码仅供参考,不包含实际业务代码
在Kconfig中添加:
code"> bool "my dsp asr" depends on ARCH_DSP select COMPONENTS_AW_AUDIO_SYSTEM+ select COMPONENTS_RPDATA select COMPONENTS_XTENSA_HIFI5_NNLIB_LIBRARY select COMPONENTS_XTENSA_HIFI5_VFPU_LIBRARY default n help在Makefile中添加
code">#rpdataCFLAGS += -Icomponents/common/aw/rpdata/include/由于核间通讯需要RV核配合,故还需编写RV端控制及接收数据的组件,可以参照编写DSP算法组件的方法编写: Kconfig:
code">menu "my rv asr"config COMPONENTS_MY_RV_ASR bool "my RV asr" depends on !ARCH_DSP select COMPONENTS_RPDATA default n help to doendmenu(注意是 !ARCH_DSP)
其它修改类似第一节内容,不再重复说明; rv 端 menuconfig命令为 mrtos_menuconfig rv端执行代码不需要"rpccli dsp";
通用代码:
code">#include struct my_rpd_t { rpdata_t *rpd; // both void *addr; // both size_t buf_len; // send void (*cb)(void *priv, void *data, unsigned int data_len); // recv void *priv; // recv};struct my_rpd_cfg_t { int dir; // both const char *type; // both const char *name; // both size_t buf_len; // send void (*cb)(void *priv, void *data, unsigned int data_len); // recv void *priv; // recv};static void rpd_ch_deinit(struct my_rpd_t *hdl){ if (hdl->rpd) { rpdata_t *rpd = hdl->rpd; hdl->cb = NULL; hdl->priv = NULL; hdl->buf_len = 0; hdl->addr = NULL; hdl->rpd = NULL; rpdata_destroy(rpd); }}static int rpd_recv_ch_callback(rpdata_t *rpd, void *data, unsigned int data_len){ struct my_rpd_t *hdl = (struct my_rpd_t *)rpdata_get_private_data(rpd); if (hdl->cb) hdl->cb(hdl->priv, data, data_len); return 0;}static struct rpdata_cbs rpd_recv_cb = { .recv_cb = rpd_recv_ch_callback,};static int rpd_recv_ch_init(struct my_rpd_t *hdl, struct my_rpd_cfg_t *cfg){ printf("recv rpd dir:%d, type:%s, name:%s\n", cfg->dir, cfg->type, cfg->name); hdl->rpd = rpdata_connect(cfg->dir, cfg->type, cfg->name); if (!hdl->rpd) { printf("rpdata_connect failed!\n"); return -1; } hdl->addr = rpdata_buffer_addr(hdl->rpd); if (!hdl->addr) { printf("rpdata_buffer_addr failed!\n"); rpd_ch_deinit(hdl); return -1; } hdl->cb = cfg->cb; hdl->priv = cfg->priv; rpdata_set_private_data(hdl->rpd, hdl); rpdata_set_recv_cb(hdl->rpd, &rpd_recv_cb); return 0;}static int rpd_send_ch_init(struct my_rpd_t *hdl, struct my_rpd_cfg_t *cfg){ printf("send rpd dir:%d, type:%s, name:%s, buf_len:%u\n", cfg->dir, cfg->type, cfg->name, cfg->buf_len); hdl->rpd = rpdata_create(cfg->dir, cfg->type, cfg->name, cfg->buf_len); if (!hdl->rpd) { printf("rpdata_create failed!\n"); goto err; } hdl->addr = rpdata_buffer_addr(hdl->rpd); if (!hdl->addr) { printf("rpdata_buffer_addr failed!\n"); goto err; } hdl->buf_len = cfg->buf_len; return 0;err: rpd_ch_deinit(hdl); return -1;}static int rpd_send(struct my_rpd_t *hdl, void *data){ memcpy(hdl->addr, data, hdl->buf_len); rpdata_wait_connect(hdl->rpd); return rpdata_send(hdl->rpd, 0, hdl->buf_len);}// RV to DSP 控制通道#define RPD_CTL_TYPE ("RVtoDSPCtl")#define RPD_CTL_NAME ("RVtoDSPCtlCh")#define RPD_CTL_SIZE (4)// DSP to RV 数据通道#define RPD_DATA_TYPE ("DSPtoRVData")#define RPD_DATA_NAME ("DSPtoRVDataCh")#define RPD_DATA_SIZE (64)DSP端代码:
code">static int g_run = 0;static void my_rpd_dsp_recv_cb(void *priv, void *data, unsigned int data_len){ printf("%s recv:%d\n", __func__, data_len); memcpy(&g_run, data, sizeof(g_run));}static void my_rpd_thread(void *arg){ struct my_rpd_t send_ch; struct my_rpd_cfg_t send_cfg = { .dir = 2, .type = RPD_DATA_TYPE, .name = RPD_DATA_NAME, .buf_len = RPD_DATA_SIZE, }; struct my_rpd_t recv_ch; struct my_rpd_cfg_t recv_cfg = { .dir = 2, .type = RPD_CTL_TYPE, .name = RPD_CTL_NAME, .cb = my_rpd_dsp_recv_cb, .priv = NULL, }; unsigned char data[RPD_DATA_SIZE]; int i = 0; for (i = 0; i < RPD_DATA_SIZE; i++) { data = '0' + 1; } g_run = 1; printf("%s start\n", __func__); if (rpd_send_ch_init(&send_ch, &send_cfg)) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } if (rpd_recv_ch_init(&recv_ch, &recv_cfg)) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } while(g_run) { rpd_send(&send_ch, data); vTaskDelay(500 / portTICK_PERIOD_MS); } rpd_ch_deinit(&recv_ch); rpd_ch_deinit(&send_ch); printf("%s exit\n", __func__); vTaskDelete(NULL);}RV端代码:
code">static int g_run = 0;static void my_rpd_rv_recv_cb(void *priv, void *data, unsigned int data_len){ printf("%s recv:%d\n", __func__, data_len);}static void my_rpd_thread(void *arg){ struct my_rpd_t send_ch; struct my_rpd_cfg_t send_cfg = { .dir = 3, .type = RPD_CTL_TYPE, .name = RPD_CTL_NAME, .buf_len = RPD_CTL_SIZE, }; struct my_rpd_t recv_ch; struct my_rpd_cfg_t recv_cfg = { .dir = 3, .type = RPD_DATA_TYPE, .name = RPD_DATA_NAME, .cb = my_rpd_rv_recv_cb, .priv = NULL, }; g_run = 1; printf("%s start\n", __func__); if (rpd_send_ch_init(&send_ch, &send_cfg)) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } if (rpd_recv_ch_init(&recv_ch, &recv_cfg)) { printf("%s:%u error!\n", __func__, __LINE__); // TODO } while(1) { int run = g_run; rpd_send(&send_ch, &run); if (!run) break; vTaskDelay(500 / portTICK_PERIOD_MS); } rpd_ch_deinit(&recv_ch); rpd_ch_deinit(&send_ch); printf("%s exit\n", __func__); vTaskDelete(NULL);}RV 端和 DSP 端各自创建处理线程;
DSP 定时将数据发给 RV,RV 定时将运行标志发给 DSP;
RV 端修改 g_run 的值为 0,RV 将 g_run 的值发送给 DSP 后退出,DSP 收到 g_run 也将退出;
DUMP 数据到PCDSP 端没有文件系统,所以数据需要先通过核间通讯发送给 RV 核,再由 RV 核通过某种方式保存或发送;
在 RV核上 可以使用 adb forward 实时将数据传输到 PC,或者也可以保存数据到 flash,然后使用 adb pull 到 PC;
本节的代码都是跑在RV核上的;
可以使用现有封装接口:
code">// file_path和port只需指定一个即可,另一个填NULL或0// 指定file_path表示保存数据到flash,指定port表示提供adb传输数据到PCvoid *data_save_create(const char *name, const char *file_path, int port);void data_save_destroy(void *_hdl);int data_save_request(void *_hdl, void *data, int size, int timeout_ms);// 需要保存后续数据到另一文件时调用,用于分割音频数据int data_save_flush(void *_hdl, int timeout_ms);可以复制 lichee/rtos-components/aw/asr_demo/inc/data_save.h 和 lichee/rtos-components/aw/asr_demo/src/data_save.c 到自己的组件中使用,或者选上 CONFIG_COMPONENTS_ASR_DEMO 时可以直接使用;
- 通过标准文件操作接口保存到flash或data_save组件指定文件路径保存到 flash
- 按以下步骤通过 adb forward 传输数据到 PC:
① 设备端:
code">reboot(重启设备)(等待设备重启完成)adb shell af -p [代码中填写的port] -r② PC端:
code">adb forward tcp:11112 tcp:[代码中填写的port]adb_record.py(或adb_record_3.py,2个文件都在lichee/rtos-components/aw/asr_demo/tools/,接收到的数据会保存在脚本执行目录下)③ 设备端开始调用data_save接口创建通道并发送数据(可以参照第一节添加start和stop传输的命令)
|