forked from xiaozhi/xiaozhi-esp32
243 lines
7.5 KiB
C++
243 lines
7.5 KiB
C++
#include "AudioDevice.h"
|
|
#include "Board.h"
|
|
|
|
#include <esp_log.h>
|
|
#include <cstring>
|
|
#include <cmath>
|
|
|
|
#define TAG "AudioDevice"
|
|
|
|
AudioDevice::AudioDevice()
|
|
: input_sample_rate_(AUDIO_INPUT_SAMPLE_RATE),
|
|
output_sample_rate_(AUDIO_OUTPUT_SAMPLE_RATE) {
|
|
}
|
|
|
|
AudioDevice::~AudioDevice() {
|
|
if (audio_input_task_ != nullptr) {
|
|
vTaskDelete(audio_input_task_);
|
|
}
|
|
if (rx_handle_ != nullptr) {
|
|
ESP_ERROR_CHECK(i2s_channel_disable(rx_handle_));
|
|
}
|
|
if (tx_handle_ != nullptr) {
|
|
ESP_ERROR_CHECK(i2s_channel_disable(tx_handle_));
|
|
}
|
|
}
|
|
|
|
void AudioDevice::Initialize() {
|
|
#ifdef AUDIO_I2S_METHOD_SIMPLEX
|
|
CreateSimplexChannels();
|
|
#else
|
|
CreateDuplexChannels();
|
|
#endif
|
|
}
|
|
|
|
void AudioDevice::CreateDuplexChannels() {
|
|
#ifndef AUDIO_I2S_METHOD_SIMPLEX
|
|
duplex_ = true;
|
|
|
|
i2s_chan_config_t chan_cfg = {
|
|
.id = I2S_NUM_0,
|
|
.role = I2S_ROLE_MASTER,
|
|
.dma_desc_num = 6,
|
|
.dma_frame_num = 240,
|
|
.auto_clear_after_cb = false,
|
|
.auto_clear_before_cb = false,
|
|
.intr_priority = 0,
|
|
};
|
|
ESP_ERROR_CHECK(i2s_new_channel(&chan_cfg, &tx_handle_, &rx_handle_));
|
|
|
|
i2s_std_config_t std_cfg = {
|
|
.clk_cfg = {
|
|
.sample_rate_hz = (uint32_t)output_sample_rate_,
|
|
.clk_src = I2S_CLK_SRC_DEFAULT,
|
|
.ext_clk_freq_hz = 0,
|
|
.mclk_multiple = I2S_MCLK_MULTIPLE_256
|
|
},
|
|
.slot_cfg = {
|
|
.data_bit_width = I2S_DATA_BIT_WIDTH_32BIT,
|
|
.slot_bit_width = I2S_SLOT_BIT_WIDTH_AUTO,
|
|
.slot_mode = I2S_SLOT_MODE_MONO,
|
|
.slot_mask = I2S_STD_SLOT_LEFT,
|
|
.ws_width = I2S_DATA_BIT_WIDTH_32BIT,
|
|
.ws_pol = false,
|
|
.bit_shift = true,
|
|
.left_align = true,
|
|
.big_endian = false,
|
|
.bit_order_lsb = false
|
|
},
|
|
.gpio_cfg = {
|
|
.mclk = I2S_GPIO_UNUSED,
|
|
.bclk = (gpio_num_t)AUDIO_I2S_GPIO_BCLK,
|
|
.ws = (gpio_num_t)AUDIO_I2S_GPIO_LRCK,
|
|
.dout = (gpio_num_t)AUDIO_I2S_GPIO_DOUT,
|
|
.din = (gpio_num_t)AUDIO_I2S_GPIO_DIN,
|
|
.invert_flags = {
|
|
.mclk_inv = false,
|
|
.bclk_inv = false,
|
|
.ws_inv = false
|
|
}
|
|
}
|
|
};
|
|
ESP_ERROR_CHECK(i2s_channel_init_std_mode(tx_handle_, &std_cfg));
|
|
ESP_ERROR_CHECK(i2s_channel_init_std_mode(rx_handle_, &std_cfg));
|
|
ESP_ERROR_CHECK(i2s_channel_enable(tx_handle_));
|
|
ESP_ERROR_CHECK(i2s_channel_enable(rx_handle_));
|
|
ESP_LOGI(TAG, "Duplex channels created");
|
|
#endif
|
|
}
|
|
|
|
void AudioDevice::CreateSimplexChannels() {
|
|
#ifdef AUDIO_I2S_METHOD_SIMPLEX
|
|
// Create a new channel for speaker
|
|
i2s_chan_config_t chan_cfg = {
|
|
.id = I2S_NUM_0,
|
|
.role = I2S_ROLE_MASTER,
|
|
.dma_desc_num = 6,
|
|
.dma_frame_num = 240,
|
|
.auto_clear_after_cb = true,
|
|
.auto_clear_before_cb = false,
|
|
.intr_priority = 0,
|
|
};
|
|
ESP_ERROR_CHECK(i2s_new_channel(&chan_cfg, &tx_handle_, nullptr));
|
|
|
|
i2s_std_config_t std_cfg = {
|
|
.clk_cfg = {
|
|
.sample_rate_hz = (uint32_t)output_sample_rate_,
|
|
.clk_src = I2S_CLK_SRC_DEFAULT,
|
|
.ext_clk_freq_hz = 0,
|
|
.mclk_multiple = I2S_MCLK_MULTIPLE_256
|
|
},
|
|
.slot_cfg = {
|
|
.data_bit_width = I2S_DATA_BIT_WIDTH_32BIT,
|
|
.slot_bit_width = I2S_SLOT_BIT_WIDTH_AUTO,
|
|
.slot_mode = I2S_SLOT_MODE_MONO,
|
|
.slot_mask = I2S_STD_SLOT_LEFT,
|
|
.ws_width = I2S_DATA_BIT_WIDTH_32BIT,
|
|
.ws_pol = false,
|
|
.bit_shift = true,
|
|
.left_align = true,
|
|
.big_endian = false,
|
|
.bit_order_lsb = false
|
|
},
|
|
.gpio_cfg = {
|
|
.mclk = I2S_GPIO_UNUSED,
|
|
.bclk = (gpio_num_t)AUDIO_I2S_SPK_GPIO_BCLK,
|
|
.ws = (gpio_num_t)AUDIO_I2S_SPK_GPIO_LRCK,
|
|
.dout = (gpio_num_t)AUDIO_I2S_SPK_GPIO_DOUT,
|
|
.din = I2S_GPIO_UNUSED,
|
|
.invert_flags = {
|
|
.mclk_inv = false,
|
|
.bclk_inv = false,
|
|
.ws_inv = false
|
|
}
|
|
}
|
|
};
|
|
ESP_ERROR_CHECK(i2s_channel_init_std_mode(tx_handle_, &std_cfg));
|
|
|
|
// Create a new channel for MIC
|
|
chan_cfg.id = I2S_NUM_1;
|
|
ESP_ERROR_CHECK(i2s_new_channel(&chan_cfg, nullptr, &rx_handle_));
|
|
std_cfg.clk_cfg.sample_rate_hz = (uint32_t)input_sample_rate_;
|
|
std_cfg.gpio_cfg.bclk = (gpio_num_t)AUDIO_I2S_MIC_GPIO_SCK;
|
|
std_cfg.gpio_cfg.ws = (gpio_num_t)AUDIO_I2S_MIC_GPIO_WS;
|
|
std_cfg.gpio_cfg.dout = I2S_GPIO_UNUSED;
|
|
std_cfg.gpio_cfg.din = (gpio_num_t)AUDIO_I2S_MIC_GPIO_DIN;
|
|
ESP_ERROR_CHECK(i2s_channel_init_std_mode(rx_handle_, &std_cfg));
|
|
|
|
ESP_ERROR_CHECK(i2s_channel_enable(tx_handle_));
|
|
ESP_ERROR_CHECK(i2s_channel_enable(rx_handle_));
|
|
ESP_LOGI(TAG, "Simplex channels created");
|
|
#endif
|
|
}
|
|
|
|
int AudioDevice::Write(const int16_t* data, int samples) {
|
|
int32_t buffer[samples];
|
|
|
|
// output_volume_: 0-100
|
|
// volume_factor_: 0-65536
|
|
int32_t volume_factor = pow(double(output_volume_) / 100.0, 2) * 65536;
|
|
for (int i = 0; i < samples; i++) {
|
|
int64_t temp = int64_t(data[i]) * volume_factor; // 使用 int64_t 进行乘法运算
|
|
if (temp > INT32_MAX) {
|
|
buffer[i] = INT32_MAX;
|
|
} else if (temp < INT32_MIN) {
|
|
buffer[i] = INT32_MIN;
|
|
} else {
|
|
buffer[i] = static_cast<int32_t>(temp);
|
|
}
|
|
}
|
|
|
|
size_t bytes_written;
|
|
ESP_ERROR_CHECK(i2s_channel_write(tx_handle_, buffer, samples * sizeof(int32_t), &bytes_written, portMAX_DELAY));
|
|
return bytes_written / sizeof(int32_t);
|
|
}
|
|
|
|
int AudioDevice::Read(int16_t* dest, int samples) {
|
|
size_t bytes_read;
|
|
|
|
int32_t bit32_buffer[samples];
|
|
if (i2s_channel_read(rx_handle_, bit32_buffer, samples * sizeof(int32_t), &bytes_read, portMAX_DELAY) != ESP_OK) {
|
|
ESP_LOGE(TAG, "Read Failed!");
|
|
return 0;
|
|
}
|
|
|
|
samples = bytes_read / sizeof(int32_t);
|
|
for (int i = 0; i < samples; i++) {
|
|
int32_t value = bit32_buffer[i] >> 12;
|
|
dest[i] = (value > INT16_MAX) ? INT16_MAX : (value < -INT16_MAX) ? -INT16_MAX : (int16_t)value;
|
|
}
|
|
return samples;
|
|
}
|
|
|
|
void AudioDevice::OnInputData(std::function<void(std::vector<int16_t>&& data)> callback) {
|
|
on_input_data_ = callback;
|
|
|
|
// 创建音频输入任务
|
|
if (audio_input_task_ == nullptr) {
|
|
xTaskCreate([](void* arg) {
|
|
auto audio_device = (AudioDevice*)arg;
|
|
audio_device->InputTask();
|
|
}, "audio_input", 4096 * 2, this, 3, &audio_input_task_);
|
|
}
|
|
}
|
|
|
|
void AudioDevice::OutputData(std::vector<int16_t>& data) {
|
|
Write(data.data(), data.size());
|
|
}
|
|
|
|
void AudioDevice::InputTask() {
|
|
int duration = 30;
|
|
int input_frame_size = input_sample_rate_ / 1000 * duration * input_channels_;
|
|
while (true) {
|
|
std::vector<int16_t> input_data(input_frame_size);
|
|
int samples = Read(input_data.data(), input_data.size());
|
|
if (samples > 0) {
|
|
if (on_input_data_) {
|
|
on_input_data_(std::move(input_data));
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
void AudioDevice::SetOutputVolume(int volume) {
|
|
output_volume_ = volume;
|
|
ESP_LOGI(TAG, "Set output volume to %d", output_volume_);
|
|
}
|
|
|
|
void AudioDevice::EnableInput(bool enable) {
|
|
if (enable == input_enabled_) {
|
|
return;
|
|
}
|
|
input_enabled_ = enable;
|
|
ESP_LOGI(TAG, "Set input enable to %s", enable ? "true" : "false");
|
|
}
|
|
|
|
void AudioDevice::EnableOutput(bool enable) {
|
|
if (enable == output_enabled_) {
|
|
return;
|
|
}
|
|
output_enabled_ = enable;
|
|
ESP_LOGI(TAG, "Set output enable to %s", enable ? "true" : "false");
|
|
}
|