webrtc 3A移植以及实时处理
#include <stdio.h>
#include <stdlib.h>
#include <alsa/asoundlib.h>
#include <pthread.h>
#include <errno.h>
#include <mutex>
#include "modules/audio_processing/include/audio_processing.h"
constexpr int sample_rate_hz = 16000; // 假设采样率为16kHz
constexpr size_t num_channels = 1; // 假设单声道
constexpr size_t frame_size = sample_rate_hz / 100; // 10ms 帧大小
#define CHANNELS 2
#define SAMPLE_RATE 16000
#define PERIOD_SIZE 160
#define BUFFER_SIZE (PERIOD_SIZE * 2)
bool gRun = true;
typedef struct
{
snd_pcm_t *playback_handle;
FILE *pcm_file;
int8_t m_pPlayoutBuffer[PERIOD_SIZE * 2 * 2];
int m_nPlayoutBufferSizeIn20MS = PERIOD_SIZE * 2 * 2;
int m_nPlayoutFramesLeft = 0;
snd_pcm_t *capture_handle;
FILE *pcm_out_file;
int8_t m_pRecordBuffer[PERIOD_SIZE * 2 * 2];
int m_nRecordBufferSizeIn20MS = PERIOD_SIZE * 2 * 2;
int m_nRecordingFramesLeft = PERIOD_SIZE;
FILE *pcm_3a_file;
FILE *pcm_ref_file;
int8_t m_pRefBuffer[PERIOD_SIZE * 2];
int8_t m_p3ABuffer[PERIOD_SIZE * 2]; // in byte
int8_t m_pNearBuffer[PERIOD_SIZE * 2]; // in byte
rtc::scoped_refptr<webrtc::AudioProcessing> apm;
} audio_data_t;
void monoTurnStereo(const int16_t *pSrc, int16_t *pDts, size_t size)
{
for (int j = 0; j < size; j++)
{
pDts[2 * j] = pSrc[j];
pDts[2 * j + 1] = pSrc[j];
}
}
void stereoTurnMono(const unsigned char *pSrc, unsigned char *pDts, size_t size)
{
int nLeftCount = 0;
for (size_t i = 0; i < size; i += 4)
{
pDts[nLeftCount] = pSrc[i];
pDts[nLeftCount + 1] = pSrc[i + 1];
nLeftCount += 2;
}
}
int32_t errorRecovery(int32_t nRet, snd_pcm_t *pDeviceHandle)
{
int st = snd_pcm_state(pDeviceHandle);
printf("Trying to recover from %s error: %s nRet:(%d) (state:%d)\n",
((snd_pcm_stream(pDeviceHandle) ==
SND_PCM_STREAM_CAPTURE)
? "capture"
: "playout"),
snd_strerror(nRet),
nRet,
st);
int res = snd_pcm_recover(pDeviceHandle, nRet, 1);
if (0 == res)
{
printf("Recovery - snd_pcm_recover OK\n");
if ((nRet == -EPIPE || nRet == -ESTRPIPE) &&
snd_pcm_stream(pDeviceHandle) == SND_PCM_STREAM_CAPTURE)
{
// For capture streams we also have to repeat the explicit start()
// to get data flowing again.
int nRet = snd_pcm_start(pDeviceHandle);
if (nRet != 0)
{
printf("Recovery - snd_pcm_start error: %d\n", nRet);
return -1;
}
}
if ((nRet == -EPIPE || nRet == -ESTRPIPE) &&
snd_pcm_stream(pDeviceHandle) == SND_PCM_STREAM_PLAYBACK)
{
// For capture streams we also have to repeat the explicit start() to get
// data flowing again.
snd_pcm_state_t state = snd_pcm_state(pDeviceHandle);
if (state != SND_PCM_STATE_PREPARED)
{
snd_pcm_prepare(pDeviceHandle);
}
int nRet = snd_pcm_start(pDeviceHandle);
if (nRet != 0)
{
printf("Recovery - snd_pcm_start error: %s\n", snd_strerror(nRet));
return -1;
}
}
return -EPIPE == nRet ? 1 : 0;
}
else
{
printf("Unrecoverable alsa stream error: %d\n", res);
}
return res;
}
void *playback_thread(void *arg)
{
printf("playback_thread\n");
audio_data_t *data = (audio_data_t *)arg;
const int policy = SCHED_FIFO;
const int min_prio = sched_get_priority_min(policy);
const int max_prio = sched_get_priority_max(policy);
sched_param param;
const int top_prio = max_prio - 1;
const int low_prio = min_prio + 1;
param.sched_priority = top_prio;
pthread_setschedparam(pthread_self(), policy, ¶m);
while (gRun)
{
int nRet;
snd_pcm_sframes_t sndFrames;
snd_pcm_sframes_t sndAvailFrames;
sndAvailFrames = snd_pcm_avail_update(data->playback_handle);
if (sndAvailFrames < 0)
{
printf("playout snd_pcm_avail_update error: %s\n", snd_strerror(sndAvailFrames));
errorRecovery(sndAvailFrames, data->playback_handle);
continue;
}
else if (sndAvailFrames == 0)
{
nRet = snd_pcm_wait(data->playback_handle, 2);
// if (nRet == 0)
// printf("playout snd_pcm_wait timeout\n");
continue;
}
if (data->m_nPlayoutFramesLeft <= 0)
{
size_t frames = fread(data->m_pRefBuffer, 2, PERIOD_SIZE, data->pcm_file);
if (frames == 0 || frames != PERIOD_SIZE)
{ // 文件播放完毕,重新开始
fseek(data->pcm_file, 0, SEEK_SET);
continue;
}
monoTurnStereo((int16_t *)data->m_pRefBuffer, (int16_t *)data->m_pPlayoutBuffer, PERIOD_SIZE);
data->m_nPlayoutFramesLeft = frames;
}
if ((uint32_t)(sndAvailFrames) > data->m_nPlayoutFramesLeft)
{
sndAvailFrames = (uint32_t)data->m_nPlayoutFramesLeft;
}
int size = snd_pcm_frames_to_bytes(data->playback_handle, data->m_nPlayoutFramesLeft);
sndFrames = snd_pcm_writei(data->playback_handle, &data->m_pPlayoutBuffer[data->m_nPlayoutBufferSizeIn20MS - size], sndAvailFrames);
if (sndFrames < 0)
{
printf("playout snd_pcm_writei error: %s\n", snd_strerror(sndFrames));
data->m_nPlayoutFramesLeft = 0;
errorRecovery(sndFrames, data->playback_handle);
continue;
}
else
{
fwrite(&data->m_pRefBuffer[PERIOD_SIZE * 2 - data->m_nPlayoutFramesLeft * 2], 1, sndFrames * 2, data->pcm_ref_file);
data->m_nPlayoutFramesLeft -= sndFrames;
}
}
return NULL;
}
void *capture_thread(void *arg)
{
printf("capture_thread\n");
audio_data_t *data = (audio_data_t *)arg;
const int policy = SCHED_FIFO;
const int min_prio = sched_get_priority_min(policy);
const int max_prio = sched_get_priority_max(policy);
sched_param param;
const int top_prio = max_prio - 1;
const int low_prio = min_prio + 1;
param.sched_priority = top_prio;
pthread_setschedparam(pthread_self(), policy, ¶m);
while (gRun)
{
int nRet;
snd_pcm_sframes_t sndFrames;
snd_pcm_sframes_t sndAvailFrames;
int8_t buffer[data->m_nRecordBufferSizeIn20MS];
sndAvailFrames = snd_pcm_avail_update(data->capture_handle);
if (sndAvailFrames < 0)
{
printf("capture snd_pcm_avail_update error: %s\n", snd_strerror(sndAvailFrames));
errorRecovery(sndAvailFrames, data->capture_handle);
continue;
}
else if (sndAvailFrames == 0)
{
continue;
}
if ((uint32_t)(sndAvailFrames) > data->m_nRecordingFramesLeft)
sndAvailFrames = data->m_nRecordingFramesLeft;
sndFrames = snd_pcm_readi(data->capture_handle, buffer, sndAvailFrames);
if (sndFrames < 0)
{
printf("capture snd_pcm_readi error: %s\n", snd_strerror(sndFrames));
errorRecovery(sndFrames, data->capture_handle);
continue;
}
else if (sndFrames > 0)
{
int nLeftSize = snd_pcm_frames_to_bytes(data->capture_handle, data->m_nRecordingFramesLeft);
int size = snd_pcm_frames_to_bytes(data->capture_handle, sndFrames);
memcpy(&data->m_pRecordBuffer[data->m_nRecordBufferSizeIn20MS - nLeftSize], buffer, size);
data->m_nRecordingFramesLeft -= sndFrames;
}
if (!data->m_nRecordingFramesLeft)
{
data->m_nRecordingFramesLeft = PERIOD_SIZE;
stereoTurnMono((unsigned char *)data->m_pRecordBuffer, (unsigned char *)data->m_pNearBuffer, PERIOD_SIZE * 2 * 2);
fwrite(data->m_pNearBuffer, 1, PERIOD_SIZE * 2, data->pcm_out_file);
webrtc::StreamConfig stream_config(sample_rate_hz, num_channels);
if (data->apm->ProcessReverseStream((int16_t *)data->m_pRefBuffer, stream_config, stream_config, (int16_t *)data->m_pRefBuffer) != webrtc::AudioProcessing::kNoError)
{
printf("ProcessReverseStream fail\n");
}
if (data->apm->ProcessStream((int16_t *)data->m_pNearBuffer, stream_config, stream_config, (int16_t *)data->m_p3ABuffer) != webrtc::AudioProcessing::kNoError)
{
printf("ProcessStream fail\n");
}
fwrite(data->m_p3ABuffer, 1, PERIOD_SIZE * 2, data->pcm_3a_file);
}
}
return NULL;
}
int setup_pcm_device(snd_pcm_t **handle, const char *device, snd_pcm_stream_t stream)
{
snd_pcm_hw_params_t *params;
int err;
if ((err = snd_pcm_open(handle, device, stream, SND_PCM_NONBLOCK)) < 0)
{
printf("无法打开 PCM 设备 %s: %s\n", device, snd_strerror(err));
return err;
}
snd_pcm_hw_params_alloca(¶ms);
snd_pcm_hw_params_any(*handle, params);
snd_pcm_hw_params_set_access(*handle, params, SND_PCM_ACCESS_RW_INTERLEAVED);
snd_pcm_hw_params_set_format(*handle, params, SND_PCM_FORMAT_S16_LE);
snd_pcm_hw_params_set_channels(*handle, params, CHANNELS);
snd_pcm_hw_params_set_rate(*handle, params, SAMPLE_RATE, 0);
snd_pcm_hw_params_set_period_size(*handle, params, PERIOD_SIZE, 0);
snd_pcm_hw_params_set_buffer_size(*handle, params, PERIOD_SIZE * 4);
if ((err = snd_pcm_hw_params(*handle, params)) < 0)
{
printf("设置 PCM 参数失败: %s\n", snd_strerror(err));
snd_pcm_close(*handle);
return err;
}
return 0;
}
int main(int argc, char *argv[])
{
audio_data_t data;
if ((data.pcm_file = fopen("./far.pcm", "rb")) == NULL ||
(data.pcm_3a_file = fopen("./3a.pcm", "wb")) == NULL ||
(data.pcm_out_file = fopen("./near.pcm", "wb")) == NULL ||
(data.pcm_ref_file = fopen("./ref.pcm", "wb")) == NULL)
{
printf("fail to open file\n");
return -1;
}
// 3a
data.apm = webrtc::AudioProcessingBuilder().Create();
webrtc::AudioProcessing::Config config;
// 噪声抑制配置
config.noise_suppression.enabled = true;
config.noise_suppression.level = webrtc::AudioProcessing::Config::NoiseSuppression::Level::kHigh;
// 增益控制配置
config.gain_controller1.enabled = true;
config.gain_controller1.mode = webrtc::AudioProcessing::Config::GainController1::Mode::kAdaptiveDigital;
config.gain_controller1.target_level_dbfs = 3; // 目标输出电平
// 回声抑制配置
config.echo_canceller.enabled = true;
config.echo_canceller.mobile_mode = false; // 如果是移动设备可以设置为 true
// 语音活动检测(可选)
config.voice_detection.enabled = true;
// 应用配置
data.apm->ApplyConfig(config);
//
if (setup_pcm_device(&data.playback_handle, "hw:0,0", SND_PCM_STREAM_PLAYBACK) < 0)
{
fclose(data.pcm_file);
return -1;
}
if (setup_pcm_device(&data.capture_handle, "hw:0,0", SND_PCM_STREAM_CAPTURE) < 0)
{
snd_pcm_close(data.playback_handle);
fclose(data.pcm_file);
return -1;
}
pthread_t play_thread, record_thread;
pthread_create(&play_thread, NULL, playback_thread, &data);
int nRet = snd_pcm_prepare(data.playback_handle);
if (nRet < 0)
{
printf("playout snd_pcm_prepare failed (%s)\n", snd_strerror(nRet));
}
p