2024-09-06 16:35:51 +08:00
|
|
|
#include "IoContext.h"
|
|
|
|
#include "SpeexDsp.h"
|
|
|
|
#include "WebRtcAecm.h"
|
|
|
|
#include "api/audio/echo_canceller3_config.h"
|
|
|
|
#include "api/audio/echo_canceller3_factory.h"
|
|
|
|
#include "main.h"
|
|
|
|
#include "modules/audio_processing/aec3/echo_canceller3.h"
|
2024-09-06 23:06:54 +08:00
|
|
|
#include "modules/audio_processing/ns/noise_suppressor.h"
|
2024-09-06 16:35:51 +08:00
|
|
|
#include <boost/asio/post.hpp>
|
|
|
|
#include <sstream>
|
|
|
|
|
|
|
|
class ProcessFileTaskPrivate {
|
|
|
|
public:
|
|
|
|
void initialize(int sampleRate, int channels, int period) {
|
|
|
|
std::unique_ptr<webrtc::EchoCanceller3Factory> factory = std::make_unique<webrtc::EchoCanceller3Factory>();
|
|
|
|
echoCanceller = factory->Create(sampleRate, channels, channels);
|
|
|
|
nearendBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
|
|
|
|
farendBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
|
|
|
|
linearOutputBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
|
|
|
|
|
2024-09-06 16:46:55 +08:00
|
|
|
// RKAP_3A_Init(&m_vqe, AEC_TX_TYPE);
|
2024-09-06 23:06:54 +08:00
|
|
|
webrtc::NsConfig config;
|
|
|
|
config.target_level = webrtc::NsConfig::SuppressionLevel::k12dB;
|
|
|
|
noiseSuppressor = std::make_unique<webrtc::NoiseSuppressor>(config, sampleRate, channels);
|
|
|
|
noiseSuppressorBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
|
2024-09-06 16:35:51 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
std::unique_ptr<webrtc::EchoControl> echoCanceller;
|
|
|
|
std::unique_ptr<webrtc::AudioBuffer> nearendBuffer;
|
|
|
|
std::unique_ptr<webrtc::AudioBuffer> farendBuffer;
|
|
|
|
std::unique_ptr<webrtc::AudioBuffer> linearOutputBuffer;
|
|
|
|
|
2024-09-06 23:06:54 +08:00
|
|
|
std::unique_ptr<webrtc::NoiseSuppressor> noiseSuppressor;
|
|
|
|
std::unique_ptr<webrtc::AudioBuffer> noiseSuppressorBuffer;
|
|
|
|
|
2024-09-06 16:46:55 +08:00
|
|
|
// RKAP_AEC_State m_vqe;
|
2024-09-06 16:35:51 +08:00
|
|
|
};
|
|
|
|
|
|
|
|
ProcessFileTask::ProcessFileTask() : m_d{new ProcessFileTaskPrivate()} {
|
|
|
|
}
|
|
|
|
|
|
|
|
ProcessFileTask::~ProcessFileTask() {
|
|
|
|
if (m_d != nullptr) {
|
|
|
|
delete m_d;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
void ProcessFileTask::setDsp(Dsp dsp) {
|
|
|
|
if (m_dsp != dsp) {
|
|
|
|
m_dsp = dsp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-07 21:51:11 +08:00
|
|
|
// ./build/Record/Record --file --dsp=aecm
|
2024-09-06 16:35:51 +08:00
|
|
|
// ./Record --file --dsp=aecm
|
|
|
|
void ProcessFileTask::run() {
|
2024-09-07 21:51:11 +08:00
|
|
|
#ifdef __RV1109__
|
|
|
|
constexpr auto MicFile = "/sdcard/micin_16k.pcm";
|
|
|
|
constexpr auto SpeakerFile = "/sdcard/speaker_16k.pcm";
|
|
|
|
|
|
|
|
#else
|
|
|
|
constexpr auto MicFile = "resources/micin_16k.pcm";
|
|
|
|
constexpr auto SpeakerFile = "resources/speaker_16k.pcm";
|
|
|
|
#endif
|
|
|
|
m_speakerIfs = std::make_shared<std::ifstream>(SpeakerFile, std::ifstream::binary);
|
|
|
|
m_micIfs = std::make_shared<std::ifstream>(MicFile, std::ifstream::binary);
|
2024-09-06 16:35:51 +08:00
|
|
|
|
|
|
|
std::ostringstream oss;
|
2024-09-07 21:51:11 +08:00
|
|
|
oss << DumpPath << "/out_" << dspToString(m_dsp) << "_16k.wav";
|
2024-09-06 16:35:51 +08:00
|
|
|
m_outFilename = oss.str();
|
2024-09-07 21:51:11 +08:00
|
|
|
m_ofs = std::make_shared<WavWriter<int16_t>>(m_outFilename, 1, 16000);
|
2024-09-06 16:35:51 +08:00
|
|
|
|
2024-09-06 23:06:54 +08:00
|
|
|
oss.str("");
|
|
|
|
oss << DumpPath << "/ns_" << dspToString(m_dsp) << "_16k.pcm";
|
|
|
|
m_nsOfs = std::make_shared<std::ofstream>(oss.str(), std::ofstream::binary);
|
|
|
|
|
2024-09-06 16:35:51 +08:00
|
|
|
// m_speakerIfs = std::make_shared<std::ifstream>("/sdcard/speaker_8k.pcm", std::ifstream::binary);
|
|
|
|
// m_micIfs = std::make_shared<std::ifstream>("/sdcard/micin_8k.pcm", std::ifstream::binary);
|
|
|
|
// m_ofs = std::make_shared<std::ofstream>("/sdcard/out_8k.pcm", std::ofstream::binary);
|
|
|
|
|
|
|
|
m_webRtcAecm = std::make_shared<WebRtcAecm>();
|
|
|
|
m_webRtcAecm->start(16000, 1, 10);
|
|
|
|
|
|
|
|
m_speex = std::make_shared<SpeexDsp>();
|
|
|
|
m_speex->start(16000, 1, 10);
|
|
|
|
|
|
|
|
m_d->initialize(16000, 1, 10);
|
|
|
|
m_begin = std::chrono::system_clock::now();
|
|
|
|
process();
|
|
|
|
}
|
|
|
|
|
|
|
|
void ProcessFileTask::process() {
|
|
|
|
using namespace Amass;
|
|
|
|
auto ioConext = Singleton<IoContext>::instance();
|
|
|
|
if (m_speakerIfs && m_micIfs && *m_speakerIfs && *m_micIfs) {
|
|
|
|
char farendBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
|
|
|
|
char nearendBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
|
2024-09-06 23:06:54 +08:00
|
|
|
char noiseSuppressorOutBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
|
2024-09-06 16:35:51 +08:00
|
|
|
char outBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
|
2024-09-06 23:06:54 +08:00
|
|
|
webrtc::StreamConfig config(16000, 1); // 单声道
|
|
|
|
|
2024-09-06 16:35:51 +08:00
|
|
|
// char farendBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
|
|
|
|
// char nearendBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
|
|
|
|
// char outBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
|
|
|
|
|
|
|
|
m_speakerIfs->read(farendBuffer, sizeof(farendBuffer));
|
|
|
|
m_micIfs->read(nearendBuffer, sizeof(nearendBuffer));
|
2024-09-06 23:06:54 +08:00
|
|
|
m_d->nearendBuffer->CopyFrom(reinterpret_cast<const int16_t *>(nearendBuffer), config);
|
2024-09-06 16:35:51 +08:00
|
|
|
if (m_dsp == Speex) {
|
|
|
|
m_speex->echoPlayback(reinterpret_cast<const int16_t *>(farendBuffer));
|
|
|
|
m_speex->echoCapture(reinterpret_cast<const int16_t *>(nearendBuffer), reinterpret_cast<int16_t *>(outBuffer));
|
|
|
|
} else if (m_dsp == AecMobile) {
|
2024-09-06 23:06:54 +08:00
|
|
|
m_d->noiseSuppressor->Analyze(*m_d->nearendBuffer);
|
|
|
|
m_d->noiseSuppressor->Process(m_d->nearendBuffer.get());
|
|
|
|
m_d->nearendBuffer->CopyTo(config, reinterpret_cast<int16_t *>(noiseSuppressorOutBuffer));
|
|
|
|
m_nsOfs->write(noiseSuppressorOutBuffer, sizeof(noiseSuppressorOutBuffer));
|
|
|
|
// LOG(info) << " " << m_d->noiseSuppressorBuffer->num_frames() << " " << m_d->nearendBuffer->num_frames();
|
|
|
|
|
2024-09-06 16:35:51 +08:00
|
|
|
m_webRtcAecm->echoPlayback(reinterpret_cast<const int16_t *>(farendBuffer), sizeof(farendBuffer) / 2);
|
2024-09-06 23:06:54 +08:00
|
|
|
m_webRtcAecm->echoCancellation(reinterpret_cast<int16_t *>(nearendBuffer),
|
|
|
|
reinterpret_cast<int16_t *>(noiseSuppressorOutBuffer), reinterpret_cast<int16_t *>(outBuffer),
|
2024-09-06 16:35:51 +08:00
|
|
|
sizeof(farendBuffer) / 2);
|
|
|
|
} else if (m_dsp == Aec3) {
|
|
|
|
|
|
|
|
m_d->farendBuffer->CopyFrom(reinterpret_cast<const int16_t *>(farendBuffer), config);
|
|
|
|
|
|
|
|
m_d->echoCanceller->AnalyzeRender(m_d->farendBuffer.get());
|
|
|
|
m_d->echoCanceller->AnalyzeCapture(m_d->nearendBuffer.get());
|
|
|
|
m_d->echoCanceller->ProcessCapture(m_d->nearendBuffer.get(), false);
|
|
|
|
// m_d->echoCanceller->ProcessCapture(&nearendBuffer, &linearOutputBuffer, /*level_change=*/false);
|
|
|
|
|
|
|
|
m_d->nearendBuffer->CopyTo(config, reinterpret_cast<int16_t *>(outBuffer));
|
|
|
|
} else if (m_dsp == Vqe) {
|
|
|
|
}
|
|
|
|
|
|
|
|
m_ofs->write(outBuffer, sizeof(outBuffer));
|
|
|
|
boost::asio::post(*ioConext->ioContext(), [this]() { process(); });
|
|
|
|
} else {
|
|
|
|
auto elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(std::chrono::system_clock::now() - m_begin);
|
|
|
|
LOG(info) << "process file finished, out: " << m_outFilename << ", elapsed: " << elapsed;
|
2024-09-07 21:51:11 +08:00
|
|
|
ioConext->stop();
|
2024-09-06 16:35:51 +08:00
|
|
|
}
|
|
|
|
}
|