FaceAccess/Record/ProcessFile.cpp

143 lines
6.5 KiB
C++
Raw Normal View History

2024-09-06 16:35:51 +08:00
#include "IoContext.h"
#include "SpeexDsp.h"
#include "WebRtcAecm.h"
#include "api/audio/echo_canceller3_config.h"
#include "api/audio/echo_canceller3_factory.h"
#include "main.h"
#include "modules/audio_processing/aec3/echo_canceller3.h"
2024-09-06 23:06:54 +08:00
#include "modules/audio_processing/ns/noise_suppressor.h"
2024-09-06 16:35:51 +08:00
#include <boost/asio/post.hpp>
#include <sstream>
class ProcessFileTaskPrivate {
public:
void initialize(int sampleRate, int channels, int period) {
std::unique_ptr<webrtc::EchoCanceller3Factory> factory = std::make_unique<webrtc::EchoCanceller3Factory>();
echoCanceller = factory->Create(sampleRate, channels, channels);
nearendBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
farendBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
linearOutputBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
2024-09-06 16:46:55 +08:00
// RKAP_3A_Init(&m_vqe, AEC_TX_TYPE);
2024-09-06 23:06:54 +08:00
webrtc::NsConfig config;
config.target_level = webrtc::NsConfig::SuppressionLevel::k12dB;
noiseSuppressor = std::make_unique<webrtc::NoiseSuppressor>(config, sampleRate, channels);
noiseSuppressorBuffer = std::make_unique<webrtc::AudioBuffer>(sampleRate, channels, sampleRate, channels, sampleRate, channels);
2024-09-06 16:35:51 +08:00
}
std::unique_ptr<webrtc::EchoControl> echoCanceller;
std::unique_ptr<webrtc::AudioBuffer> nearendBuffer;
std::unique_ptr<webrtc::AudioBuffer> farendBuffer;
std::unique_ptr<webrtc::AudioBuffer> linearOutputBuffer;
2024-09-06 23:06:54 +08:00
std::unique_ptr<webrtc::NoiseSuppressor> noiseSuppressor;
std::unique_ptr<webrtc::AudioBuffer> noiseSuppressorBuffer;
2024-09-06 16:46:55 +08:00
// RKAP_AEC_State m_vqe;
2024-09-06 16:35:51 +08:00
};
ProcessFileTask::ProcessFileTask() : m_d{new ProcessFileTaskPrivate()} {
}
ProcessFileTask::~ProcessFileTask() {
if (m_d != nullptr) {
delete m_d;
}
}
void ProcessFileTask::setDsp(Dsp dsp) {
if (m_dsp != dsp) {
m_dsp = dsp;
}
}
2024-09-07 21:51:11 +08:00
// ./build/Record/Record --file --dsp=aecm
2024-09-06 16:35:51 +08:00
// ./Record --file --dsp=aecm
void ProcessFileTask::run() {
2024-09-07 21:51:11 +08:00
#ifdef __RV1109__
constexpr auto MicFile = "/sdcard/micin_16k.pcm";
constexpr auto SpeakerFile = "/sdcard/speaker_16k.pcm";
#else
constexpr auto MicFile = "resources/micin_16k.pcm";
constexpr auto SpeakerFile = "resources/speaker_16k.pcm";
#endif
m_speakerIfs = std::make_shared<std::ifstream>(SpeakerFile, std::ifstream::binary);
m_micIfs = std::make_shared<std::ifstream>(MicFile, std::ifstream::binary);
2024-09-06 16:35:51 +08:00
std::ostringstream oss;
2024-09-07 21:51:11 +08:00
oss << DumpPath << "/out_" << dspToString(m_dsp) << "_16k.wav";
2024-09-06 16:35:51 +08:00
m_outFilename = oss.str();
2024-09-07 21:51:11 +08:00
m_ofs = std::make_shared<WavWriter<int16_t>>(m_outFilename, 1, 16000);
2024-09-06 16:35:51 +08:00
2024-09-06 23:06:54 +08:00
oss.str("");
oss << DumpPath << "/ns_" << dspToString(m_dsp) << "_16k.pcm";
m_nsOfs = std::make_shared<std::ofstream>(oss.str(), std::ofstream::binary);
2024-09-06 16:35:51 +08:00
// m_speakerIfs = std::make_shared<std::ifstream>("/sdcard/speaker_8k.pcm", std::ifstream::binary);
// m_micIfs = std::make_shared<std::ifstream>("/sdcard/micin_8k.pcm", std::ifstream::binary);
// m_ofs = std::make_shared<std::ofstream>("/sdcard/out_8k.pcm", std::ofstream::binary);
m_webRtcAecm = std::make_shared<WebRtcAecm>();
m_webRtcAecm->start(16000, 1, 10);
m_speex = std::make_shared<SpeexDsp>();
m_speex->start(16000, 1, 10);
m_d->initialize(16000, 1, 10);
m_begin = std::chrono::system_clock::now();
process();
}
void ProcessFileTask::process() {
using namespace Amass;
auto ioConext = Singleton<IoContext>::instance();
if (m_speakerIfs && m_micIfs && *m_speakerIfs && *m_micIfs) {
char farendBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
char nearendBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
2024-09-06 23:06:54 +08:00
char noiseSuppressorOutBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
2024-09-06 16:35:51 +08:00
char outBuffer[sizeof(int16_t) * 16000 / 1000 * 10] = {0};
2024-09-06 23:06:54 +08:00
webrtc::StreamConfig config(16000, 1); // 单声道
2024-09-06 16:35:51 +08:00
// char farendBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
// char nearendBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
// char outBuffer[sizeof(int16_t) * 8000 / 1000 * 10] = {0};
m_speakerIfs->read(farendBuffer, sizeof(farendBuffer));
m_micIfs->read(nearendBuffer, sizeof(nearendBuffer));
2024-09-06 23:06:54 +08:00
m_d->nearendBuffer->CopyFrom(reinterpret_cast<const int16_t *>(nearendBuffer), config);
2024-09-06 16:35:51 +08:00
if (m_dsp == Speex) {
m_speex->echoPlayback(reinterpret_cast<const int16_t *>(farendBuffer));
m_speex->echoCapture(reinterpret_cast<const int16_t *>(nearendBuffer), reinterpret_cast<int16_t *>(outBuffer));
} else if (m_dsp == AecMobile) {
2024-09-06 23:06:54 +08:00
m_d->noiseSuppressor->Analyze(*m_d->nearendBuffer);
m_d->noiseSuppressor->Process(m_d->nearendBuffer.get());
m_d->nearendBuffer->CopyTo(config, reinterpret_cast<int16_t *>(noiseSuppressorOutBuffer));
m_nsOfs->write(noiseSuppressorOutBuffer, sizeof(noiseSuppressorOutBuffer));
// LOG(info) << " " << m_d->noiseSuppressorBuffer->num_frames() << " " << m_d->nearendBuffer->num_frames();
2024-09-06 16:35:51 +08:00
m_webRtcAecm->echoPlayback(reinterpret_cast<const int16_t *>(farendBuffer), sizeof(farendBuffer) / 2);
2024-09-06 23:06:54 +08:00
m_webRtcAecm->echoCancellation(reinterpret_cast<int16_t *>(nearendBuffer),
reinterpret_cast<int16_t *>(noiseSuppressorOutBuffer), reinterpret_cast<int16_t *>(outBuffer),
2024-09-06 16:35:51 +08:00
sizeof(farendBuffer) / 2);
} else if (m_dsp == Aec3) {
m_d->farendBuffer->CopyFrom(reinterpret_cast<const int16_t *>(farendBuffer), config);
m_d->echoCanceller->AnalyzeRender(m_d->farendBuffer.get());
m_d->echoCanceller->AnalyzeCapture(m_d->nearendBuffer.get());
m_d->echoCanceller->ProcessCapture(m_d->nearendBuffer.get(), false);
// m_d->echoCanceller->ProcessCapture(&nearendBuffer, &linearOutputBuffer, /*level_change=*/false);
m_d->nearendBuffer->CopyTo(config, reinterpret_cast<int16_t *>(outBuffer));
} else if (m_dsp == Vqe) {
}
m_ofs->write(outBuffer, sizeof(outBuffer));
boost::asio::post(*ioConext->ioContext(), [this]() { process(); });
} else {
auto elapsed = std::chrono::duration_cast<std::chrono::milliseconds>(std::chrono::system_clock::now() - m_begin);
LOG(info) << "process file finished, out: " << m_outFilename << ", elapsed: " << elapsed;
2024-09-07 21:51:11 +08:00
ioConext->stop();
2024-09-06 16:35:51 +08:00
}
}