205 lines
7.0 KiB
C
205 lines
7.0 KiB
C
|
/*
|
||
|
* Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
|
||
|
*
|
||
|
* Use of this source code is governed by a BSD-style license
|
||
|
* that can be found in the LICENSE file in the root of the source
|
||
|
* tree. An additional intellectual property rights grant can be found
|
||
|
* in the file PATENTS. All contributing project authors may
|
||
|
* be found in the AUTHORS file in the root of the source tree.
|
||
|
*/
|
||
|
|
||
|
#ifndef COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
|
||
|
#define COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
|
||
|
|
||
|
#include <stdint.h>
|
||
|
|
||
|
#include <algorithm>
|
||
|
#include <cmath>
|
||
|
#include <cstring>
|
||
|
#include <limits>
|
||
|
|
||
|
#include "api/audio/audio_view.h"
|
||
|
#include "rtc_base/checks.h"
|
||
|
|
||
|
namespace webrtc {
|
||
|
|
||
|
typedef std::numeric_limits<int16_t> limits_int16;
|
||
|
|
||
|
// TODO(tommi, peah): Move these constants to their own header, e.g.
|
||
|
// `audio_constants.h`. Also consider if they should be in api/.
|
||
|
|
||
|
// Absolute highest acceptable sample rate supported for audio processing,
|
||
|
// capture and codecs. Note that for some components some cases a lower limit
|
||
|
// applies which typically is 48000 but in some cases is lower.
|
||
|
constexpr int kMaxSampleRateHz = 384000;
|
||
|
|
||
|
// Number of samples per channel for 10ms of audio at the highest sample rate.
|
||
|
constexpr size_t kMaxSamplesPerChannel10ms = kMaxSampleRateHz / 100u;
|
||
|
|
||
|
// The conversion functions use the following naming convention:
|
||
|
// S16: int16_t [-32768, 32767]
|
||
|
// Float: float [-1.0, 1.0]
|
||
|
// FloatS16: float [-32768.0, 32768.0]
|
||
|
// Dbfs: float [-20.0*log(10, 32768), 0] = [-90.3, 0]
|
||
|
// The ratio conversion functions use this naming convention:
|
||
|
// Ratio: float (0, +inf)
|
||
|
// Db: float (-inf, +inf)
|
||
|
static inline float S16ToFloat(int16_t v) {
|
||
|
constexpr float kScaling = 1.f / 32768.f;
|
||
|
return v * kScaling;
|
||
|
}
|
||
|
|
||
|
static inline int16_t FloatS16ToS16(float v) {
|
||
|
v = std::min(v, 32767.f);
|
||
|
v = std::max(v, -32768.f);
|
||
|
return static_cast<int16_t>(v + std::copysign(0.5f, v));
|
||
|
}
|
||
|
|
||
|
static inline int16_t FloatToS16(float v) {
|
||
|
v *= 32768.f;
|
||
|
v = std::min(v, 32767.f);
|
||
|
v = std::max(v, -32768.f);
|
||
|
return static_cast<int16_t>(v + std::copysign(0.5f, v));
|
||
|
}
|
||
|
|
||
|
static inline float FloatToFloatS16(float v) {
|
||
|
v = std::min(v, 1.f);
|
||
|
v = std::max(v, -1.f);
|
||
|
return v * 32768.f;
|
||
|
}
|
||
|
|
||
|
static inline float FloatS16ToFloat(float v) {
|
||
|
v = std::min(v, 32768.f);
|
||
|
v = std::max(v, -32768.f);
|
||
|
constexpr float kScaling = 1.f / 32768.f;
|
||
|
return v * kScaling;
|
||
|
}
|
||
|
|
||
|
void FloatToS16(const float* src, size_t size, int16_t* dest);
|
||
|
void S16ToFloat(const int16_t* src, size_t size, float* dest);
|
||
|
void S16ToFloatS16(const int16_t* src, size_t size, float* dest);
|
||
|
void FloatS16ToS16(const float* src, size_t size, int16_t* dest);
|
||
|
void FloatToFloatS16(const float* src, size_t size, float* dest);
|
||
|
void FloatS16ToFloat(const float* src, size_t size, float* dest);
|
||
|
|
||
|
inline float DbToRatio(float v) {
|
||
|
return std::pow(10.0f, v / 20.0f);
|
||
|
}
|
||
|
|
||
|
inline float DbfsToFloatS16(float v) {
|
||
|
static constexpr float kMaximumAbsFloatS16 = -limits_int16::min();
|
||
|
return DbToRatio(v) * kMaximumAbsFloatS16;
|
||
|
}
|
||
|
|
||
|
inline float FloatS16ToDbfs(float v) {
|
||
|
RTC_DCHECK_GE(v, 0);
|
||
|
|
||
|
// kMinDbfs is equal to -20.0 * log10(-limits_int16::min())
|
||
|
static constexpr float kMinDbfs = -90.30899869919436f;
|
||
|
if (v <= 1.0f) {
|
||
|
return kMinDbfs;
|
||
|
}
|
||
|
// Equal to 20 * log10(v / (-limits_int16::min()))
|
||
|
return 20.0f * std::log10(v) + kMinDbfs;
|
||
|
}
|
||
|
|
||
|
// Copy audio from `src` channels to `dest` channels unless `src` and `dest`
|
||
|
// point to the same address. `src` and `dest` must have the same number of
|
||
|
// channels, and there must be sufficient space allocated in `dest`.
|
||
|
// TODO: b/335805780 - Accept ArrayView.
|
||
|
template <typename T>
|
||
|
void CopyAudioIfNeeded(const T* const* src,
|
||
|
int num_frames,
|
||
|
int num_channels,
|
||
|
T* const* dest) {
|
||
|
for (int i = 0; i < num_channels; ++i) {
|
||
|
if (src[i] != dest[i]) {
|
||
|
std::copy(src[i], src[i] + num_frames, dest[i]);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Deinterleave audio from `interleaved` to the channel buffers pointed to
|
||
|
// by `deinterleaved`. There must be sufficient space allocated in the
|
||
|
// `deinterleaved` buffers (`num_channel` buffers with `samples_per_channel`
|
||
|
// per buffer).
|
||
|
template <typename T>
|
||
|
void Deinterleave(const InterleavedView<const T>& interleaved,
|
||
|
const DeinterleavedView<T>& deinterleaved) {
|
||
|
RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
|
||
|
RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
|
||
|
SamplesPerChannel(deinterleaved));
|
||
|
const auto num_channels = NumChannels(interleaved);
|
||
|
const auto samples_per_channel = SamplesPerChannel(interleaved);
|
||
|
for (size_t i = 0; i < num_channels; ++i) {
|
||
|
MonoView<T> channel = deinterleaved[i];
|
||
|
size_t interleaved_idx = i;
|
||
|
for (size_t j = 0; j < samples_per_channel; ++j) {
|
||
|
channel[j] = interleaved[interleaved_idx];
|
||
|
interleaved_idx += num_channels;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Interleave audio from the channel buffers pointed to by `deinterleaved` to
|
||
|
// `interleaved`. There must be sufficient space allocated in `interleaved`
|
||
|
// (`samples_per_channel` * `num_channels`).
|
||
|
template <typename T>
|
||
|
void Interleave(const DeinterleavedView<const T>& deinterleaved,
|
||
|
const InterleavedView<T>& interleaved) {
|
||
|
RTC_DCHECK_EQ(NumChannels(interleaved), NumChannels(deinterleaved));
|
||
|
RTC_DCHECK_EQ(SamplesPerChannel(interleaved),
|
||
|
SamplesPerChannel(deinterleaved));
|
||
|
for (size_t i = 0; i < deinterleaved.num_channels(); ++i) {
|
||
|
const auto channel = deinterleaved[i];
|
||
|
size_t interleaved_idx = i;
|
||
|
for (size_t j = 0; j < deinterleaved.samples_per_channel(); ++j) {
|
||
|
interleaved[interleaved_idx] = channel[j];
|
||
|
interleaved_idx += deinterleaved.num_channels();
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// Downmixes an interleaved multichannel signal to a single channel by averaging
|
||
|
// all channels.
|
||
|
// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
|
||
|
template <typename T, typename Intermediate>
|
||
|
void DownmixInterleavedToMonoImpl(const T* interleaved,
|
||
|
size_t num_frames,
|
||
|
int num_channels,
|
||
|
T* deinterleaved) {
|
||
|
RTC_DCHECK_GT(num_channels, 0);
|
||
|
RTC_DCHECK_GT(num_frames, 0);
|
||
|
|
||
|
const T* const end = interleaved + num_frames * num_channels;
|
||
|
|
||
|
while (interleaved < end) {
|
||
|
const T* const frame_end = interleaved + num_channels;
|
||
|
|
||
|
Intermediate value = *interleaved++;
|
||
|
while (interleaved < frame_end) {
|
||
|
value += *interleaved++;
|
||
|
}
|
||
|
|
||
|
*deinterleaved++ = value / num_channels;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
|
||
|
template <typename T>
|
||
|
void DownmixInterleavedToMono(const T* interleaved,
|
||
|
size_t num_frames,
|
||
|
int num_channels,
|
||
|
T* deinterleaved);
|
||
|
|
||
|
// TODO: b/335805780 - Accept InterleavedView and DeinterleavedView.
|
||
|
template <>
|
||
|
void DownmixInterleavedToMono<int16_t>(const int16_t* interleaved,
|
||
|
size_t num_frames,
|
||
|
int num_channels,
|
||
|
int16_t* deinterleaved);
|
||
|
|
||
|
} // namespace webrtc
|
||
|
|
||
|
#endif // COMMON_AUDIO_INCLUDE_AUDIO_UTIL_H_
|