#include "media/base/audio_converter.h"
#include <stddef.h>
#include <algorithm>
#include <memory>
#include <tuple>
#include "base/strings/string_number_conversions.h"
#include "media/base/audio_bus.h"
#include "media/base/audio_timestamp_helper.h"
#include "media/base/fake_audio_render_callback.h"
#include "testing/gmock/include/gmock/gmock.h"
#include "testing/gtest/include/gtest/gtest.h"
namespace media {
static const int kConvertInputs = 8;
static const int kConvertCycles = 3;
static constexpr ChannelLayout kChannelLayout = CHANNEL_LAYOUT_STEREO;
static const int kHighLatencyBufferSize = 2048;
static const int kLowLatencyBufferSize = 256;
static const int kSampleRate = 48000;
static const int kSineCycles = 4;
typedef std::tuple<int, int, ChannelLayoutConfig, double>
AudioConverterTestData;
class AudioConverterTest
: public testing::TestWithParam<AudioConverterTestData> {
public:
AudioConverterTest() : epsilon_(std::get<3>(GetParam())) {
input_parameters_ =
AudioParameters(AudioParameters::AUDIO_PCM_LINEAR,
ChannelLayoutConfig::FromLayout<kChannelLayout>(),
std::get<0>(GetParam()), kHighLatencyBufferSize);
output_parameters_ = AudioParameters(
AudioParameters::AUDIO_PCM_LOW_LATENCY, std::get<2>(GetParam()),
std::get<1>(GetParam()), kLowLatencyBufferSize);
converter_ = std::make_unique<AudioConverter>(input_parameters_,
output_parameters_, false);
audio_bus_ = AudioBus::Create(output_parameters_);
expected_audio_bus_ = AudioBus::Create(output_parameters_);
double step = kSineCycles / static_cast<double>(
output_parameters_.frames_per_buffer());
expected_callback_ =
std::make_unique<FakeAudioRenderCallback>(step, kSampleRate);
}
AudioConverterTest(const AudioConverterTest&) = delete;
AudioConverterTest& operator=(const AudioConverterTest&) = delete;
void InitializeInputs(int count) {
double scale_factor = input_parameters_.sample_rate() /
static_cast<double>(output_parameters_.sample_rate());
double step = kSineCycles / (scale_factor *
static_cast<double>(output_parameters_.frames_per_buffer()));
for (int i = 0; i < count; ++i) {
fake_callbacks_.push_back(
std::make_unique<FakeAudioRenderCallback>(step, kSampleRate));
converter_->AddInput(fake_callbacks_[i].get());
}
}
void Reset() {
converter_->Reset();
for (const auto& fake_callback : fake_callbacks_) {
fake_callback->reset();
}
expected_callback_->reset();
}
void SetVolume(float volume) {
for (const auto& fake_callback : fake_callbacks_) {
fake_callback->set_volume(volume);
}
}
bool ValidateAudioData(int index, int frames, float scale) {
for (int ch = 0; ch < audio_bus_->channels(); ++ch) {
auto channel_data = audio_bus_->channel_span(ch);
auto expected_channel_data = expected_audio_bus_->channel_span(ch);
for (int j = index; j < frames; ++j) {
double error = fabs(channel_data[j] - expected_channel_data[j] * scale);
if (error > epsilon_) {
EXPECT_NEAR(expected_channel_data[j] * scale, channel_data[j],
epsilon_)
<< " ch=" << ch << ", j=" << j;
return false;
}
}
}
return true;
}
bool RenderAndValidateAudioData(float scale) {
converter_->Convert(audio_bus_.get());
expected_callback_->Render(base::TimeDelta(), base::TimeTicks::Now(), {},
expected_audio_bus_.get());
for (int i = input_parameters_.channels();
i < output_parameters_.channels(); ++i) {
std::ranges::fill(expected_audio_bus_->channel_span(i), 0);
}
return ValidateAudioData(0, audio_bus_->frames(), scale);
}
void FillAudioData(float value) {
for (auto channel : audio_bus_->AllChannels()) {
std::ranges::fill(channel, value);
}
}
void RunTest(int inputs) {
InitializeInputs(inputs);
SetVolume(0);
for (int i = 0; i < kConvertCycles; ++i)
ASSERT_TRUE(RenderAndValidateAudioData(0));
Reset();
float total_scale = 0;
for (size_t i = 0; i < fake_callbacks_.size(); ++i) {
float volume = static_cast<float>(i) / fake_callbacks_.size();
total_scale += volume;
fake_callbacks_[i]->set_volume(volume);
}
for (int i = 0; i < kConvertCycles; ++i)
ASSERT_TRUE(RenderAndValidateAudioData(total_scale));
Reset();
for (size_t i = 1; i < fake_callbacks_.size(); i += 2)
converter_->RemoveInput(fake_callbacks_[i].get());
SetVolume(1);
float scale = inputs > 1 ? inputs / 2.0f : inputs;
for (int i = 0; i < kConvertCycles; ++i)
ASSERT_TRUE(RenderAndValidateAudioData(scale));
}
protected:
virtual ~AudioConverterTest() = default;
std::unique_ptr<AudioConverter> converter_;
AudioParameters input_parameters_;
AudioParameters output_parameters_;
std::unique_ptr<AudioBus> audio_bus_;
std::unique_ptr<AudioBus> expected_audio_bus_;
std::vector<std::unique_ptr<FakeAudioRenderCallback>> fake_callbacks_;
std::unique_ptr<FakeAudioRenderCallback> expected_callback_;
double epsilon_;
};
TEST(AudioConverterTest, AudioDelayAndDiscreteChannelCount) {
AudioParameters input_parameters(AudioParameters::AUDIO_PCM_LINEAR,
{CHANNEL_LAYOUT_DISCRETE, 10}, kSampleRate,
kLowLatencyBufferSize);
AudioParameters output_parameters(AudioParameters::AUDIO_PCM_LINEAR,
{CHANNEL_LAYOUT_DISCRETE, 5},
kSampleRate * 2, kHighLatencyBufferSize);
AudioConverter converter(input_parameters, output_parameters, false);
FakeAudioRenderCallback callback(0.2, kSampleRate);
std::unique_ptr<AudioBus> audio_bus = AudioBus::Create(output_parameters);
converter.AddInput(&callback);
converter.Convert(audio_bus.get());
int kExpectedDelay = 960;
auto expected_delay =
AudioTimestampHelper::FramesToTime(kExpectedDelay, kSampleRate);
EXPECT_EQ(expected_delay, callback.last_delay());
EXPECT_EQ(input_parameters.channels(), callback.last_channel_count());
}
TEST(AudioConverterTest, PropagatesGlitchInfo) {
AudioParameters input_parameters(AudioParameters::AUDIO_PCM_LINEAR,
ChannelLayoutConfig::Stereo(), kSampleRate,
kLowLatencyBufferSize);
AudioParameters output_parameters(AudioParameters::AUDIO_PCM_LINEAR,
ChannelLayoutConfig::Stereo(),
kSampleRate * 2, kHighLatencyBufferSize);
AudioGlitchInfo glitch_info{.duration = base::Seconds(5), .count = 123};
AudioConverter converter(input_parameters, output_parameters, false);
FakeAudioRenderCallback callback1(0.2, kSampleRate);
FakeAudioRenderCallback callback2(0.2, kSampleRate);
std::unique_ptr<AudioBus> audio_bus = AudioBus::Create(output_parameters);
converter.AddInput(&callback1);
converter.AddInput(&callback2);
converter.ConvertWithInfo(0, {}, audio_bus.get());
EXPECT_EQ(callback1.cumulative_glitch_info(), AudioGlitchInfo());
EXPECT_EQ(callback2.cumulative_glitch_info(), AudioGlitchInfo());
converter.ConvertWithInfo(0, glitch_info, audio_bus.get());
EXPECT_EQ(callback1.cumulative_glitch_info(), glitch_info);
EXPECT_EQ(callback2.cumulative_glitch_info(), glitch_info);
converter.ConvertWithInfo(0, {}, audio_bus.get());
EXPECT_EQ(callback1.cumulative_glitch_info(), glitch_info);
EXPECT_EQ(callback2.cumulative_glitch_info(), glitch_info);
}
TEST_P(AudioConverterTest, ArbitraryOutputRequestSize) {
audio_bus_ = AudioBus::Create(output_parameters_.channels(),
output_parameters_.frames_per_buffer() / 2);
RunTest(1);
}
TEST_P(AudioConverterTest, NoInputs) {
FillAudioData(1.0f);
EXPECT_TRUE(RenderAndValidateAudioData(0.0f));
}
TEST_P(AudioConverterTest, OneInput) {
RunTest(1);
}
TEST_P(AudioConverterTest, ManyInputs) {
RunTest(kConvertInputs);
}
INSTANTIATE_TEST_SUITE_P(
AudioConverterTest,
AudioConverterTest,
testing::Values(
std::make_tuple(44100,
44100,
ChannelLayoutConfig::Stereo(),
0.00000048),
std::make_tuple(44100,
48000,
ChannelLayoutConfig::FromLayout<CHANNEL_LAYOUT_QUAD>(),
0.033),
std::make_tuple(48000, 41000, ChannelLayoutConfig::Mono(), 0.042)));
}