blob: fef3c3c1e414826045053836667efc64b959aef4 [file] [log] [blame]
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +00001/*
2 * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000011#include <stdlib.h>
12
Alessio Bazzicab28e57e2020-02-13 09:18:24 +010013#include <array>
kwiberg2d0c3322016-02-14 09:28:33 -080014#include <memory>
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000015#include <string>
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000016#include <vector>
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000017
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020018#include "api/audio_codecs/opus/audio_encoder_opus.h"
19#include "modules/audio_coding/codecs/g711/audio_decoder_pcm.h"
20#include "modules/audio_coding/codecs/g711/audio_encoder_pcm.h"
21#include "modules/audio_coding/codecs/g722/audio_decoder_g722.h"
22#include "modules/audio_coding/codecs/g722/audio_encoder_g722.h"
23#include "modules/audio_coding/codecs/ilbc/audio_decoder_ilbc.h"
24#include "modules/audio_coding/codecs/ilbc/audio_encoder_ilbc.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "modules/audio_coding/codecs/opus/audio_decoder_opus.h"
26#include "modules/audio_coding/codecs/pcm16b/audio_decoder_pcm16b.h"
27#include "modules/audio_coding/codecs/pcm16b/audio_encoder_pcm16b.h"
28#include "modules/audio_coding/neteq/tools/resample_input_audio_file.h"
Artem Titovee966752021-08-06 14:18:10 +020029#include "rtc_base/system/arch.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020030#include "test/gtest.h"
Steve Anton10542f22019-01-11 09:11:00 -080031#include "test/testsupport/file_utils.h"
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000032
33namespace webrtc {
34
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000035namespace {
Jakob Ivarsson36274f92020-10-22 13:01:07 +020036
37constexpr int kOverheadBytesPerPacket = 50;
38
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000039// The absolute difference between the input and output (the first channel) is
Artem Titovd00ce742021-07-28 20:00:17 +020040// compared vs `tolerance`. The parameter `delay` is used to correct for codec
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000041// delays.
42void CompareInputOutput(const std::vector<int16_t>& input,
43 const std::vector<int16_t>& output,
44 size_t num_samples,
45 size_t channels,
46 int tolerance,
47 int delay) {
48 ASSERT_LE(num_samples, input.size());
49 ASSERT_LE(num_samples * channels, output.size());
50 for (unsigned int n = 0; n < num_samples - delay; ++n) {
51 ASSERT_NEAR(input[n], output[channels * n + delay], tolerance)
52 << "Exit test on first diff; n = " << n;
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000053 }
54}
55
Artem Titovd00ce742021-07-28 20:00:17 +020056// The absolute difference between the first two channels in `output` is
57// compared vs `tolerance`.
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000058void CompareTwoChannels(const std::vector<int16_t>& output,
59 size_t samples_per_channel,
60 size_t channels,
61 int tolerance) {
62 ASSERT_GE(channels, 2u);
63 ASSERT_LE(samples_per_channel * channels, output.size());
64 for (unsigned int n = 0; n < samples_per_channel; ++n)
65 ASSERT_NEAR(output[channels * n], output[channels * n + 1], tolerance)
66 << "Stereo samples differ.";
67}
68
69// Calculates mean-squared error between input and output (the first channel).
Artem Titovd00ce742021-07-28 20:00:17 +020070// The parameter `delay` is used to correct for codec delays.
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000071double MseInputOutput(const std::vector<int16_t>& input,
72 const std::vector<int16_t>& output,
73 size_t num_samples,
74 size_t channels,
75 int delay) {
Mirko Bonadei25ab3222021-07-08 20:08:20 +020076 RTC_DCHECK_LT(delay, static_cast<int>(num_samples));
77 RTC_DCHECK_LE(num_samples, input.size());
78 RTC_DCHECK_LE(num_samples * channels, output.size());
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000079 if (num_samples == 0)
80 return 0.0;
81 double squared_sum = 0.0;
82 for (unsigned int n = 0; n < num_samples - delay; ++n) {
83 squared_sum += (input[n] - output[channels * n + delay]) *
84 (input[n] - output[channels * n + delay]);
85 }
86 return squared_sum / (num_samples - delay);
87}
88} // namespace
89
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000090class AudioDecoderTest : public ::testing::Test {
91 protected:
92 AudioDecoderTest()
kjellander02060002016-02-16 22:06:12 -080093 : input_audio_(
94 webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"),
95 32000),
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +000096 codec_input_rate_hz_(32000), // Legacy default value.
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +000097 frame_size_(0),
98 data_length_(0),
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +000099 channels_(1),
henrik.lundin@webrtc.org7f1dfa52014-12-02 12:08:39 +0000100 payload_type_(17),
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000101 decoder_(NULL) {}
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000102
Mirko Bonadei682aac52018-07-20 13:59:20 +0200103 ~AudioDecoderTest() override {}
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000104
Mirko Bonadei682aac52018-07-20 13:59:20 +0200105 void SetUp() override {
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000106 if (audio_encoder_)
kwiberg@webrtc.org05211272015-02-18 12:00:32 +0000107 codec_input_rate_hz_ = audio_encoder_->SampleRateHz();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000108 // Create arrays.
109 ASSERT_GT(data_length_, 0u) << "The test must set data_length_ > 0";
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000110 }
111
Mirko Bonadei682aac52018-07-20 13:59:20 +0200112 void TearDown() override {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000113 delete decoder_;
114 decoder_ = NULL;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000115 }
116
Yves Gerey665174f2018-06-19 15:03:05 +0200117 virtual void InitEncoder() {}
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000118
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000119 // TODO(henrik.lundin) Change return type to size_t once most/all overriding
120 // implementations are gone.
121 virtual int EncodeFrame(const int16_t* input,
122 size_t input_len_samples,
ossu10a029e2016-03-01 00:41:31 -0800123 rtc::Buffer* output) {
124 AudioEncoder::EncodedInfo encoded_info;
kwiberg@webrtc.org05211272015-02-18 12:00:32 +0000125 const size_t samples_per_10ms = audio_encoder_->SampleRateHz() / 100;
henrikg91d6ede2015-09-17 00:24:34 -0700126 RTC_CHECK_EQ(samples_per_10ms * audio_encoder_->Num10MsFramesInNextPacket(),
127 input_len_samples);
kwiberg2d0c3322016-02-14 09:28:33 -0800128 std::unique_ptr<int16_t[]> interleaved_input(
henrik.lundin@webrtc.org130fef82014-12-08 21:07:59 +0000129 new int16_t[channels_ * samples_per_10ms]);
Peter Kastingdce40cf2015-08-24 14:52:23 -0700130 for (size_t i = 0; i < audio_encoder_->Num10MsFramesInNextPacket(); ++i) {
ossu10a029e2016-03-01 00:41:31 -0800131 EXPECT_EQ(0u, encoded_info.encoded_bytes);
kwiberg@webrtc.org663fdd02014-10-29 07:28:36 +0000132
133 // Duplicate the mono input signal to however many channels the test
134 // wants.
henrik.lundin@webrtc.org130fef82014-12-08 21:07:59 +0000135 test::InputAudioFile::DuplicateInterleaved(input + i * samples_per_10ms,
136 samples_per_10ms, channels_,
137 interleaved_input.get());
kwiberg@webrtc.org663fdd02014-10-29 07:28:36 +0000138
Yves Gerey665174f2018-06-19 15:03:05 +0200139 encoded_info =
140 audio_encoder_->Encode(0,
141 rtc::ArrayView<const int16_t>(
142 interleaved_input.get(),
143 audio_encoder_->NumChannels() *
144 audio_encoder_->SampleRateHz() / 100),
145 output);
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000146 }
ossu10a029e2016-03-01 00:41:31 -0800147 EXPECT_EQ(payload_type_, encoded_info.payload_type);
148 return static_cast<int>(encoded_info.encoded_bytes);
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000149 }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000150
151 // Encodes and decodes audio. The absolute difference between the input and
Artem Titovd00ce742021-07-28 20:00:17 +0200152 // output is compared vs `tolerance`, and the mean-squared error is compared
153 // with `mse`. The encoded stream should contain `expected_bytes`. For stereo
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000154 // audio, the absolute difference between the two channels is compared vs
Artem Titovd00ce742021-07-28 20:00:17 +0200155 // `channel_diff_tolerance`.
Yves Gerey665174f2018-06-19 15:03:05 +0200156 void EncodeDecodeTest(size_t expected_bytes,
157 int tolerance,
158 double mse,
159 int delay = 0,
160 int channel_diff_tolerance = 0) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000161 ASSERT_GE(tolerance, 0) << "Test must define a tolerance >= 0";
Yves Gerey665174f2018-06-19 15:03:05 +0200162 ASSERT_GE(channel_diff_tolerance, 0)
163 << "Test must define a channel_diff_tolerance >= 0";
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000164 size_t processed_samples = 0u;
ossu10a029e2016-03-01 00:41:31 -0800165 size_t encoded_bytes = 0u;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000166 InitEncoder();
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000167 std::vector<int16_t> input;
168 std::vector<int16_t> decoded;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000169 while (processed_samples + frame_size_ <= data_length_) {
Artem Titovd00ce742021-07-28 20:00:17 +0200170 // Extend input vector with `frame_size_`.
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000171 input.resize(input.size() + frame_size_, 0);
172 // Read from input file.
173 ASSERT_GE(input.size() - processed_samples, frame_size_);
Yves Gerey665174f2018-06-19 15:03:05 +0200174 ASSERT_TRUE(input_audio_.Read(frame_size_, codec_input_rate_hz_,
175 &input[processed_samples]));
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100176 rtc::Buffer encoded;
Yves Gerey665174f2018-06-19 15:03:05 +0200177 size_t enc_len =
178 EncodeFrame(&input[processed_samples], frame_size_, &encoded);
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000179 // Make sure that frame_size_ * channels_ samples are allocated and free.
180 decoded.resize((processed_samples + frame_size_) * channels_, 0);
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100181
182 const std::vector<AudioDecoder::ParseResult> parse_result =
183 decoder_->ParsePayload(std::move(encoded), /*timestamp=*/0);
184 RTC_CHECK_EQ(parse_result.size(), size_t{1});
185 auto decode_result = parse_result[0].frame->Decode(
186 rtc::ArrayView<int16_t>(&decoded[processed_samples * channels_],
187 frame_size_ * channels_ * sizeof(int16_t)));
188 RTC_CHECK(decode_result.has_value());
189 EXPECT_EQ(frame_size_ * channels_, decode_result->num_decoded_samples);
ossu10a029e2016-03-01 00:41:31 -0800190 encoded_bytes += enc_len;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000191 processed_samples += frame_size_;
192 }
tina.legrand@webrtc.org8418e962013-11-29 09:30:43 +0000193 // For some codecs it doesn't make sense to check expected number of bytes,
Alessio Bazzicab46c4bf2022-11-11 16:52:46 +0100194 // since the number can vary for different platforms. Opus is such a codec.
195 // In this case expected_bytes is set to 0.
tina.legrand@webrtc.org8418e962013-11-29 09:30:43 +0000196 if (expected_bytes) {
ossu10a029e2016-03-01 00:41:31 -0800197 EXPECT_EQ(expected_bytes, encoded_bytes);
tina.legrand@webrtc.org8418e962013-11-29 09:30:43 +0000198 }
Yves Gerey665174f2018-06-19 15:03:05 +0200199 CompareInputOutput(input, decoded, processed_samples, channels_, tolerance,
200 delay);
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000201 if (channels_ == 2)
Yves Gerey665174f2018-06-19 15:03:05 +0200202 CompareTwoChannels(decoded, processed_samples, channels_,
203 channel_diff_tolerance);
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000204 EXPECT_LE(
205 MseInputOutput(input, decoded, processed_samples, channels_, delay),
206 mse);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000207 }
208
209 // Encodes a payload and decodes it twice with decoder re-init before each
210 // decode. Verifies that the decoded result is the same.
211 void ReInitTest() {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000212 InitEncoder();
kwiberg2d0c3322016-02-14 09:28:33 -0800213 std::unique_ptr<int16_t[]> input(new int16_t[frame_size_]);
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000214 ASSERT_TRUE(
215 input_audio_.Read(frame_size_, codec_input_rate_hz_, input.get()));
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100216 std::array<rtc::Buffer, 2> encoded;
217 EncodeFrame(input.get(), frame_size_, &encoded[0]);
218 // Make a copy.
219 encoded[1].SetData(encoded[0].data(), encoded[0].size());
220
221 std::array<std::vector<int16_t>, 2> outputs;
222 for (size_t i = 0; i < outputs.size(); ++i) {
223 outputs[i].resize(frame_size_ * channels_);
224 decoder_->Reset();
225 const std::vector<AudioDecoder::ParseResult> parse_result =
226 decoder_->ParsePayload(std::move(encoded[i]), /*timestamp=*/0);
227 RTC_CHECK_EQ(parse_result.size(), size_t{1});
228 auto decode_result = parse_result[0].frame->Decode(outputs[i]);
229 RTC_CHECK(decode_result.has_value());
230 EXPECT_EQ(frame_size_ * channels_, decode_result->num_decoded_samples);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000231 }
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100232 EXPECT_EQ(outputs[0], outputs[1]);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000233 }
234
235 // Call DecodePlc and verify that the correct number of samples is produced.
236 void DecodePlcTest() {
237 InitEncoder();
kwiberg2d0c3322016-02-14 09:28:33 -0800238 std::unique_ptr<int16_t[]> input(new int16_t[frame_size_]);
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000239 ASSERT_TRUE(
240 input_audio_.Read(frame_size_, codec_input_rate_hz_, input.get()));
ossu10a029e2016-03-01 00:41:31 -0800241 rtc::Buffer encoded;
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100242 EncodeFrame(input.get(), frame_size_, &encoded);
Karl Wiberg43766482015-08-27 15:22:11 +0200243 decoder_->Reset();
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100244 std::vector<int16_t> output(frame_size_ * channels_);
245 const std::vector<AudioDecoder::ParseResult> parse_result =
246 decoder_->ParsePayload(std::move(encoded), /*timestamp=*/0);
247 RTC_CHECK_EQ(parse_result.size(), size_t{1});
248 auto decode_result = parse_result[0].frame->Decode(output);
249 RTC_CHECK(decode_result.has_value());
250 EXPECT_EQ(frame_size_ * channels_, decode_result->num_decoded_samples);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000251 // Call DecodePlc and verify that we get one frame of data.
252 // (Overwrite the output from the above Decode call, but that does not
253 // matter.)
Alessio Bazzicab28e57e2020-02-13 09:18:24 +0100254 size_t dec_len =
255 decoder_->DecodePlc(/*num_frames=*/1, /*decoded=*/output.data());
turaj@webrtc.org6ad6a072013-09-30 20:07:39 +0000256 EXPECT_EQ(frame_size_ * channels_, dec_len);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000257 }
258
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000259 test::ResampleInputAudioFile input_audio_;
260 int codec_input_rate_hz_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000261 size_t frame_size_;
262 size_t data_length_;
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000263 size_t channels_;
henrik.lundin@webrtc.org7f1dfa52014-12-02 12:08:39 +0000264 const int payload_type_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000265 AudioDecoder* decoder_;
kwiberg2d0c3322016-02-14 09:28:33 -0800266 std::unique_ptr<AudioEncoder> audio_encoder_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000267};
268
269class AudioDecoderPcmUTest : public AudioDecoderTest {
270 protected:
271 AudioDecoderPcmUTest() : AudioDecoderTest() {
272 frame_size_ = 160;
273 data_length_ = 10 * frame_size_;
kwiberg89671832015-09-22 14:06:29 -0700274 decoder_ = new AudioDecoderPcmU(1);
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000275 AudioEncoderPcmU::Config config;
276 config.frame_size_ms = static_cast<int>(frame_size_ / 8);
henrik.lundin@webrtc.org7f1dfa52014-12-02 12:08:39 +0000277 config.payload_type = payload_type_;
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000278 audio_encoder_.reset(new AudioEncoderPcmU(config));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000279 }
280};
281
282class AudioDecoderPcmATest : public AudioDecoderTest {
283 protected:
284 AudioDecoderPcmATest() : AudioDecoderTest() {
285 frame_size_ = 160;
286 data_length_ = 10 * frame_size_;
kwiberg89671832015-09-22 14:06:29 -0700287 decoder_ = new AudioDecoderPcmA(1);
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000288 AudioEncoderPcmA::Config config;
289 config.frame_size_ms = static_cast<int>(frame_size_ / 8);
henrik.lundin@webrtc.org7f1dfa52014-12-02 12:08:39 +0000290 config.payload_type = payload_type_;
henrik.lundin@webrtc.orgdef1e972014-10-21 12:48:29 +0000291 audio_encoder_.reset(new AudioEncoderPcmA(config));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000292 }
293};
294
295class AudioDecoderPcm16BTest : public AudioDecoderTest {
296 protected:
297 AudioDecoderPcm16BTest() : AudioDecoderTest() {
henrik.lundin@webrtc.org817e50d2014-12-11 10:47:19 +0000298 codec_input_rate_hz_ = 16000;
299 frame_size_ = 20 * codec_input_rate_hz_ / 1000;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000300 data_length_ = 10 * frame_size_;
kwiberg6c2eab32016-05-31 02:46:20 -0700301 decoder_ = new AudioDecoderPcm16B(codec_input_rate_hz_, 1);
Mirko Bonadei25ab3222021-07-08 20:08:20 +0200302 RTC_DCHECK(decoder_);
henrik.lundin@webrtc.org817e50d2014-12-11 10:47:19 +0000303 AudioEncoderPcm16B::Config config;
304 config.sample_rate_hz = codec_input_rate_hz_;
305 config.frame_size_ms =
306 static_cast<int>(frame_size_ / (config.sample_rate_hz / 1000));
307 config.payload_type = payload_type_;
308 audio_encoder_.reset(new AudioEncoderPcm16B(config));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000309 }
310};
311
312class AudioDecoderIlbcTest : public AudioDecoderTest {
313 protected:
314 AudioDecoderIlbcTest() : AudioDecoderTest() {
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000315 codec_input_rate_hz_ = 8000;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000316 frame_size_ = 240;
317 data_length_ = 10 * frame_size_;
solenbergdb3c9b02017-06-28 02:05:04 -0700318 decoder_ = new AudioDecoderIlbcImpl;
Mirko Bonadei25ab3222021-07-08 20:08:20 +0200319 RTC_DCHECK(decoder_);
solenbergdb3c9b02017-06-28 02:05:04 -0700320 AudioEncoderIlbcConfig config;
kwiberg@webrtc.orgcb858ba2014-12-08 17:11:44 +0000321 config.frame_size_ms = 30;
solenbergdb3c9b02017-06-28 02:05:04 -0700322 audio_encoder_.reset(new AudioEncoderIlbcImpl(config, payload_type_));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000323 }
324
325 // Overload the default test since iLBC's function WebRtcIlbcfix_NetEqPlc does
326 // not return any data. It simply resets a few states and returns 0.
327 void DecodePlcTest() {
328 InitEncoder();
kwiberg2d0c3322016-02-14 09:28:33 -0800329 std::unique_ptr<int16_t[]> input(new int16_t[frame_size_]);
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000330 ASSERT_TRUE(
331 input_audio_.Read(frame_size_, codec_input_rate_hz_, input.get()));
ossu10a029e2016-03-01 00:41:31 -0800332 rtc::Buffer encoded;
333 size_t enc_len = EncodeFrame(input.get(), frame_size_, &encoded);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000334 AudioDecoder::SpeechType speech_type;
Karl Wiberg43766482015-08-27 15:22:11 +0200335 decoder_->Reset();
kwiberg2d0c3322016-02-14 09:28:33 -0800336 std::unique_ptr<int16_t[]> output(new int16_t[frame_size_ * channels_]);
Yves Gerey665174f2018-06-19 15:03:05 +0200337 size_t dec_len = decoder_->Decode(
338 encoded.data(), enc_len, codec_input_rate_hz_,
339 frame_size_ * channels_ * sizeof(int16_t), output.get(), &speech_type);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000340 EXPECT_EQ(frame_size_, dec_len);
341 // Simply call DecodePlc and verify that we get 0 as return value.
Peter Kastingdce40cf2015-08-24 14:52:23 -0700342 EXPECT_EQ(0U, decoder_->DecodePlc(1, output.get()));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000343 }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000344};
345
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000346class AudioDecoderG722Test : public AudioDecoderTest {
347 protected:
348 AudioDecoderG722Test() : AudioDecoderTest() {
henrik.lundin@webrtc.orga37f1dd2014-10-27 12:58:18 +0000349 codec_input_rate_hz_ = 16000;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000350 frame_size_ = 160;
351 data_length_ = 10 * frame_size_;
kwibergb1ed7f02017-06-17 17:30:09 -0700352 decoder_ = new AudioDecoderG722Impl;
Mirko Bonadei25ab3222021-07-08 20:08:20 +0200353 RTC_DCHECK(decoder_);
kwibergb8727ae2017-06-17 17:41:59 -0700354 AudioEncoderG722Config config;
kwiberg@webrtc.org0cd55582014-12-02 11:45:51 +0000355 config.frame_size_ms = 10;
356 config.num_channels = 1;
kwibergb8727ae2017-06-17 17:41:59 -0700357 audio_encoder_.reset(new AudioEncoderG722Impl(config, payload_type_));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000358 }
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000359};
360
kwiberg@webrtc.org0cd55582014-12-02 11:45:51 +0000361class AudioDecoderG722StereoTest : public AudioDecoderTest {
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000362 protected:
kwiberg@webrtc.org0cd55582014-12-02 11:45:51 +0000363 AudioDecoderG722StereoTest() : AudioDecoderTest() {
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000364 channels_ = 2;
kwiberg@webrtc.org0cd55582014-12-02 11:45:51 +0000365 codec_input_rate_hz_ = 16000;
366 frame_size_ = 160;
367 data_length_ = 10 * frame_size_;
kwiberg1b97e262017-06-26 04:19:43 -0700368 decoder_ = new AudioDecoderG722StereoImpl;
Mirko Bonadei25ab3222021-07-08 20:08:20 +0200369 RTC_DCHECK(decoder_);
kwibergb8727ae2017-06-17 17:41:59 -0700370 AudioEncoderG722Config config;
kwiberg@webrtc.org0cd55582014-12-02 11:45:51 +0000371 config.frame_size_ms = 10;
372 config.num_channels = 2;
kwibergb8727ae2017-06-17 17:41:59 -0700373 audio_encoder_.reset(new AudioEncoderG722Impl(config, payload_type_));
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000374 }
375};
376
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200377class AudioDecoderOpusTest
378 : public AudioDecoderTest,
379 public testing::WithParamInterface<std::tuple<int, int>> {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000380 protected:
381 AudioDecoderOpusTest() : AudioDecoderTest() {
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200382 channels_ = opus_num_channels_;
383 codec_input_rate_hz_ = opus_sample_rate_hz_;
384 frame_size_ = rtc::CheckedDivExact(opus_sample_rate_hz_, 100);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000385 data_length_ = 10 * frame_size_;
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200386 decoder_ =
387 new AudioDecoderOpusImpl(opus_num_channels_, opus_sample_rate_hz_);
kwiberg96da0112017-06-30 04:23:22 -0700388 AudioEncoderOpusConfig config;
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200389 config.frame_size_ms = 10;
390 config.sample_rate_hz = opus_sample_rate_hz_;
391 config.num_channels = opus_num_channels_;
392 config.application = opus_num_channels_ == 1
393 ? AudioEncoderOpusConfig::ApplicationMode::kVoip
394 : AudioEncoderOpusConfig::ApplicationMode::kAudio;
kwiberg96da0112017-06-30 04:23:22 -0700395 audio_encoder_ = AudioEncoderOpus::MakeAudioEncoder(config, payload_type_);
Jakob Ivarsson36274f92020-10-22 13:01:07 +0200396 audio_encoder_->OnReceivedOverhead(kOverheadBytesPerPacket);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000397 }
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200398 const int opus_sample_rate_hz_{std::get<0>(GetParam())};
399 const int opus_num_channels_{std::get<1>(GetParam())};
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000400};
401
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200402INSTANTIATE_TEST_SUITE_P(Param,
403 AudioDecoderOpusTest,
404 testing::Combine(testing::Values(16000, 48000),
405 testing::Values(1, 2)));
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000406
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000407TEST_F(AudioDecoderPcmUTest, EncodeDecode) {
408 int tolerance = 251;
409 double mse = 1734.0;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000410 EncodeDecodeTest(data_length_, tolerance, mse);
411 ReInitTest();
412 EXPECT_FALSE(decoder_->HasDecodePlc());
413}
414
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200415namespace {
416int SetAndGetTargetBitrate(AudioEncoder* audio_encoder, int rate) {
Danil Chapovalovb6021232018-06-19 13:26:36 +0200417 audio_encoder->OnReceivedUplinkBandwidth(rate, absl::nullopt);
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200418 return audio_encoder->GetTargetBitrate();
419}
420void TestSetAndGetTargetBitratesWithFixedCodec(AudioEncoder* audio_encoder,
421 int fixed_rate) {
422 EXPECT_EQ(fixed_rate, SetAndGetTargetBitrate(audio_encoder, 32000));
423 EXPECT_EQ(fixed_rate, SetAndGetTargetBitrate(audio_encoder, fixed_rate - 1));
424 EXPECT_EQ(fixed_rate, SetAndGetTargetBitrate(audio_encoder, fixed_rate));
425 EXPECT_EQ(fixed_rate, SetAndGetTargetBitrate(audio_encoder, fixed_rate + 1));
426}
427} // namespace
428
429TEST_F(AudioDecoderPcmUTest, SetTargetBitrate) {
430 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(), 64000);
431}
432
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000433TEST_F(AudioDecoderPcmATest, EncodeDecode) {
434 int tolerance = 308;
435 double mse = 1931.0;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000436 EncodeDecodeTest(data_length_, tolerance, mse);
437 ReInitTest();
438 EXPECT_FALSE(decoder_->HasDecodePlc());
439}
440
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200441TEST_F(AudioDecoderPcmATest, SetTargetBitrate) {
442 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(), 64000);
443}
444
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000445TEST_F(AudioDecoderPcm16BTest, EncodeDecode) {
446 int tolerance = 0;
447 double mse = 0.0;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000448 EncodeDecodeTest(2 * data_length_, tolerance, mse);
449 ReInitTest();
450 EXPECT_FALSE(decoder_->HasDecodePlc());
451}
452
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200453TEST_F(AudioDecoderPcm16BTest, SetTargetBitrate) {
454 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(),
455 codec_input_rate_hz_ * 16);
456}
457
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000458TEST_F(AudioDecoderIlbcTest, EncodeDecode) {
459 int tolerance = 6808;
460 double mse = 2.13e6;
461 int delay = 80; // Delay from input to output.
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000462 EncodeDecodeTest(500, tolerance, mse, delay);
463 ReInitTest();
464 EXPECT_TRUE(decoder_->HasDecodePlc());
465 DecodePlcTest();
466}
467
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200468TEST_F(AudioDecoderIlbcTest, SetTargetBitrate) {
469 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(), 13333);
470}
471
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000472TEST_F(AudioDecoderG722Test, EncodeDecode) {
473 int tolerance = 6176;
474 double mse = 238630.0;
475 int delay = 22; // Delay from input to output.
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000476 EncodeDecodeTest(data_length_ / 2, tolerance, mse, delay);
477 ReInitTest();
478 EXPECT_FALSE(decoder_->HasDecodePlc());
479}
480
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200481TEST_F(AudioDecoderG722Test, SetTargetBitrate) {
482 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(), 64000);
483}
484
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000485TEST_F(AudioDecoderG722StereoTest, EncodeDecode) {
486 int tolerance = 6176;
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000487 int channel_diff_tolerance = 0;
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000488 double mse = 238630.0;
489 int delay = 22; // Delay from input to output.
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000490 EncodeDecodeTest(data_length_, tolerance, mse, delay, channel_diff_tolerance);
henrik.lundin@webrtc.orgaaad6132013-02-01 11:49:28 +0000491 ReInitTest();
492 EXPECT_FALSE(decoder_->HasDecodePlc());
493}
494
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200495TEST_F(AudioDecoderG722StereoTest, SetTargetBitrate) {
496 TestSetAndGetTargetBitratesWithFixedCodec(audio_encoder_.get(), 128000);
497}
498
Jakob Ivarsson213dc2c2021-03-10 12:38:34 +0100499// TODO(http://bugs.webrtc.org/12518): Enable the test after Opus has been
500// updated.
501TEST_P(AudioDecoderOpusTest, DISABLED_EncodeDecode) {
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200502 constexpr int tolerance = 6176;
Ivo Creusen16ddae92020-03-04 17:16:59 +0100503 constexpr int channel_diff_tolerance = 6;
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200504 constexpr double mse = 238630.0;
505 constexpr int delay = 22; // Delay from input to output.
tina.legrand@webrtc.org8418e962013-11-29 09:30:43 +0000506 EncodeDecodeTest(0, tolerance, mse, delay, channel_diff_tolerance);
minyue@webrtc.orgecbe0aa2013-08-12 06:48:09 +0000507 ReInitTest();
508 EXPECT_FALSE(decoder_->HasDecodePlc());
509}
510
Karl Wiberg7eb0a5e2019-05-29 13:46:09 +0200511TEST_P(AudioDecoderOpusTest, SetTargetBitrate) {
Jakob Ivarsson36274f92020-10-22 13:01:07 +0200512 const int overhead_rate =
513 8 * kOverheadBytesPerPacket * codec_input_rate_hz_ / frame_size_;
514 EXPECT_EQ(6000,
515 SetAndGetTargetBitrate(audio_encoder_.get(), 5999 + overhead_rate));
516 EXPECT_EQ(6000,
517 SetAndGetTargetBitrate(audio_encoder_.get(), 6000 + overhead_rate));
518 EXPECT_EQ(32000, SetAndGetTargetBitrate(audio_encoder_.get(),
519 32000 + overhead_rate));
520 EXPECT_EQ(510000, SetAndGetTargetBitrate(audio_encoder_.get(),
521 510000 + overhead_rate));
522 EXPECT_EQ(510000, SetAndGetTargetBitrate(audio_encoder_.get(),
523 511000 + overhead_rate));
Henrik Lundin3e89dbf2015-06-18 14:58:34 +0200524}
525
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000526} // namespace webrtc