blob: 010fe55b41524322dd898fd8c5e50d08256f8671 [file] [log] [blame]
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +00001/*
2 * Copyright (c) 2011 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020011#include "modules/audio_coding/neteq/include/neteq.h"
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000012
pbos@webrtc.org3ecc1622014-03-07 15:23:34 +000013#include <math.h>
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000014#include <stdlib.h>
15#include <string.h> // memset
16
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +000017#include <algorithm>
kwiberg2d0c3322016-02-14 09:28:33 -080018#include <memory>
turaj@webrtc.org78b41a02013-11-22 20:27:07 +000019#include <set>
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000020#include <string>
21#include <vector>
22
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020023#include "api/audio_codecs/builtin_audio_decoder_factory.h"
24#include "common_types.h"
25#include "modules/audio_coding/codecs/pcm16b/pcm16b.h"
26#include "modules/audio_coding/neteq/tools/audio_loop.h"
27#include "modules/audio_coding/neteq/tools/rtp_file_source.h"
28#include "modules/include/module_common_types.h"
29#include "rtc_base/flags.h"
30#include "rtc_base/ignore_wundef.h"
31#include "rtc_base/protobuf_utils.h"
32#include "rtc_base/sha1digest.h"
33#include "rtc_base/stringencode.h"
34#include "test/gtest.h"
35#include "test/testsupport/fileutils.h"
36#include "typedefs.h"
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000037
minyue5f026d02015-12-16 07:36:04 -080038#ifdef WEBRTC_NETEQ_UNITTEST_BITEXACT
kwiberg77eab702016-09-28 17:42:01 -070039RTC_PUSH_IGNORING_WUNDEF()
minyue5f026d02015-12-16 07:36:04 -080040#ifdef WEBRTC_ANDROID_PLATFORM_BUILD
41#include "external/webrtc/webrtc/modules/audio_coding/neteq/neteq_unittest.pb.h"
42#else
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020043#include "modules/audio_coding/neteq/neteq_unittest.pb.h"
minyue5f026d02015-12-16 07:36:04 -080044#endif
kwiberg77eab702016-09-28 17:42:01 -070045RTC_POP_IGNORING_WUNDEF()
minyue5f026d02015-12-16 07:36:04 -080046#endif
47
turaj@webrtc.orga6101d72013-10-01 22:01:09 +000048DEFINE_bool(gen_ref, false, "Generate reference files.");
49
kwiberg5adaf732016-10-04 09:33:27 -070050namespace webrtc {
51
minyue5f026d02015-12-16 07:36:04 -080052namespace {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +000053
minyue4f906772016-04-29 11:05:14 -070054const std::string& PlatformChecksum(const std::string& checksum_general,
55 const std::string& checksum_android,
56 const std::string& checksum_win_32,
57 const std::string& checksum_win_64) {
kwiberg77eab702016-09-28 17:42:01 -070058#if defined(WEBRTC_ANDROID)
minyue4f906772016-04-29 11:05:14 -070059 return checksum_android;
kwiberg77eab702016-09-28 17:42:01 -070060#elif defined(WEBRTC_WIN)
minyue4f906772016-04-29 11:05:14 -070061 #ifdef WEBRTC_ARCH_64_BITS
62 return checksum_win_64;
63 #else
64 return checksum_win_32;
65 #endif // WEBRTC_ARCH_64_BITS
66#else
67 return checksum_general;
68#endif // WEBRTC_WIN
69}
70
minyue5f026d02015-12-16 07:36:04 -080071#ifdef WEBRTC_NETEQ_UNITTEST_BITEXACT
72void Convert(const webrtc::NetEqNetworkStatistics& stats_raw,
73 webrtc::neteq_unittest::NetEqNetworkStatistics* stats) {
74 stats->set_current_buffer_size_ms(stats_raw.current_buffer_size_ms);
75 stats->set_preferred_buffer_size_ms(stats_raw.preferred_buffer_size_ms);
76 stats->set_jitter_peaks_found(stats_raw.jitter_peaks_found);
77 stats->set_packet_loss_rate(stats_raw.packet_loss_rate);
minyue5f026d02015-12-16 07:36:04 -080078 stats->set_expand_rate(stats_raw.expand_rate);
79 stats->set_speech_expand_rate(stats_raw.speech_expand_rate);
80 stats->set_preemptive_rate(stats_raw.preemptive_rate);
81 stats->set_accelerate_rate(stats_raw.accelerate_rate);
82 stats->set_secondary_decoded_rate(stats_raw.secondary_decoded_rate);
minyue-webrtc0c3ca752017-08-23 15:59:38 +020083 stats->set_secondary_discarded_rate(stats_raw.secondary_discarded_rate);
minyue5f026d02015-12-16 07:36:04 -080084 stats->set_clockdrift_ppm(stats_raw.clockdrift_ppm);
85 stats->set_added_zero_samples(stats_raw.added_zero_samples);
86 stats->set_mean_waiting_time_ms(stats_raw.mean_waiting_time_ms);
87 stats->set_median_waiting_time_ms(stats_raw.median_waiting_time_ms);
88 stats->set_min_waiting_time_ms(stats_raw.min_waiting_time_ms);
89 stats->set_max_waiting_time_ms(stats_raw.max_waiting_time_ms);
90}
91
92void Convert(const webrtc::RtcpStatistics& stats_raw,
93 webrtc::neteq_unittest::RtcpStatistics* stats) {
94 stats->set_fraction_lost(stats_raw.fraction_lost);
srte186d9c32017-08-04 05:03:53 -070095 stats->set_cumulative_lost(stats_raw.packets_lost);
minyue5f026d02015-12-16 07:36:04 -080096 stats->set_extended_max_sequence_number(
srte186d9c32017-08-04 05:03:53 -070097 stats_raw.extended_highest_sequence_number);
minyue5f026d02015-12-16 07:36:04 -080098 stats->set_jitter(stats_raw.jitter);
99}
100
minyue4f906772016-04-29 11:05:14 -0700101void AddMessage(FILE* file, rtc::MessageDigest* digest,
102 const std::string& message) {
minyue5f026d02015-12-16 07:36:04 -0800103 int32_t size = message.length();
minyue4f906772016-04-29 11:05:14 -0700104 if (file)
105 ASSERT_EQ(1u, fwrite(&size, sizeof(size), 1, file));
106 digest->Update(&size, sizeof(size));
107
108 if (file)
109 ASSERT_EQ(static_cast<size_t>(size),
110 fwrite(message.data(), sizeof(char), size, file));
111 digest->Update(message.data(), sizeof(char) * size);
minyue5f026d02015-12-16 07:36:04 -0800112}
113
minyue5f026d02015-12-16 07:36:04 -0800114#endif // WEBRTC_NETEQ_UNITTEST_BITEXACT
115
henrik.lundin7a926812016-05-12 13:51:28 -0700116void LoadDecoders(webrtc::NetEq* neteq) {
kwiberg5adaf732016-10-04 09:33:27 -0700117 ASSERT_EQ(true,
118 neteq->RegisterPayloadType(0, SdpAudioFormat("pcmu", 8000, 1)));
119 // Use non-SdpAudioFormat argument when registering PCMa, so that we get test
120 // coverage for that as well.
henrik.lundin7a926812016-05-12 13:51:28 -0700121 ASSERT_EQ(0, neteq->RegisterPayloadType(webrtc::NetEqDecoder::kDecoderPCMa,
122 "pcma", 8));
123#ifdef WEBRTC_CODEC_ILBC
kwiberg5adaf732016-10-04 09:33:27 -0700124 ASSERT_EQ(true,
125 neteq->RegisterPayloadType(102, SdpAudioFormat("ilbc", 8000, 1)));
henrik.lundin7a926812016-05-12 13:51:28 -0700126#endif
127#if defined(WEBRTC_CODEC_ISAC) || defined(WEBRTC_CODEC_ISACFX)
kwiberg5adaf732016-10-04 09:33:27 -0700128 ASSERT_EQ(true,
129 neteq->RegisterPayloadType(103, SdpAudioFormat("isac", 16000, 1)));
henrik.lundin7a926812016-05-12 13:51:28 -0700130#endif
131#ifdef WEBRTC_CODEC_ISAC
kwiberg5adaf732016-10-04 09:33:27 -0700132 ASSERT_EQ(true,
133 neteq->RegisterPayloadType(104, SdpAudioFormat("isac", 32000, 1)));
henrik.lundin7a926812016-05-12 13:51:28 -0700134#endif
135#ifdef WEBRTC_CODEC_OPUS
kwiberg5adaf732016-10-04 09:33:27 -0700136 ASSERT_EQ(true,
137 neteq->RegisterPayloadType(
138 111, SdpAudioFormat("opus", 48000, 2, {{"stereo", "0"}})));
henrik.lundin7a926812016-05-12 13:51:28 -0700139#endif
kwiberg5adaf732016-10-04 09:33:27 -0700140 ASSERT_EQ(true,
141 neteq->RegisterPayloadType(93, SdpAudioFormat("L16", 8000, 1)));
142 ASSERT_EQ(true,
143 neteq->RegisterPayloadType(94, SdpAudioFormat("L16", 16000, 1)));
144 ASSERT_EQ(true,
145 neteq->RegisterPayloadType(95, SdpAudioFormat("L16", 32000, 1)));
146 ASSERT_EQ(true,
147 neteq->RegisterPayloadType(13, SdpAudioFormat("cn", 8000, 1)));
148 ASSERT_EQ(true,
149 neteq->RegisterPayloadType(98, SdpAudioFormat("cn", 16000, 1)));
henrik.lundin7a926812016-05-12 13:51:28 -0700150}
minyue5f026d02015-12-16 07:36:04 -0800151} // namespace
152
minyue4f906772016-04-29 11:05:14 -0700153class ResultSink {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000154 public:
minyue4f906772016-04-29 11:05:14 -0700155 explicit ResultSink(const std::string& output_file);
156 ~ResultSink();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000157
yujo36b1a5f2017-06-12 12:45:32 -0700158 template<typename T> void AddResult(const T* test_results, size_t length);
minyue4f906772016-04-29 11:05:14 -0700159
160 void AddResult(const NetEqNetworkStatistics& stats);
161 void AddResult(const RtcpStatistics& stats);
162
163 void VerifyChecksum(const std::string& ref_check_sum);
164
165 private:
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000166 FILE* output_fp_;
minyue4f906772016-04-29 11:05:14 -0700167 std::unique_ptr<rtc::MessageDigest> digest_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000168};
169
minyue4f906772016-04-29 11:05:14 -0700170ResultSink::ResultSink(const std::string &output_file)
171 : output_fp_(nullptr),
172 digest_(new rtc::Sha1Digest()) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000173 if (!output_file.empty()) {
174 output_fp_ = fopen(output_file.c_str(), "wb");
175 EXPECT_TRUE(output_fp_ != NULL);
176 }
177}
178
minyue4f906772016-04-29 11:05:14 -0700179ResultSink::~ResultSink() {
180 if (output_fp_)
181 fclose(output_fp_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000182}
183
yujo36b1a5f2017-06-12 12:45:32 -0700184template<typename T>
185void ResultSink::AddResult(const T* test_results, size_t length) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000186 if (output_fp_) {
yujo36b1a5f2017-06-12 12:45:32 -0700187 ASSERT_EQ(length, fwrite(test_results, sizeof(T), length, output_fp_));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000188 }
yujo36b1a5f2017-06-12 12:45:32 -0700189 digest_->Update(test_results, sizeof(T) * length);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000190}
191
minyue4f906772016-04-29 11:05:14 -0700192void ResultSink::AddResult(const NetEqNetworkStatistics& stats_raw) {
minyue5f026d02015-12-16 07:36:04 -0800193#ifdef WEBRTC_NETEQ_UNITTEST_BITEXACT
minyue5f026d02015-12-16 07:36:04 -0800194 neteq_unittest::NetEqNetworkStatistics stats;
195 Convert(stats_raw, &stats);
196
mbonadei7c2c8432017-04-07 00:59:12 -0700197 ProtoString stats_string;
minyue5f026d02015-12-16 07:36:04 -0800198 ASSERT_TRUE(stats.SerializeToString(&stats_string));
minyue4f906772016-04-29 11:05:14 -0700199 AddMessage(output_fp_, digest_.get(), stats_string);
minyue5f026d02015-12-16 07:36:04 -0800200#else
201 FAIL() << "Writing to reference file requires Proto Buffer.";
202#endif // WEBRTC_NETEQ_UNITTEST_BITEXACT
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000203}
204
minyue4f906772016-04-29 11:05:14 -0700205void ResultSink::AddResult(const RtcpStatistics& stats_raw) {
minyue5f026d02015-12-16 07:36:04 -0800206#ifdef WEBRTC_NETEQ_UNITTEST_BITEXACT
minyue5f026d02015-12-16 07:36:04 -0800207 neteq_unittest::RtcpStatistics stats;
208 Convert(stats_raw, &stats);
209
mbonadei7c2c8432017-04-07 00:59:12 -0700210 ProtoString stats_string;
minyue5f026d02015-12-16 07:36:04 -0800211 ASSERT_TRUE(stats.SerializeToString(&stats_string));
minyue4f906772016-04-29 11:05:14 -0700212 AddMessage(output_fp_, digest_.get(), stats_string);
minyue5f026d02015-12-16 07:36:04 -0800213#else
214 FAIL() << "Writing to reference file requires Proto Buffer.";
215#endif // WEBRTC_NETEQ_UNITTEST_BITEXACT
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000216}
217
minyue4f906772016-04-29 11:05:14 -0700218void ResultSink::VerifyChecksum(const std::string& checksum) {
219 std::vector<char> buffer;
220 buffer.resize(digest_->Size());
221 digest_->Finish(&buffer[0], buffer.size());
222 const std::string result = rtc::hex_encode(&buffer[0], digest_->Size());
223 EXPECT_EQ(checksum, result);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000224}
225
226class NetEqDecodingTest : public ::testing::Test {
227 protected:
228 // NetEQ must be polled for data once every 10 ms. Thus, neither of the
229 // constants below can be changed.
230 static const int kTimeStepMs = 10;
Peter Kastingdce40cf2015-08-24 14:52:23 -0700231 static const size_t kBlockSize8kHz = kTimeStepMs * 8;
232 static const size_t kBlockSize16kHz = kTimeStepMs * 16;
233 static const size_t kBlockSize32kHz = kTimeStepMs * 32;
minyue93c08b72015-12-22 09:57:41 -0800234 static const size_t kBlockSize48kHz = kTimeStepMs * 48;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000235 static const int kInitSampleRateHz = 8000;
236
237 NetEqDecodingTest();
238 virtual void SetUp();
239 virtual void TearDown();
240 void SelectDecoders(NetEqDecoder* used_codec);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000241 void OpenInputFile(const std::string &rtp_file);
henrik.lundin6d8e0112016-03-04 10:34:21 -0800242 void Process();
minyue5f026d02015-12-16 07:36:04 -0800243
henrik.lundin@webrtc.org4e4b0982014-08-11 14:48:49 +0000244 void DecodeAndCompare(const std::string& rtp_file,
minyue4f906772016-04-29 11:05:14 -0700245 const std::string& output_checksum,
246 const std::string& network_stats_checksum,
247 const std::string& rtcp_stats_checksum,
248 bool gen_ref);
minyue5f026d02015-12-16 07:36:04 -0800249
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000250 static void PopulateRtpInfo(int frame_index,
251 int timestamp,
henrik.lundin246ef3e2017-04-24 09:14:32 -0700252 RTPHeader* rtp_info);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000253 static void PopulateCng(int frame_index,
254 int timestamp,
henrik.lundin246ef3e2017-04-24 09:14:32 -0700255 RTPHeader* rtp_info,
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000256 uint8_t* payload,
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000257 size_t* payload_len);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000258
turaj@webrtc.org78b41a02013-11-22 20:27:07 +0000259 void WrapTest(uint16_t start_seq_no, uint32_t start_timestamp,
260 const std::set<uint16_t>& drop_seq_numbers,
261 bool expect_seq_no_wrap, bool expect_timestamp_wrap);
262
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000263 void LongCngWithClockDrift(double drift_factor,
264 double network_freeze_ms,
265 bool pull_audio_during_freeze,
266 int delay_tolerance_ms,
267 int max_time_to_speech_ms);
268
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +0000269 void DuplicateCng();
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000270
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000271 NetEq* neteq_;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000272 NetEq::Config config_;
kwiberg2d0c3322016-02-14 09:28:33 -0800273 std::unique_ptr<test::RtpFileSource> rtp_source_;
274 std::unique_ptr<test::Packet> packet_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000275 unsigned int sim_clock_;
henrik.lundin6d8e0112016-03-04 10:34:21 -0800276 AudioFrame out_frame_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000277 int output_sample_rate_;
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +0000278 int algorithmic_delay_ms_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000279};
280
281// Allocating the static const so that it can be passed by reference.
282const int NetEqDecodingTest::kTimeStepMs;
Peter Kastingdce40cf2015-08-24 14:52:23 -0700283const size_t NetEqDecodingTest::kBlockSize8kHz;
284const size_t NetEqDecodingTest::kBlockSize16kHz;
285const size_t NetEqDecodingTest::kBlockSize32kHz;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000286const int NetEqDecodingTest::kInitSampleRateHz;
287
288NetEqDecodingTest::NetEqDecodingTest()
289 : neteq_(NULL),
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000290 config_(),
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000291 sim_clock_(0),
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +0000292 output_sample_rate_(kInitSampleRateHz),
293 algorithmic_delay_ms_(0) {
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000294 config_.sample_rate_hz = kInitSampleRateHz;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000295}
296
297void NetEqDecodingTest::SetUp() {
ossue3525782016-05-25 07:37:43 -0700298 neteq_ = NetEq::Create(config_, CreateBuiltinAudioDecoderFactory());
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +0000299 NetEqNetworkStatistics stat;
300 ASSERT_EQ(0, neteq_->NetworkStatistics(&stat));
301 algorithmic_delay_ms_ = stat.current_buffer_size_ms;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000302 ASSERT_TRUE(neteq_);
henrik.lundin7a926812016-05-12 13:51:28 -0700303 LoadDecoders(neteq_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000304}
305
306void NetEqDecodingTest::TearDown() {
307 delete neteq_;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000308}
309
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000310void NetEqDecodingTest::OpenInputFile(const std::string &rtp_file) {
henrik.lundin@webrtc.org966a7082014-11-17 09:08:38 +0000311 rtp_source_.reset(test::RtpFileSource::Create(rtp_file));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000312}
313
henrik.lundin6d8e0112016-03-04 10:34:21 -0800314void NetEqDecodingTest::Process() {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000315 // Check if time to receive.
henrik.lundin@webrtc.org966a7082014-11-17 09:08:38 +0000316 while (packet_ && sim_clock_ >= packet_->time_ms()) {
317 if (packet_->payload_length_bytes() > 0) {
ivoc72c08ed2016-01-20 07:26:24 -0800318#ifndef WEBRTC_CODEC_ISAC
319 // Ignore payload type 104 (iSAC-swb) if ISAC is not supported.
henrik.lundin246ef3e2017-04-24 09:14:32 -0700320 if (packet_->header().payloadType != 104)
ivoc72c08ed2016-01-20 07:26:24 -0800321#endif
Henrik Lundin70c09bd2017-04-24 15:56:56 +0200322 ASSERT_EQ(0,
323 neteq_->InsertPacket(
henrik.lundin246ef3e2017-04-24 09:14:32 -0700324 packet_->header(),
Henrik Lundin70c09bd2017-04-24 15:56:56 +0200325 rtc::ArrayView<const uint8_t>(
326 packet_->payload(), packet_->payload_length_bytes()),
327 static_cast<uint32_t>(packet_->time_ms() *
328 (output_sample_rate_ / 1000))));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000329 }
330 // Get next packet.
henrik.lundin46ba49c2016-05-24 22:50:47 -0700331 packet_ = rtp_source_->NextPacket();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000332 }
333
henrik.lundin@webrtc.orge1d468c2013-01-30 07:37:20 +0000334 // Get audio from NetEq.
henrik.lundin7a926812016-05-12 13:51:28 -0700335 bool muted;
336 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
337 ASSERT_FALSE(muted);
henrik.lundin6d8e0112016-03-04 10:34:21 -0800338 ASSERT_TRUE((out_frame_.samples_per_channel_ == kBlockSize8kHz) ||
339 (out_frame_.samples_per_channel_ == kBlockSize16kHz) ||
340 (out_frame_.samples_per_channel_ == kBlockSize32kHz) ||
341 (out_frame_.samples_per_channel_ == kBlockSize48kHz));
342 output_sample_rate_ = out_frame_.sample_rate_hz_;
henrik.lundind89814b2015-11-23 06:49:25 -0800343 EXPECT_EQ(output_sample_rate_, neteq_->last_output_sample_rate_hz());
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000344
345 // Increase time.
346 sim_clock_ += kTimeStepMs;
347}
348
minyue4f906772016-04-29 11:05:14 -0700349void NetEqDecodingTest::DecodeAndCompare(
350 const std::string& rtp_file,
351 const std::string& output_checksum,
352 const std::string& network_stats_checksum,
353 const std::string& rtcp_stats_checksum,
354 bool gen_ref) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000355 OpenInputFile(rtp_file);
356
minyue4f906772016-04-29 11:05:14 -0700357 std::string ref_out_file =
358 gen_ref ? webrtc::test::OutputPath() + "neteq_universal_ref.pcm" : "";
359 ResultSink output(ref_out_file);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000360
minyue4f906772016-04-29 11:05:14 -0700361 std::string stat_out_file =
362 gen_ref ? webrtc::test::OutputPath() + "neteq_network_stats.dat" : "";
363 ResultSink network_stats(stat_out_file);
henrik.lundin@webrtc.org4e4b0982014-08-11 14:48:49 +0000364
minyue4f906772016-04-29 11:05:14 -0700365 std::string rtcp_out_file =
366 gen_ref ? webrtc::test::OutputPath() + "neteq_rtcp_stats.dat" : "";
367 ResultSink rtcp_stats(rtcp_out_file);
henrik.lundin@webrtc.org4e4b0982014-08-11 14:48:49 +0000368
henrik.lundin46ba49c2016-05-24 22:50:47 -0700369 packet_ = rtp_source_->NextPacket();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000370 int i = 0;
henrik.lundin@webrtc.org966a7082014-11-17 09:08:38 +0000371 while (packet_) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000372 std::ostringstream ss;
373 ss << "Lap number " << i++ << " in DecodeAndCompare while loop";
374 SCOPED_TRACE(ss.str()); // Print out the parameter values on failure.
henrik.lundin6d8e0112016-03-04 10:34:21 -0800375 ASSERT_NO_FATAL_FAILURE(Process());
minyue4f906772016-04-29 11:05:14 -0700376 ASSERT_NO_FATAL_FAILURE(output.AddResult(
yujo36b1a5f2017-06-12 12:45:32 -0700377 out_frame_.data(), out_frame_.samples_per_channel_));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000378
379 // Query the network statistics API once per second
380 if (sim_clock_ % 1000 == 0) {
381 // Process NetworkStatistics.
minyue4f906772016-04-29 11:05:14 -0700382 NetEqNetworkStatistics current_network_stats;
383 ASSERT_EQ(0, neteq_->NetworkStatistics(&current_network_stats));
384 ASSERT_NO_FATAL_FAILURE(network_stats.AddResult(current_network_stats));
385
henrik.lundin9c3efd02015-08-27 13:12:22 -0700386 // Compare with CurrentDelay, which should be identical.
minyue4f906772016-04-29 11:05:14 -0700387 EXPECT_EQ(current_network_stats.current_buffer_size_ms,
388 neteq_->CurrentDelayMs());
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000389
390 // Process RTCPstat.
minyue4f906772016-04-29 11:05:14 -0700391 RtcpStatistics current_rtcp_stats;
392 neteq_->GetRtcpStatistics(&current_rtcp_stats);
393 ASSERT_NO_FATAL_FAILURE(rtcp_stats.AddResult(current_rtcp_stats));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000394 }
395 }
minyue4f906772016-04-29 11:05:14 -0700396
397 SCOPED_TRACE("Check output audio.");
398 output.VerifyChecksum(output_checksum);
399 SCOPED_TRACE("Check network stats.");
400 network_stats.VerifyChecksum(network_stats_checksum);
401 SCOPED_TRACE("Check rtcp stats.");
402 rtcp_stats.VerifyChecksum(rtcp_stats_checksum);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000403}
404
405void NetEqDecodingTest::PopulateRtpInfo(int frame_index,
406 int timestamp,
henrik.lundin246ef3e2017-04-24 09:14:32 -0700407 RTPHeader* rtp_info) {
408 rtp_info->sequenceNumber = frame_index;
409 rtp_info->timestamp = timestamp;
410 rtp_info->ssrc = 0x1234; // Just an arbitrary SSRC.
411 rtp_info->payloadType = 94; // PCM16b WB codec.
412 rtp_info->markerBit = 0;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000413}
414
415void NetEqDecodingTest::PopulateCng(int frame_index,
416 int timestamp,
henrik.lundin246ef3e2017-04-24 09:14:32 -0700417 RTPHeader* rtp_info,
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000418 uint8_t* payload,
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000419 size_t* payload_len) {
henrik.lundin246ef3e2017-04-24 09:14:32 -0700420 rtp_info->sequenceNumber = frame_index;
421 rtp_info->timestamp = timestamp;
422 rtp_info->ssrc = 0x1234; // Just an arbitrary SSRC.
423 rtp_info->payloadType = 98; // WB CNG.
424 rtp_info->markerBit = 0;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000425 payload[0] = 64; // Noise level -64 dBov, quite arbitrarily chosen.
426 *payload_len = 1; // Only noise level, no spectral parameters.
427}
428
ivoc72c08ed2016-01-20 07:26:24 -0800429#if !defined(WEBRTC_IOS) && defined(WEBRTC_NETEQ_UNITTEST_BITEXACT) && \
430 (defined(WEBRTC_CODEC_ISAC) || defined(WEBRTC_CODEC_ISACFX)) && \
431 defined(WEBRTC_CODEC_ILBC) && defined(WEBRTC_CODEC_G722) && \
pbosc7a65692016-05-06 12:50:04 -0700432 !defined(WEBRTC_ARCH_ARM64)
minyue5f026d02015-12-16 07:36:04 -0800433#define MAYBE_TestBitExactness TestBitExactness
kwiberg98ab3a42015-09-30 21:54:21 -0700434#else
minyue5f026d02015-12-16 07:36:04 -0800435#define MAYBE_TestBitExactness DISABLED_TestBitExactness
kwiberg98ab3a42015-09-30 21:54:21 -0700436#endif
minyue5f026d02015-12-16 07:36:04 -0800437TEST_F(NetEqDecodingTest, MAYBE_TestBitExactness) {
minyue49c454e2016-01-08 11:30:14 -0800438 const std::string input_rtp_file =
439 webrtc::test::ResourcePath("audio_coding/neteq_universal_new", "rtp");
henrik.lundin@webrtc.org4e4b0982014-08-11 14:48:49 +0000440
minyue4f906772016-04-29 11:05:14 -0700441 const std::string output_checksum = PlatformChecksum(
soren9f2c18e2017-04-10 02:22:46 -0700442 "09fa7646e2ad032a0b156177b95f09012430f81f",
443 "1c64eb8b55ce8878676c6a1e6ddd78f48de0668b",
444 "09fa7646e2ad032a0b156177b95f09012430f81f",
445 "759fef89a5de52bd17e733dc255c671ce86be909");
minyue4f906772016-04-29 11:05:14 -0700446
henrik.lundin2979f552017-05-05 05:04:16 -0700447 const std::string network_stats_checksum =
minyue-webrtc0c3ca752017-08-23 15:59:38 +0200448 PlatformChecksum("5b4262ca328e5f066af5d34f3380521583dd20de",
449 "80235b6d727281203acb63b98f9a9e85d95f7ec0",
450 "5b4262ca328e5f066af5d34f3380521583dd20de",
451 "5b4262ca328e5f066af5d34f3380521583dd20de");
minyue4f906772016-04-29 11:05:14 -0700452
453 const std::string rtcp_stats_checksum = PlatformChecksum(
454 "b8880bf9fed2487efbddcb8d94b9937a29ae521d",
455 "f3f7b3d3e71d7e635240b5373b57df6a7e4ce9d4",
456 "b8880bf9fed2487efbddcb8d94b9937a29ae521d",
457 "b8880bf9fed2487efbddcb8d94b9937a29ae521d");
458
459 DecodeAndCompare(input_rtp_file,
460 output_checksum,
461 network_stats_checksum,
462 rtcp_stats_checksum,
oprypin9b2f20c2017-08-29 05:51:57 -0700463 FLAG_gen_ref);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000464}
465
minyue93c08b72015-12-22 09:57:41 -0800466#if !defined(WEBRTC_IOS) && !defined(WEBRTC_ANDROID) && \
467 defined(WEBRTC_NETEQ_UNITTEST_BITEXACT) && \
minyue-webrtc516711c2017-07-27 17:45:49 +0200468 defined(WEBRTC_CODEC_OPUS)
minyue93c08b72015-12-22 09:57:41 -0800469#define MAYBE_TestOpusBitExactness TestOpusBitExactness
470#else
471#define MAYBE_TestOpusBitExactness DISABLED_TestOpusBitExactness
472#endif
minyue-webrtcadb58b82017-07-26 17:59:59 +0200473TEST_F(NetEqDecodingTest, MAYBE_TestOpusBitExactness) {
minyue93c08b72015-12-22 09:57:41 -0800474 const std::string input_rtp_file =
475 webrtc::test::ResourcePath("audio_coding/neteq_opus", "rtp");
minyue93c08b72015-12-22 09:57:41 -0800476
minyue4f906772016-04-29 11:05:14 -0700477 const std::string output_checksum = PlatformChecksum(
minyue-webrtcadb58b82017-07-26 17:59:59 +0200478 "721e1e0c6effe4b2401536a4eef11512c9fb709c",
479 "721e1e0c6effe4b2401536a4eef11512c9fb709c",
480 "721e1e0c6effe4b2401536a4eef11512c9fb709c",
481 "721e1e0c6effe4b2401536a4eef11512c9fb709c");
minyue4f906772016-04-29 11:05:14 -0700482
henrik.lundin2979f552017-05-05 05:04:16 -0700483 const std::string network_stats_checksum =
minyue-webrtc0c3ca752017-08-23 15:59:38 +0200484 PlatformChecksum("4e749c46e2611877120ac7a20cbbe555cfbd70ea",
485 "4e749c46e2611877120ac7a20cbbe555cfbd70ea",
486 "4e749c46e2611877120ac7a20cbbe555cfbd70ea",
487 "4e749c46e2611877120ac7a20cbbe555cfbd70ea");
minyue4f906772016-04-29 11:05:14 -0700488
489 const std::string rtcp_stats_checksum = PlatformChecksum(
490 "e37c797e3de6a64dda88c9ade7a013d022a2e1e0",
491 "e37c797e3de6a64dda88c9ade7a013d022a2e1e0",
492 "e37c797e3de6a64dda88c9ade7a013d022a2e1e0",
493 "e37c797e3de6a64dda88c9ade7a013d022a2e1e0");
494
495 DecodeAndCompare(input_rtp_file,
496 output_checksum,
497 network_stats_checksum,
498 rtcp_stats_checksum,
oprypin9b2f20c2017-08-29 05:51:57 -0700499 FLAG_gen_ref);
minyue93c08b72015-12-22 09:57:41 -0800500}
501
henrik.lundin@webrtc.org7cbc4f92014-10-07 06:37:39 +0000502// Use fax mode to avoid time-scaling. This is to simplify the testing of
503// packet waiting times in the packet buffer.
504class NetEqDecodingTestFaxMode : public NetEqDecodingTest {
505 protected:
506 NetEqDecodingTestFaxMode() : NetEqDecodingTest() {
507 config_.playout_mode = kPlayoutFax;
508 }
509};
510
511TEST_F(NetEqDecodingTestFaxMode, TestFrameWaitingTimeStatistics) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000512 // Insert 30 dummy packets at once. Each packet contains 10 ms 16 kHz audio.
513 size_t num_frames = 30;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000514 const size_t kSamples = 10 * 16;
515 const size_t kPayloadBytes = kSamples * 2;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000516 for (size_t i = 0; i < num_frames; ++i) {
kwibergee2bac22015-11-11 10:34:00 -0800517 const uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700518 RTPHeader rtp_info;
519 rtp_info.sequenceNumber = i;
520 rtp_info.timestamp = i * kSamples;
521 rtp_info.ssrc = 0x1234; // Just an arbitrary SSRC.
522 rtp_info.payloadType = 94; // PCM16b WB codec.
523 rtp_info.markerBit = 0;
524 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000525 }
526 // Pull out all data.
527 for (size_t i = 0; i < num_frames; ++i) {
henrik.lundin7a926812016-05-12 13:51:28 -0700528 bool muted;
529 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800530 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000531 }
532
Henrik Lundin1bb8cf82015-08-25 13:08:04 +0200533 NetEqNetworkStatistics stats;
534 EXPECT_EQ(0, neteq_->NetworkStatistics(&stats));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000535 // Since all frames are dumped into NetEQ at once, but pulled out with 10 ms
536 // spacing (per definition), we expect the delay to increase with 10 ms for
Henrik Lundin1bb8cf82015-08-25 13:08:04 +0200537 // each packet. Thus, we are calculating the statistics for a series from 10
538 // to 300, in steps of 10 ms.
539 EXPECT_EQ(155, stats.mean_waiting_time_ms);
540 EXPECT_EQ(155, stats.median_waiting_time_ms);
541 EXPECT_EQ(10, stats.min_waiting_time_ms);
542 EXPECT_EQ(300, stats.max_waiting_time_ms);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000543
544 // Check statistics again and make sure it's been reset.
Henrik Lundin1bb8cf82015-08-25 13:08:04 +0200545 EXPECT_EQ(0, neteq_->NetworkStatistics(&stats));
546 EXPECT_EQ(-1, stats.mean_waiting_time_ms);
547 EXPECT_EQ(-1, stats.median_waiting_time_ms);
548 EXPECT_EQ(-1, stats.min_waiting_time_ms);
549 EXPECT_EQ(-1, stats.max_waiting_time_ms);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000550}
551
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000552TEST_F(NetEqDecodingTest, TestAverageInterArrivalTimeNegative) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000553 const int kNumFrames = 3000; // Needed for convergence.
554 int frame_index = 0;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000555 const size_t kSamples = 10 * 16;
556 const size_t kPayloadBytes = kSamples * 2;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000557 while (frame_index < kNumFrames) {
558 // Insert one packet each time, except every 10th time where we insert two
559 // packets at once. This will create a negative clock-drift of approx. 10%.
560 int num_packets = (frame_index % 10 == 0 ? 2 : 1);
561 for (int n = 0; n < num_packets; ++n) {
562 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700563 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000564 PopulateRtpInfo(frame_index, frame_index * kSamples, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700565 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000566 ++frame_index;
567 }
568
569 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700570 bool muted;
571 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800572 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000573 }
574
575 NetEqNetworkStatistics network_stats;
576 ASSERT_EQ(0, neteq_->NetworkStatistics(&network_stats));
henrik.lundin0d838572016-10-13 03:35:55 -0700577 EXPECT_EQ(-103192, network_stats.clockdrift_ppm);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000578}
579
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000580TEST_F(NetEqDecodingTest, TestAverageInterArrivalTimePositive) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000581 const int kNumFrames = 5000; // Needed for convergence.
582 int frame_index = 0;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000583 const size_t kSamples = 10 * 16;
584 const size_t kPayloadBytes = kSamples * 2;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000585 for (int i = 0; i < kNumFrames; ++i) {
586 // Insert one packet each time, except every 10th time where we don't insert
587 // any packet. This will create a positive clock-drift of approx. 11%.
588 int num_packets = (i % 10 == 9 ? 0 : 1);
589 for (int n = 0; n < num_packets; ++n) {
590 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700591 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000592 PopulateRtpInfo(frame_index, frame_index * kSamples, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700593 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000594 ++frame_index;
595 }
596
597 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700598 bool muted;
599 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800600 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000601 }
602
603 NetEqNetworkStatistics network_stats;
604 ASSERT_EQ(0, neteq_->NetworkStatistics(&network_stats));
henrik.lundin0d838572016-10-13 03:35:55 -0700605 EXPECT_EQ(110953, network_stats.clockdrift_ppm);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000606}
607
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000608void NetEqDecodingTest::LongCngWithClockDrift(double drift_factor,
609 double network_freeze_ms,
610 bool pull_audio_during_freeze,
611 int delay_tolerance_ms,
612 int max_time_to_speech_ms) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000613 uint16_t seq_no = 0;
614 uint32_t timestamp = 0;
615 const int kFrameSizeMs = 30;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000616 const size_t kSamples = kFrameSizeMs * 16;
617 const size_t kPayloadBytes = kSamples * 2;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000618 double next_input_time_ms = 0.0;
619 double t_ms;
henrik.lundin7a926812016-05-12 13:51:28 -0700620 bool muted;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000621
622 // Insert speech for 5 seconds.
623 const int kSpeechDurationMs = 5000;
624 for (t_ms = 0; t_ms < kSpeechDurationMs; t_ms += 10) {
625 // Each turn in this for loop is 10 ms.
626 while (next_input_time_ms <= t_ms) {
627 // Insert one 30 ms speech frame.
628 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700629 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000630 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700631 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000632 ++seq_no;
633 timestamp += kSamples;
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000634 next_input_time_ms += static_cast<double>(kFrameSizeMs) * drift_factor;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000635 }
636 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700637 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800638 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000639 }
640
henrik.lundin55480f52016-03-08 02:37:57 -0800641 EXPECT_EQ(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
henrik.lundin114c1b32017-04-26 07:47:32 -0700642 rtc::Optional<uint32_t> playout_timestamp = neteq_->GetPlayoutTimestamp();
henrik.lundin0d96ab72016-04-06 12:28:26 -0700643 ASSERT_TRUE(playout_timestamp);
644 int32_t delay_before = timestamp - *playout_timestamp;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000645
646 // Insert CNG for 1 minute (= 60000 ms).
647 const int kCngPeriodMs = 100;
648 const int kCngPeriodSamples = kCngPeriodMs * 16; // Period in 16 kHz samples.
649 const int kCngDurationMs = 60000;
650 for (; t_ms < kSpeechDurationMs + kCngDurationMs; t_ms += 10) {
651 // Each turn in this for loop is 10 ms.
652 while (next_input_time_ms <= t_ms) {
653 // Insert one CNG frame each 100 ms.
654 uint8_t payload[kPayloadBytes];
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000655 size_t payload_len;
henrik.lundin246ef3e2017-04-24 09:14:32 -0700656 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000657 PopulateCng(seq_no, timestamp, &rtp_info, payload, &payload_len);
kwibergee2bac22015-11-11 10:34:00 -0800658 ASSERT_EQ(0, neteq_->InsertPacket(
henrik.lundin246ef3e2017-04-24 09:14:32 -0700659 rtp_info,
kwibergee2bac22015-11-11 10:34:00 -0800660 rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000661 ++seq_no;
662 timestamp += kCngPeriodSamples;
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000663 next_input_time_ms += static_cast<double>(kCngPeriodMs) * drift_factor;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000664 }
665 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700666 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800667 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000668 }
669
henrik.lundin55480f52016-03-08 02:37:57 -0800670 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000671
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000672 if (network_freeze_ms > 0) {
673 // First keep pulling audio for |network_freeze_ms| without inserting
674 // any data, then insert CNG data corresponding to |network_freeze_ms|
675 // without pulling any output audio.
676 const double loop_end_time = t_ms + network_freeze_ms;
677 for (; t_ms < loop_end_time; t_ms += 10) {
678 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700679 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800680 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -0800681 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000682 }
683 bool pull_once = pull_audio_during_freeze;
684 // If |pull_once| is true, GetAudio will be called once half-way through
685 // the network recovery period.
686 double pull_time_ms = (t_ms + next_input_time_ms) / 2;
687 while (next_input_time_ms <= t_ms) {
688 if (pull_once && next_input_time_ms >= pull_time_ms) {
689 pull_once = false;
690 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700691 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800692 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -0800693 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000694 t_ms += 10;
695 }
696 // Insert one CNG frame each 100 ms.
697 uint8_t payload[kPayloadBytes];
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000698 size_t payload_len;
henrik.lundin246ef3e2017-04-24 09:14:32 -0700699 RTPHeader rtp_info;
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000700 PopulateCng(seq_no, timestamp, &rtp_info, payload, &payload_len);
kwibergee2bac22015-11-11 10:34:00 -0800701 ASSERT_EQ(0, neteq_->InsertPacket(
henrik.lundin246ef3e2017-04-24 09:14:32 -0700702 rtp_info,
kwibergee2bac22015-11-11 10:34:00 -0800703 rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000704 ++seq_no;
705 timestamp += kCngPeriodSamples;
706 next_input_time_ms += kCngPeriodMs * drift_factor;
707 }
708 }
709
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000710 // Insert speech again until output type is speech.
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000711 double speech_restart_time_ms = t_ms;
henrik.lundin55480f52016-03-08 02:37:57 -0800712 while (out_frame_.speech_type_ != AudioFrame::kNormalSpeech) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000713 // Each turn in this for loop is 10 ms.
714 while (next_input_time_ms <= t_ms) {
715 // Insert one 30 ms speech frame.
716 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700717 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000718 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700719 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000720 ++seq_no;
721 timestamp += kSamples;
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000722 next_input_time_ms += kFrameSizeMs * drift_factor;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000723 }
724 // Pull out data once.
henrik.lundin7a926812016-05-12 13:51:28 -0700725 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800726 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000727 // Increase clock.
728 t_ms += 10;
729 }
730
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000731 // Check that the speech starts again within reasonable time.
732 double time_until_speech_returns_ms = t_ms - speech_restart_time_ms;
733 EXPECT_LT(time_until_speech_returns_ms, max_time_to_speech_ms);
henrik.lundin114c1b32017-04-26 07:47:32 -0700734 playout_timestamp = neteq_->GetPlayoutTimestamp();
henrik.lundin0d96ab72016-04-06 12:28:26 -0700735 ASSERT_TRUE(playout_timestamp);
736 int32_t delay_after = timestamp - *playout_timestamp;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000737 // Compare delay before and after, and make sure it differs less than 20 ms.
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000738 EXPECT_LE(delay_after, delay_before + delay_tolerance_ms * 16);
739 EXPECT_GE(delay_after, delay_before - delay_tolerance_ms * 16);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000740}
741
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000742TEST_F(NetEqDecodingTest, LongCngWithNegativeClockDrift) {
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000743 // Apply a clock drift of -25 ms / s (sender faster than receiver).
744 const double kDriftFactor = 1000.0 / (1000.0 + 25.0);
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000745 const double kNetworkFreezeTimeMs = 0.0;
746 const bool kGetAudioDuringFreezeRecovery = false;
747 const int kDelayToleranceMs = 20;
748 const int kMaxTimeToSpeechMs = 100;
749 LongCngWithClockDrift(kDriftFactor,
750 kNetworkFreezeTimeMs,
751 kGetAudioDuringFreezeRecovery,
752 kDelayToleranceMs,
753 kMaxTimeToSpeechMs);
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000754}
755
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000756TEST_F(NetEqDecodingTest, LongCngWithPositiveClockDrift) {
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000757 // Apply a clock drift of +25 ms / s (sender slower than receiver).
758 const double kDriftFactor = 1000.0 / (1000.0 - 25.0);
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000759 const double kNetworkFreezeTimeMs = 0.0;
760 const bool kGetAudioDuringFreezeRecovery = false;
761 const int kDelayToleranceMs = 20;
762 const int kMaxTimeToSpeechMs = 100;
763 LongCngWithClockDrift(kDriftFactor,
764 kNetworkFreezeTimeMs,
765 kGetAudioDuringFreezeRecovery,
766 kDelayToleranceMs,
767 kMaxTimeToSpeechMs);
768}
769
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000770TEST_F(NetEqDecodingTest, LongCngWithNegativeClockDriftNetworkFreeze) {
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000771 // Apply a clock drift of -25 ms / s (sender faster than receiver).
772 const double kDriftFactor = 1000.0 / (1000.0 + 25.0);
773 const double kNetworkFreezeTimeMs = 5000.0;
774 const bool kGetAudioDuringFreezeRecovery = false;
775 const int kDelayToleranceMs = 50;
776 const int kMaxTimeToSpeechMs = 200;
777 LongCngWithClockDrift(kDriftFactor,
778 kNetworkFreezeTimeMs,
779 kGetAudioDuringFreezeRecovery,
780 kDelayToleranceMs,
781 kMaxTimeToSpeechMs);
782}
783
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000784TEST_F(NetEqDecodingTest, LongCngWithPositiveClockDriftNetworkFreeze) {
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000785 // Apply a clock drift of +25 ms / s (sender slower than receiver).
786 const double kDriftFactor = 1000.0 / (1000.0 - 25.0);
787 const double kNetworkFreezeTimeMs = 5000.0;
788 const bool kGetAudioDuringFreezeRecovery = false;
789 const int kDelayToleranceMs = 20;
790 const int kMaxTimeToSpeechMs = 100;
791 LongCngWithClockDrift(kDriftFactor,
792 kNetworkFreezeTimeMs,
793 kGetAudioDuringFreezeRecovery,
794 kDelayToleranceMs,
795 kMaxTimeToSpeechMs);
796}
797
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000798TEST_F(NetEqDecodingTest, LongCngWithPositiveClockDriftNetworkFreezeExtraPull) {
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000799 // Apply a clock drift of +25 ms / s (sender slower than receiver).
800 const double kDriftFactor = 1000.0 / (1000.0 - 25.0);
801 const double kNetworkFreezeTimeMs = 5000.0;
802 const bool kGetAudioDuringFreezeRecovery = true;
803 const int kDelayToleranceMs = 20;
804 const int kMaxTimeToSpeechMs = 100;
805 LongCngWithClockDrift(kDriftFactor,
806 kNetworkFreezeTimeMs,
807 kGetAudioDuringFreezeRecovery,
808 kDelayToleranceMs,
809 kMaxTimeToSpeechMs);
810}
811
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000812TEST_F(NetEqDecodingTest, LongCngWithoutClockDrift) {
henrik.lundin@webrtc.org24779fe2014-03-14 12:40:05 +0000813 const double kDriftFactor = 1.0; // No drift.
814 const double kNetworkFreezeTimeMs = 0.0;
815 const bool kGetAudioDuringFreezeRecovery = false;
816 const int kDelayToleranceMs = 10;
817 const int kMaxTimeToSpeechMs = 50;
818 LongCngWithClockDrift(kDriftFactor,
819 kNetworkFreezeTimeMs,
820 kGetAudioDuringFreezeRecovery,
821 kDelayToleranceMs,
822 kMaxTimeToSpeechMs);
henrik.lundin@webrtc.orgfcfc6a92014-02-13 11:42:28 +0000823}
824
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000825TEST_F(NetEqDecodingTest, UnknownPayloadType) {
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000826 const size_t kPayloadBytes = 100;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000827 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700828 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000829 PopulateRtpInfo(0, 0, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700830 rtp_info.payloadType = 1; // Not registered as a decoder.
831 EXPECT_EQ(NetEq::kFail, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000832}
833
Peter Boströme2976c82016-01-04 22:44:05 +0100834#if defined(WEBRTC_CODEC_ISAC) || defined(WEBRTC_CODEC_ISACFX)
ivoc72c08ed2016-01-20 07:26:24 -0800835#define MAYBE_DecoderError DecoderError
836#else
837#define MAYBE_DecoderError DISABLED_DecoderError
838#endif
839
Peter Boströme2976c82016-01-04 22:44:05 +0100840TEST_F(NetEqDecodingTest, MAYBE_DecoderError) {
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +0000841 const size_t kPayloadBytes = 100;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000842 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -0700843 RTPHeader rtp_info;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000844 PopulateRtpInfo(0, 0, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700845 rtp_info.payloadType = 103; // iSAC, but the payload is invalid.
846 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000847 // Set all of |out_data_| to 1, and verify that it was set to 0 by the call
848 // to GetAudio.
yujo36b1a5f2017-06-12 12:45:32 -0700849 int16_t* out_frame_data = out_frame_.mutable_data();
henrik.lundin6d8e0112016-03-04 10:34:21 -0800850 for (size_t i = 0; i < AudioFrame::kMaxDataSizeSamples; ++i) {
yujo36b1a5f2017-06-12 12:45:32 -0700851 out_frame_data[i] = 1;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000852 }
henrik.lundin7a926812016-05-12 13:51:28 -0700853 bool muted;
854 EXPECT_EQ(NetEq::kFail, neteq_->GetAudio(&out_frame_, &muted));
855 ASSERT_FALSE(muted);
ivoc72c08ed2016-01-20 07:26:24 -0800856
yujo36b1a5f2017-06-12 12:45:32 -0700857 // Verify that the first 160 samples are set to 0.
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000858 static const int kExpectedOutputLength = 160; // 10 ms at 16 kHz sample rate.
yujo36b1a5f2017-06-12 12:45:32 -0700859 const int16_t* const_out_frame_data = out_frame_.data();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000860 for (int i = 0; i < kExpectedOutputLength; ++i) {
861 std::ostringstream ss;
862 ss << "i = " << i;
863 SCOPED_TRACE(ss.str()); // Print out the parameter values on failure.
yujo36b1a5f2017-06-12 12:45:32 -0700864 EXPECT_EQ(0, const_out_frame_data[i]);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000865 }
866}
867
henrik.lundin@webrtc.orgb4e80e02014-05-15 07:14:00 +0000868TEST_F(NetEqDecodingTest, GetAudioBeforeInsertPacket) {
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000869 // Set all of |out_data_| to 1, and verify that it was set to 0 by the call
870 // to GetAudio.
yujo36b1a5f2017-06-12 12:45:32 -0700871 int16_t* out_frame_data = out_frame_.mutable_data();
henrik.lundin6d8e0112016-03-04 10:34:21 -0800872 for (size_t i = 0; i < AudioFrame::kMaxDataSizeSamples; ++i) {
yujo36b1a5f2017-06-12 12:45:32 -0700873 out_frame_data[i] = 1;
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000874 }
henrik.lundin7a926812016-05-12 13:51:28 -0700875 bool muted;
876 EXPECT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
877 ASSERT_FALSE(muted);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000878 // Verify that the first block of samples is set to 0.
879 static const int kExpectedOutputLength =
880 kInitSampleRateHz / 100; // 10 ms at initial sample rate.
yujo36b1a5f2017-06-12 12:45:32 -0700881 const int16_t* const_out_frame_data = out_frame_.data();
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000882 for (int i = 0; i < kExpectedOutputLength; ++i) {
883 std::ostringstream ss;
884 ss << "i = " << i;
885 SCOPED_TRACE(ss.str()); // Print out the parameter values on failure.
yujo36b1a5f2017-06-12 12:45:32 -0700886 EXPECT_EQ(0, const_out_frame_data[i]);
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000887 }
henrik.lundind89814b2015-11-23 06:49:25 -0800888 // Verify that the sample rate did not change from the initial configuration.
889 EXPECT_EQ(config_.sample_rate_hz, neteq_->last_output_sample_rate_hz());
henrik.lundin@webrtc.orgd94659d2013-01-29 12:09:21 +0000890}
turaj@webrtc.orgff43c852013-09-25 00:07:27 +0000891
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000892class NetEqBgnTest : public NetEqDecodingTest {
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000893 protected:
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000894 virtual void TestCondition(double sum_squared_noise,
895 bool should_be_faded) = 0;
turaj@webrtc.orgff43c852013-09-25 00:07:27 +0000896
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000897 void CheckBgn(int sampling_rate_hz) {
Peter Kastingdce40cf2015-08-24 14:52:23 -0700898 size_t expected_samples_per_channel = 0;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000899 uint8_t payload_type = 0xFF; // Invalid.
900 if (sampling_rate_hz == 8000) {
901 expected_samples_per_channel = kBlockSize8kHz;
902 payload_type = 93; // PCM 16, 8 kHz.
903 } else if (sampling_rate_hz == 16000) {
904 expected_samples_per_channel = kBlockSize16kHz;
905 payload_type = 94; // PCM 16, 16 kHZ.
906 } else if (sampling_rate_hz == 32000) {
907 expected_samples_per_channel = kBlockSize32kHz;
908 payload_type = 95; // PCM 16, 32 kHz.
909 } else {
910 ASSERT_TRUE(false); // Unsupported test case.
911 }
turaj@webrtc.orgff43c852013-09-25 00:07:27 +0000912
henrik.lundin6d8e0112016-03-04 10:34:21 -0800913 AudioFrame output;
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000914 test::AudioLoop input;
915 // We are using the same 32 kHz input file for all tests, regardless of
916 // |sampling_rate_hz|. The output may sound weird, but the test is still
917 // valid.
918 ASSERT_TRUE(input.Init(
919 webrtc::test::ResourcePath("audio_coding/testfile32kHz", "pcm"),
920 10 * sampling_rate_hz, // Max 10 seconds loop length.
Peter Kastingdce40cf2015-08-24 14:52:23 -0700921 expected_samples_per_channel));
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000922
923 // Payload of 10 ms of PCM16 32 kHz.
924 uint8_t payload[kBlockSize32kHz * sizeof(int16_t)];
henrik.lundin246ef3e2017-04-24 09:14:32 -0700925 RTPHeader rtp_info;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000926 PopulateRtpInfo(0, 0, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -0700927 rtp_info.payloadType = payload_type;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000928
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000929 uint32_t receive_timestamp = 0;
henrik.lundin7a926812016-05-12 13:51:28 -0700930 bool muted;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000931 for (int n = 0; n < 10; ++n) { // Insert few packets and get audio.
kwiberg288886b2015-11-06 01:21:35 -0800932 auto block = input.GetNextBlock();
933 ASSERT_EQ(expected_samples_per_channel, block.size());
934 size_t enc_len_bytes =
935 WebRtcPcm16b_Encode(block.data(), block.size(), payload);
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000936 ASSERT_EQ(enc_len_bytes, expected_samples_per_channel * 2);
937
Henrik Lundin70c09bd2017-04-24 15:56:56 +0200938 ASSERT_EQ(0, neteq_->InsertPacket(
henrik.lundin246ef3e2017-04-24 09:14:32 -0700939 rtp_info,
Henrik Lundin70c09bd2017-04-24 15:56:56 +0200940 rtc::ArrayView<const uint8_t>(payload, enc_len_bytes),
941 receive_timestamp));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800942 output.Reset();
henrik.lundin7a926812016-05-12 13:51:28 -0700943 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800944 ASSERT_EQ(1u, output.num_channels_);
945 ASSERT_EQ(expected_samples_per_channel, output.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -0800946 ASSERT_EQ(AudioFrame::kNormalSpeech, output.speech_type_);
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000947
948 // Next packet.
henrik.lundin246ef3e2017-04-24 09:14:32 -0700949 rtp_info.timestamp += expected_samples_per_channel;
950 rtp_info.sequenceNumber++;
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000951 receive_timestamp += expected_samples_per_channel;
952 }
953
henrik.lundin6d8e0112016-03-04 10:34:21 -0800954 output.Reset();
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000955
956 // Get audio without inserting packets, expecting PLC and PLC-to-CNG. Pull
957 // one frame without checking speech-type. This is the first frame pulled
958 // without inserting any packet, and might not be labeled as PLC.
henrik.lundin7a926812016-05-12 13:51:28 -0700959 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -0800960 ASSERT_EQ(1u, output.num_channels_);
961 ASSERT_EQ(expected_samples_per_channel, output.samples_per_channel_);
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000962
963 // To be able to test the fading of background noise we need at lease to
964 // pull 611 frames.
965 const int kFadingThreshold = 611;
966
967 // Test several CNG-to-PLC packet for the expected behavior. The number 20
968 // is arbitrary, but sufficiently large to test enough number of frames.
969 const int kNumPlcToCngTestFrames = 20;
970 bool plc_to_cng = false;
971 for (int n = 0; n < kFadingThreshold + kNumPlcToCngTestFrames; ++n) {
henrik.lundin6d8e0112016-03-04 10:34:21 -0800972 output.Reset();
yujo36b1a5f2017-06-12 12:45:32 -0700973 // Set to non-zero.
974 memset(output.mutable_data(), 1, AudioFrame::kMaxDataSizeBytes);
henrik.lundin7a926812016-05-12 13:51:28 -0700975 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
976 ASSERT_FALSE(muted);
henrik.lundin6d8e0112016-03-04 10:34:21 -0800977 ASSERT_EQ(1u, output.num_channels_);
978 ASSERT_EQ(expected_samples_per_channel, output.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -0800979 if (output.speech_type_ == AudioFrame::kPLCCNG) {
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000980 plc_to_cng = true;
981 double sum_squared = 0;
yujo36b1a5f2017-06-12 12:45:32 -0700982 const int16_t* output_data = output.data();
henrik.lundin6d8e0112016-03-04 10:34:21 -0800983 for (size_t k = 0;
984 k < output.num_channels_ * output.samples_per_channel_; ++k)
yujo36b1a5f2017-06-12 12:45:32 -0700985 sum_squared += output_data[k] * output_data[k];
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000986 TestCondition(sum_squared, n > kFadingThreshold);
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000987 } else {
henrik.lundin55480f52016-03-08 02:37:57 -0800988 EXPECT_EQ(AudioFrame::kPLC, output.speech_type_);
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +0000989 }
990 }
991 EXPECT_TRUE(plc_to_cng); // Just to be sure that PLC-to-CNG has occurred.
992 }
993};
994
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +0000995class NetEqBgnTestOn : public NetEqBgnTest {
996 protected:
997 NetEqBgnTestOn() : NetEqBgnTest() {
998 config_.background_noise_mode = NetEq::kBgnOn;
999 }
1000
1001 void TestCondition(double sum_squared_noise, bool /*should_be_faded*/) {
1002 EXPECT_NE(0, sum_squared_noise);
1003 }
1004};
1005
1006class NetEqBgnTestOff : public NetEqBgnTest {
1007 protected:
1008 NetEqBgnTestOff() : NetEqBgnTest() {
1009 config_.background_noise_mode = NetEq::kBgnOff;
1010 }
1011
1012 void TestCondition(double sum_squared_noise, bool /*should_be_faded*/) {
1013 EXPECT_EQ(0, sum_squared_noise);
1014 }
1015};
1016
1017class NetEqBgnTestFade : public NetEqBgnTest {
1018 protected:
1019 NetEqBgnTestFade() : NetEqBgnTest() {
1020 config_.background_noise_mode = NetEq::kBgnFade;
1021 }
1022
1023 void TestCondition(double sum_squared_noise, bool should_be_faded) {
1024 if (should_be_faded)
1025 EXPECT_EQ(0, sum_squared_noise);
1026 }
1027};
1028
henrika1d34fe92015-06-16 10:04:20 +02001029TEST_F(NetEqBgnTestOn, RunTest) {
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +00001030 CheckBgn(8000);
1031 CheckBgn(16000);
1032 CheckBgn(32000);
turaj@webrtc.orgff43c852013-09-25 00:07:27 +00001033}
turaj@webrtc.org7b75ac62013-09-26 00:27:56 +00001034
henrika1d34fe92015-06-16 10:04:20 +02001035TEST_F(NetEqBgnTestOff, RunTest) {
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +00001036 CheckBgn(8000);
1037 CheckBgn(16000);
1038 CheckBgn(32000);
1039}
1040
henrika1d34fe92015-06-16 10:04:20 +02001041TEST_F(NetEqBgnTestFade, RunTest) {
henrik.lundin@webrtc.org9b8102c2014-08-21 08:27:44 +00001042 CheckBgn(8000);
1043 CheckBgn(16000);
1044 CheckBgn(32000);
1045}
henrik.lundin@webrtc.orgea257842014-08-07 12:27:37 +00001046
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001047void NetEqDecodingTest::WrapTest(uint16_t start_seq_no,
1048 uint32_t start_timestamp,
1049 const std::set<uint16_t>& drop_seq_numbers,
1050 bool expect_seq_no_wrap,
1051 bool expect_timestamp_wrap) {
1052 uint16_t seq_no = start_seq_no;
1053 uint32_t timestamp = start_timestamp;
1054 const int kBlocksPerFrame = 3; // Number of 10 ms blocks per frame.
1055 const int kFrameSizeMs = kBlocksPerFrame * kTimeStepMs;
1056 const int kSamples = kBlockSize16kHz * kBlocksPerFrame;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +00001057 const size_t kPayloadBytes = kSamples * sizeof(int16_t);
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001058 double next_input_time_ms = 0.0;
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001059 uint32_t receive_timestamp = 0;
1060
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001061 // Insert speech for 2 seconds.
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001062 const int kSpeechDurationMs = 2000;
1063 int packets_inserted = 0;
1064 uint16_t last_seq_no;
1065 uint32_t last_timestamp;
1066 bool timestamp_wrapped = false;
1067 bool seq_no_wrapped = false;
1068 for (double t_ms = 0; t_ms < kSpeechDurationMs; t_ms += 10) {
1069 // Each turn in this for loop is 10 ms.
1070 while (next_input_time_ms <= t_ms) {
1071 // Insert one 30 ms speech frame.
1072 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001073 RTPHeader rtp_info;
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001074 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
1075 if (drop_seq_numbers.find(seq_no) == drop_seq_numbers.end()) {
1076 // This sequence number was not in the set to drop. Insert it.
henrik.lundin246ef3e2017-04-24 09:14:32 -07001077 ASSERT_EQ(0,
1078 neteq_->InsertPacket(rtp_info, payload, receive_timestamp));
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001079 ++packets_inserted;
1080 }
1081 NetEqNetworkStatistics network_stats;
1082 ASSERT_EQ(0, neteq_->NetworkStatistics(&network_stats));
1083
1084 // Due to internal NetEq logic, preferred buffer-size is about 4 times the
1085 // packet size for first few packets. Therefore we refrain from checking
1086 // the criteria.
1087 if (packets_inserted > 4) {
1088 // Expect preferred and actual buffer size to be no more than 2 frames.
1089 EXPECT_LE(network_stats.preferred_buffer_size_ms, kFrameSizeMs * 2);
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +00001090 EXPECT_LE(network_stats.current_buffer_size_ms, kFrameSizeMs * 2 +
1091 algorithmic_delay_ms_);
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001092 }
1093 last_seq_no = seq_no;
1094 last_timestamp = timestamp;
1095
1096 ++seq_no;
1097 timestamp += kSamples;
1098 receive_timestamp += kSamples;
1099 next_input_time_ms += static_cast<double>(kFrameSizeMs);
1100
1101 seq_no_wrapped |= seq_no < last_seq_no;
1102 timestamp_wrapped |= timestamp < last_timestamp;
1103 }
1104 // Pull out data once.
henrik.lundin6d8e0112016-03-04 10:34:21 -08001105 AudioFrame output;
henrik.lundin7a926812016-05-12 13:51:28 -07001106 bool muted;
1107 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001108 ASSERT_EQ(kBlockSize16kHz, output.samples_per_channel_);
1109 ASSERT_EQ(1u, output.num_channels_);
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001110
1111 // Expect delay (in samples) to be less than 2 packets.
henrik.lundin114c1b32017-04-26 07:47:32 -07001112 rtc::Optional<uint32_t> playout_timestamp = neteq_->GetPlayoutTimestamp();
henrik.lundin0d96ab72016-04-06 12:28:26 -07001113 ASSERT_TRUE(playout_timestamp);
1114 EXPECT_LE(timestamp - *playout_timestamp,
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001115 static_cast<uint32_t>(kSamples * 2));
turaj@webrtc.org78b41a02013-11-22 20:27:07 +00001116 }
1117 // Make sure we have actually tested wrap-around.
1118 ASSERT_EQ(expect_seq_no_wrap, seq_no_wrapped);
1119 ASSERT_EQ(expect_timestamp_wrap, timestamp_wrapped);
1120}
1121
1122TEST_F(NetEqDecodingTest, SequenceNumberWrap) {
1123 // Start with a sequence number that will soon wrap.
1124 std::set<uint16_t> drop_seq_numbers; // Don't drop any packets.
1125 WrapTest(0xFFFF - 10, 0, drop_seq_numbers, true, false);
1126}
1127
1128TEST_F(NetEqDecodingTest, SequenceNumberWrapAndDrop) {
1129 // Start with a sequence number that will soon wrap.
1130 std::set<uint16_t> drop_seq_numbers;
1131 drop_seq_numbers.insert(0xFFFF);
1132 drop_seq_numbers.insert(0x0);
1133 WrapTest(0xFFFF - 10, 0, drop_seq_numbers, true, false);
1134}
1135
1136TEST_F(NetEqDecodingTest, TimestampWrap) {
1137 // Start with a timestamp that will soon wrap.
1138 std::set<uint16_t> drop_seq_numbers;
1139 WrapTest(0, 0xFFFFFFFF - 3000, drop_seq_numbers, false, true);
1140}
1141
1142TEST_F(NetEqDecodingTest, TimestampAndSequenceNumberWrap) {
1143 // Start with a timestamp and a sequence number that will wrap at the same
1144 // time.
1145 std::set<uint16_t> drop_seq_numbers;
1146 WrapTest(0xFFFF - 10, 0xFFFFFFFF - 5000, drop_seq_numbers, true, true);
1147}
1148
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001149void NetEqDecodingTest::DuplicateCng() {
1150 uint16_t seq_no = 0;
1151 uint32_t timestamp = 0;
1152 const int kFrameSizeMs = 10;
1153 const int kSampleRateKhz = 16;
1154 const int kSamples = kFrameSizeMs * kSampleRateKhz;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +00001155 const size_t kPayloadBytes = kSamples * 2;
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001156
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +00001157 const int algorithmic_delay_samples = std::max(
1158 algorithmic_delay_ms_ * kSampleRateKhz, 5 * kSampleRateKhz / 8);
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001159 // Insert three speech packets. Three are needed to get the frame length
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001160 // correct.
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001161 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001162 RTPHeader rtp_info;
henrik.lundin7a926812016-05-12 13:51:28 -07001163 bool muted;
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001164 for (int i = 0; i < 3; ++i) {
1165 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001166 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001167 ++seq_no;
1168 timestamp += kSamples;
1169
1170 // Pull audio once.
henrik.lundin7a926812016-05-12 13:51:28 -07001171 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001172 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001173 }
1174 // Verify speech output.
henrik.lundin55480f52016-03-08 02:37:57 -08001175 EXPECT_EQ(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001176
1177 // Insert same CNG packet twice.
1178 const int kCngPeriodMs = 100;
1179 const int kCngPeriodSamples = kCngPeriodMs * kSampleRateKhz;
pkasting@chromium.org4591fbd2014-11-20 22:28:14 +00001180 size_t payload_len;
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001181 PopulateCng(seq_no, timestamp, &rtp_info, payload, &payload_len);
1182 // This is the first time this CNG packet is inserted.
henrik.lundin246ef3e2017-04-24 09:14:32 -07001183 ASSERT_EQ(
1184 0, neteq_->InsertPacket(
1185 rtp_info, rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001186
1187 // Pull audio once and make sure CNG is played.
henrik.lundin7a926812016-05-12 13:51:28 -07001188 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001189 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -08001190 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin114c1b32017-04-26 07:47:32 -07001191 EXPECT_FALSE(
1192 neteq_->GetPlayoutTimestamp()); // Returns empty value during CNG.
henrik.lundin0d96ab72016-04-06 12:28:26 -07001193 EXPECT_EQ(timestamp - algorithmic_delay_samples,
1194 out_frame_.timestamp_ + out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001195
1196 // Insert the same CNG packet again. Note that at this point it is old, since
1197 // we have already decoded the first copy of it.
henrik.lundin246ef3e2017-04-24 09:14:32 -07001198 ASSERT_EQ(
1199 0, neteq_->InsertPacket(
1200 rtp_info, rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001201
1202 // Pull audio until we have played |kCngPeriodMs| of CNG. Start at 10 ms since
1203 // we have already pulled out CNG once.
1204 for (int cng_time_ms = 10; cng_time_ms < kCngPeriodMs; cng_time_ms += 10) {
henrik.lundin7a926812016-05-12 13:51:28 -07001205 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001206 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -08001207 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin114c1b32017-04-26 07:47:32 -07001208 EXPECT_FALSE(
1209 neteq_->GetPlayoutTimestamp()); // Returns empty value during CNG.
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +00001210 EXPECT_EQ(timestamp - algorithmic_delay_samples,
henrik.lundin0d96ab72016-04-06 12:28:26 -07001211 out_frame_.timestamp_ + out_frame_.samples_per_channel_);
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001212 }
1213
1214 // Insert speech again.
1215 ++seq_no;
1216 timestamp += kCngPeriodSamples;
1217 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001218 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001219
1220 // Pull audio once and verify that the output is speech again.
henrik.lundin7a926812016-05-12 13:51:28 -07001221 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001222 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -08001223 EXPECT_EQ(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
henrik.lundin114c1b32017-04-26 07:47:32 -07001224 rtc::Optional<uint32_t> playout_timestamp = neteq_->GetPlayoutTimestamp();
henrik.lundin0d96ab72016-04-06 12:28:26 -07001225 ASSERT_TRUE(playout_timestamp);
turaj@webrtc.org8d1cdaa2014-04-11 18:47:55 +00001226 EXPECT_EQ(timestamp + kSamples - algorithmic_delay_samples,
henrik.lundin0d96ab72016-04-06 12:28:26 -07001227 *playout_timestamp);
wu@webrtc.org94454b72014-06-05 20:34:08 +00001228}
1229
henrik.lundin@webrtc.orgca8cb952014-03-12 10:26:52 +00001230TEST_F(NetEqDecodingTest, DiscardDuplicateCng) { DuplicateCng(); }
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001231
1232TEST_F(NetEqDecodingTest, CngFirst) {
1233 uint16_t seq_no = 0;
1234 uint32_t timestamp = 0;
1235 const int kFrameSizeMs = 10;
1236 const int kSampleRateKhz = 16;
1237 const int kSamples = kFrameSizeMs * kSampleRateKhz;
1238 const int kPayloadBytes = kSamples * 2;
1239 const int kCngPeriodMs = 100;
1240 const int kCngPeriodSamples = kCngPeriodMs * kSampleRateKhz;
1241 size_t payload_len;
1242
1243 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001244 RTPHeader rtp_info;
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001245
1246 PopulateCng(seq_no, timestamp, &rtp_info, payload, &payload_len);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001247 ASSERT_EQ(
1248 NetEq::kOK,
1249 neteq_->InsertPacket(
1250 rtp_info, rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001251 ++seq_no;
1252 timestamp += kCngPeriodSamples;
1253
1254 // Pull audio once and make sure CNG is played.
henrik.lundin7a926812016-05-12 13:51:28 -07001255 bool muted;
1256 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001257 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin55480f52016-03-08 02:37:57 -08001258 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001259
1260 // Insert some speech packets.
henrik.lundin549d80b2016-08-25 00:44:24 -07001261 const uint32_t first_speech_timestamp = timestamp;
1262 int timeout_counter = 0;
1263 do {
1264 ASSERT_LT(timeout_counter++, 20) << "Test timed out";
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001265 PopulateRtpInfo(seq_no, timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001266 ASSERT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001267 ++seq_no;
1268 timestamp += kSamples;
1269
1270 // Pull audio once.
henrik.lundin7a926812016-05-12 13:51:28 -07001271 ASSERT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
henrik.lundin6d8e0112016-03-04 10:34:21 -08001272 ASSERT_EQ(kBlockSize16kHz, out_frame_.samples_per_channel_);
henrik.lundin549d80b2016-08-25 00:44:24 -07001273 } while (!IsNewerTimestamp(out_frame_.timestamp_, first_speech_timestamp));
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001274 // Verify speech output.
henrik.lundin55480f52016-03-08 02:37:57 -08001275 EXPECT_EQ(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
henrik.lundin@webrtc.orgc93437e2014-12-01 11:42:42 +00001276}
henrik.lundin7a926812016-05-12 13:51:28 -07001277
1278class NetEqDecodingTestWithMutedState : public NetEqDecodingTest {
1279 public:
1280 NetEqDecodingTestWithMutedState() : NetEqDecodingTest() {
1281 config_.enable_muted_state = true;
1282 }
1283
1284 protected:
1285 static constexpr size_t kSamples = 10 * 16;
1286 static constexpr size_t kPayloadBytes = kSamples * 2;
1287
1288 void InsertPacket(uint32_t rtp_timestamp) {
1289 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001290 RTPHeader rtp_info;
henrik.lundin7a926812016-05-12 13:51:28 -07001291 PopulateRtpInfo(0, rtp_timestamp, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001292 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
henrik.lundin7a926812016-05-12 13:51:28 -07001293 }
1294
henrik.lundin42feb512016-09-20 06:51:40 -07001295 void InsertCngPacket(uint32_t rtp_timestamp) {
1296 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001297 RTPHeader rtp_info;
henrik.lundin42feb512016-09-20 06:51:40 -07001298 size_t payload_len;
1299 PopulateCng(0, rtp_timestamp, &rtp_info, payload, &payload_len);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001300 EXPECT_EQ(
1301 NetEq::kOK,
1302 neteq_->InsertPacket(
1303 rtp_info, rtc::ArrayView<const uint8_t>(payload, payload_len), 0));
henrik.lundin42feb512016-09-20 06:51:40 -07001304 }
1305
henrik.lundin7a926812016-05-12 13:51:28 -07001306 bool GetAudioReturnMuted() {
1307 bool muted;
1308 EXPECT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
1309 return muted;
1310 }
1311
1312 void GetAudioUntilMuted() {
1313 while (!GetAudioReturnMuted()) {
1314 ASSERT_LT(counter_++, 1000) << "Test timed out";
1315 }
1316 }
1317
1318 void GetAudioUntilNormal() {
1319 bool muted = false;
1320 while (out_frame_.speech_type_ != AudioFrame::kNormalSpeech) {
1321 EXPECT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
1322 ASSERT_LT(counter_++, 1000) << "Test timed out";
1323 }
1324 EXPECT_FALSE(muted);
1325 }
1326
1327 int counter_ = 0;
1328};
1329
1330// Verifies that NetEq goes in and out of muted state as expected.
1331TEST_F(NetEqDecodingTestWithMutedState, MutedState) {
1332 // Insert one speech packet.
1333 InsertPacket(0);
1334 // Pull out audio once and expect it not to be muted.
1335 EXPECT_FALSE(GetAudioReturnMuted());
1336 // Pull data until faded out.
1337 GetAudioUntilMuted();
henrik.lundina4491072017-07-06 05:23:53 -07001338 EXPECT_TRUE(out_frame_.muted());
henrik.lundin7a926812016-05-12 13:51:28 -07001339
1340 // Verify that output audio is not written during muted mode. Other parameters
1341 // should be correct, though.
1342 AudioFrame new_frame;
yujo36b1a5f2017-06-12 12:45:32 -07001343 int16_t* frame_data = new_frame.mutable_data();
1344 for (size_t i = 0; i < AudioFrame::kMaxDataSizeSamples; i++) {
1345 frame_data[i] = 17;
henrik.lundin7a926812016-05-12 13:51:28 -07001346 }
1347 bool muted;
1348 EXPECT_EQ(0, neteq_->GetAudio(&new_frame, &muted));
1349 EXPECT_TRUE(muted);
henrik.lundina4491072017-07-06 05:23:53 -07001350 EXPECT_TRUE(out_frame_.muted());
yujo36b1a5f2017-06-12 12:45:32 -07001351 for (size_t i = 0; i < AudioFrame::kMaxDataSizeSamples; i++) {
1352 EXPECT_EQ(17, frame_data[i]);
henrik.lundin7a926812016-05-12 13:51:28 -07001353 }
1354 EXPECT_EQ(out_frame_.timestamp_ + out_frame_.samples_per_channel_,
1355 new_frame.timestamp_);
1356 EXPECT_EQ(out_frame_.samples_per_channel_, new_frame.samples_per_channel_);
1357 EXPECT_EQ(out_frame_.sample_rate_hz_, new_frame.sample_rate_hz_);
1358 EXPECT_EQ(out_frame_.num_channels_, new_frame.num_channels_);
1359 EXPECT_EQ(out_frame_.speech_type_, new_frame.speech_type_);
1360 EXPECT_EQ(out_frame_.vad_activity_, new_frame.vad_activity_);
1361
1362 // Insert new data. Timestamp is corrected for the time elapsed since the last
1363 // packet. Verify that normal operation resumes.
1364 InsertPacket(kSamples * counter_);
1365 GetAudioUntilNormal();
henrik.lundina4491072017-07-06 05:23:53 -07001366 EXPECT_FALSE(out_frame_.muted());
henrik.lundin612c25e2016-05-25 08:21:04 -07001367
1368 NetEqNetworkStatistics stats;
1369 EXPECT_EQ(0, neteq_->NetworkStatistics(&stats));
1370 // NetEqNetworkStatistics::expand_rate tells the fraction of samples that were
1371 // concealment samples, in Q14 (16384 = 100%) .The vast majority should be
1372 // concealment samples in this test.
1373 EXPECT_GT(stats.expand_rate, 14000);
1374 // And, it should be greater than the speech_expand_rate.
1375 EXPECT_GT(stats.expand_rate, stats.speech_expand_rate);
henrik.lundin7a926812016-05-12 13:51:28 -07001376}
1377
1378// Verifies that NetEq goes out of muted state when given a delayed packet.
1379TEST_F(NetEqDecodingTestWithMutedState, MutedStateDelayedPacket) {
1380 // Insert one speech packet.
1381 InsertPacket(0);
1382 // Pull out audio once and expect it not to be muted.
1383 EXPECT_FALSE(GetAudioReturnMuted());
1384 // Pull data until faded out.
1385 GetAudioUntilMuted();
1386 // Insert new data. Timestamp is only corrected for the half of the time
1387 // elapsed since the last packet. That is, the new packet is delayed. Verify
1388 // that normal operation resumes.
1389 InsertPacket(kSamples * counter_ / 2);
1390 GetAudioUntilNormal();
1391}
1392
1393// Verifies that NetEq goes out of muted state when given a future packet.
1394TEST_F(NetEqDecodingTestWithMutedState, MutedStateFuturePacket) {
1395 // Insert one speech packet.
1396 InsertPacket(0);
1397 // Pull out audio once and expect it not to be muted.
1398 EXPECT_FALSE(GetAudioReturnMuted());
1399 // Pull data until faded out.
1400 GetAudioUntilMuted();
1401 // Insert new data. Timestamp is over-corrected for the time elapsed since the
1402 // last packet. That is, the new packet is too early. Verify that normal
1403 // operation resumes.
1404 InsertPacket(kSamples * counter_ * 2);
1405 GetAudioUntilNormal();
1406}
1407
1408// Verifies that NetEq goes out of muted state when given an old packet.
1409TEST_F(NetEqDecodingTestWithMutedState, MutedStateOldPacket) {
1410 // Insert one speech packet.
1411 InsertPacket(0);
1412 // Pull out audio once and expect it not to be muted.
1413 EXPECT_FALSE(GetAudioReturnMuted());
1414 // Pull data until faded out.
1415 GetAudioUntilMuted();
1416
1417 EXPECT_NE(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
1418 // Insert packet which is older than the first packet.
1419 InsertPacket(kSamples * (counter_ - 1000));
1420 EXPECT_FALSE(GetAudioReturnMuted());
1421 EXPECT_EQ(AudioFrame::kNormalSpeech, out_frame_.speech_type_);
1422}
1423
henrik.lundin42feb512016-09-20 06:51:40 -07001424// Verifies that NetEq doesn't enter muted state when CNG mode is active and the
1425// packet stream is suspended for a long time.
1426TEST_F(NetEqDecodingTestWithMutedState, DoNotMuteExtendedCngWithoutPackets) {
1427 // Insert one CNG packet.
1428 InsertCngPacket(0);
1429
1430 // Pull 10 seconds of audio (10 ms audio generated per lap).
1431 for (int i = 0; i < 1000; ++i) {
1432 bool muted;
1433 EXPECT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
1434 ASSERT_FALSE(muted);
1435 }
1436 EXPECT_EQ(AudioFrame::kCNG, out_frame_.speech_type_);
1437}
1438
1439// Verifies that NetEq goes back to normal after a long CNG period with the
1440// packet stream suspended.
1441TEST_F(NetEqDecodingTestWithMutedState, RecoverAfterExtendedCngWithoutPackets) {
1442 // Insert one CNG packet.
1443 InsertCngPacket(0);
1444
1445 // Pull 10 seconds of audio (10 ms audio generated per lap).
1446 for (int i = 0; i < 1000; ++i) {
1447 bool muted;
1448 EXPECT_EQ(0, neteq_->GetAudio(&out_frame_, &muted));
1449 }
1450
1451 // Insert new data. Timestamp is corrected for the time elapsed since the last
1452 // packet. Verify that normal operation resumes.
1453 InsertPacket(kSamples * counter_);
1454 GetAudioUntilNormal();
1455}
1456
henrik.lundin7a926812016-05-12 13:51:28 -07001457class NetEqDecodingTestTwoInstances : public NetEqDecodingTest {
1458 public:
1459 NetEqDecodingTestTwoInstances() : NetEqDecodingTest() {}
1460
1461 void SetUp() override {
1462 NetEqDecodingTest::SetUp();
1463 config2_ = config_;
1464 }
1465
1466 void CreateSecondInstance() {
ossue3525782016-05-25 07:37:43 -07001467 neteq2_.reset(NetEq::Create(config2_, CreateBuiltinAudioDecoderFactory()));
henrik.lundin7a926812016-05-12 13:51:28 -07001468 ASSERT_TRUE(neteq2_);
1469 LoadDecoders(neteq2_.get());
1470 }
1471
1472 protected:
1473 std::unique_ptr<NetEq> neteq2_;
1474 NetEq::Config config2_;
1475};
1476
1477namespace {
1478::testing::AssertionResult AudioFramesEqualExceptData(const AudioFrame& a,
1479 const AudioFrame& b) {
1480 if (a.timestamp_ != b.timestamp_)
1481 return ::testing::AssertionFailure() << "timestamp_ diff (" << a.timestamp_
1482 << " != " << b.timestamp_ << ")";
1483 if (a.sample_rate_hz_ != b.sample_rate_hz_)
1484 return ::testing::AssertionFailure() << "sample_rate_hz_ diff ("
1485 << a.sample_rate_hz_
1486 << " != " << b.sample_rate_hz_ << ")";
1487 if (a.samples_per_channel_ != b.samples_per_channel_)
1488 return ::testing::AssertionFailure()
1489 << "samples_per_channel_ diff (" << a.samples_per_channel_
1490 << " != " << b.samples_per_channel_ << ")";
1491 if (a.num_channels_ != b.num_channels_)
1492 return ::testing::AssertionFailure() << "num_channels_ diff ("
1493 << a.num_channels_
1494 << " != " << b.num_channels_ << ")";
1495 if (a.speech_type_ != b.speech_type_)
1496 return ::testing::AssertionFailure() << "speech_type_ diff ("
1497 << a.speech_type_
1498 << " != " << b.speech_type_ << ")";
1499 if (a.vad_activity_ != b.vad_activity_)
1500 return ::testing::AssertionFailure() << "vad_activity_ diff ("
1501 << a.vad_activity_
1502 << " != " << b.vad_activity_ << ")";
1503 return ::testing::AssertionSuccess();
1504}
1505
1506::testing::AssertionResult AudioFramesEqual(const AudioFrame& a,
1507 const AudioFrame& b) {
1508 ::testing::AssertionResult res = AudioFramesEqualExceptData(a, b);
1509 if (!res)
1510 return res;
1511 if (memcmp(
yujo36b1a5f2017-06-12 12:45:32 -07001512 a.data(), b.data(),
1513 a.samples_per_channel_ * a.num_channels_ * sizeof(*a.data())) != 0) {
henrik.lundin7a926812016-05-12 13:51:28 -07001514 return ::testing::AssertionFailure() << "data_ diff";
1515 }
1516 return ::testing::AssertionSuccess();
1517}
1518
1519} // namespace
1520
1521TEST_F(NetEqDecodingTestTwoInstances, CompareMutedStateOnOff) {
1522 ASSERT_FALSE(config_.enable_muted_state);
1523 config2_.enable_muted_state = true;
1524 CreateSecondInstance();
1525
1526 // Insert one speech packet into both NetEqs.
1527 const size_t kSamples = 10 * 16;
1528 const size_t kPayloadBytes = kSamples * 2;
1529 uint8_t payload[kPayloadBytes] = {0};
henrik.lundin246ef3e2017-04-24 09:14:32 -07001530 RTPHeader rtp_info;
henrik.lundin7a926812016-05-12 13:51:28 -07001531 PopulateRtpInfo(0, 0, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001532 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
1533 EXPECT_EQ(0, neteq2_->InsertPacket(rtp_info, payload, 0));
henrik.lundin7a926812016-05-12 13:51:28 -07001534
1535 AudioFrame out_frame1, out_frame2;
1536 bool muted;
1537 for (int i = 0; i < 1000; ++i) {
1538 std::ostringstream ss;
1539 ss << "i = " << i;
1540 SCOPED_TRACE(ss.str()); // Print out the loop iterator on failure.
1541 EXPECT_EQ(0, neteq_->GetAudio(&out_frame1, &muted));
1542 EXPECT_FALSE(muted);
1543 EXPECT_EQ(0, neteq2_->GetAudio(&out_frame2, &muted));
1544 if (muted) {
1545 EXPECT_TRUE(AudioFramesEqualExceptData(out_frame1, out_frame2));
1546 } else {
1547 EXPECT_TRUE(AudioFramesEqual(out_frame1, out_frame2));
1548 }
1549 }
1550 EXPECT_TRUE(muted);
1551
1552 // Insert new data. Timestamp is corrected for the time elapsed since the last
1553 // packet.
1554 PopulateRtpInfo(0, kSamples * 1000, &rtp_info);
henrik.lundin246ef3e2017-04-24 09:14:32 -07001555 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
1556 EXPECT_EQ(0, neteq2_->InsertPacket(rtp_info, payload, 0));
henrik.lundin7a926812016-05-12 13:51:28 -07001557
1558 int counter = 0;
1559 while (out_frame1.speech_type_ != AudioFrame::kNormalSpeech) {
1560 ASSERT_LT(counter++, 1000) << "Test timed out";
1561 std::ostringstream ss;
1562 ss << "counter = " << counter;
1563 SCOPED_TRACE(ss.str()); // Print out the loop iterator on failure.
1564 EXPECT_EQ(0, neteq_->GetAudio(&out_frame1, &muted));
1565 EXPECT_FALSE(muted);
1566 EXPECT_EQ(0, neteq2_->GetAudio(&out_frame2, &muted));
1567 if (muted) {
1568 EXPECT_TRUE(AudioFramesEqualExceptData(out_frame1, out_frame2));
1569 } else {
1570 EXPECT_TRUE(AudioFramesEqual(out_frame1, out_frame2));
1571 }
1572 }
1573 EXPECT_FALSE(muted);
1574}
1575
henrik.lundin114c1b32017-04-26 07:47:32 -07001576TEST_F(NetEqDecodingTest, LastDecodedTimestampsEmpty) {
1577 EXPECT_TRUE(neteq_->LastDecodedTimestamps().empty());
1578
1579 // Pull out data once.
1580 AudioFrame output;
1581 bool muted;
1582 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
1583
1584 EXPECT_TRUE(neteq_->LastDecodedTimestamps().empty());
1585}
1586
1587TEST_F(NetEqDecodingTest, LastDecodedTimestampsOneDecoded) {
1588 // Insert one packet with PCM16b WB data (this is what PopulateRtpInfo does by
1589 // default). Make the length 10 ms.
1590 constexpr size_t kPayloadSamples = 16 * 10;
1591 constexpr size_t kPayloadBytes = 2 * kPayloadSamples;
1592 uint8_t payload[kPayloadBytes] = {0};
1593
1594 RTPHeader rtp_info;
1595 constexpr uint32_t kRtpTimestamp = 0x1234;
1596 PopulateRtpInfo(0, kRtpTimestamp, &rtp_info);
1597 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
1598
1599 // Pull out data once.
1600 AudioFrame output;
1601 bool muted;
1602 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
1603
1604 EXPECT_EQ(std::vector<uint32_t>({kRtpTimestamp}),
1605 neteq_->LastDecodedTimestamps());
1606
1607 // Nothing decoded on the second call.
1608 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
1609 EXPECT_TRUE(neteq_->LastDecodedTimestamps().empty());
1610}
1611
1612TEST_F(NetEqDecodingTest, LastDecodedTimestampsTwoDecoded) {
1613 // Insert two packets with PCM16b WB data (this is what PopulateRtpInfo does
1614 // by default). Make the length 5 ms so that NetEq must decode them both in
1615 // the same GetAudio call.
1616 constexpr size_t kPayloadSamples = 16 * 5;
1617 constexpr size_t kPayloadBytes = 2 * kPayloadSamples;
1618 uint8_t payload[kPayloadBytes] = {0};
1619
1620 RTPHeader rtp_info;
1621 constexpr uint32_t kRtpTimestamp1 = 0x1234;
1622 PopulateRtpInfo(0, kRtpTimestamp1, &rtp_info);
1623 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
1624 constexpr uint32_t kRtpTimestamp2 = kRtpTimestamp1 + kPayloadSamples;
1625 PopulateRtpInfo(1, kRtpTimestamp2, &rtp_info);
1626 EXPECT_EQ(0, neteq_->InsertPacket(rtp_info, payload, 0));
1627
1628 // Pull out data once.
1629 AudioFrame output;
1630 bool muted;
1631 ASSERT_EQ(0, neteq_->GetAudio(&output, &muted));
1632
1633 EXPECT_EQ(std::vector<uint32_t>({kRtpTimestamp1, kRtpTimestamp2}),
1634 neteq_->LastDecodedTimestamps());
1635}
1636
henrik.lundin@webrtc.orge7ce4372014-01-09 14:01:55 +00001637} // namespace webrtc