andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (c) 2013 The WebRTC project authors. All Rights Reserved. |
| 3 | * |
| 4 | * Use of this source code is governed by a BSD-style license |
| 5 | * that can be found in the LICENSE file in the root of the source |
| 6 | * tree. An additional intellectual property rights grant can be found |
| 7 | * in the file PATENTS. All contributing project authors may |
| 8 | * be found in the AUTHORS file in the root of the source tree. |
| 9 | */ |
| 10 | |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 11 | #include "modules/audio_coding/acm2/acm_receiver.h" |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 12 | |
| 13 | #include <algorithm> // std::min |
kwiberg | 16c5a96 | 2016-02-15 02:27:22 -0800 | [diff] [blame] | 14 | #include <memory> |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 15 | |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 16 | #include "absl/types/optional.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 17 | #include "api/audio_codecs/builtin_audio_decoder_factory.h" |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 18 | #include "api/audio_codecs/builtin_audio_encoder_factory.h" |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 19 | #include "modules/audio_coding/codecs/cng/audio_encoder_cng.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 20 | #include "modules/audio_coding/include/audio_coding_module.h" |
| 21 | #include "modules/audio_coding/neteq/tools/rtp_generator.h" |
Fredrik Solenberg | bbf21a3 | 2018-04-12 22:44:09 +0200 | [diff] [blame] | 22 | #include "modules/include/module_common_types.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 23 | #include "rtc_base/checks.h" |
Karl Wiberg | e40468b | 2017-11-22 10:42:26 +0100 | [diff] [blame] | 24 | #include "rtc_base/numerics/safe_conversions.h" |
Mirko Bonadei | 92ea95e | 2017-09-15 06:47:31 +0200 | [diff] [blame] | 25 | #include "system_wrappers/include/clock.h" |
| 26 | #include "test/gtest.h" |
Steve Anton | 10542f2 | 2019-01-11 09:11:00 -0800 | [diff] [blame] | 27 | #include "test/testsupport/file_utils.h" |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 28 | |
| 29 | namespace webrtc { |
| 30 | |
| 31 | namespace acm2 { |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 32 | |
| 33 | class AcmReceiverTestOldApi : public AudioPacketizationCallback, |
| 34 | public ::testing::Test { |
| 35 | protected: |
| 36 | AcmReceiverTestOldApi() |
| 37 | : timestamp_(0), |
| 38 | packet_sent_(false), |
| 39 | last_packet_send_timestamp_(timestamp_), |
Niels Möller | c936cb6 | 2019-03-19 14:10:16 +0100 | [diff] [blame] | 40 | last_frame_type_(AudioFrameType::kEmptyFrame) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 41 | config_.decoder_factory = decoder_factory_; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 42 | } |
| 43 | |
| 44 | ~AcmReceiverTestOldApi() {} |
| 45 | |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 46 | void SetUp() override { |
kwiberg | c13ded5 | 2016-06-17 06:00:45 -0700 | [diff] [blame] | 47 | acm_.reset(AudioCodingModule::Create(config_)); |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 48 | receiver_.reset(new AcmReceiver(config_)); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 49 | ASSERT_TRUE(receiver_.get() != NULL); |
| 50 | ASSERT_TRUE(acm_.get() != NULL); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 51 | acm_->InitializeReceiver(); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 52 | acm_->RegisterTransportCallback(this); |
| 53 | |
Niels Möller | afb5dbb | 2019-02-15 15:21:47 +0100 | [diff] [blame] | 54 | rtp_header_.sequenceNumber = 0; |
| 55 | rtp_header_.timestamp = 0; |
| 56 | rtp_header_.markerBit = false; |
| 57 | rtp_header_.ssrc = 0x12345678; // Arbitrary. |
| 58 | rtp_header_.numCSRCs = 0; |
| 59 | rtp_header_.payloadType = 0; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 60 | } |
| 61 | |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 62 | void TearDown() override {} |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 63 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 64 | AudioCodecInfo SetEncoder(int payload_type, |
| 65 | const SdpAudioFormat& format, |
| 66 | const std::map<int, int> cng_payload_types = {}) { |
| 67 | // Create the speech encoder. |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 68 | absl::optional<AudioCodecInfo> info = |
| 69 | encoder_factory_->QueryAudioEncoder(format); |
| 70 | RTC_CHECK(info.has_value()); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 71 | std::unique_ptr<AudioEncoder> enc = |
| 72 | encoder_factory_->MakeAudioEncoder(payload_type, format, absl::nullopt); |
| 73 | |
| 74 | // If we have a compatible CN specification, stack a CNG on top. |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 75 | auto it = cng_payload_types.find(info->sample_rate_hz); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 76 | if (it != cng_payload_types.end()) { |
Karl Wiberg | 2365936 | 2018-11-01 11:13:44 +0100 | [diff] [blame] | 77 | AudioEncoderCngConfig config; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 78 | config.speech_encoder = std::move(enc); |
| 79 | config.num_channels = 1; |
| 80 | config.payload_type = it->second; |
| 81 | config.vad_mode = Vad::kVadNormal; |
Karl Wiberg | 2365936 | 2018-11-01 11:13:44 +0100 | [diff] [blame] | 82 | enc = CreateComfortNoiseEncoder(std::move(config)); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 83 | } |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 84 | |
| 85 | // Actually start using the new encoder. |
| 86 | acm_->SetEncoder(std::move(enc)); |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 87 | return *info; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 88 | } |
| 89 | |
| 90 | int InsertOnePacketOfSilence(const AudioCodecInfo& info) { |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 91 | // Frame setup according to the codec. |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 92 | AudioFrame frame; |
| 93 | frame.sample_rate_hz_ = info.sample_rate_hz; |
| 94 | frame.samples_per_channel_ = info.sample_rate_hz / 100; // 10 ms. |
| 95 | frame.num_channels_ = info.num_channels; |
yujo | 36b1a5f | 2017-06-12 12:45:32 -0700 | [diff] [blame] | 96 | frame.Mute(); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 97 | packet_sent_ = false; |
| 98 | last_packet_send_timestamp_ = timestamp_; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 99 | int num_10ms_frames = 0; |
henrik.lundin@webrtc.org | f56c162 | 2015-03-02 12:29:30 +0000 | [diff] [blame] | 100 | while (!packet_sent_) { |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 101 | frame.timestamp_ = timestamp_; |
Mirko Bonadei | 737e073 | 2017-10-19 09:00:17 +0200 | [diff] [blame] | 102 | timestamp_ += rtc::checked_cast<uint32_t>(frame.samples_per_channel_); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 103 | EXPECT_GE(acm_->Add10MsData(frame), 0); |
| 104 | ++num_10ms_frames; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 105 | } |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 106 | return num_10ms_frames; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 107 | } |
| 108 | |
Niels Möller | 87e2d78 | 2019-03-07 10:18:23 +0100 | [diff] [blame] | 109 | int SendData(AudioFrameType frame_type, |
kjellander@webrtc.org | 14665ff | 2015-03-04 12:58:35 +0000 | [diff] [blame] | 110 | uint8_t payload_type, |
| 111 | uint32_t timestamp, |
| 112 | const uint8_t* payload_data, |
Minyue Li | ff0e4db | 2020-01-23 13:45:50 +0100 | [diff] [blame] | 113 | size_t payload_len_bytes, |
| 114 | int64_t absolute_capture_timestamp_ms) override { |
Niels Möller | c936cb6 | 2019-03-19 14:10:16 +0100 | [diff] [blame] | 115 | if (frame_type == AudioFrameType::kEmptyFrame) |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 116 | return 0; |
| 117 | |
Niels Möller | afb5dbb | 2019-02-15 15:21:47 +0100 | [diff] [blame] | 118 | rtp_header_.payloadType = payload_type; |
| 119 | rtp_header_.timestamp = timestamp; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 120 | |
kwiberg | ee2bac2 | 2015-11-11 10:34:00 -0800 | [diff] [blame] | 121 | int ret_val = receiver_->InsertPacket( |
| 122 | rtp_header_, |
| 123 | rtc::ArrayView<const uint8_t>(payload_data, payload_len_bytes)); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 124 | if (ret_val < 0) { |
Artem Titov | d325196 | 2021-11-15 16:57:07 +0100 | [diff] [blame] | 125 | RTC_DCHECK_NOTREACHED(); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 126 | return -1; |
| 127 | } |
Niels Möller | afb5dbb | 2019-02-15 15:21:47 +0100 | [diff] [blame] | 128 | rtp_header_.sequenceNumber++; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 129 | packet_sent_ = true; |
| 130 | last_frame_type_ = frame_type; |
| 131 | return 0; |
| 132 | } |
| 133 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 134 | const rtc::scoped_refptr<AudioEncoderFactory> encoder_factory_ = |
| 135 | CreateBuiltinAudioEncoderFactory(); |
| 136 | const rtc::scoped_refptr<AudioDecoderFactory> decoder_factory_ = |
| 137 | CreateBuiltinAudioDecoderFactory(); |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 138 | AudioCodingModule::Config config_; |
kwiberg | 16c5a96 | 2016-02-15 02:27:22 -0800 | [diff] [blame] | 139 | std::unique_ptr<AcmReceiver> receiver_; |
kwiberg | 16c5a96 | 2016-02-15 02:27:22 -0800 | [diff] [blame] | 140 | std::unique_ptr<AudioCodingModule> acm_; |
Niels Möller | afb5dbb | 2019-02-15 15:21:47 +0100 | [diff] [blame] | 141 | RTPHeader rtp_header_; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 142 | uint32_t timestamp_; |
| 143 | bool packet_sent_; // Set when SendData is called reset when inserting audio. |
| 144 | uint32_t last_packet_send_timestamp_; |
Niels Möller | 87e2d78 | 2019-03-07 10:18:23 +0100 | [diff] [blame] | 145 | AudioFrameType last_frame_type_; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 146 | }; |
| 147 | |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 148 | #if defined(WEBRTC_ANDROID) |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 149 | #define MAYBE_SampleRate DISABLED_SampleRate |
| 150 | #else |
| 151 | #define MAYBE_SampleRate SampleRate |
| 152 | #endif |
| 153 | TEST_F(AcmReceiverTestOldApi, MAYBE_SampleRate) { |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 154 | const std::map<int, SdpAudioFormat> codecs = {{0, {"OPUS", 48000, 2}}}; |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 155 | receiver_->SetCodecs(codecs); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 156 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 157 | constexpr int kOutSampleRateHz = 8000; // Different than codec sample rate. |
| 158 | for (size_t i = 0; i < codecs.size(); ++i) { |
| 159 | const int payload_type = rtc::checked_cast<int>(i); |
| 160 | const int num_10ms_frames = |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 161 | InsertOnePacketOfSilence(SetEncoder(payload_type, codecs.at(i))); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 162 | for (int k = 0; k < num_10ms_frames; ++k) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 163 | AudioFrame frame; |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 164 | bool muted; |
| 165 | EXPECT_EQ(0, receiver_->GetAudio(kOutSampleRateHz, &frame, &muted)); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 166 | } |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 167 | EXPECT_EQ(encoder_factory_->QueryAudioEncoder(codecs.at(i))->sample_rate_hz, |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 168 | receiver_->last_output_sample_rate_hz()); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 169 | } |
| 170 | } |
| 171 | |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 172 | class AcmReceiverTestFaxModeOldApi : public AcmReceiverTestOldApi { |
| 173 | protected: |
| 174 | AcmReceiverTestFaxModeOldApi() { |
Henrik Lundin | 7687ad5 | 2018-07-02 10:14:46 +0200 | [diff] [blame] | 175 | config_.neteq_config.for_test_no_time_stretching = true; |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 176 | } |
| 177 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 178 | void RunVerifyAudioFrame(const SdpAudioFormat& codec) { |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 179 | // Make sure "fax mode" is enabled. This will avoid delay changes unless the |
| 180 | // packet-loss concealment is made. We do this in order to make the |
| 181 | // timestamp increments predictable; in normal mode, NetEq may decide to do |
| 182 | // accelerate or pre-emptive expand operations after some time, offsetting |
| 183 | // the timestamp. |
Henrik Lundin | 7687ad5 | 2018-07-02 10:14:46 +0200 | [diff] [blame] | 184 | EXPECT_TRUE(config_.neteq_config.for_test_no_time_stretching); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 185 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 186 | constexpr int payload_type = 17; |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 187 | receiver_->SetCodecs({{payload_type, codec}}); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 188 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 189 | const AudioCodecInfo info = SetEncoder(payload_type, codec); |
| 190 | const int output_sample_rate_hz = info.sample_rate_hz; |
| 191 | const size_t output_channels = info.num_channels; |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 192 | const size_t samples_per_ms = rtc::checked_cast<size_t>( |
| 193 | rtc::CheckedDivExact(output_sample_rate_hz, 1000)); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 194 | const AudioFrame::VADActivity expected_vad_activity = |
| 195 | output_sample_rate_hz > 16000 ? AudioFrame::kVadActive |
| 196 | : AudioFrame::kVadPassive; |
| 197 | |
| 198 | // Expect the first output timestamp to be 5*fs/8000 samples before the |
| 199 | // first inserted timestamp (because of NetEq's look-ahead). (This value is |
| 200 | // defined in Expand::overlap_length_.) |
Yves Gerey | 665174f | 2018-06-19 15:03:05 +0200 | [diff] [blame] | 201 | uint32_t expected_output_ts = |
| 202 | last_packet_send_timestamp_ - |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 203 | rtc::CheckedDivExact(5 * output_sample_rate_hz, 8000); |
| 204 | |
| 205 | AudioFrame frame; |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 206 | bool muted; |
| 207 | EXPECT_EQ(0, receiver_->GetAudio(output_sample_rate_hz, &frame, &muted)); |
henrik.lundin | 15c51e3 | 2016-04-06 08:38:56 -0700 | [diff] [blame] | 208 | // Expect timestamp = 0 before first packet is inserted. |
| 209 | EXPECT_EQ(0u, frame.timestamp_); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 210 | for (int i = 0; i < 5; ++i) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 211 | const int num_10ms_frames = InsertOnePacketOfSilence(info); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 212 | for (int k = 0; k < num_10ms_frames; ++k) { |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 213 | EXPECT_EQ(0, |
| 214 | receiver_->GetAudio(output_sample_rate_hz, &frame, &muted)); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 215 | EXPECT_EQ(expected_output_ts, frame.timestamp_); |
Mirko Bonadei | 737e073 | 2017-10-19 09:00:17 +0200 | [diff] [blame] | 216 | expected_output_ts += rtc::checked_cast<uint32_t>(10 * samples_per_ms); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 217 | EXPECT_EQ(10 * samples_per_ms, frame.samples_per_channel_); |
| 218 | EXPECT_EQ(output_sample_rate_hz, frame.sample_rate_hz_); |
| 219 | EXPECT_EQ(output_channels, frame.num_channels_); |
| 220 | EXPECT_EQ(AudioFrame::kNormalSpeech, frame.speech_type_); |
| 221 | EXPECT_EQ(expected_vad_activity, frame.vad_activity_); |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 222 | EXPECT_FALSE(muted); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 223 | } |
| 224 | } |
| 225 | } |
| 226 | }; |
| 227 | |
| 228 | #if defined(WEBRTC_ANDROID) |
| 229 | #define MAYBE_VerifyAudioFramePCMU DISABLED_VerifyAudioFramePCMU |
| 230 | #else |
| 231 | #define MAYBE_VerifyAudioFramePCMU VerifyAudioFramePCMU |
| 232 | #endif |
| 233 | TEST_F(AcmReceiverTestFaxModeOldApi, MAYBE_VerifyAudioFramePCMU) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 234 | RunVerifyAudioFrame({"PCMU", 8000, 1}); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 235 | } |
| 236 | |
| 237 | #if defined(WEBRTC_ANDROID) |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 238 | #define MAYBE_VerifyAudioFrameOpus DISABLED_VerifyAudioFrameOpus |
| 239 | #else |
| 240 | #define MAYBE_VerifyAudioFrameOpus VerifyAudioFrameOpus |
| 241 | #endif |
| 242 | TEST_F(AcmReceiverTestFaxModeOldApi, MAYBE_VerifyAudioFrameOpus) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 243 | RunVerifyAudioFrame({"opus", 48000, 2}); |
henrik.lundin | 7dc6889 | 2016-04-06 01:03:02 -0700 | [diff] [blame] | 244 | } |
| 245 | |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 246 | #if defined(WEBRTC_ANDROID) |
| 247 | #define MAYBE_PostdecodingVad DISABLED_PostdecodingVad |
| 248 | #else |
| 249 | #define MAYBE_PostdecodingVad PostdecodingVad |
| 250 | #endif |
| 251 | TEST_F(AcmReceiverTestOldApi, MAYBE_PostdecodingVad) { |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 252 | EXPECT_TRUE(config_.neteq_config.enable_post_decode_vad); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 253 | constexpr int payload_type = 34; |
| 254 | const SdpAudioFormat codec = {"L16", 16000, 1}; |
| 255 | const AudioCodecInfo info = SetEncoder(payload_type, codec); |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 256 | receiver_->SetCodecs({{payload_type, codec}}); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 257 | constexpr int kNumPackets = 5; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 258 | AudioFrame frame; |
| 259 | for (int n = 0; n < kNumPackets; ++n) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 260 | const int num_10ms_frames = InsertOnePacketOfSilence(info); |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 261 | for (int k = 0; k < num_10ms_frames; ++k) { |
| 262 | bool muted; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 263 | ASSERT_EQ(0, receiver_->GetAudio(info.sample_rate_hz, &frame, &muted)); |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 264 | } |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 265 | } |
| 266 | EXPECT_EQ(AudioFrame::kVadPassive, frame.vad_activity_); |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 267 | } |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 268 | |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 269 | class AcmReceiverTestPostDecodeVadPassiveOldApi : public AcmReceiverTestOldApi { |
| 270 | protected: |
| 271 | AcmReceiverTestPostDecodeVadPassiveOldApi() { |
| 272 | config_.neteq_config.enable_post_decode_vad = false; |
| 273 | } |
| 274 | }; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 275 | |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 276 | #if defined(WEBRTC_ANDROID) |
| 277 | #define MAYBE_PostdecodingVad DISABLED_PostdecodingVad |
| 278 | #else |
| 279 | #define MAYBE_PostdecodingVad PostdecodingVad |
| 280 | #endif |
| 281 | TEST_F(AcmReceiverTestPostDecodeVadPassiveOldApi, MAYBE_PostdecodingVad) { |
| 282 | EXPECT_FALSE(config_.neteq_config.enable_post_decode_vad); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 283 | constexpr int payload_type = 34; |
| 284 | const SdpAudioFormat codec = {"L16", 16000, 1}; |
| 285 | const AudioCodecInfo info = SetEncoder(payload_type, codec); |
Jerome Humbert | 3e3c551 | 2020-01-13 11:58:26 +0000 | [diff] [blame] | 286 | auto const value = encoder_factory_->QueryAudioEncoder(codec); |
| 287 | ASSERT_TRUE(value.has_value()); |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 288 | receiver_->SetCodecs({{payload_type, codec}}); |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 289 | const int kNumPackets = 5; |
henrik.lundin | 500c04b | 2016-03-08 02:36:04 -0800 | [diff] [blame] | 290 | AudioFrame frame; |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 291 | for (int n = 0; n < kNumPackets; ++n) { |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 292 | const int num_10ms_frames = InsertOnePacketOfSilence(info); |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 293 | for (int k = 0; k < num_10ms_frames; ++k) { |
| 294 | bool muted; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 295 | ASSERT_EQ(0, receiver_->GetAudio(info.sample_rate_hz, &frame, &muted)); |
henrik.lundin | 834a6ea | 2016-05-13 03:45:24 -0700 | [diff] [blame] | 296 | } |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 297 | } |
| 298 | EXPECT_EQ(AudioFrame::kVadUnknown, frame.vad_activity_); |
| 299 | } |
| 300 | |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 301 | #if defined(WEBRTC_ANDROID) |
| 302 | #define MAYBE_LastAudioCodec DISABLED_LastAudioCodec |
kwiberg | 98ab3a4 | 2015-09-30 21:54:21 -0700 | [diff] [blame] | 303 | #else |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 304 | #define MAYBE_LastAudioCodec LastAudioCodec |
kwiberg | 98ab3a4 | 2015-09-30 21:54:21 -0700 | [diff] [blame] | 305 | #endif |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 306 | #if defined(WEBRTC_CODEC_OPUS) |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 307 | TEST_F(AcmReceiverTestOldApi, MAYBE_LastAudioCodec) { |
Alessio Bazzica | b46c4bf | 2022-11-11 16:52:46 +0100 | [diff] [blame] | 308 | const std::map<int, SdpAudioFormat> codecs = { |
| 309 | {0, {"PCMU", 8000, 1}}, {1, {"PCMA", 8000, 1}}, {2, {"L16", 32000, 1}}}; |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 310 | const std::map<int, int> cng_payload_types = { |
| 311 | {8000, 100}, {16000, 101}, {32000, 102}}; |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 312 | { |
| 313 | std::map<int, SdpAudioFormat> receive_codecs = codecs; |
| 314 | for (const auto& cng_type : cng_payload_types) { |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 315 | receive_codecs.emplace(std::make_pair( |
| 316 | cng_type.second, SdpAudioFormat("CN", cng_type.first, 1))); |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 317 | } |
| 318 | receiver_->SetCodecs(receive_codecs); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 319 | } |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 320 | |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 321 | // No audio payload is received. |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 322 | EXPECT_EQ(absl::nullopt, receiver_->LastDecoder()); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 323 | |
| 324 | // Start with sending DTX. |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 325 | packet_sent_ = false; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 326 | InsertOnePacketOfSilence( |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 327 | SetEncoder(0, codecs.at(0), cng_payload_types)); // Enough to test |
Jonas Olsson | a4d8737 | 2019-07-05 19:08:33 +0200 | [diff] [blame] | 328 | // with one codec. |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 329 | ASSERT_TRUE(packet_sent_); |
Niels Möller | c936cb6 | 2019-03-19 14:10:16 +0100 | [diff] [blame] | 330 | EXPECT_EQ(AudioFrameType::kAudioFrameCN, last_frame_type_); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 331 | |
| 332 | // Has received, only, DTX. Last Audio codec is undefined. |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 333 | EXPECT_EQ(absl::nullopt, receiver_->LastDecoder()); |
| 334 | EXPECT_EQ(absl::nullopt, receiver_->last_packet_sample_rate_hz()); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 335 | |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 336 | for (size_t i = 0; i < codecs.size(); ++i) { |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 337 | // Set DTX off to send audio payload. |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 338 | packet_sent_ = false; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 339 | const int payload_type = rtc::checked_cast<int>(i); |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 340 | const AudioCodecInfo info_without_cng = |
| 341 | SetEncoder(payload_type, codecs.at(i)); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 342 | InsertOnePacketOfSilence(info_without_cng); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 343 | |
| 344 | // Sanity check if Actually an audio payload received, and it should be |
| 345 | // of type "speech." |
| 346 | ASSERT_TRUE(packet_sent_); |
Niels Möller | c936cb6 | 2019-03-19 14:10:16 +0100 | [diff] [blame] | 347 | ASSERT_EQ(AudioFrameType::kAudioFrameSpeech, last_frame_type_); |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 348 | EXPECT_EQ(info_without_cng.sample_rate_hz, |
| 349 | receiver_->last_packet_sample_rate_hz()); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 350 | |
| 351 | // Set VAD on to send DTX. Then check if the "Last Audio codec" returns |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 352 | // the expected codec. Encode repeatedly until a DTX is sent. |
| 353 | const AudioCodecInfo info_with_cng = |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 354 | SetEncoder(payload_type, codecs.at(i), cng_payload_types); |
Niels Möller | c936cb6 | 2019-03-19 14:10:16 +0100 | [diff] [blame] | 355 | while (last_frame_type_ != AudioFrameType::kAudioFrameCN) { |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 356 | packet_sent_ = false; |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 357 | InsertOnePacketOfSilence(info_with_cng); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 358 | ASSERT_TRUE(packet_sent_); |
| 359 | } |
Karl Wiberg | 377a231 | 2018-09-24 14:52:51 +0200 | [diff] [blame] | 360 | EXPECT_EQ(info_with_cng.sample_rate_hz, |
| 361 | receiver_->last_packet_sample_rate_hz()); |
Fredrik Solenberg | f693bfa | 2018-12-11 12:22:10 +0100 | [diff] [blame] | 362 | EXPECT_EQ(codecs.at(i), receiver_->LastDecoder()->second); |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 363 | } |
| 364 | } |
Peter Boström | e2976c8 | 2016-01-04 22:44:05 +0100 | [diff] [blame] | 365 | #endif |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 366 | |
Niels Möller | 3247244 | 2019-09-04 10:14:51 +0200 | [diff] [blame] | 367 | // Check if the statistics are initialized correctly. Before any call to ACM |
| 368 | // all fields have to be zero. |
| 369 | #if defined(WEBRTC_ANDROID) |
| 370 | #define MAYBE_InitializedToZero DISABLED_InitializedToZero |
| 371 | #else |
| 372 | #define MAYBE_InitializedToZero InitializedToZero |
| 373 | #endif |
| 374 | TEST_F(AcmReceiverTestOldApi, MAYBE_InitializedToZero) { |
| 375 | AudioDecodingCallStats stats; |
| 376 | receiver_->GetDecodingCallStatistics(&stats); |
| 377 | EXPECT_EQ(0, stats.calls_to_neteq); |
| 378 | EXPECT_EQ(0, stats.calls_to_silence_generator); |
| 379 | EXPECT_EQ(0, stats.decoded_normal); |
| 380 | EXPECT_EQ(0, stats.decoded_cng); |
| 381 | EXPECT_EQ(0, stats.decoded_neteq_plc); |
| 382 | EXPECT_EQ(0, stats.decoded_plc_cng); |
| 383 | EXPECT_EQ(0, stats.decoded_muted_output); |
| 384 | } |
| 385 | |
| 386 | // Insert some packets and pull audio. Check statistics are valid. Then, |
| 387 | // simulate packet loss and check if PLC and PLC-to-CNG statistics are |
| 388 | // correctly updated. |
| 389 | #if defined(WEBRTC_ANDROID) |
| 390 | #define MAYBE_NetEqCalls DISABLED_NetEqCalls |
| 391 | #else |
| 392 | #define MAYBE_NetEqCalls NetEqCalls |
| 393 | #endif |
| 394 | TEST_F(AcmReceiverTestOldApi, MAYBE_NetEqCalls) { |
| 395 | AudioDecodingCallStats stats; |
| 396 | const int kNumNormalCalls = 10; |
| 397 | const int kSampleRateHz = 16000; |
| 398 | const int kNumSamples10ms = kSampleRateHz / 100; |
| 399 | const int kFrameSizeMs = 10; // Multiple of 10. |
| 400 | const int kFrameSizeSamples = kFrameSizeMs / 10 * kNumSamples10ms; |
| 401 | const int kPayloadSizeBytes = kFrameSizeSamples * sizeof(int16_t); |
| 402 | const uint8_t kPayloadType = 111; |
| 403 | RTPHeader rtp_header; |
| 404 | AudioFrame audio_frame; |
| 405 | bool muted; |
| 406 | |
| 407 | receiver_->SetCodecs( |
| 408 | {{kPayloadType, SdpAudioFormat("L16", kSampleRateHz, 1)}}); |
| 409 | rtp_header.sequenceNumber = 0xABCD; |
| 410 | rtp_header.timestamp = 0xABCDEF01; |
| 411 | rtp_header.payloadType = kPayloadType; |
| 412 | rtp_header.markerBit = false; |
| 413 | rtp_header.ssrc = 0x1234; |
| 414 | rtp_header.numCSRCs = 0; |
| 415 | rtp_header.payload_type_frequency = kSampleRateHz; |
| 416 | |
| 417 | for (int num_calls = 0; num_calls < kNumNormalCalls; ++num_calls) { |
| 418 | const uint8_t kPayload[kPayloadSizeBytes] = {0}; |
| 419 | ASSERT_EQ(0, receiver_->InsertPacket(rtp_header, kPayload)); |
| 420 | ++rtp_header.sequenceNumber; |
| 421 | rtp_header.timestamp += kFrameSizeSamples; |
| 422 | ASSERT_EQ(0, receiver_->GetAudio(-1, &audio_frame, &muted)); |
| 423 | EXPECT_FALSE(muted); |
| 424 | } |
| 425 | receiver_->GetDecodingCallStatistics(&stats); |
| 426 | EXPECT_EQ(kNumNormalCalls, stats.calls_to_neteq); |
| 427 | EXPECT_EQ(0, stats.calls_to_silence_generator); |
| 428 | EXPECT_EQ(kNumNormalCalls, stats.decoded_normal); |
| 429 | EXPECT_EQ(0, stats.decoded_cng); |
| 430 | EXPECT_EQ(0, stats.decoded_neteq_plc); |
| 431 | EXPECT_EQ(0, stats.decoded_plc_cng); |
| 432 | EXPECT_EQ(0, stats.decoded_muted_output); |
| 433 | |
| 434 | const int kNumPlc = 3; |
| 435 | const int kNumPlcCng = 5; |
| 436 | |
| 437 | // Simulate packet-loss. NetEq first performs PLC then PLC fades to CNG. |
| 438 | for (int n = 0; n < kNumPlc + kNumPlcCng; ++n) { |
| 439 | ASSERT_EQ(0, receiver_->GetAudio(-1, &audio_frame, &muted)); |
| 440 | EXPECT_FALSE(muted); |
| 441 | } |
| 442 | receiver_->GetDecodingCallStatistics(&stats); |
| 443 | EXPECT_EQ(kNumNormalCalls + kNumPlc + kNumPlcCng, stats.calls_to_neteq); |
| 444 | EXPECT_EQ(0, stats.calls_to_silence_generator); |
| 445 | EXPECT_EQ(kNumNormalCalls, stats.decoded_normal); |
| 446 | EXPECT_EQ(0, stats.decoded_cng); |
| 447 | EXPECT_EQ(kNumPlc, stats.decoded_neteq_plc); |
| 448 | EXPECT_EQ(kNumPlcCng, stats.decoded_plc_cng); |
| 449 | EXPECT_EQ(0, stats.decoded_muted_output); |
| 450 | // TODO(henrik.lundin) Add a test with muted state enabled. |
| 451 | } |
| 452 | |
andresp@webrtc.org | 4f6f22f | 2014-09-23 11:37:57 +0000 | [diff] [blame] | 453 | } // namespace acm2 |
| 454 | |
| 455 | } // namespace webrtc |