Blame - audio/audio_transport_impl.cc - webrtc.googlesource.com/src

blob: 44e95aa909a66967f750af5c3887bc8f2896cd91 [file] [log] [blame]

Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	1	/*
				2	* Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
				3	*
				4	* Use of this source code is governed by a BSD-style license
				5	* that can be found in the LICENSE file in the root of the source
				6	* tree. An additional intellectual property rights grant can be found
				7	* in the file PATENTS. All contributing project authors may
				8	* be found in the AUTHORS file in the root of the source tree.
				9	*/
				10
				11	#include "audio/audio_transport_impl.h"
				12
				13	#include <algorithm>
				14	#include <memory>
				15	#include <utility>
				16
Fredrik Solenberg	a8b7c7f	2018-01-17 11:18:31 +0100	[diff] [blame]	17	#include "audio/remix_resample.h"
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	18	#include "audio/utility/audio_frame_operations.h"
				19	#include "call/audio_send_stream.h"
				20	#include "rtc_base/logging.h"
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	21
				22	namespace webrtc {
				23
				24	namespace {
				25
				26	// We want to process at the lowest sample rate and channel count possible
				27	// without losing information. Choose the lowest native rate at least equal to
				28	// the minimum of input and codec rates, choose lowest channel count, and
				29	// configure the audio frame.
				30	void InitializeCaptureFrame(int input_sample_rate,
				31	int send_sample_rate_hz,
				32	size_t input_num_channels,
				33	size_t send_num_channels,
				34	AudioFrame* audio_frame) {
				35	RTC_DCHECK(audio_frame);
				36	int min_processing_rate_hz = std::min(input_sample_rate, send_sample_rate_hz);
				37	for (int native_rate_hz : AudioProcessing::kNativeSampleRatesHz) {
				38	audio_frame->sample_rate_hz_ = native_rate_hz;
				39	if (audio_frame->sample_rate_hz_ >= min_processing_rate_hz) {
				40	break;
				41	}
				42	}
				43	audio_frame->num_channels_ = std::min(input_num_channels, send_num_channels);
				44	}
				45
henrika	649a385	2017-12-22 13:58:29 +0100	[diff] [blame]	46	void ProcessCaptureFrame(uint32_t delay_ms,
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	47	bool key_pressed,
				48	bool swap_stereo_channels,
				49	AudioProcessing* audio_processing,
				50	AudioFrame* audio_frame) {
				51	RTC_DCHECK(audio_processing);
				52	RTC_DCHECK(audio_frame);
				53	RTC_DCHECK(
				54	!audio_processing->echo_cancellation()->is_drift_compensation_enabled());
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	55	audio_processing->set_stream_delay_ms(delay_ms);
				56	audio_processing->set_stream_key_pressed(key_pressed);
henrika	649a385	2017-12-22 13:58:29 +0100	[diff] [blame]	57	int error = audio_processing->ProcessStream(audio_frame);
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	58	RTC_DCHECK_EQ(0, error) << "ProcessStream() error: " << error;
				59	if (swap_stereo_channels) {
				60	AudioFrameOperations::SwapStereoChannels(audio_frame);
				61	}
				62	}
				63
				64	// Resample audio in \|frame\| to given sample rate preserving the
				65	// channel count and place the result in \|destination\|.
				66	int Resample(const AudioFrame& frame,
				67	const int destination_sample_rate,
				68	PushResampler<int16_t>* resampler,
				69	int16_t* destination) {
				70	const int number_of_channels = static_cast<int>(frame.num_channels_);
				71	const int target_number_of_samples_per_channel =
				72	destination_sample_rate / 100;
				73	resampler->InitializeIfNeeded(frame.sample_rate_hz_, destination_sample_rate,
				74	number_of_channels);
				75
				76	// TODO(yujo): make resampler take an AudioFrame, and add special case
				77	// handling of muted frames.
				78	return resampler->Resample(
				79	frame.data(), frame.samples_per_channel_ * number_of_channels,
				80	destination, number_of_channels * target_number_of_samples_per_channel);
				81	}
				82	} // namespace
				83
				84	AudioTransportImpl::AudioTransportImpl(AudioMixer* mixer,
henrika	649a385	2017-12-22 13:58:29 +0100	[diff] [blame]	85	AudioProcessing* audio_processing)
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame^]	86	: audio_processing_(audio_processing), mixer_(mixer) {
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	87	RTC_DCHECK(mixer);
				88	RTC_DCHECK(audio_processing);
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	89	}
				90
				91	AudioTransportImpl::~AudioTransportImpl() {}
				92
				93	// Not used in Chromium. Process captured audio and distribute to all sending
				94	// streams, and try to do this at the lowest possible sample rate.
				95	int32_t AudioTransportImpl::RecordedDataIsAvailable(
				96	const void* audio_data,
				97	const size_t number_of_frames,
				98	const size_t bytes_per_sample,
				99	const size_t number_of_channels,
				100	const uint32_t sample_rate,
				101	const uint32_t audio_delay_milliseconds,
				102	const int32_t /clock_drift/,
henrika	649a385	2017-12-22 13:58:29 +0100	[diff] [blame]	103	const uint32_t /volume/,
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	104	const bool key_pressed,
				105	uint32_t& /new_mic_volume/) { // NOLINT: to avoid changing APIs
				106	RTC_DCHECK(audio_data);
				107	RTC_DCHECK_GE(number_of_channels, 1);
				108	RTC_DCHECK_LE(number_of_channels, 2);
				109	RTC_DCHECK_EQ(2 * number_of_channels, bytes_per_sample);
				110	RTC_DCHECK_GE(sample_rate, AudioProcessing::NativeRate::kSampleRate8kHz);
				111	// 100 = 1 second / data duration (10 ms).
				112	RTC_DCHECK_EQ(number_of_frames * 100, sample_rate);
				113	RTC_DCHECK_LE(bytes_per_sample * number_of_frames * number_of_channels,
				114	AudioFrame::kMaxDataSizeBytes);
				115
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	116	int send_sample_rate_hz = 0;
				117	size_t send_num_channels = 0;
				118	bool swap_stereo_channels = false;
				119	{
				120	rtc::CritScope lock(&capture_lock_);
				121	send_sample_rate_hz = send_sample_rate_hz_;
				122	send_num_channels = send_num_channels_;
				123	swap_stereo_channels = swap_stereo_channels_;
				124	}
				125
				126	std::unique_ptr<AudioFrame> audio_frame(new AudioFrame());
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame^]	127	InitializeCaptureFrame(sample_rate, send_sample_rate_hz, number_of_channels,
				128	send_num_channels, audio_frame.get());
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	129	voe::RemixAndResample(static_cast<const int16_t*>(audio_data),
				130	number_of_frames, number_of_channels, sample_rate,
				131	&capture_resampler_, audio_frame.get());
henrika	649a385	2017-12-22 13:58:29 +0100	[diff] [blame]	132	ProcessCaptureFrame(audio_delay_milliseconds, key_pressed,
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	133	swap_stereo_channels, audio_processing_,
				134	audio_frame.get());
				135
				136	// Typing detection (utilizes the APM/VAD decision). We let the VAD determine
				137	// if we're using this feature or not.
				138	// TODO(solenberg): is_enabled() takes a lock. Work around that.
				139	bool typing_detected = false;
				140	if (audio_processing_->voice_detection()->is_enabled()) {
				141	if (audio_frame->vad_activity_ != AudioFrame::kVadUnknown) {
				142	bool vad_active = audio_frame->vad_activity_ == AudioFrame::kVadActive;
				143	typing_detected = typing_detection_.Process(key_pressed, vad_active);
				144	}
				145	}
				146
				147	// Measure audio level of speech after all processing.
				148	double sample_duration = static_cast<double>(number_of_frames) / sample_rate;
				149	audio_level_.ComputeLevel(*audio_frame.get(), sample_duration);
				150
				151	// Copy frame and push to each sending stream. The copy is required since an
				152	// encoding task will be posted internally to each stream.
				153	{
				154	rtc::CritScope lock(&capture_lock_);
				155	typing_noise_detected_ = typing_detected;
				156
				157	RTC_DCHECK_GT(audio_frame->samples_per_channel_, 0);
				158	if (!sending_streams_.empty()) {
				159	auto it = sending_streams_.begin();
				160	while (++it != sending_streams_.end()) {
				161	std::unique_ptr<AudioFrame> audio_frame_copy(new AudioFrame());
				162	audio_frame_copy->CopyFrom(*audio_frame.get());
				163	(*it)->SendAudioData(std::move(audio_frame_copy));
				164	}
				165	// Send the original frame to the first stream w/o copying.
				166	(*sending_streams_.begin())->SendAudioData(std::move(audio_frame));
				167	}
				168	}
				169
				170	return 0;
				171	}
				172
				173	// Mix all received streams, feed the result to the AudioProcessing module, then
				174	// resample the result to the requested output rate.
				175	int32_t AudioTransportImpl::NeedMorePlayData(const size_t nSamples,
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame^]	176	const size_t nBytesPerSample,
				177	const size_t nChannels,
				178	const uint32_t samplesPerSec,
				179	void* audioSamples,
				180	size_t& nSamplesOut,
				181	int64_t* elapsed_time_ms,
				182	int64_t* ntp_time_ms) {
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	183	RTC_DCHECK_EQ(sizeof(int16_t) * nChannels, nBytesPerSample);
				184	RTC_DCHECK_GE(nChannels, 1);
				185	RTC_DCHECK_LE(nChannels, 2);
				186	RTC_DCHECK_GE(
				187	samplesPerSec,
				188	static_cast<uint32_t>(AudioProcessing::NativeRate::kSampleRate8kHz));
				189
				190	// 100 = 1 second / data duration (10 ms).
				191	RTC_DCHECK_EQ(nSamples * 100, samplesPerSec);
				192	RTC_DCHECK_LE(nBytesPerSample * nSamples * nChannels,
				193	AudioFrame::kMaxDataSizeBytes);
				194
				195	mixer_->Mix(nChannels, &mixed_frame_);
				196	*elapsed_time_ms = mixed_frame_.elapsed_time_ms_;
				197	*ntp_time_ms = mixed_frame_.ntp_time_ms_;
				198
				199	const auto error = audio_processing_->ProcessReverseStream(&mixed_frame_);
				200	RTC_DCHECK_EQ(error, AudioProcessing::kNoError);
				201
				202	nSamplesOut = Resample(mixed_frame_, samplesPerSec, &render_resampler_,
				203	static_cast<int16_t*>(audioSamples));
				204	RTC_DCHECK_EQ(nSamplesOut, nChannels * nSamples);
				205	return 0;
				206	}
				207
				208	// Used by Chromium - same as NeedMorePlayData() but because Chrome has its
				209	// own APM instance, does not call audio_processing_->ProcessReverseStream().
				210	void AudioTransportImpl::PullRenderData(int bits_per_sample,
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame^]	211	int sample_rate,
				212	size_t number_of_channels,
				213	size_t number_of_frames,
				214	void* audio_data,
				215	int64_t* elapsed_time_ms,
				216	int64_t* ntp_time_ms) {
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	217	RTC_DCHECK_EQ(bits_per_sample, 16);
				218	RTC_DCHECK_GE(number_of_channels, 1);
				219	RTC_DCHECK_LE(number_of_channels, 2);
				220	RTC_DCHECK_GE(sample_rate, AudioProcessing::NativeRate::kSampleRate8kHz);
				221
				222	// 100 = 1 second / data duration (10 ms).
				223	RTC_DCHECK_EQ(number_of_frames * 100, sample_rate);
				224
				225	// 8 = bits per byte.
				226	RTC_DCHECK_LE(bits_per_sample / 8 * number_of_frames * number_of_channels,
				227	AudioFrame::kMaxDataSizeBytes);
				228	mixer_->Mix(number_of_channels, &mixed_frame_);
				229	*elapsed_time_ms = mixed_frame_.elapsed_time_ms_;
				230	*ntp_time_ms = mixed_frame_.ntp_time_ms_;
				231
				232	auto output_samples = Resample(mixed_frame_, sample_rate, &render_resampler_,
				233	static_cast<int16_t*>(audio_data));
				234	RTC_DCHECK_EQ(output_samples, number_of_channels * number_of_frames);
				235	}
				236
				237	void AudioTransportImpl::UpdateSendingStreams(
Yves Gerey	665174f	2018-06-19 15:03:05 +0200	[diff] [blame^]	238	std::vector<AudioSendStream*> streams,
				239	int send_sample_rate_hz,
Fredrik Solenberg	2a87797	2017-12-15 16:42:15 +0100	[diff] [blame]	240	size_t send_num_channels) {
				241	rtc::CritScope lock(&capture_lock_);
				242	sending_streams_ = std::move(streams);
				243	send_sample_rate_hz_ = send_sample_rate_hz;
				244	send_num_channels_ = send_num_channels;
				245	}
				246
				247	void AudioTransportImpl::SetStereoChannelSwapping(bool enable) {
				248	rtc::CritScope lock(&capture_lock_);
				249	swap_stereo_channels_ = enable;
				250	}
				251
				252	bool AudioTransportImpl::typing_noise_detected() const {
				253	rtc::CritScope lock(&capture_lock_);
				254	return typing_noise_detected_;
				255	}
				256	} // namespace webrtc