Blame - modules/audio_processing/audio_buffer.cc - webrtc.googlesource.com/src

2011-07-07 08:21:25 +0000

[diff] [blame]

1

/*

andrew@webrtc.org

63a5098

2012-05-02 23:56:37 +0000

[diff] [blame]

2

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

3

*

4

* Use of this source code is governed by a BSD-style license

5

* that can be found in the LICENSE file in the root of the source

6

* tree. An additional intellectual property rights grant can be found

7

* in the file PATENTS. All contributing project authors may

8

* be found in the AUTHORS file in the root of the source tree.

9

*/

10

Mirko Bonadei

92ea95e

2017-09-15 06:47:31 +0200

[diff] [blame]

11

#include "modules/audio_processing/audio_buffer.h"

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

12

Yves Gerey

988cc08

2018-10-23 12:03:01 +0200

[diff] [blame]

13

#include <string.h>

Jonas Olsson

a4d8737

2019-07-05 19:08:33 +0200

[diff] [blame]

14

Yves Gerey

988cc08

2018-10-23 12:03:01 +0200

[diff] [blame]

15

#include <cstdint>

16

Mirko Bonadei

92ea95e

2017-09-15 06:47:31 +0200

[diff] [blame]

17

#include "common_audio/channel_buffer.h"

18

#include "common_audio/include/audio_util.h"

19

#include "common_audio/resampler/push_sinc_resampler.h"

Yves Gerey

988cc08

2018-10-23 12:03:01 +0200

[diff] [blame]

20

#include "modules/audio_processing/splitting_filter.h"

Mirko Bonadei

92ea95e

2017-09-15 06:47:31 +0200

[diff] [blame]

21

#include "rtc_base/checks.h"

andrew@webrtc.org

755b04a

2011-11-15 16:57:56 +0000

[diff] [blame]

22

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

namespace webrtc {

namespace {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

26

constexpr size_t kSamplesPer32kHzChannel = 320;

27

constexpr size_t kSamplesPer48kHzChannel = 480;

28

constexpr size_t kSamplesPer192kHzChannel = 1920;

29

constexpr size_t kMaxSamplesPerChannel = kSamplesPer192kHzChannel;

Alejandro Luebs

5a92aa8

2015-04-27 11:34:45 -0700

[diff] [blame]

30

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

31

size_t NumBandsFromFramesPerChannel(size_t num_frames) {

32

if (num_frames == kSamplesPer32kHzChannel) {

33

return 2;

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

34

}

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

35

if (num_frames == kSamplesPer48kHzChannel) {

36

return 3;

37

}

38

return 1;

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

39

}

40

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

41

} // namespace

42

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

43

AudioBuffer::AudioBuffer(size_t input_rate,

44

size_t input_num_channels,

45

size_t buffer_rate,

46

size_t buffer_num_channels,

47

size_t output_rate)

48

: input_num_frames_(

49

rtc::CheckedDivExact(static_cast<int>(input_rate), 100)),

50

input_num_channels_(input_num_channels),

51

buffer_num_frames_(

52

rtc::CheckedDivExact(static_cast<int>(buffer_rate), 100)),

53

buffer_num_channels_(buffer_num_channels),

54

output_num_frames_(

55

rtc::CheckedDivExact(static_cast<int>(output_rate), 100)),

56

num_channels_(buffer_num_channels),

57

num_bands_(NumBandsFromFramesPerChannel(buffer_num_frames_)),

58

num_split_frames_(rtc::CheckedDivExact(buffer_num_frames_, num_bands_)),

59

data_(new ChannelBuffer<float>(buffer_num_frames_, buffer_num_channels_)),

60

output_buffer_(

61

new ChannelBuffer<float>(output_num_frames_, num_channels_)) {

kwiberg

af476c7

2016-11-28 15:21:39 -0800

[diff] [blame]

62

RTC_DCHECK_GT(input_num_frames_, 0);

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

63

RTC_DCHECK_GT(buffer_num_frames_, 0);

kwiberg

af476c7

2016-11-28 15:21:39 -0800

[diff] [blame]

64

RTC_DCHECK_GT(output_num_frames_, 0);

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

65

RTC_DCHECK_GT(input_num_channels_, 0);

66

RTC_DCHECK_GT(buffer_num_channels_, 0);

67

RTC_DCHECK_LE(buffer_num_channels_, input_num_channels_);

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

68

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

69

const bool input_resampling_needed = input_num_frames_ != buffer_num_frames_;

70

const bool output_resampling_needed =

71

output_num_frames_ != buffer_num_frames_;

72

if (input_resampling_needed) {

73

for (size_t i = 0; i < buffer_num_channels_; ++i) {

74

input_resamplers_.push_back(std::unique_ptr<PushSincResampler>(

75

new PushSincResampler(input_num_frames_, buffer_num_frames_)));

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

76

}

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

77

}

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

78

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

79

if (output_resampling_needed) {

80

for (size_t i = 0; i < buffer_num_channels_; ++i) {

81

output_resamplers_.push_back(std::unique_ptr<PushSincResampler>(

82

new PushSincResampler(buffer_num_frames_, output_num_frames_)));

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

}

}

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

86

if (num_bands_ > 1) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

87

split_data_.reset(new ChannelBuffer<float>(

88

buffer_num_frames_, buffer_num_channels_, num_bands_));

89

splitting_filter_.reset(new SplittingFilter(

90

buffer_num_channels_, num_bands_, buffer_num_frames_));

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

}

}

andrew@webrtc.org

2014-04-24 18:28:56 +0000

[diff] [blame]

94

AudioBuffer::~AudioBuffer() {}

95

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

96

void AudioBuffer::set_downmixing_to_specific_channel(size_t channel) {

97

downmix_by_averaging_ = false;

98

RTC_DCHECK_GT(input_num_channels_, channel);

99

channel_for_downmixing_ = std::min(channel, input_num_channels_ - 1);

100

}

101

102

void AudioBuffer::set_downmixing_by_averaging() {

103

downmix_by_averaging_ = true;

104

}

105

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

106

void AudioBuffer::CopyFrom(const float* const* data,

Michael Graczyk

86c6d33

2015-07-23 11:41:39 -0700

[diff] [blame]

107

const StreamConfig& stream_config) {

kwiberg

2016-09-14 05:23:22 -0700

[diff] [blame]

108

RTC_DCHECK_EQ(stream_config.num_frames(), input_num_frames_);

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

109

RTC_DCHECK_EQ(stream_config.num_channels(), input_num_channels_);

110

RestoreNumChannels();

111

const bool downmix_needed = input_num_channels_ > 1 && num_channels_ == 1;

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

112

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

113

const bool resampling_needed = input_num_frames_ != buffer_num_frames_;

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

114

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

115

if (downmix_needed) {

116

RTC_DCHECK_GT(kMaxSamplesPerChannel, input_num_frames_);

117

118

std::array<float, kMaxSamplesPerChannel> downmix;

119

if (downmix_by_averaging_) {

120

const float kOneByNumChannels = 1.f / input_num_channels_;

121

for (size_t i = 0; i < input_num_frames_; ++i) {

122

float value = data[0][i];

123

for (size_t j = 1; j < input_num_channels_; ++j) {

124

value += data[j][i];

125

}

126

downmix[i] = value * kOneByNumChannels;

127

}

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

128

}

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

129

const float* downmixed_data =

130

downmix_by_averaging_ ? downmix.data() : data[channel_for_downmixing_];

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

131

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

132

if (resampling_needed) {

133

input_resamplers_[0]->Resample(downmixed_data, input_num_frames_,

134

data_->channels()[0], buffer_num_frames_);

135

}

136

const float* data_to_convert =

137

resampling_needed ? data_->channels()[0] : downmixed_data;

138

FloatToFloatS16(data_to_convert, buffer_num_frames_, data_->channels()[0]);

139

} else {

140

if (resampling_needed) {

141

for (size_t i = 0; i < num_channels_; ++i) {

142

input_resamplers_[i]->Resample(data[i], input_num_frames_,

143

data_->channels()[i],

144

buffer_num_frames_);

145

FloatToFloatS16(data_->channels()[i], buffer_num_frames_,

146

data_->channels()[i]);

147

}

148

} else {

149

for (size_t i = 0; i < num_channels_; ++i) {

150

FloatToFloatS16(data[i], buffer_num_frames_, data_->channels()[i]);

151

}

152

}

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

}

}

Michael Graczyk

2015-07-23 11:41:39 -0700

[diff] [blame]

156

void AudioBuffer::CopyTo(const StreamConfig& stream_config,

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

157

float* const* data) {

kwiberg

2016-09-14 05:23:22 -0700

[diff] [blame]

158

RTC_DCHECK_EQ(stream_config.num_frames(), output_num_frames_);

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

159

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

160

const bool resampling_needed = output_num_frames_ != buffer_num_frames_;

161

if (resampling_needed) {

Peter Kasting

6955870

2016-01-12 16:26:35 -0800

[diff] [blame]

162

for (size_t i = 0; i < num_channels_; ++i) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

163

FloatS16ToFloat(data_->channels()[i], buffer_num_frames_,

164

data_->channels()[i]);

165

output_resamplers_[i]->Resample(data_->channels()[i], buffer_num_frames_,

166

data[i], output_num_frames_);

167

}

168

} else {

169

for (size_t i = 0; i < num_channels_; ++i) {

170

FloatS16ToFloat(data_->channels()[i], buffer_num_frames_, data[i]);

andrew@webrtc.org

2014-04-22 21:00:04 +0000

[diff] [blame]

171

}

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

172

}

aluebs

b2328d1

2016-01-11 20:32:29 -0800

[diff] [blame]

173

Peter Kasting

6955870

2016-01-12 16:26:35 -0800

[diff] [blame]

174

for (size_t i = num_channels_; i < stream_config.num_channels(); ++i) {

aluebs

b2328d1

2016-01-11 20:32:29 -0800

[diff] [blame]

175

memcpy(data[i], data[0], output_num_frames_ * sizeof(**data));

176

}

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

177

}

178

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

179

void AudioBuffer::RestoreNumChannels() {

180

num_channels_ = buffer_num_channels_;

181

data_->set_num_channels(buffer_num_channels_);

Alejandro Luebs

a181c9a

2016-06-30 15:33:37 -0700

[diff] [blame]

182

if (split_data_.get()) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

183

split_data_->set_num_channels(buffer_num_channels_);

Alejandro Luebs

a181c9a

2016-06-30 15:33:37 -0700

[diff] [blame]

184

}

andrew@webrtc.org

17e4064

2014-03-04 20:58:13 +0000

[diff] [blame]

185

}

186

Peter Kasting

6955870

2016-01-12 16:26:35 -0800

[diff] [blame]

187

void AudioBuffer::set_num_channels(size_t num_channels) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

188

RTC_DCHECK_GE(buffer_num_channels_, num_channels);

aluebs@webrtc.org

27d106b

2014-12-11 17:09:21 +0000

[diff] [blame]

189

num_channels_ = num_channels;

Alejandro Luebs

a181c9a

2016-06-30 15:33:37 -0700

[diff] [blame]

190

data_->set_num_channels(num_channels);

191

if (split_data_.get()) {

192

split_data_->set_num_channels(num_channels);

193

}

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

194

}

195

Alejandro Luebs

05c7605

2015-05-20 14:39:39 -0700

[diff] [blame]

196

// The resampler is only for supporting 48kHz to 16kHz in the reverse stream.

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

197

void AudioBuffer::CopyFrom(const AudioFrame* frame) {

198

RTC_DCHECK_EQ(frame->num_channels_, input_num_channels_);

kwiberg

2016-09-14 05:23:22 -0700

[diff] [blame]

199

RTC_DCHECK_EQ(frame->samples_per_channel_, input_num_frames_);

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

200

RestoreNumChannels();

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

201

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

202

const bool resampling_required = input_num_frames_ != buffer_num_frames_;

Alejandro Luebs

05c7605

2015-05-20 14:39:39 -0700

[diff] [blame]

203

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

204

const int16_t* interleaved = frame->data();

205

if (num_channels_ == 1) {

206

if (input_num_channels_ == 1) {

207

if (resampling_required) {

208

std::array<float, kMaxSamplesPerChannel> float_buffer;

209

S16ToFloatS16(interleaved, input_num_frames_, float_buffer.data());

210

input_resamplers_[0]->Resample(float_buffer.data(), input_num_frames_,

211

data_->channels()[0],

212

buffer_num_frames_);

213

} else {

214

S16ToFloatS16(interleaved, input_num_frames_, data_->channels()[0]);

215

}

216

} else {

217

std::array<float, kMaxSamplesPerChannel> float_buffer;

218

float* downmixed_data =

219

resampling_required ? float_buffer.data() : data_->channels()[0];

220

if (downmix_by_averaging_) {

221

for (size_t j = 0, k = 0; j < input_num_frames_; ++j) {

222

int32_t sum = 0;

223

for (size_t i = 0; i < input_num_channels_; ++i, ++k) {

224

sum += interleaved[k];

225

}

226

downmixed_data[j] = sum / static_cast<int16_t>(input_num_channels_);

227

}

228

} else {

229

for (size_t j = 0, k = channel_for_downmixing_; j < input_num_frames_;

230

++j, k += input_num_channels_) {

231

downmixed_data[j] = interleaved[k];

}

}

if (resampling_required) {

236

input_resamplers_[0]->Resample(downmixed_data, input_num_frames_,

237

data_->channels()[0],

buffer_num_frames_);

}

}

} else {

auto deinterleave_channel = [](size_t channel, size_t num_channels,

243

size_t samples_per_channel, const int16_t* x,

244

float* y) {

245

for (size_t j = 0, k = channel; j < samples_per_channel;

246

++j, k += num_channels) {

y[j] = x[k];

}

};

if (resampling_required) {

252

std::array<float, kMaxSamplesPerChannel> float_buffer;

253

for (size_t i = 0; i < num_channels_; ++i) {

254

deinterleave_channel(i, num_channels_, input_num_frames_, interleaved,

255

float_buffer.data());

256

input_resamplers_[i]->Resample(float_buffer.data(), input_num_frames_,

257

data_->channels()[i],

buffer_num_frames_);

}

} else {

for (size_t i = 0; i < num_channels_; ++i) {

262

deinterleave_channel(i, num_channels_, input_num_frames_, interleaved,

263

data_->channels()[i]);

264

}

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

}

}

}

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

269

void AudioBuffer::CopyTo(AudioFrame* frame) const {

kwiberg

2016-09-14 05:23:22 -0700

[diff] [blame]

270

RTC_DCHECK(frame->num_channels_ == num_channels_ || num_channels_ == 1);

271

RTC_DCHECK_EQ(frame->samples_per_channel_, output_num_frames_);

ekmeyerson

2015-08-14 10:35:55 -0700

[diff] [blame]

272

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

273

const bool resampling_required = buffer_num_frames_ != output_num_frames_;

ekmeyerson

2015-08-14 10:35:55 -0700

[diff] [blame]

274

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

275

int16_t* interleaved = frame->mutable_data();

276

if (num_channels_ == 1) {

277

std::array<float, kMaxSamplesPerChannel> float_buffer;

278

279

if (resampling_required) {

280

output_resamplers_[0]->Resample(data_->channels()[0], buffer_num_frames_,

281

float_buffer.data(), output_num_frames_);

282

}

283

const float* deinterleaved =

284

resampling_required ? float_buffer.data() : data_->channels()[0];

285

286

if (frame->num_channels_ == 1) {

287

for (size_t j = 0; j < output_num_frames_; ++j) {

288

interleaved[j] = FloatS16ToS16(deinterleaved[j]);

289

}

290

} else {

291

for (size_t i = 0, k = 0; i < output_num_frames_; ++i) {

292

float tmp = FloatS16ToS16(deinterleaved[i]);

293

for (size_t j = 0; j < frame->num_channels_; ++j, ++k) {

294

interleaved[k] = tmp;

295

}

296

}

297

}

ekmeyerson

2015-08-14 10:35:55 -0700

[diff] [blame]

298

} else {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

299

auto interleave_channel = [](size_t channel, size_t num_channels,

300

size_t samples_per_channel, const float* x,

301

int16_t* y) {

302

for (size_t k = 0, j = channel; k < samples_per_channel;

303

++k, j += num_channels) {

304

y[j] = FloatS16ToS16(x[k]);

}

};

if (resampling_required) {

309

for (size_t i = 0; i < num_channels_; ++i) {

310

std::array<float, kMaxSamplesPerChannel> float_buffer;

311

output_resamplers_[i]->Resample(data_->channels()[i],

312

buffer_num_frames_, float_buffer.data(),

313

output_num_frames_);

314

interleave_channel(i, frame->num_channels_, output_num_frames_,

315

float_buffer.data(), interleaved);

316

}

317

} else {

318

for (size_t i = 0; i < num_channels_; ++i) {

319

interleave_channel(i, frame->num_channels_, output_num_frames_,

320

data_->channels()[i], interleaved);

}

}

for (size_t i = num_channels_; i < frame->num_channels_; ++i) {

325

for (size_t j = 0, k = i, n = num_channels_; j < output_num_frames_;

326

++j, k += frame->num_channels_, n += frame->num_channels_) {

327

interleaved[k] = interleaved[n];

328

}

329

}

ekmeyerson

2015-08-14 10:35:55 -0700

[diff] [blame]

330

}

niklase@google.com

2011-07-07 08:21:25 +0000

[diff] [blame]

331

}

332

aluebs@webrtc.org

be05c74

2014-11-14 22:18:10 +0000

[diff] [blame]

333

void AudioBuffer::SplitIntoFrequencyBands() {

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

334

splitting_filter_->Analysis(data_.get(), split_data_.get());

aluebs@webrtc.org

be05c74

2014-11-14 22:18:10 +0000

[diff] [blame]

335

}

336

337

void AudioBuffer::MergeFrequencyBands() {

aluebs@webrtc.org

2015-02-10 22:52:15 +0000

[diff] [blame]

338

splitting_filter_->Synthesis(split_data_.get(), data_.get());

aluebs@webrtc.org

be05c74

2014-11-14 22:18:10 +0000

[diff] [blame]

339

}

340

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

341

void AudioBuffer::ExportSplitChannelData(size_t channel,

Per Åhgren

2019-08-20 09:19:21 +0200

[diff] [blame]

342

int16_t* const* split_band_data) {

343

for (size_t k = 0; k < num_bands(); ++k) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

344

const float* band_data = split_bands(channel)[k];

345

Per Åhgren

2019-08-20 09:19:21 +0200

[diff] [blame]

346

RTC_DCHECK(split_band_data[k]);

347

RTC_DCHECK(band_data);

348

for (size_t i = 0; i < num_frames_per_band(); ++i) {

349

split_band_data[k][i] = FloatS16ToS16(band_data[i]);

}

}

}

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

354

void AudioBuffer::ImportSplitChannelData(

Per Åhgren

2019-08-20 09:19:21 +0200

[diff] [blame]

355

size_t channel,

356

const int16_t* const* split_band_data) {

357

for (size_t k = 0; k < num_bands(); ++k) {

Per Åhgren

2019-08-21 15:02:37 +0200

[diff] [blame]

358

float* band_data = split_bands(channel)[k];

Per Åhgren