blob: dd6f7296df433b59ab95ffe6394e595b5ab48fae [file] [log] [blame]
aleloi24899e52017-02-21 13:06:291/*
2 * Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
3 *
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
9 */
10
Mirko Bonadei92ea95e2017-09-15 04:47:3111#include "modules/audio_mixer/frame_combiner.h"
aleloi24899e52017-02-21 13:06:2912
13#include <algorithm>
14#include <array>
Yves Gerey3e707812018-11-28 15:47:4915#include <cstdint>
16#include <iterator>
17#include <string>
aleloi24899e52017-02-21 13:06:2918
Mirko Bonadei92ea95e2017-09-15 04:47:3119#include "api/array_view.h"
Alex Loiko507e8d12018-02-27 12:51:4720#include "common_audio/include/audio_util.h"
Mirko Bonadei92ea95e2017-09-15 04:47:3121#include "modules/audio_mixer/audio_frame_manipulator.h"
22#include "modules/audio_mixer/audio_mixer_impl.h"
Yves Gerey3e707812018-11-28 15:47:4923#include "modules/audio_processing/include/audio_frame_view.h"
Alex Loiko8396e342018-06-21 10:04:0524#include "modules/audio_processing/include/audio_processing.h"
Alex Loiko507e8d12018-02-27 12:51:4725#include "modules/audio_processing/logging/apm_data_dumper.h"
Alex Loiko6f2fcb42018-03-14 11:27:0526#include "rtc_base/arraysize.h"
Mirko Bonadei92ea95e2017-09-15 04:47:3127#include "rtc_base/checks.h"
Alex Loiko6f2fcb42018-03-14 11:27:0528#include "system_wrappers/include/metrics.h"
aleloi24899e52017-02-21 13:06:2929
30namespace webrtc {
31namespace {
32
33// Stereo, 48 kHz, 10 ms.
Alex Loiko507e8d12018-02-27 12:51:4734constexpr int kMaximumAmountOfChannels = 2;
35constexpr int kMaximumChannelSize = 48 * AudioMixerImpl::kFrameDurationInMs;
aleloi24899e52017-02-21 13:06:2936
Alex Loiko507e8d12018-02-27 12:51:4737using OneChannelBuffer = std::array<float, kMaximumChannelSize>;
aleloi24899e52017-02-21 13:06:2938
Alex Loiko507e8d12018-02-27 12:51:4739void SetAudioFrameFields(const std::vector<AudioFrame*>& mix_list,
40 size_t number_of_channels,
41 int sample_rate,
42 size_t number_of_streams,
43 AudioFrame* audio_frame_for_mixing) {
44 const size_t samples_per_channel = static_cast<size_t>(
45 (sample_rate * webrtc::AudioMixerImpl::kFrameDurationInMs) / 1000);
46
47 // TODO(minyue): Issue bugs.webrtc.org/3390.
48 // Audio frame timestamp. The 'timestamp_' field is set to dummy
49 // value '0', because it is only supported in the one channel case and
50 // is then updated in the helper functions.
51 audio_frame_for_mixing->UpdateFrame(
52 0, nullptr, samples_per_channel, sample_rate, AudioFrame::kUndefined,
53 AudioFrame::kVadUnknown, number_of_channels);
54
55 if (mix_list.empty()) {
56 audio_frame_for_mixing->elapsed_time_ms_ = -1;
57 } else if (mix_list.size() == 1) {
58 audio_frame_for_mixing->timestamp_ = mix_list[0]->timestamp_;
59 audio_frame_for_mixing->elapsed_time_ms_ = mix_list[0]->elapsed_time_ms_;
Niklas Enbomef8a3eb2018-10-04 23:21:4760 audio_frame_for_mixing->ntp_time_ms_ = mix_list[0]->ntp_time_ms_;
Alex Loiko507e8d12018-02-27 12:51:4761 }
62}
63
64void MixFewFramesWithNoLimiter(const std::vector<AudioFrame*>& mix_list,
65 AudioFrame* audio_frame_for_mixing) {
66 if (mix_list.empty()) {
67 audio_frame_for_mixing->Mute();
68 return;
69 }
70 RTC_DCHECK_LE(mix_list.size(), 1);
71 std::copy(mix_list[0]->data(),
72 mix_list[0]->data() +
73 mix_list[0]->num_channels_ * mix_list[0]->samples_per_channel_,
74 audio_frame_for_mixing->mutable_data());
75}
76
77std::array<OneChannelBuffer, kMaximumAmountOfChannels> MixToFloatFrame(
78 const std::vector<AudioFrame*>& mix_list,
79 size_t samples_per_channel,
80 size_t number_of_channels) {
81 // Convert to FloatS16 and mix.
82 using OneChannelBuffer = std::array<float, kMaximumChannelSize>;
83 std::array<OneChannelBuffer, kMaximumAmountOfChannels> mixing_buffer{};
84
85 for (size_t i = 0; i < mix_list.size(); ++i) {
86 const AudioFrame* const frame = mix_list[i];
87 for (size_t j = 0; j < number_of_channels; ++j) {
88 for (size_t k = 0; k < samples_per_channel; ++k) {
89 mixing_buffer[j][k] += frame->data()[number_of_channels * k + j];
90 }
91 }
92 }
93 return mixing_buffer;
94}
95
Alessio Bazzica3e4c77f2018-11-01 20:31:3896void RunLimiter(AudioFrameView<float> mixing_buffer_view, Limiter* limiter) {
Alex Loiko507e8d12018-02-27 12:51:4797 const size_t sample_rate = mixing_buffer_view.samples_per_channel() * 1000 /
98 AudioMixerImpl::kFrameDurationInMs;
Alessio Bazzica3e4c77f2018-11-01 20:31:3899 // TODO(alessiob): Avoid calling SetSampleRate every time.
Alex Loiko8396e342018-06-21 10:04:05100 limiter->SetSampleRate(sample_rate);
101 limiter->Process(mixing_buffer_view);
Alex Loiko507e8d12018-02-27 12:51:47102}
103
104// Both interleaves and rounds.
105void InterleaveToAudioFrame(AudioFrameView<const float> mixing_buffer_view,
106 AudioFrame* audio_frame_for_mixing) {
107 const size_t number_of_channels = mixing_buffer_view.num_channels();
108 const size_t samples_per_channel = mixing_buffer_view.samples_per_channel();
109 // Put data in the result frame.
110 for (size_t i = 0; i < number_of_channels; ++i) {
111 for (size_t j = 0; j < samples_per_channel; ++j) {
112 audio_frame_for_mixing->mutable_data()[number_of_channels * j + i] =
113 FloatS16ToS16(mixing_buffer_view.channel(i)[j]);
114 }
115 }
116}
aleloi24899e52017-02-21 13:06:29117} // namespace
118
Alex Loiko507e8d12018-02-27 12:51:47119FrameCombiner::FrameCombiner(bool use_limiter)
Alex Loiko8396e342018-06-21 10:04:05120 : data_dumper_(new ApmDataDumper(0)),
Alessio Bazzica3e4c77f2018-11-01 20:31:38121 limiter_(static_cast<size_t>(48000), data_dumper_.get(), "AudioMixer"),
122 use_limiter_(use_limiter) {}
aleloi24899e52017-02-21 13:06:29123
124FrameCombiner::~FrameCombiner() = default;
125
126void FrameCombiner::Combine(const std::vector<AudioFrame*>& mix_list,
127 size_t number_of_channels,
128 int sample_rate,
aleloi2c9306e2017-03-29 11:25:16129 size_t number_of_streams,
Alex Loiko507e8d12018-02-27 12:51:47130 AudioFrame* audio_frame_for_mixing) {
aleloi24899e52017-02-21 13:06:29131 RTC_DCHECK(audio_frame_for_mixing);
Alex Loikob9a02e52018-03-19 13:32:05132
133 LogMixingStats(mix_list, sample_rate, number_of_streams);
134
Alex Loiko507e8d12018-02-27 12:51:47135 SetAudioFrameFields(mix_list, number_of_channels, sample_rate,
136 number_of_streams, audio_frame_for_mixing);
137
aleloi24899e52017-02-21 13:06:29138 const size_t samples_per_channel = static_cast<size_t>(
139 (sample_rate * webrtc::AudioMixerImpl::kFrameDurationInMs) / 1000);
140
141 for (const auto* frame : mix_list) {
142 RTC_DCHECK_EQ(samples_per_channel, frame->samples_per_channel_);
143 RTC_DCHECK_EQ(sample_rate, frame->sample_rate_hz_);
144 }
145
Alex Loiko507e8d12018-02-27 12:51:47146 // The 'num_channels_' field of frames in 'mix_list' could be
147 // different from 'number_of_channels'.
aleloi24899e52017-02-21 13:06:29148 for (auto* frame : mix_list) {
149 RemixFrame(number_of_channels, frame);
150 }
151
Alex Loiko507e8d12018-02-27 12:51:47152 if (number_of_streams <= 1) {
153 MixFewFramesWithNoLimiter(mix_list, audio_frame_for_mixing);
154 return;
aleloi24899e52017-02-21 13:06:29155 }
Alex Loiko507e8d12018-02-27 12:51:47156
157 std::array<OneChannelBuffer, kMaximumAmountOfChannels> mixing_buffer =
158 MixToFloatFrame(mix_list, samples_per_channel, number_of_channels);
159
160 // Put float data in an AudioFrameView.
161 std::array<float*, kMaximumAmountOfChannels> channel_pointers{};
162 for (size_t i = 0; i < number_of_channels; ++i) {
163 channel_pointers[i] = &mixing_buffer[i][0];
164 }
165 AudioFrameView<float> mixing_buffer_view(
166 &channel_pointers[0], number_of_channels, samples_per_channel);
167
Alex Loiko8396e342018-06-21 10:04:05168 if (use_limiter_) {
169 RunLimiter(mixing_buffer_view, &limiter_);
Alex Loiko507e8d12018-02-27 12:51:47170 }
171
172 InterleaveToAudioFrame(mixing_buffer_view, audio_frame_for_mixing);
Alex Loiko6f2fcb42018-03-14 11:27:05173}
174
175void FrameCombiner::LogMixingStats(const std::vector<AudioFrame*>& mix_list,
176 int sample_rate,
177 size_t number_of_streams) const {
178 // Log every second.
179 uma_logging_counter_++;
180 if (uma_logging_counter_ > 1000 / AudioMixerImpl::kFrameDurationInMs) {
181 uma_logging_counter_ = 0;
182 RTC_HISTOGRAM_COUNTS_100("WebRTC.Audio.AudioMixer.NumIncomingStreams",
183 static_cast<int>(number_of_streams));
184 RTC_HISTOGRAM_ENUMERATION(
185 "WebRTC.Audio.AudioMixer.NumIncomingActiveStreams",
186 static_cast<int>(mix_list.size()),
187 AudioMixerImpl::kMaximumAmountOfMixedAudioSources);
188
189 using NativeRate = AudioProcessing::NativeRate;
190 static constexpr NativeRate native_rates[] = {
191 NativeRate::kSampleRate8kHz, NativeRate::kSampleRate16kHz,
192 NativeRate::kSampleRate32kHz, NativeRate::kSampleRate48kHz};
193 const auto* rate_position = std::lower_bound(
194 std::begin(native_rates), std::end(native_rates), sample_rate);
195
196 RTC_HISTOGRAM_ENUMERATION(
197 "WebRTC.Audio.AudioMixer.MixingRate",
198 std::distance(std::begin(native_rates), rate_position),
199 arraysize(native_rates));
200 }
aleloi24899e52017-02-21 13:06:29201}
yujo36b1a5f2017-06-12 19:45:32202
aleloi24899e52017-02-21 13:06:29203} // namespace webrtc