xref: /aosp_15_r20/external/webrtc/modules/audio_mixer/audio_mixer_impl.cc (revision d9f758449e529ab9291ac668be2861e7a55c2422)
1 /*
2  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include "modules/audio_mixer/audio_mixer_impl.h"
12 
13 #include <stdint.h>
14 
15 #include <algorithm>
16 #include <iterator>
17 #include <type_traits>
18 #include <utility>
19 
20 #include "modules/audio_mixer/audio_frame_manipulator.h"
21 #include "modules/audio_mixer/default_output_rate_calculator.h"
22 #include "rtc_base/checks.h"
23 #include "rtc_base/logging.h"
24 #include "rtc_base/trace_event.h"
25 
26 namespace webrtc {
27 
28 struct AudioMixerImpl::SourceStatus {
SourceStatuswebrtc::AudioMixerImpl::SourceStatus29   SourceStatus(Source* audio_source, bool is_mixed, float gain)
30       : audio_source(audio_source), is_mixed(is_mixed), gain(gain) {}
31   Source* audio_source = nullptr;
32   bool is_mixed = false;
33   float gain = 0.0f;
34 
35   // A frame that will be passed to audio_source->GetAudioFrameWithInfo.
36   AudioFrame audio_frame;
37 };
38 
39 namespace {
40 
41 struct SourceFrame {
42   SourceFrame() = default;
43 
SourceFramewebrtc::__anona8e001850111::SourceFrame44   SourceFrame(AudioMixerImpl::SourceStatus* source_status,
45               AudioFrame* audio_frame,
46               bool muted)
47       : source_status(source_status), audio_frame(audio_frame), muted(muted) {
48     RTC_DCHECK(source_status);
49     RTC_DCHECK(audio_frame);
50     if (!muted) {
51       energy = AudioMixerCalculateEnergy(*audio_frame);
52     }
53   }
54 
SourceFramewebrtc::__anona8e001850111::SourceFrame55   SourceFrame(AudioMixerImpl::SourceStatus* source_status,
56               AudioFrame* audio_frame,
57               bool muted,
58               uint32_t energy)
59       : source_status(source_status),
60         audio_frame(audio_frame),
61         muted(muted),
62         energy(energy) {
63     RTC_DCHECK(source_status);
64     RTC_DCHECK(audio_frame);
65   }
66 
67   AudioMixerImpl::SourceStatus* source_status = nullptr;
68   AudioFrame* audio_frame = nullptr;
69   bool muted = true;
70   uint32_t energy = 0;
71 };
72 
73 // ShouldMixBefore(a, b) is used to select mixer sources.
74 // Returns true if `a` is preferred over `b` as a source to be mixed.
ShouldMixBefore(const SourceFrame & a,const SourceFrame & b)75 bool ShouldMixBefore(const SourceFrame& a, const SourceFrame& b) {
76   if (a.muted != b.muted) {
77     return b.muted;
78   }
79 
80   const auto a_activity = a.audio_frame->vad_activity_;
81   const auto b_activity = b.audio_frame->vad_activity_;
82 
83   if (a_activity != b_activity) {
84     return a_activity == AudioFrame::kVadActive;
85   }
86 
87   return a.energy > b.energy;
88 }
89 
RampAndUpdateGain(rtc::ArrayView<const SourceFrame> mixed_sources_and_frames)90 void RampAndUpdateGain(
91     rtc::ArrayView<const SourceFrame> mixed_sources_and_frames) {
92   for (const auto& source_frame : mixed_sources_and_frames) {
93     float target_gain = source_frame.source_status->is_mixed ? 1.0f : 0.0f;
94     Ramp(source_frame.source_status->gain, target_gain,
95          source_frame.audio_frame);
96     source_frame.source_status->gain = target_gain;
97   }
98 }
99 
100 std::vector<std::unique_ptr<AudioMixerImpl::SourceStatus>>::const_iterator
FindSourceInList(AudioMixerImpl::Source const * audio_source,std::vector<std::unique_ptr<AudioMixerImpl::SourceStatus>> const * audio_source_list)101 FindSourceInList(
102     AudioMixerImpl::Source const* audio_source,
103     std::vector<std::unique_ptr<AudioMixerImpl::SourceStatus>> const*
104         audio_source_list) {
105   return std::find_if(
106       audio_source_list->begin(), audio_source_list->end(),
107       [audio_source](const std::unique_ptr<AudioMixerImpl::SourceStatus>& p) {
108         return p->audio_source == audio_source;
109       });
110 }
111 }  // namespace
112 
113 struct AudioMixerImpl::HelperContainers {
resizewebrtc::AudioMixerImpl::HelperContainers114   void resize(size_t size) {
115     audio_to_mix.resize(size);
116     audio_source_mixing_data_list.resize(size);
117     ramp_list.resize(size);
118     preferred_rates.resize(size);
119   }
120 
121   std::vector<AudioFrame*> audio_to_mix;
122   std::vector<SourceFrame> audio_source_mixing_data_list;
123   std::vector<SourceFrame> ramp_list;
124   std::vector<int> preferred_rates;
125 };
126 
AudioMixerImpl(std::unique_ptr<OutputRateCalculator> output_rate_calculator,bool use_limiter,int max_sources_to_mix)127 AudioMixerImpl::AudioMixerImpl(
128     std::unique_ptr<OutputRateCalculator> output_rate_calculator,
129     bool use_limiter,
130     int max_sources_to_mix)
131     : max_sources_to_mix_(max_sources_to_mix),
132       output_rate_calculator_(std::move(output_rate_calculator)),
133       audio_source_list_(),
134       helper_containers_(std::make_unique<HelperContainers>()),
135       frame_combiner_(use_limiter) {
136   RTC_CHECK_GE(max_sources_to_mix, 1) << "At least one source must be mixed";
137   audio_source_list_.reserve(max_sources_to_mix);
138   helper_containers_->resize(max_sources_to_mix);
139 }
140 
~AudioMixerImpl()141 AudioMixerImpl::~AudioMixerImpl() {}
142 
Create(int max_sources_to_mix)143 rtc::scoped_refptr<AudioMixerImpl> AudioMixerImpl::Create(
144     int max_sources_to_mix) {
145   return Create(std::unique_ptr<DefaultOutputRateCalculator>(
146                     new DefaultOutputRateCalculator()),
147                 /*use_limiter=*/true, max_sources_to_mix);
148 }
149 
Create(std::unique_ptr<OutputRateCalculator> output_rate_calculator,bool use_limiter,int max_sources_to_mix)150 rtc::scoped_refptr<AudioMixerImpl> AudioMixerImpl::Create(
151     std::unique_ptr<OutputRateCalculator> output_rate_calculator,
152     bool use_limiter,
153     int max_sources_to_mix) {
154   return rtc::make_ref_counted<AudioMixerImpl>(
155       std::move(output_rate_calculator), use_limiter, max_sources_to_mix);
156 }
157 
Mix(size_t number_of_channels,AudioFrame * audio_frame_for_mixing)158 void AudioMixerImpl::Mix(size_t number_of_channels,
159                          AudioFrame* audio_frame_for_mixing) {
160   TRACE_EVENT0("webrtc", "AudioMixerImpl::Mix");
161   RTC_DCHECK(number_of_channels >= 1);
162   MutexLock lock(&mutex_);
163 
164   size_t number_of_streams = audio_source_list_.size();
165 
166   std::transform(audio_source_list_.begin(), audio_source_list_.end(),
167                  helper_containers_->preferred_rates.begin(),
168                  [&](std::unique_ptr<SourceStatus>& a) {
169                    return a->audio_source->PreferredSampleRate();
170                  });
171 
172   int output_frequency = output_rate_calculator_->CalculateOutputRateFromRange(
173       rtc::ArrayView<const int>(helper_containers_->preferred_rates.data(),
174                                 number_of_streams));
175 
176   frame_combiner_.Combine(GetAudioFromSources(output_frequency),
177                           number_of_channels, output_frequency,
178                           number_of_streams, audio_frame_for_mixing);
179 }
180 
AddSource(Source * audio_source)181 bool AudioMixerImpl::AddSource(Source* audio_source) {
182   RTC_DCHECK(audio_source);
183   MutexLock lock(&mutex_);
184   RTC_DCHECK(FindSourceInList(audio_source, &audio_source_list_) ==
185              audio_source_list_.end())
186       << "Source already added to mixer";
187   audio_source_list_.emplace_back(new SourceStatus(audio_source, false, 0));
188   helper_containers_->resize(audio_source_list_.size());
189   return true;
190 }
191 
RemoveSource(Source * audio_source)192 void AudioMixerImpl::RemoveSource(Source* audio_source) {
193   RTC_DCHECK(audio_source);
194   MutexLock lock(&mutex_);
195   const auto iter = FindSourceInList(audio_source, &audio_source_list_);
196   RTC_DCHECK(iter != audio_source_list_.end()) << "Source not present in mixer";
197   audio_source_list_.erase(iter);
198 }
199 
GetAudioFromSources(int output_frequency)200 rtc::ArrayView<AudioFrame* const> AudioMixerImpl::GetAudioFromSources(
201     int output_frequency) {
202   // Get audio from the audio sources and put it in the SourceFrame vector.
203   int audio_source_mixing_data_count = 0;
204   for (auto& source_and_status : audio_source_list_) {
205     const auto audio_frame_info =
206         source_and_status->audio_source->GetAudioFrameWithInfo(
207             output_frequency, &source_and_status->audio_frame);
208 
209     if (audio_frame_info == Source::AudioFrameInfo::kError) {
210       RTC_LOG_F(LS_WARNING) << "failed to GetAudioFrameWithInfo() from source";
211       continue;
212     }
213     helper_containers_
214         ->audio_source_mixing_data_list[audio_source_mixing_data_count++] =
215         SourceFrame(source_and_status.get(), &source_and_status->audio_frame,
216                     audio_frame_info == Source::AudioFrameInfo::kMuted);
217   }
218   rtc::ArrayView<SourceFrame> audio_source_mixing_data_view(
219       helper_containers_->audio_source_mixing_data_list.data(),
220       audio_source_mixing_data_count);
221 
222   // Sort frames by sorting function.
223   std::sort(audio_source_mixing_data_view.begin(),
224             audio_source_mixing_data_view.end(), ShouldMixBefore);
225 
226   int max_audio_frame_counter = max_sources_to_mix_;
227   int ramp_list_lengh = 0;
228   int audio_to_mix_count = 0;
229   // Go through list in order and put unmuted frames in result list.
230   for (const auto& p : audio_source_mixing_data_view) {
231     // Filter muted.
232     if (p.muted) {
233       p.source_status->is_mixed = false;
234       continue;
235     }
236 
237     // Add frame to result vector for mixing.
238     bool is_mixed = false;
239     if (max_audio_frame_counter > 0) {
240       --max_audio_frame_counter;
241       helper_containers_->audio_to_mix[audio_to_mix_count++] = p.audio_frame;
242       helper_containers_->ramp_list[ramp_list_lengh++] =
243           SourceFrame(p.source_status, p.audio_frame, false, -1);
244       is_mixed = true;
245     }
246     p.source_status->is_mixed = is_mixed;
247   }
248   RampAndUpdateGain(rtc::ArrayView<SourceFrame>(
249       helper_containers_->ramp_list.data(), ramp_list_lengh));
250   return rtc::ArrayView<AudioFrame* const>(
251       helper_containers_->audio_to_mix.data(), audio_to_mix_count);
252 }
253 
GetAudioSourceMixabilityStatusForTest(AudioMixerImpl::Source * audio_source) const254 bool AudioMixerImpl::GetAudioSourceMixabilityStatusForTest(
255     AudioMixerImpl::Source* audio_source) const {
256   MutexLock lock(&mutex_);
257 
258   const auto iter = FindSourceInList(audio_source, &audio_source_list_);
259   if (iter != audio_source_list_.end()) {
260     return (*iter)->is_mixed;
261   }
262 
263   RTC_LOG(LS_ERROR) << "Audio source unknown";
264   return false;
265 }
266 }  // namespace webrtc
267