xref: /aosp_15_r20/external/webrtc/modules/audio_coding/neteq/accelerate.cc (revision d9f758449e529ab9291ac668be2861e7a55c2422)
1*d9f75844SAndroid Build Coastguard Worker /*
2*d9f75844SAndroid Build Coastguard Worker  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
3*d9f75844SAndroid Build Coastguard Worker  *
4*d9f75844SAndroid Build Coastguard Worker  *  Use of this source code is governed by a BSD-style license
5*d9f75844SAndroid Build Coastguard Worker  *  that can be found in the LICENSE file in the root of the source
6*d9f75844SAndroid Build Coastguard Worker  *  tree. An additional intellectual property rights grant can be found
7*d9f75844SAndroid Build Coastguard Worker  *  in the file PATENTS.  All contributing project authors may
8*d9f75844SAndroid Build Coastguard Worker  *  be found in the AUTHORS file in the root of the source tree.
9*d9f75844SAndroid Build Coastguard Worker  */
10*d9f75844SAndroid Build Coastguard Worker 
11*d9f75844SAndroid Build Coastguard Worker #include "modules/audio_coding/neteq/accelerate.h"
12*d9f75844SAndroid Build Coastguard Worker 
13*d9f75844SAndroid Build Coastguard Worker 
14*d9f75844SAndroid Build Coastguard Worker #include "api/array_view.h"
15*d9f75844SAndroid Build Coastguard Worker #include "modules/audio_coding/neteq/audio_multi_vector.h"
16*d9f75844SAndroid Build Coastguard Worker 
17*d9f75844SAndroid Build Coastguard Worker namespace webrtc {
18*d9f75844SAndroid Build Coastguard Worker 
Process(const int16_t * input,size_t input_length,bool fast_accelerate,AudioMultiVector * output,size_t * length_change_samples)19*d9f75844SAndroid Build Coastguard Worker Accelerate::ReturnCodes Accelerate::Process(const int16_t* input,
20*d9f75844SAndroid Build Coastguard Worker                                             size_t input_length,
21*d9f75844SAndroid Build Coastguard Worker                                             bool fast_accelerate,
22*d9f75844SAndroid Build Coastguard Worker                                             AudioMultiVector* output,
23*d9f75844SAndroid Build Coastguard Worker                                             size_t* length_change_samples) {
24*d9f75844SAndroid Build Coastguard Worker   // Input length must be (almost) 30 ms.
25*d9f75844SAndroid Build Coastguard Worker   static const size_t k15ms = 120;  // 15 ms = 120 samples at 8 kHz sample rate.
26*d9f75844SAndroid Build Coastguard Worker   if (num_channels_ == 0 ||
27*d9f75844SAndroid Build Coastguard Worker       input_length / num_channels_ < (2 * k15ms - 1) * fs_mult_) {
28*d9f75844SAndroid Build Coastguard Worker     // Length of input data too short to do accelerate. Simply move all data
29*d9f75844SAndroid Build Coastguard Worker     // from input to output.
30*d9f75844SAndroid Build Coastguard Worker     output->PushBackInterleaved(
31*d9f75844SAndroid Build Coastguard Worker         rtc::ArrayView<const int16_t>(input, input_length));
32*d9f75844SAndroid Build Coastguard Worker     return kError;
33*d9f75844SAndroid Build Coastguard Worker   }
34*d9f75844SAndroid Build Coastguard Worker   return TimeStretch::Process(input, input_length, fast_accelerate, output,
35*d9f75844SAndroid Build Coastguard Worker                               length_change_samples);
36*d9f75844SAndroid Build Coastguard Worker }
37*d9f75844SAndroid Build Coastguard Worker 
SetParametersForPassiveSpeech(size_t,int16_t * best_correlation,size_t *) const38*d9f75844SAndroid Build Coastguard Worker void Accelerate::SetParametersForPassiveSpeech(size_t /*len*/,
39*d9f75844SAndroid Build Coastguard Worker                                                int16_t* best_correlation,
40*d9f75844SAndroid Build Coastguard Worker                                                size_t* /*peak_index*/) const {
41*d9f75844SAndroid Build Coastguard Worker   // When the signal does not contain any active speech, the correlation does
42*d9f75844SAndroid Build Coastguard Worker   // not matter. Simply set it to zero.
43*d9f75844SAndroid Build Coastguard Worker   *best_correlation = 0;
44*d9f75844SAndroid Build Coastguard Worker }
45*d9f75844SAndroid Build Coastguard Worker 
CheckCriteriaAndStretch(const int16_t * input,size_t input_length,size_t peak_index,int16_t best_correlation,bool active_speech,bool fast_mode,AudioMultiVector * output) const46*d9f75844SAndroid Build Coastguard Worker Accelerate::ReturnCodes Accelerate::CheckCriteriaAndStretch(
47*d9f75844SAndroid Build Coastguard Worker     const int16_t* input,
48*d9f75844SAndroid Build Coastguard Worker     size_t input_length,
49*d9f75844SAndroid Build Coastguard Worker     size_t peak_index,
50*d9f75844SAndroid Build Coastguard Worker     int16_t best_correlation,
51*d9f75844SAndroid Build Coastguard Worker     bool active_speech,
52*d9f75844SAndroid Build Coastguard Worker     bool fast_mode,
53*d9f75844SAndroid Build Coastguard Worker     AudioMultiVector* output) const {
54*d9f75844SAndroid Build Coastguard Worker   // Check for strong correlation or passive speech.
55*d9f75844SAndroid Build Coastguard Worker   // Use 8192 (0.5 in Q14) in fast mode.
56*d9f75844SAndroid Build Coastguard Worker   const int correlation_threshold = fast_mode ? 8192 : kCorrelationThreshold;
57*d9f75844SAndroid Build Coastguard Worker   if ((best_correlation > correlation_threshold) || !active_speech) {
58*d9f75844SAndroid Build Coastguard Worker     // Do accelerate operation by overlap add.
59*d9f75844SAndroid Build Coastguard Worker 
60*d9f75844SAndroid Build Coastguard Worker     // Pre-calculate common multiplication with `fs_mult_`.
61*d9f75844SAndroid Build Coastguard Worker     // 120 corresponds to 15 ms.
62*d9f75844SAndroid Build Coastguard Worker     size_t fs_mult_120 = fs_mult_ * 120;
63*d9f75844SAndroid Build Coastguard Worker 
64*d9f75844SAndroid Build Coastguard Worker     if (fast_mode) {
65*d9f75844SAndroid Build Coastguard Worker       // Fit as many multiples of `peak_index` as possible in fs_mult_120.
66*d9f75844SAndroid Build Coastguard Worker       // TODO(henrik.lundin) Consider finding multiple correlation peaks and
67*d9f75844SAndroid Build Coastguard Worker       // pick the one with the longest correlation lag in this case.
68*d9f75844SAndroid Build Coastguard Worker       peak_index = (fs_mult_120 / peak_index) * peak_index;
69*d9f75844SAndroid Build Coastguard Worker     }
70*d9f75844SAndroid Build Coastguard Worker 
71*d9f75844SAndroid Build Coastguard Worker     RTC_DCHECK_GE(fs_mult_120, peak_index);  // Should be handled in Process().
72*d9f75844SAndroid Build Coastguard Worker     // Copy first part; 0 to 15 ms.
73*d9f75844SAndroid Build Coastguard Worker     output->PushBackInterleaved(
74*d9f75844SAndroid Build Coastguard Worker         rtc::ArrayView<const int16_t>(input, fs_mult_120 * num_channels_));
75*d9f75844SAndroid Build Coastguard Worker     // Copy the `peak_index` starting at 15 ms to `temp_vector`.
76*d9f75844SAndroid Build Coastguard Worker     AudioMultiVector temp_vector(num_channels_);
77*d9f75844SAndroid Build Coastguard Worker     temp_vector.PushBackInterleaved(rtc::ArrayView<const int16_t>(
78*d9f75844SAndroid Build Coastguard Worker         &input[fs_mult_120 * num_channels_], peak_index * num_channels_));
79*d9f75844SAndroid Build Coastguard Worker     // Cross-fade `temp_vector` onto the end of `output`.
80*d9f75844SAndroid Build Coastguard Worker     output->CrossFade(temp_vector, peak_index);
81*d9f75844SAndroid Build Coastguard Worker     // Copy the last unmodified part, 15 ms + pitch period until the end.
82*d9f75844SAndroid Build Coastguard Worker     output->PushBackInterleaved(rtc::ArrayView<const int16_t>(
83*d9f75844SAndroid Build Coastguard Worker         &input[(fs_mult_120 + peak_index) * num_channels_],
84*d9f75844SAndroid Build Coastguard Worker         input_length - (fs_mult_120 + peak_index) * num_channels_));
85*d9f75844SAndroid Build Coastguard Worker 
86*d9f75844SAndroid Build Coastguard Worker     if (active_speech) {
87*d9f75844SAndroid Build Coastguard Worker       return kSuccess;
88*d9f75844SAndroid Build Coastguard Worker     } else {
89*d9f75844SAndroid Build Coastguard Worker       return kSuccessLowEnergy;
90*d9f75844SAndroid Build Coastguard Worker     }
91*d9f75844SAndroid Build Coastguard Worker   } else {
92*d9f75844SAndroid Build Coastguard Worker     // Accelerate not allowed. Simply move all data from decoded to outData.
93*d9f75844SAndroid Build Coastguard Worker     output->PushBackInterleaved(
94*d9f75844SAndroid Build Coastguard Worker         rtc::ArrayView<const int16_t>(input, input_length));
95*d9f75844SAndroid Build Coastguard Worker     return kNoStretch;
96*d9f75844SAndroid Build Coastguard Worker   }
97*d9f75844SAndroid Build Coastguard Worker }
98*d9f75844SAndroid Build Coastguard Worker 
Create(int sample_rate_hz,size_t num_channels,const BackgroundNoise & background_noise) const99*d9f75844SAndroid Build Coastguard Worker Accelerate* AccelerateFactory::Create(
100*d9f75844SAndroid Build Coastguard Worker     int sample_rate_hz,
101*d9f75844SAndroid Build Coastguard Worker     size_t num_channels,
102*d9f75844SAndroid Build Coastguard Worker     const BackgroundNoise& background_noise) const {
103*d9f75844SAndroid Build Coastguard Worker   return new Accelerate(sample_rate_hz, num_channels, background_noise);
104*d9f75844SAndroid Build Coastguard Worker }
105*d9f75844SAndroid Build Coastguard Worker 
106*d9f75844SAndroid Build Coastguard Worker }  // namespace webrtc
107