xref: /aosp_15_r20/external/webrtc/modules/audio_processing/aec3/render_delay_buffer.cc (revision d9f758449e529ab9291ac668be2861e7a55c2422)
1 /*
2  *  Copyright (c) 2018 The WebRTC project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include "modules/audio_processing/aec3/render_delay_buffer.h"
12 
13 #include <string.h>
14 
15 #include <algorithm>
16 #include <atomic>
17 #include <cmath>
18 #include <memory>
19 #include <numeric>
20 #include <vector>
21 
22 #include "absl/types/optional.h"
23 #include "api/array_view.h"
24 #include "api/audio/echo_canceller3_config.h"
25 #include "modules/audio_processing/aec3/aec3_common.h"
26 #include "modules/audio_processing/aec3/aec3_fft.h"
27 #include "modules/audio_processing/aec3/alignment_mixer.h"
28 #include "modules/audio_processing/aec3/block_buffer.h"
29 #include "modules/audio_processing/aec3/decimator.h"
30 #include "modules/audio_processing/aec3/downsampled_render_buffer.h"
31 #include "modules/audio_processing/aec3/fft_buffer.h"
32 #include "modules/audio_processing/aec3/fft_data.h"
33 #include "modules/audio_processing/aec3/render_buffer.h"
34 #include "modules/audio_processing/aec3/spectrum_buffer.h"
35 #include "modules/audio_processing/logging/apm_data_dumper.h"
36 #include "rtc_base/checks.h"
37 #include "rtc_base/logging.h"
38 #include "system_wrappers/include/field_trial.h"
39 
40 namespace webrtc {
41 namespace {
42 
UpdateCaptureCallCounterOnSkippedBlocks()43 bool UpdateCaptureCallCounterOnSkippedBlocks() {
44   return !field_trial::IsEnabled(
45       "WebRTC-Aec3RenderBufferCallCounterUpdateKillSwitch");
46 }
47 
48 class RenderDelayBufferImpl final : public RenderDelayBuffer {
49  public:
50   RenderDelayBufferImpl(const EchoCanceller3Config& config,
51                         int sample_rate_hz,
52                         size_t num_render_channels);
53   RenderDelayBufferImpl() = delete;
54   ~RenderDelayBufferImpl() override;
55 
56   void Reset() override;
57   BufferingEvent Insert(const Block& block) override;
58   BufferingEvent PrepareCaptureProcessing() override;
59   void HandleSkippedCaptureProcessing() override;
60   bool AlignFromDelay(size_t delay) override;
61   void AlignFromExternalDelay() override;
Delay() const62   size_t Delay() const override { return ComputeDelay(); }
MaxDelay() const63   size_t MaxDelay() const override {
64     return blocks_.buffer.size() - 1 - buffer_headroom_;
65   }
GetRenderBuffer()66   RenderBuffer* GetRenderBuffer() override { return &echo_remover_buffer_; }
67 
GetDownsampledRenderBuffer() const68   const DownsampledRenderBuffer& GetDownsampledRenderBuffer() const override {
69     return low_rate_;
70   }
71 
72   int BufferLatency() const;
73   void SetAudioBufferDelay(int delay_ms) override;
74   bool HasReceivedBufferDelay() override;
75 
76  private:
77   static std::atomic<int> instance_count_;
78   std::unique_ptr<ApmDataDumper> data_dumper_;
79   const Aec3Optimization optimization_;
80   const EchoCanceller3Config config_;
81   const bool update_capture_call_counter_on_skipped_blocks_;
82   const float render_linear_amplitude_gain_;
83   const rtc::LoggingSeverity delay_log_level_;
84   size_t down_sampling_factor_;
85   const int sub_block_size_;
86   BlockBuffer blocks_;
87   SpectrumBuffer spectra_;
88   FftBuffer ffts_;
89   absl::optional<size_t> delay_;
90   RenderBuffer echo_remover_buffer_;
91   DownsampledRenderBuffer low_rate_;
92   AlignmentMixer render_mixer_;
93   Decimator render_decimator_;
94   const Aec3Fft fft_;
95   std::vector<float> render_ds_;
96   const int buffer_headroom_;
97   bool last_call_was_render_ = false;
98   int num_api_calls_in_a_row_ = 0;
99   int max_observed_jitter_ = 1;
100   int64_t capture_call_counter_ = 0;
101   int64_t render_call_counter_ = 0;
102   bool render_activity_ = false;
103   size_t render_activity_counter_ = 0;
104   absl::optional<int> external_audio_buffer_delay_;
105   bool external_audio_buffer_delay_verified_after_reset_ = false;
106   size_t min_latency_blocks_ = 0;
107   size_t excess_render_detection_counter_ = 0;
108 
109   int MapDelayToTotalDelay(size_t delay) const;
110   int ComputeDelay() const;
111   void ApplyTotalDelay(int delay);
112   void InsertBlock(const Block& block, int previous_write);
113   bool DetectActiveRender(rtc::ArrayView<const float> x) const;
114   bool DetectExcessRenderBlocks();
115   void IncrementWriteIndices();
116   void IncrementLowRateReadIndices();
117   void IncrementReadIndices();
118   bool RenderOverrun();
119   bool RenderUnderrun();
120 };
121 
122 std::atomic<int> RenderDelayBufferImpl::instance_count_ = 0;
123 
RenderDelayBufferImpl(const EchoCanceller3Config & config,int sample_rate_hz,size_t num_render_channels)124 RenderDelayBufferImpl::RenderDelayBufferImpl(const EchoCanceller3Config& config,
125                                              int sample_rate_hz,
126                                              size_t num_render_channels)
127     : data_dumper_(new ApmDataDumper(instance_count_.fetch_add(1) + 1)),
128       optimization_(DetectOptimization()),
129       config_(config),
130       update_capture_call_counter_on_skipped_blocks_(
131           UpdateCaptureCallCounterOnSkippedBlocks()),
132       render_linear_amplitude_gain_(
133           std::pow(10.0f, config_.render_levels.render_power_gain_db / 20.f)),
134       delay_log_level_(config_.delay.log_warning_on_delay_changes
135                            ? rtc::LS_WARNING
136                            : rtc::LS_VERBOSE),
137       down_sampling_factor_(config.delay.down_sampling_factor),
138       sub_block_size_(static_cast<int>(down_sampling_factor_ > 0
139                                            ? kBlockSize / down_sampling_factor_
140                                            : kBlockSize)),
141       blocks_(GetRenderDelayBufferSize(down_sampling_factor_,
142                                        config.delay.num_filters,
143                                        config.filter.refined.length_blocks),
144               NumBandsForRate(sample_rate_hz),
145               num_render_channels),
146       spectra_(blocks_.buffer.size(), num_render_channels),
147       ffts_(blocks_.buffer.size(), num_render_channels),
148       delay_(config_.delay.default_delay),
149       echo_remover_buffer_(&blocks_, &spectra_, &ffts_),
150       low_rate_(GetDownSampledBufferSize(down_sampling_factor_,
151                                          config.delay.num_filters)),
152       render_mixer_(num_render_channels, config.delay.render_alignment_mixing),
153       render_decimator_(down_sampling_factor_),
154       fft_(),
155       render_ds_(sub_block_size_, 0.f),
156       buffer_headroom_(config.filter.refined.length_blocks) {
157   RTC_DCHECK_EQ(blocks_.buffer.size(), ffts_.buffer.size());
158   RTC_DCHECK_EQ(spectra_.buffer.size(), ffts_.buffer.size());
159   for (size_t i = 0; i < blocks_.buffer.size(); ++i) {
160     RTC_DCHECK_EQ(blocks_.buffer[i].NumChannels(), ffts_.buffer[i].size());
161     RTC_DCHECK_EQ(spectra_.buffer[i].size(), ffts_.buffer[i].size());
162   }
163 
164   Reset();
165 }
166 
167 RenderDelayBufferImpl::~RenderDelayBufferImpl() = default;
168 
169 // Resets the buffer delays and clears the reported delays.
Reset()170 void RenderDelayBufferImpl::Reset() {
171   last_call_was_render_ = false;
172   num_api_calls_in_a_row_ = 1;
173   min_latency_blocks_ = 0;
174   excess_render_detection_counter_ = 0;
175 
176   // Initialize the read index to one sub-block before the write index.
177   low_rate_.read = low_rate_.OffsetIndex(low_rate_.write, sub_block_size_);
178 
179   // Check for any external audio buffer delay and whether it is feasible.
180   if (external_audio_buffer_delay_) {
181     const int headroom = 2;
182     size_t audio_buffer_delay_to_set;
183     // Minimum delay is 1 (like the low-rate render buffer).
184     if (*external_audio_buffer_delay_ <= headroom) {
185       audio_buffer_delay_to_set = 1;
186     } else {
187       audio_buffer_delay_to_set = *external_audio_buffer_delay_ - headroom;
188     }
189 
190     audio_buffer_delay_to_set = std::min(audio_buffer_delay_to_set, MaxDelay());
191 
192     // When an external delay estimate is available, use that delay as the
193     // initial render buffer delay.
194     ApplyTotalDelay(audio_buffer_delay_to_set);
195     delay_ = ComputeDelay();
196 
197     external_audio_buffer_delay_verified_after_reset_ = false;
198   } else {
199     // If an external delay estimate is not available, use that delay as the
200     // initial delay. Set the render buffer delays to the default delay.
201     ApplyTotalDelay(config_.delay.default_delay);
202 
203     // Unset the delays which are set by AlignFromDelay.
204     delay_ = absl::nullopt;
205   }
206 }
207 
208 // Inserts a new block into the render buffers.
Insert(const Block & block)209 RenderDelayBuffer::BufferingEvent RenderDelayBufferImpl::Insert(
210     const Block& block) {
211   ++render_call_counter_;
212   if (delay_) {
213     if (!last_call_was_render_) {
214       last_call_was_render_ = true;
215       num_api_calls_in_a_row_ = 1;
216     } else {
217       if (++num_api_calls_in_a_row_ > max_observed_jitter_) {
218         max_observed_jitter_ = num_api_calls_in_a_row_;
219         RTC_LOG_V(delay_log_level_)
220             << "New max number api jitter observed at render block "
221             << render_call_counter_ << ":  " << num_api_calls_in_a_row_
222             << " blocks";
223       }
224     }
225   }
226 
227   // Increase the write indices to where the new blocks should be written.
228   const int previous_write = blocks_.write;
229   IncrementWriteIndices();
230 
231   // Allow overrun and do a reset when render overrun occurrs due to more render
232   // data being inserted than capture data is received.
233   BufferingEvent event =
234       RenderOverrun() ? BufferingEvent::kRenderOverrun : BufferingEvent::kNone;
235 
236   // Detect and update render activity.
237   if (!render_activity_) {
238     render_activity_counter_ +=
239         DetectActiveRender(block.View(/*band=*/0, /*channel=*/0)) ? 1 : 0;
240     render_activity_ = render_activity_counter_ >= 20;
241   }
242 
243   // Insert the new render block into the specified position.
244   InsertBlock(block, previous_write);
245 
246   if (event != BufferingEvent::kNone) {
247     Reset();
248   }
249 
250   return event;
251 }
252 
HandleSkippedCaptureProcessing()253 void RenderDelayBufferImpl::HandleSkippedCaptureProcessing() {
254   if (update_capture_call_counter_on_skipped_blocks_) {
255     ++capture_call_counter_;
256   }
257 }
258 
259 // Prepares the render buffers for processing another capture block.
260 RenderDelayBuffer::BufferingEvent
PrepareCaptureProcessing()261 RenderDelayBufferImpl::PrepareCaptureProcessing() {
262   RenderDelayBuffer::BufferingEvent event = BufferingEvent::kNone;
263   ++capture_call_counter_;
264 
265   if (delay_) {
266     if (last_call_was_render_) {
267       last_call_was_render_ = false;
268       num_api_calls_in_a_row_ = 1;
269     } else {
270       if (++num_api_calls_in_a_row_ > max_observed_jitter_) {
271         max_observed_jitter_ = num_api_calls_in_a_row_;
272         RTC_LOG_V(delay_log_level_)
273             << "New max number api jitter observed at capture block "
274             << capture_call_counter_ << ":  " << num_api_calls_in_a_row_
275             << " blocks";
276       }
277     }
278   }
279 
280   if (DetectExcessRenderBlocks()) {
281     // Too many render blocks compared to capture blocks. Risk of delay ending
282     // up before the filter used by the delay estimator.
283     RTC_LOG_V(delay_log_level_)
284         << "Excess render blocks detected at block " << capture_call_counter_;
285     Reset();
286     event = BufferingEvent::kRenderOverrun;
287   } else if (RenderUnderrun()) {
288     // Don't increment the read indices of the low rate buffer if there is a
289     // render underrun.
290     RTC_LOG_V(delay_log_level_)
291         << "Render buffer underrun detected at block " << capture_call_counter_;
292     IncrementReadIndices();
293     // Incrementing the buffer index without increasing the low rate buffer
294     // index means that the delay is reduced by one.
295     if (delay_ && *delay_ > 0)
296       delay_ = *delay_ - 1;
297     event = BufferingEvent::kRenderUnderrun;
298   } else {
299     // Increment the read indices in the render buffers to point to the most
300     // recent block to use in the capture processing.
301     IncrementLowRateReadIndices();
302     IncrementReadIndices();
303   }
304 
305   echo_remover_buffer_.SetRenderActivity(render_activity_);
306   if (render_activity_) {
307     render_activity_counter_ = 0;
308     render_activity_ = false;
309   }
310 
311   return event;
312 }
313 
314 // Sets the delay and returns a bool indicating whether the delay was changed.
AlignFromDelay(size_t delay)315 bool RenderDelayBufferImpl::AlignFromDelay(size_t delay) {
316   RTC_DCHECK(!config_.delay.use_external_delay_estimator);
317   if (!external_audio_buffer_delay_verified_after_reset_ &&
318       external_audio_buffer_delay_ && delay_) {
319     int difference = static_cast<int>(delay) - static_cast<int>(*delay_);
320     RTC_LOG_V(delay_log_level_)
321         << "Mismatch between first estimated delay after reset "
322            "and externally reported audio buffer delay: "
323         << difference << " blocks";
324     external_audio_buffer_delay_verified_after_reset_ = true;
325   }
326   if (delay_ && *delay_ == delay) {
327     return false;
328   }
329   delay_ = delay;
330 
331   // Compute the total delay and limit the delay to the allowed range.
332   int total_delay = MapDelayToTotalDelay(*delay_);
333   total_delay =
334       std::min(MaxDelay(), static_cast<size_t>(std::max(total_delay, 0)));
335 
336   // Apply the delay to the buffers.
337   ApplyTotalDelay(total_delay);
338   return true;
339 }
340 
SetAudioBufferDelay(int delay_ms)341 void RenderDelayBufferImpl::SetAudioBufferDelay(int delay_ms) {
342   if (!external_audio_buffer_delay_) {
343     RTC_LOG_V(delay_log_level_)
344         << "Receiving a first externally reported audio buffer delay of "
345         << delay_ms << " ms.";
346   }
347 
348   // Convert delay from milliseconds to blocks (rounded down).
349   external_audio_buffer_delay_ = delay_ms / 4;
350 }
351 
HasReceivedBufferDelay()352 bool RenderDelayBufferImpl::HasReceivedBufferDelay() {
353   return external_audio_buffer_delay_.has_value();
354 }
355 
356 // Maps the externally computed delay to the delay used internally.
MapDelayToTotalDelay(size_t external_delay_blocks) const357 int RenderDelayBufferImpl::MapDelayToTotalDelay(
358     size_t external_delay_blocks) const {
359   const int latency_blocks = BufferLatency();
360   return latency_blocks + static_cast<int>(external_delay_blocks);
361 }
362 
363 // Returns the delay (not including call jitter).
ComputeDelay() const364 int RenderDelayBufferImpl::ComputeDelay() const {
365   const int latency_blocks = BufferLatency();
366   int internal_delay = spectra_.read >= spectra_.write
367                            ? spectra_.read - spectra_.write
368                            : spectra_.size + spectra_.read - spectra_.write;
369 
370   return internal_delay - latency_blocks;
371 }
372 
373 // Set the read indices according to the delay.
ApplyTotalDelay(int delay)374 void RenderDelayBufferImpl::ApplyTotalDelay(int delay) {
375   RTC_LOG_V(delay_log_level_)
376       << "Applying total delay of " << delay << " blocks.";
377   blocks_.read = blocks_.OffsetIndex(blocks_.write, -delay);
378   spectra_.read = spectra_.OffsetIndex(spectra_.write, delay);
379   ffts_.read = ffts_.OffsetIndex(ffts_.write, delay);
380 }
381 
AlignFromExternalDelay()382 void RenderDelayBufferImpl::AlignFromExternalDelay() {
383   RTC_DCHECK(config_.delay.use_external_delay_estimator);
384   if (external_audio_buffer_delay_) {
385     const int64_t delay = render_call_counter_ - capture_call_counter_ +
386                           *external_audio_buffer_delay_;
387     const int64_t delay_with_headroom =
388         delay - config_.delay.delay_headroom_samples / kBlockSize;
389     ApplyTotalDelay(delay_with_headroom);
390   }
391 }
392 
393 // Inserts a block into the render buffers.
InsertBlock(const Block & block,int previous_write)394 void RenderDelayBufferImpl::InsertBlock(const Block& block,
395                                         int previous_write) {
396   auto& b = blocks_;
397   auto& lr = low_rate_;
398   auto& ds = render_ds_;
399   auto& f = ffts_;
400   auto& s = spectra_;
401   const size_t num_bands = b.buffer[b.write].NumBands();
402   const size_t num_render_channels = b.buffer[b.write].NumChannels();
403   RTC_DCHECK_EQ(block.NumBands(), num_bands);
404   RTC_DCHECK_EQ(block.NumChannels(), num_render_channels);
405   for (size_t band = 0; band < num_bands; ++band) {
406     for (size_t ch = 0; ch < num_render_channels; ++ch) {
407       std::copy(block.begin(band, ch), block.end(band, ch),
408                 b.buffer[b.write].begin(band, ch));
409     }
410   }
411 
412   if (render_linear_amplitude_gain_ != 1.f) {
413     for (size_t band = 0; band < num_bands; ++band) {
414       for (size_t ch = 0; ch < num_render_channels; ++ch) {
415         rtc::ArrayView<float, kBlockSize> b_view =
416             b.buffer[b.write].View(band, ch);
417         for (float& sample : b_view) {
418           sample *= render_linear_amplitude_gain_;
419         }
420       }
421     }
422   }
423 
424   std::array<float, kBlockSize> downmixed_render;
425   render_mixer_.ProduceOutput(b.buffer[b.write], downmixed_render);
426   render_decimator_.Decimate(downmixed_render, ds);
427   data_dumper_->DumpWav("aec3_render_decimator_output", ds.size(), ds.data(),
428                         16000 / down_sampling_factor_, 1);
429   std::copy(ds.rbegin(), ds.rend(), lr.buffer.begin() + lr.write);
430   for (int channel = 0; channel < b.buffer[b.write].NumChannels(); ++channel) {
431     fft_.PaddedFft(b.buffer[b.write].View(/*band=*/0, channel),
432                    b.buffer[previous_write].View(/*band=*/0, channel),
433                    &f.buffer[f.write][channel]);
434     f.buffer[f.write][channel].Spectrum(optimization_,
435                                         s.buffer[s.write][channel]);
436   }
437 }
438 
DetectActiveRender(rtc::ArrayView<const float> x) const439 bool RenderDelayBufferImpl::DetectActiveRender(
440     rtc::ArrayView<const float> x) const {
441   const float x_energy = std::inner_product(x.begin(), x.end(), x.begin(), 0.f);
442   return x_energy > (config_.render_levels.active_render_limit *
443                      config_.render_levels.active_render_limit) *
444                         kFftLengthBy2;
445 }
446 
DetectExcessRenderBlocks()447 bool RenderDelayBufferImpl::DetectExcessRenderBlocks() {
448   bool excess_render_detected = false;
449   const size_t latency_blocks = static_cast<size_t>(BufferLatency());
450   // The recently seen minimum latency in blocks. Should be close to 0.
451   min_latency_blocks_ = std::min(min_latency_blocks_, latency_blocks);
452   // After processing a configurable number of blocks the minimum latency is
453   // checked.
454   if (++excess_render_detection_counter_ >=
455       config_.buffering.excess_render_detection_interval_blocks) {
456     // If the minimum latency is not lower than the threshold there have been
457     // more render than capture frames.
458     excess_render_detected = min_latency_blocks_ >
459                              config_.buffering.max_allowed_excess_render_blocks;
460     // Reset the counter and let the minimum latency be the current latency.
461     min_latency_blocks_ = latency_blocks;
462     excess_render_detection_counter_ = 0;
463   }
464 
465   data_dumper_->DumpRaw("aec3_latency_blocks", latency_blocks);
466   data_dumper_->DumpRaw("aec3_min_latency_blocks", min_latency_blocks_);
467   data_dumper_->DumpRaw("aec3_excess_render_detected", excess_render_detected);
468   return excess_render_detected;
469 }
470 
471 // Computes the latency in the buffer (the number of unread sub-blocks).
BufferLatency() const472 int RenderDelayBufferImpl::BufferLatency() const {
473   const DownsampledRenderBuffer& l = low_rate_;
474   int latency_samples = (l.buffer.size() + l.read - l.write) % l.buffer.size();
475   int latency_blocks = latency_samples / sub_block_size_;
476   return latency_blocks;
477 }
478 
479 // Increments the write indices for the render buffers.
IncrementWriteIndices()480 void RenderDelayBufferImpl::IncrementWriteIndices() {
481   low_rate_.UpdateWriteIndex(-sub_block_size_);
482   blocks_.IncWriteIndex();
483   spectra_.DecWriteIndex();
484   ffts_.DecWriteIndex();
485 }
486 
487 // Increments the read indices of the low rate render buffers.
IncrementLowRateReadIndices()488 void RenderDelayBufferImpl::IncrementLowRateReadIndices() {
489   low_rate_.UpdateReadIndex(-sub_block_size_);
490 }
491 
492 // Increments the read indices for the render buffers.
IncrementReadIndices()493 void RenderDelayBufferImpl::IncrementReadIndices() {
494   if (blocks_.read != blocks_.write) {
495     blocks_.IncReadIndex();
496     spectra_.DecReadIndex();
497     ffts_.DecReadIndex();
498   }
499 }
500 
501 // Checks for a render buffer overrun.
RenderOverrun()502 bool RenderDelayBufferImpl::RenderOverrun() {
503   return low_rate_.read == low_rate_.write || blocks_.read == blocks_.write;
504 }
505 
506 // Checks for a render buffer underrun.
RenderUnderrun()507 bool RenderDelayBufferImpl::RenderUnderrun() {
508   return low_rate_.read == low_rate_.write;
509 }
510 
511 }  // namespace
512 
Create(const EchoCanceller3Config & config,int sample_rate_hz,size_t num_render_channels)513 RenderDelayBuffer* RenderDelayBuffer::Create(const EchoCanceller3Config& config,
514                                              int sample_rate_hz,
515                                              size_t num_render_channels) {
516   return new RenderDelayBufferImpl(config, sample_rate_hz, num_render_channels);
517 }
518 
519 }  // namespace webrtc
520