modules/audio_device/audio_device_buffer.cc - src - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_device/audio_device_buffer.h"

 #include <string.h>

 #include <cmath>
 #include <cstddef>
 #include <cstdint>

 #include "common_audio/signal_processing/include/signal_processing_library.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/logging.h"
 #include "rtc_base/time_utils.h"
 #include "rtc_base/trace_event.h"
 #include "system_wrappers/include/metrics.h"

 namespace webrtc {

 static const char kTimerQueueName[] = "AudioDeviceBufferTimer";

 // Time between two sucessive calls to LogStats().
 static const size_t kTimerIntervalInSeconds = 10;
 static const size_t kTimerIntervalInMilliseconds =
     kTimerIntervalInSeconds * rtc::kNumMillisecsPerSec;
 // Min time required to qualify an audio session as a "call". If playout or
 // recording has been active for less than this time we will not store any
 // logs or UMA stats but instead consider the call as too short.
 static const size_t kMinValidCallTimeTimeInSeconds = 10;
 static const size_t kMinValidCallTimeTimeInMilliseconds =
     kMinValidCallTimeTimeInSeconds * rtc::kNumMillisecsPerSec;
 #ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
 static const double k2Pi = 6.28318530717959;
 #endif

 AudioDeviceBuffer::AudioDeviceBuffer(TaskQueueFactory* task_queue_factory,
                                      bool create_detached)
     : task_queue_(task_queue_factory->CreateTaskQueue(
           kTimerQueueName,
           TaskQueueFactory::Priority::NORMAL)),
       audio_transport_cb_(nullptr),
       rec_sample_rate_(0),
       play_sample_rate_(0),
       rec_channels_(0),
       play_channels_(0),
       playing_(false),
       recording_(false),
       typing_status_(false),
       play_delay_ms_(0),
       rec_delay_ms_(0),
       num_stat_reports_(0),
       last_timer_task_time_(0),
       rec_stat_count_(0),
       play_stat_count_(0),
       play_start_time_(0),
       only_silence_recorded_(true),
       log_stats_(false) {
   RTC_LOG(LS_INFO) << "AudioDeviceBuffer::ctor";
 #ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
   phase_ = 0.0;
   RTC_LOG(LS_WARNING) << "AUDIO_DEVICE_PLAYS_SINUS_TONE is defined!";
 #endif
   if (create_detached) {
     main_thread_checker_.Detach();
   }
 }

 AudioDeviceBuffer::~AudioDeviceBuffer() {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   RTC_DCHECK(!playing_);
   RTC_DCHECK(!recording_);
   RTC_LOG(LS_INFO) << "AudioDeviceBuffer::~dtor";

   // Delete and and thus stop task queue before deleting other members to avoid
   // race with running tasks. Even though !playing_ and !recording_ called
   // StopPeriodicLogging, such stop is asynchronous and may race with the
   // AudioDeviceBuffer destructor. In particular there might be regular LogStats
   // that attempts to repost task to the task_queue_.
   // Thus task_queue_ should be deleted before pointer to it is invalidated.
   // std::unique_ptr destructor does the same two operations in reverse order as
   // it doesn't expect member would be used after its destruction has started.
   task_queue_.get_deleter()(task_queue_.get());
   task_queue_.release();
 }

 int32_t AudioDeviceBuffer::RegisterAudioCallback(
     AudioTransport* audio_callback) {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   RTC_DLOG(LS_INFO) << __FUNCTION__;
   if (playing_ || recording_) {
     RTC_LOG(LS_ERROR) << "Failed to set audio transport since media was active";
     return -1;
   }
   audio_transport_cb_ = audio_callback;
   return 0;
 }

 void AudioDeviceBuffer::StartPlayout() {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   // TODO(henrika): allow for usage of DCHECK(!playing_) here instead. Today the
   // ADM allows calling Start(), Start() by ignoring the second call but it
   // makes more sense to only allow one call.
   if (playing_) {
     return;
   }
   RTC_DLOG(LS_INFO) << __FUNCTION__;
   // Clear members tracking playout stats and do it on the task queue.
   task_queue_->PostTask([this] { ResetPlayStats(); });
   // Start a periodic timer based on task queue if not already done by the
   // recording side.
   if (!recording_) {
     StartPeriodicLogging();
   }
   const int64_t now_time = rtc::TimeMillis();
   // Clear members that are only touched on the main (creating) thread.
   play_start_time_ = now_time;
   playing_ = true;
 }

 void AudioDeviceBuffer::StartRecording() {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   if (recording_) {
     return;
   }
   RTC_DLOG(LS_INFO) << __FUNCTION__;
   // Clear members tracking recording stats and do it on the task queue.
   task_queue_->PostTask([this] { ResetRecStats(); });
   // Start a periodic timer based on task queue if not already done by the
   // playout side.
   if (!playing_) {
     StartPeriodicLogging();
   }
   // Clear members that will be touched on the main (creating) thread.
   rec_start_time_ = rtc::TimeMillis();
   recording_ = true;
   // And finally a member which can be modified on the native audio thread.
   // It is safe to do so since we know by design that the owning ADM has not
   // yet started the native audio recording.
   only_silence_recorded_ = true;
 }

 void AudioDeviceBuffer::StopPlayout() {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   if (!playing_) {
     return;
   }
   RTC_DLOG(LS_INFO) << __FUNCTION__;
   playing_ = false;
   // Stop periodic logging if no more media is active.
   if (!recording_) {
     StopPeriodicLogging();
   }
   RTC_LOG(LS_INFO) << "total playout time: "
                    << rtc::TimeSince(play_start_time_);
 }

 void AudioDeviceBuffer::StopRecording() {
   RTC_DCHECK_RUN_ON(&main_thread_checker_);
   if (!recording_) {
     return;
   }
   RTC_DLOG(LS_INFO) << __FUNCTION__;
   recording_ = false;
   // Stop periodic logging if no more media is active.
   if (!playing_) {
     StopPeriodicLogging();
   }
   // Add UMA histogram to keep track of the case when only zeros have been
   // recorded. Measurements (max of absolute level) are taken twice per second,
   // which means that if e.g 10 seconds of audio has been recorded, a total of
   // 20 level estimates must all be identical to zero to trigger the histogram.
   // `only_silence_recorded_` can only be cleared on the native audio thread
   // that drives audio capture but we know by design that the audio has stopped
   // when this method is called, hence there should not be aby conflicts. Also,
   // the fact that `only_silence_recorded_` can be affected during the complete
   // call makes chances of conflicts with potentially one last callback very
   // small.
   const size_t time_since_start = rtc::TimeSince(rec_start_time_);
   if (time_since_start > kMinValidCallTimeTimeInMilliseconds) {
     const int only_zeros = static_cast<int>(only_silence_recorded_);
     RTC_HISTOGRAM_BOOLEAN("WebRTC.Audio.RecordedOnlyZeros", only_zeros);
     RTC_LOG(LS_INFO) << "HISTOGRAM(WebRTC.Audio.RecordedOnlyZeros): "
                      << only_zeros;
   }
   RTC_LOG(LS_INFO) << "total recording time: " << time_since_start;
 }

 int32_t AudioDeviceBuffer::SetRecordingSampleRate(uint32_t fsHz) {
   RTC_LOG(LS_INFO) << "SetRecordingSampleRate(" << fsHz << ")";
   rec_sample_rate_ = fsHz;
   return 0;
 }

 int32_t AudioDeviceBuffer::SetPlayoutSampleRate(uint32_t fsHz) {
   RTC_LOG(LS_INFO) << "SetPlayoutSampleRate(" << fsHz << ")";
   play_sample_rate_ = fsHz;
   return 0;
 }

 uint32_t AudioDeviceBuffer::RecordingSampleRate() const {
   return rec_sample_rate_;
 }

 uint32_t AudioDeviceBuffer::PlayoutSampleRate() const {
   return play_sample_rate_;
 }

 int32_t AudioDeviceBuffer::SetRecordingChannels(size_t channels) {
   RTC_LOG(LS_INFO) << "SetRecordingChannels(" << channels << ")";
   rec_channels_ = channels;
   return 0;
 }

 int32_t AudioDeviceBuffer::SetPlayoutChannels(size_t channels) {
   RTC_LOG(LS_INFO) << "SetPlayoutChannels(" << channels << ")";
   play_channels_ = channels;
   return 0;
 }

 size_t AudioDeviceBuffer::RecordingChannels() const {
   return rec_channels_;
 }

 size_t AudioDeviceBuffer::PlayoutChannels() const {
   return play_channels_;
 }

 int32_t AudioDeviceBuffer::SetTypingStatus(bool typing_status) {
   typing_status_ = typing_status;
   return 0;
 }

 void AudioDeviceBuffer::SetVQEData(int play_delay_ms, int rec_delay_ms) {
   play_delay_ms_ = play_delay_ms;
   rec_delay_ms_ = rec_delay_ms;
 }

 int32_t AudioDeviceBuffer::SetRecordedBuffer(const void* audio_buffer,
                                              size_t samples_per_channel) {
   return SetRecordedBuffer(audio_buffer, samples_per_channel, std::nullopt);
 }

 int32_t AudioDeviceBuffer::SetRecordedBuffer(
     const void* audio_buffer,
     size_t samples_per_channel,
     std::optional<int64_t> capture_timestamp_ns) {
   // Copy the complete input buffer to the local buffer.
   const size_t old_size = rec_buffer_.size();
   rec_buffer_.SetData(static_cast<const int16_t*>(audio_buffer),
                       rec_channels_ * samples_per_channel);
   // Keep track of the size of the recording buffer. Only updated when the
   // size changes, which is a rare event.
   if (old_size != rec_buffer_.size()) {
     RTC_LOG(LS_INFO) << "Size of recording buffer: " << rec_buffer_.size();
   }

   if (capture_timestamp_ns) {
     int64_t align_offsync_estimation_time = rtc::TimeMicros();
     if (align_offsync_estimation_time -
             rtc::TimestampAligner::kMinFrameIntervalUs >
         align_offsync_estimation_time_) {
       align_offsync_estimation_time_ = align_offsync_estimation_time;
       capture_timestamp_ns_ =
           rtc::kNumNanosecsPerMicrosec *
           timestamp_aligner_.TranslateTimestamp(
               *capture_timestamp_ns / rtc::kNumNanosecsPerMicrosec,
               align_offsync_estimation_time);
     } else {
       // The Timestamp aligner is designed to prevent timestamps that are too
       // similar, and produces warnings if it is called to often. We do not care
       // about that here, so we do this workaround. If we where to call the
       // aligner within a millisecond, we instead call this, that do not update
       // the clock offset estimation. This get us timestamps without generating
       // warnings, but could generate two timestamps within a millisecond.
       capture_timestamp_ns_ =
           rtc::kNumNanosecsPerMicrosec *
           timestamp_aligner_.TranslateTimestamp(*capture_timestamp_ns /
                                                 rtc::kNumNanosecsPerMicrosec);
     }
   }
   // Derive a new level value twice per second and check if it is non-zero.
   int16_t max_abs = 0;
   RTC_DCHECK_LT(rec_stat_count_, 50);
   if (++rec_stat_count_ >= 50) {
     // Returns the largest absolute value in a signed 16-bit vector.
     max_abs = WebRtcSpl_MaxAbsValueW16(rec_buffer_.data(), rec_buffer_.size());
     rec_stat_count_ = 0;
     // Set `only_silence_recorded_` to false as soon as at least one detection
     // of a non-zero audio packet is found. It can only be restored to true
     // again by restarting the call.
     if (max_abs > 0) {
       only_silence_recorded_ = false;
     }
   }
   // Update recording stats which is used as base for periodic logging of the
   // audio input state.
   UpdateRecStats(max_abs, samples_per_channel);
   return 0;
 }

 int32_t AudioDeviceBuffer::DeliverRecordedData() {
   if (!audio_transport_cb_) {
     RTC_LOG(LS_WARNING) << "Invalid audio transport";
     return 0;
   }
   const size_t frames = rec_buffer_.size() / rec_channels_;
   const size_t bytes_per_frame = rec_channels_ * sizeof(int16_t);
   uint32_t new_mic_level_dummy = 0;
   uint32_t total_delay_ms = play_delay_ms_ + rec_delay_ms_;
   int32_t res = audio_transport_cb_->RecordedDataIsAvailable(
       rec_buffer_.data(), frames, bytes_per_frame, rec_channels_,
       rec_sample_rate_, total_delay_ms, 0, 0, typing_status_,
       new_mic_level_dummy, capture_timestamp_ns_);
   if (res == -1) {
     RTC_LOG(LS_ERROR) << "RecordedDataIsAvailable() failed";
   }
   return 0;
 }

 int32_t AudioDeviceBuffer::RequestPlayoutData(size_t samples_per_channel) {
   TRACE_EVENT1("webrtc", "AudioDeviceBuffer::RequestPlayoutData",
                "samples_per_channel", samples_per_channel);

   // The consumer can change the requested size on the fly and we therefore
   // resize the buffer accordingly. Also takes place at the first call to this
   // method.
   const size_t total_samples = play_channels_ * samples_per_channel;
   if (play_buffer_.size() != total_samples) {
     play_buffer_.SetSize(total_samples);
     RTC_LOG(LS_INFO) << "Size of playout buffer: " << play_buffer_.size();
   }

   size_t num_samples_out(0);
   // It is currently supported to start playout without a valid audio
   // transport object. Leads to warning and silence.
   if (!audio_transport_cb_) {
     RTC_LOG(LS_WARNING) << "Invalid audio transport";
     return 0;
   }

   // Retrieve new 16-bit PCM audio data using the audio transport instance.
   int64_t elapsed_time_ms = -1;
   int64_t ntp_time_ms = -1;
   const size_t bytes_per_frame = play_channels_ * sizeof(int16_t);
   uint32_t res = audio_transport_cb_->NeedMorePlayData(
       samples_per_channel, bytes_per_frame, play_channels_, play_sample_rate_,
       play_buffer_.data(), num_samples_out, &elapsed_time_ms, &ntp_time_ms);
   if (res != 0) {
     RTC_LOG(LS_ERROR) << "NeedMorePlayData() failed";
   }

   // Derive a new level value twice per second.
   int16_t max_abs = 0;
   RTC_DCHECK_LT(play_stat_count_, 50);
   if (++play_stat_count_ >= 50) {
     // Returns the largest absolute value in a signed 16-bit vector.
     max_abs =
         WebRtcSpl_MaxAbsValueW16(play_buffer_.data(), play_buffer_.size());
     play_stat_count_ = 0;
   }
   // Update playout stats which is used as base for periodic logging of the
   // audio output state.
   UpdatePlayStats(max_abs, num_samples_out / play_channels_);
   return static_cast<int32_t>(num_samples_out / play_channels_);
 }

 int32_t AudioDeviceBuffer::GetPlayoutData(void* audio_buffer) {
   RTC_DCHECK_GT(play_buffer_.size(), 0);
 #ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
   const double phase_increment =
       k2Pi * 440.0 / static_cast<double>(play_sample_rate_);
   int16_t* destination_r = reinterpret_cast<int16_t*>(audio_buffer);
   if (play_channels_ == 1) {
     for (size_t i = 0; i < play_buffer_.size(); ++i) {
       destination_r[i] = static_cast<int16_t>((sin(phase_) * (1 << 14)));
       phase_ += phase_increment;
     }
   } else if (play_channels_ == 2) {
     for (size_t i = 0; i < play_buffer_.size() / 2; ++i) {
       destination_r[2 * i] = destination_r[2 * i + 1] =
           static_cast<int16_t>((sin(phase_) * (1 << 14)));
       phase_ += phase_increment;
     }
   }
 #else
   memcpy(audio_buffer, play_buffer_.data(),
          play_buffer_.size() * sizeof(int16_t));
 #endif
   // Return samples per channel or number of frames.
   return static_cast<int32_t>(play_buffer_.size() / play_channels_);
 }

 void AudioDeviceBuffer::StartPeriodicLogging() {
   task_queue_->PostTask([this] { LogStats(AudioDeviceBuffer::LOG_START); });
 }

 void AudioDeviceBuffer::StopPeriodicLogging() {
   task_queue_->PostTask([this] { LogStats(AudioDeviceBuffer::LOG_STOP); });
 }

 void AudioDeviceBuffer::LogStats(LogState state) {
   RTC_DCHECK_RUN_ON(task_queue_.get());
   int64_t now_time = rtc::TimeMillis();

   if (state == AudioDeviceBuffer::LOG_START) {
     // Reset counters at start. We will not add any logging in this state but
     // the timer will started by posting a new (delayed) task.
     num_stat_reports_ = 0;
     last_timer_task_time_ = now_time;
     log_stats_ = true;
   } else if (state == AudioDeviceBuffer::LOG_STOP) {
     // Stop logging and posting new tasks.
     log_stats_ = false;
   } else if (state == AudioDeviceBuffer::LOG_ACTIVE) {
     // Keep logging unless logging was disabled while task was posted.
   }

   // Avoid adding more logs since we are in STOP mode.
   if (!log_stats_) {
     return;
   }

   int64_t next_callback_time = now_time + kTimerIntervalInMilliseconds;
   int64_t time_since_last = rtc::TimeDiff(now_time, last_timer_task_time_);
   last_timer_task_time_ = now_time;

   Stats stats;
   {
     MutexLock lock(&lock_);
     stats = stats_;
     stats_.max_rec_level = 0;
     stats_.max_play_level = 0;
   }

   // Cache current sample rate from atomic members.
   const uint32_t rec_sample_rate = rec_sample_rate_;
   const uint32_t play_sample_rate = play_sample_rate_;

   // Log the latest statistics but skip the first two rounds just after state
   // was set to LOG_START to ensure that we have at least one full stable
   // 10-second interval for sample-rate estimation. Hence, first printed log
   // will be after ~20 seconds.
   if (++num_stat_reports_ > 2 &&
       static_cast<size_t>(time_since_last) > kTimerIntervalInMilliseconds / 2) {
     uint32_t diff_samples = stats.rec_samples - last_stats_.rec_samples;
     float rate = diff_samples / (static_cast<float>(time_since_last) / 1000.0);
     uint32_t abs_diff_rate_in_percent = 0;
     if (rec_sample_rate > 0 && rate > 0) {
       abs_diff_rate_in_percent = static_cast<uint32_t>(
           0.5f +
           ((100.0f * std::abs(rate - rec_sample_rate)) / rec_sample_rate));
       RTC_HISTOGRAM_PERCENTAGE("WebRTC.Audio.RecordSampleRateOffsetInPercent",
                                abs_diff_rate_in_percent);
       RTC_LOG(LS_INFO) << "[REC : " << time_since_last << "msec, "
                        << rec_sample_rate / 1000 << "kHz] callbacks: "
                        << stats.rec_callbacks - last_stats_.rec_callbacks
                        << ", "
                           "samples: "
                        << diff_samples
                        << ", "
                           "rate: "
                        << static_cast<int>(rate + 0.5)
                        << ", "
                           "rate diff: "
                        << abs_diff_rate_in_percent
                        << "%, "
                           "level: "
                        << stats.max_rec_level;
     }

     diff_samples = stats.play_samples - last_stats_.play_samples;
     rate = diff_samples / (static_cast<float>(time_since_last) / 1000.0);
     abs_diff_rate_in_percent = 0;
     if (play_sample_rate > 0 && rate > 0) {
       abs_diff_rate_in_percent = static_cast<uint32_t>(
           0.5f +
           ((100.0f * std::abs(rate - play_sample_rate)) / play_sample_rate));
       RTC_HISTOGRAM_PERCENTAGE("WebRTC.Audio.PlayoutSampleRateOffsetInPercent",
                                abs_diff_rate_in_percent);
       RTC_LOG(LS_INFO) << "[PLAY: " << time_since_last << "msec, "
                        << play_sample_rate / 1000 << "kHz] callbacks: "
                        << stats.play_callbacks - last_stats_.play_callbacks
                        << ", "
                           "samples: "
                        << diff_samples
                        << ", "
                           "rate: "
                        << static_cast<int>(rate + 0.5)
                        << ", "
                           "rate diff: "
                        << abs_diff_rate_in_percent
                        << "%, "
                           "level: "
                        << stats.max_play_level;
     }
   }
   last_stats_ = stats;

   int64_t time_to_wait_ms = next_callback_time - rtc::TimeMillis();
   RTC_DCHECK_GT(time_to_wait_ms, 0) << "Invalid timer interval";

   // Keep posting new (delayed) tasks until state is changed to kLogStop.
   task_queue_->PostDelayedTask(
       [this] { AudioDeviceBuffer::LogStats(AudioDeviceBuffer::LOG_ACTIVE); },
       TimeDelta::Millis(time_to_wait_ms));
 }

 void AudioDeviceBuffer::ResetRecStats() {
   RTC_DCHECK_RUN_ON(task_queue_.get());
   last_stats_.ResetRecStats();
   MutexLock lock(&lock_);
   stats_.ResetRecStats();
 }

 void AudioDeviceBuffer::ResetPlayStats() {
   RTC_DCHECK_RUN_ON(task_queue_.get());
   last_stats_.ResetPlayStats();
   MutexLock lock(&lock_);
   stats_.ResetPlayStats();
 }

 void AudioDeviceBuffer::UpdateRecStats(int16_t max_abs,
                                        size_t samples_per_channel) {
   MutexLock lock(&lock_);
   ++stats_.rec_callbacks;
   stats_.rec_samples += samples_per_channel;
   if (max_abs > stats_.max_rec_level) {
     stats_.max_rec_level = max_abs;
   }
 }

 void AudioDeviceBuffer::UpdatePlayStats(int16_t max_abs,
                                         size_t samples_per_channel) {
   MutexLock lock(&lock_);
   ++stats_.play_callbacks;
   stats_.play_samples += samples_per_channel;
   if (max_abs > stats_.max_play_level) {
     stats_.max_play_level = max_abs;
   }
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_device/audio_device_buffer.h"

	#include <string.h>

	#include <cmath>
	#include <cstddef>
	#include <cstdint>

	#include "common_audio/signal_processing/include/signal_processing_library.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/logging.h"
	#include "rtc_base/time_utils.h"
	#include "rtc_base/trace_event.h"
	#include "system_wrappers/include/metrics.h"

	namespace webrtc {

	static const char kTimerQueueName[] = "AudioDeviceBufferTimer";

	// Time between two sucessive calls to LogStats().
	static const size_t kTimerIntervalInSeconds = 10;
	static const size_t kTimerIntervalInMilliseconds =
	kTimerIntervalInSeconds * rtc::kNumMillisecsPerSec;
	// Min time required to qualify an audio session as a "call". If playout or
	// recording has been active for less than this time we will not store any
	// logs or UMA stats but instead consider the call as too short.
	static const size_t kMinValidCallTimeTimeInSeconds = 10;
	static const size_t kMinValidCallTimeTimeInMilliseconds =
	kMinValidCallTimeTimeInSeconds * rtc::kNumMillisecsPerSec;
	#ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
	static const double k2Pi = 6.28318530717959;
	#endif

	AudioDeviceBuffer::AudioDeviceBuffer(TaskQueueFactory* task_queue_factory,
	bool create_detached)
	: task_queue_(task_queue_factory->CreateTaskQueue(
	kTimerQueueName,
	TaskQueueFactory::Priority::NORMAL)),
	audio_transport_cb_(nullptr),
	rec_sample_rate_(0),
	play_sample_rate_(0),
	rec_channels_(0),
	play_channels_(0),
	playing_(false),
	recording_(false),
	typing_status_(false),
	play_delay_ms_(0),
	rec_delay_ms_(0),
	num_stat_reports_(0),
	last_timer_task_time_(0),
	rec_stat_count_(0),
	play_stat_count_(0),
	play_start_time_(0),
	only_silence_recorded_(true),
	log_stats_(false) {
	RTC_LOG(LS_INFO) << "AudioDeviceBuffer::ctor";
	#ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
	phase_ = 0.0;
	RTC_LOG(LS_WARNING) << "AUDIO_DEVICE_PLAYS_SINUS_TONE is defined!";
	#endif
	if (create_detached) {
	main_thread_checker_.Detach();
	}
	}

	AudioDeviceBuffer::~AudioDeviceBuffer() {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	RTC_DCHECK(!playing_);
	RTC_DCHECK(!recording_);
	RTC_LOG(LS_INFO) << "AudioDeviceBuffer::~dtor";

	// Delete and and thus stop task queue before deleting other members to avoid
	// race with running tasks. Even though !playing_ and !recording_ called
	// StopPeriodicLogging, such stop is asynchronous and may race with the
	// AudioDeviceBuffer destructor. In particular there might be regular LogStats
	// that attempts to repost task to the task_queue_.
	// Thus task_queue_ should be deleted before pointer to it is invalidated.
	// std::unique_ptr destructor does the same two operations in reverse order as
	// it doesn't expect member would be used after its destruction has started.
	task_queue_.get_deleter()(task_queue_.get());
	task_queue_.release();
	}

	int32_t AudioDeviceBuffer::RegisterAudioCallback(
	AudioTransport* audio_callback) {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	RTC_DLOG(LS_INFO) << __FUNCTION__;
	if (playing_ \|\| recording_) {
	RTC_LOG(LS_ERROR) << "Failed to set audio transport since media was active";
	return -1;
	}
	audio_transport_cb_ = audio_callback;
	return 0;
	}

	void AudioDeviceBuffer::StartPlayout() {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	// TODO(henrika): allow for usage of DCHECK(!playing_) here instead. Today the
	// ADM allows calling Start(), Start() by ignoring the second call but it
	// makes more sense to only allow one call.
	if (playing_) {
	return;
	}
	RTC_DLOG(LS_INFO) << __FUNCTION__;
	// Clear members tracking playout stats and do it on the task queue.
	task_queue_->PostTask([this] { ResetPlayStats(); });
	// Start a periodic timer based on task queue if not already done by the
	// recording side.
	if (!recording_) {
	StartPeriodicLogging();
	}
	const int64_t now_time = rtc::TimeMillis();
	// Clear members that are only touched on the main (creating) thread.
	play_start_time_ = now_time;
	playing_ = true;
	}

	void AudioDeviceBuffer::StartRecording() {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	if (recording_) {
	return;
	}
	RTC_DLOG(LS_INFO) << __FUNCTION__;
	// Clear members tracking recording stats and do it on the task queue.
	task_queue_->PostTask([this] { ResetRecStats(); });
	// Start a periodic timer based on task queue if not already done by the
	// playout side.
	if (!playing_) {
	StartPeriodicLogging();
	}
	// Clear members that will be touched on the main (creating) thread.
	rec_start_time_ = rtc::TimeMillis();
	recording_ = true;
	// And finally a member which can be modified on the native audio thread.
	// It is safe to do so since we know by design that the owning ADM has not
	// yet started the native audio recording.
	only_silence_recorded_ = true;
	}

	void AudioDeviceBuffer::StopPlayout() {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	if (!playing_) {
	return;
	}
	RTC_DLOG(LS_INFO) << __FUNCTION__;
	playing_ = false;
	// Stop periodic logging if no more media is active.
	if (!recording_) {
	StopPeriodicLogging();
	}
	RTC_LOG(LS_INFO) << "total playout time: "
	<< rtc::TimeSince(play_start_time_);
	}

	void AudioDeviceBuffer::StopRecording() {
	RTC_DCHECK_RUN_ON(&main_thread_checker_);
	if (!recording_) {
	return;
	}
	RTC_DLOG(LS_INFO) << __FUNCTION__;
	recording_ = false;
	// Stop periodic logging if no more media is active.
	if (!playing_) {
	StopPeriodicLogging();
	}
	// Add UMA histogram to keep track of the case when only zeros have been
	// recorded. Measurements (max of absolute level) are taken twice per second,
	// which means that if e.g 10 seconds of audio has been recorded, a total of
	// 20 level estimates must all be identical to zero to trigger the histogram.
	// `only_silence_recorded_` can only be cleared on the native audio thread
	// that drives audio capture but we know by design that the audio has stopped
	// when this method is called, hence there should not be aby conflicts. Also,
	// the fact that `only_silence_recorded_` can be affected during the complete
	// call makes chances of conflicts with potentially one last callback very
	// small.
	const size_t time_since_start = rtc::TimeSince(rec_start_time_);
	if (time_since_start > kMinValidCallTimeTimeInMilliseconds) {
	const int only_zeros = static_cast<int>(only_silence_recorded_);
	RTC_HISTOGRAM_BOOLEAN("WebRTC.Audio.RecordedOnlyZeros", only_zeros);
	RTC_LOG(LS_INFO) << "HISTOGRAM(WebRTC.Audio.RecordedOnlyZeros): "
	<< only_zeros;
	}
	RTC_LOG(LS_INFO) << "total recording time: " << time_since_start;
	}

	int32_t AudioDeviceBuffer::SetRecordingSampleRate(uint32_t fsHz) {
	RTC_LOG(LS_INFO) << "SetRecordingSampleRate(" << fsHz << ")";
	rec_sample_rate_ = fsHz;
	return 0;
	}

	int32_t AudioDeviceBuffer::SetPlayoutSampleRate(uint32_t fsHz) {
	RTC_LOG(LS_INFO) << "SetPlayoutSampleRate(" << fsHz << ")";
	play_sample_rate_ = fsHz;
	return 0;
	}

	uint32_t AudioDeviceBuffer::RecordingSampleRate() const {
	return rec_sample_rate_;
	}

	uint32_t AudioDeviceBuffer::PlayoutSampleRate() const {
	return play_sample_rate_;
	}

	int32_t AudioDeviceBuffer::SetRecordingChannels(size_t channels) {
	RTC_LOG(LS_INFO) << "SetRecordingChannels(" << channels << ")";
	rec_channels_ = channels;
	return 0;
	}

	int32_t AudioDeviceBuffer::SetPlayoutChannels(size_t channels) {
	RTC_LOG(LS_INFO) << "SetPlayoutChannels(" << channels << ")";
	play_channels_ = channels;
	return 0;
	}

	size_t AudioDeviceBuffer::RecordingChannels() const {
	return rec_channels_;
	}

	size_t AudioDeviceBuffer::PlayoutChannels() const {
	return play_channels_;
	}

	int32_t AudioDeviceBuffer::SetTypingStatus(bool typing_status) {
	typing_status_ = typing_status;
	return 0;
	}

	void AudioDeviceBuffer::SetVQEData(int play_delay_ms, int rec_delay_ms) {
	play_delay_ms_ = play_delay_ms;
	rec_delay_ms_ = rec_delay_ms;
	}

	int32_t AudioDeviceBuffer::SetRecordedBuffer(const void* audio_buffer,
	size_t samples_per_channel) {
	return SetRecordedBuffer(audio_buffer, samples_per_channel, std::nullopt);
	}

	int32_t AudioDeviceBuffer::SetRecordedBuffer(
	const void* audio_buffer,
	size_t samples_per_channel,
	std::optional<int64_t> capture_timestamp_ns) {
	// Copy the complete input buffer to the local buffer.
	const size_t old_size = rec_buffer_.size();
	rec_buffer_.SetData(static_cast<const int16_t*>(audio_buffer),
	rec_channels_ * samples_per_channel);
	// Keep track of the size of the recording buffer. Only updated when the
	// size changes, which is a rare event.
	if (old_size != rec_buffer_.size()) {
	RTC_LOG(LS_INFO) << "Size of recording buffer: " << rec_buffer_.size();
	}

	if (capture_timestamp_ns) {
	int64_t align_offsync_estimation_time = rtc::TimeMicros();
	if (align_offsync_estimation_time -
	rtc::TimestampAligner::kMinFrameIntervalUs >
	align_offsync_estimation_time_) {
	align_offsync_estimation_time_ = align_offsync_estimation_time;
	capture_timestamp_ns_ =
	rtc::kNumNanosecsPerMicrosec *
	timestamp_aligner_.TranslateTimestamp(
	*capture_timestamp_ns / rtc::kNumNanosecsPerMicrosec,
	align_offsync_estimation_time);
	} else {
	// The Timestamp aligner is designed to prevent timestamps that are too
	// similar, and produces warnings if it is called to often. We do not care
	// about that here, so we do this workaround. If we where to call the
	// aligner within a millisecond, we instead call this, that do not update
	// the clock offset estimation. This get us timestamps without generating
	// warnings, but could generate two timestamps within a millisecond.
	capture_timestamp_ns_ =
	rtc::kNumNanosecsPerMicrosec *
	timestamp_aligner_.TranslateTimestamp(*capture_timestamp_ns /
	rtc::kNumNanosecsPerMicrosec);
	}
	}
	// Derive a new level value twice per second and check if it is non-zero.
	int16_t max_abs = 0;
	RTC_DCHECK_LT(rec_stat_count_, 50);
	if (++rec_stat_count_ >= 50) {
	// Returns the largest absolute value in a signed 16-bit vector.
	max_abs = WebRtcSpl_MaxAbsValueW16(rec_buffer_.data(), rec_buffer_.size());
	rec_stat_count_ = 0;
	// Set `only_silence_recorded_` to false as soon as at least one detection
	// of a non-zero audio packet is found. It can only be restored to true
	// again by restarting the call.
	if (max_abs > 0) {
	only_silence_recorded_ = false;
	}
	}
	// Update recording stats which is used as base for periodic logging of the
	// audio input state.
	UpdateRecStats(max_abs, samples_per_channel);
	return 0;
	}

	int32_t AudioDeviceBuffer::DeliverRecordedData() {
	if (!audio_transport_cb_) {
	RTC_LOG(LS_WARNING) << "Invalid audio transport";
	return 0;
	}
	const size_t frames = rec_buffer_.size() / rec_channels_;
	const size_t bytes_per_frame = rec_channels_ * sizeof(int16_t);
	uint32_t new_mic_level_dummy = 0;
	uint32_t total_delay_ms = play_delay_ms_ + rec_delay_ms_;
	int32_t res = audio_transport_cb_->RecordedDataIsAvailable(
	rec_buffer_.data(), frames, bytes_per_frame, rec_channels_,
	rec_sample_rate_, total_delay_ms, 0, 0, typing_status_,
	new_mic_level_dummy, capture_timestamp_ns_);
	if (res == -1) {
	RTC_LOG(LS_ERROR) << "RecordedDataIsAvailable() failed";
	}
	return 0;
	}

	int32_t AudioDeviceBuffer::RequestPlayoutData(size_t samples_per_channel) {
	TRACE_EVENT1("webrtc", "AudioDeviceBuffer::RequestPlayoutData",
	"samples_per_channel", samples_per_channel);

	// The consumer can change the requested size on the fly and we therefore
	// resize the buffer accordingly. Also takes place at the first call to this
	// method.
	const size_t total_samples = play_channels_ * samples_per_channel;
	if (play_buffer_.size() != total_samples) {
	play_buffer_.SetSize(total_samples);
	RTC_LOG(LS_INFO) << "Size of playout buffer: " << play_buffer_.size();
	}

	size_t num_samples_out(0);
	// It is currently supported to start playout without a valid audio
	// transport object. Leads to warning and silence.
	if (!audio_transport_cb_) {
	RTC_LOG(LS_WARNING) << "Invalid audio transport";
	return 0;
	}

	// Retrieve new 16-bit PCM audio data using the audio transport instance.
	int64_t elapsed_time_ms = -1;
	int64_t ntp_time_ms = -1;
	const size_t bytes_per_frame = play_channels_ * sizeof(int16_t);
	uint32_t res = audio_transport_cb_->NeedMorePlayData(
	samples_per_channel, bytes_per_frame, play_channels_, play_sample_rate_,
	play_buffer_.data(), num_samples_out, &elapsed_time_ms, &ntp_time_ms);
	if (res != 0) {
	RTC_LOG(LS_ERROR) << "NeedMorePlayData() failed";
	}

	// Derive a new level value twice per second.
	int16_t max_abs = 0;
	RTC_DCHECK_LT(play_stat_count_, 50);
	if (++play_stat_count_ >= 50) {
	// Returns the largest absolute value in a signed 16-bit vector.
	max_abs =
	WebRtcSpl_MaxAbsValueW16(play_buffer_.data(), play_buffer_.size());
	play_stat_count_ = 0;
	}
	// Update playout stats which is used as base for periodic logging of the
	// audio output state.
	UpdatePlayStats(max_abs, num_samples_out / play_channels_);
	return static_cast<int32_t>(num_samples_out / play_channels_);
	}

	int32_t AudioDeviceBuffer::GetPlayoutData(void* audio_buffer) {
	RTC_DCHECK_GT(play_buffer_.size(), 0);
	#ifdef AUDIO_DEVICE_PLAYS_SINUS_TONE
	const double phase_increment =
	k2Pi * 440.0 / static_cast<double>(play_sample_rate_);
	int16_t* destination_r = reinterpret_cast<int16_t*>(audio_buffer);
	if (play_channels_ == 1) {
	for (size_t i = 0; i < play_buffer_.size(); ++i) {
	destination_r[i] = static_cast<int16_t>((sin(phase_) * (1 << 14)));
	phase_ += phase_increment;
	}
	} else if (play_channels_ == 2) {
	for (size_t i = 0; i < play_buffer_.size() / 2; ++i) {
	destination_r[2 * i] = destination_r[2 * i + 1] =
	static_cast<int16_t>((sin(phase_) * (1 << 14)));
	phase_ += phase_increment;
	}
	}
	#else
	memcpy(audio_buffer, play_buffer_.data(),
	play_buffer_.size() * sizeof(int16_t));
	#endif
	// Return samples per channel or number of frames.
	return static_cast<int32_t>(play_buffer_.size() / play_channels_);
	}

	void AudioDeviceBuffer::StartPeriodicLogging() {
	task_queue_->PostTask([this] { LogStats(AudioDeviceBuffer::LOG_START); });
	}

	void AudioDeviceBuffer::StopPeriodicLogging() {
	task_queue_->PostTask([this] { LogStats(AudioDeviceBuffer::LOG_STOP); });
	}

	void AudioDeviceBuffer::LogStats(LogState state) {
	RTC_DCHECK_RUN_ON(task_queue_.get());
	int64_t now_time = rtc::TimeMillis();

	if (state == AudioDeviceBuffer::LOG_START) {
	// Reset counters at start. We will not add any logging in this state but
	// the timer will started by posting a new (delayed) task.
	num_stat_reports_ = 0;
	last_timer_task_time_ = now_time;
	log_stats_ = true;
	} else if (state == AudioDeviceBuffer::LOG_STOP) {
	// Stop logging and posting new tasks.
	log_stats_ = false;
	} else if (state == AudioDeviceBuffer::LOG_ACTIVE) {
	// Keep logging unless logging was disabled while task was posted.
	}

	// Avoid adding more logs since we are in STOP mode.
	if (!log_stats_) {
	return;
	}

	int64_t next_callback_time = now_time + kTimerIntervalInMilliseconds;
	int64_t time_since_last = rtc::TimeDiff(now_time, last_timer_task_time_);
	last_timer_task_time_ = now_time;

	Stats stats;
	{
	MutexLock lock(&lock_);
	stats = stats_;
	stats_.max_rec_level = 0;
	stats_.max_play_level = 0;
	}

	// Cache current sample rate from atomic members.
	const uint32_t rec_sample_rate = rec_sample_rate_;
	const uint32_t play_sample_rate = play_sample_rate_;

	// Log the latest statistics but skip the first two rounds just after state
	// was set to LOG_START to ensure that we have at least one full stable
	// 10-second interval for sample-rate estimation. Hence, first printed log
	// will be after ~20 seconds.
	if (++num_stat_reports_ > 2 &&
	static_cast<size_t>(time_since_last) > kTimerIntervalInMilliseconds / 2) {
	uint32_t diff_samples = stats.rec_samples - last_stats_.rec_samples;
	float rate = diff_samples / (static_cast<float>(time_since_last) / 1000.0);
	uint32_t abs_diff_rate_in_percent = 0;
	if (rec_sample_rate > 0 && rate > 0) {
	abs_diff_rate_in_percent = static_cast<uint32_t>(
	0.5f +
	((100.0f * std::abs(rate - rec_sample_rate)) / rec_sample_rate));
	RTC_HISTOGRAM_PERCENTAGE("WebRTC.Audio.RecordSampleRateOffsetInPercent",
	abs_diff_rate_in_percent);
	RTC_LOG(LS_INFO) << "[REC : " << time_since_last << "msec, "
	<< rec_sample_rate / 1000 << "kHz] callbacks: "
	<< stats.rec_callbacks - last_stats_.rec_callbacks
	<< ", "
	"samples: "
	<< diff_samples
	<< ", "
	"rate: "
	<< static_cast<int>(rate + 0.5)
	<< ", "
	"rate diff: "
	<< abs_diff_rate_in_percent
	<< "%, "
	"level: "
	<< stats.max_rec_level;
	}

	diff_samples = stats.play_samples - last_stats_.play_samples;
	rate = diff_samples / (static_cast<float>(time_since_last) / 1000.0);
	abs_diff_rate_in_percent = 0;
	if (play_sample_rate > 0 && rate > 0) {
	abs_diff_rate_in_percent = static_cast<uint32_t>(
	0.5f +
	((100.0f * std::abs(rate - play_sample_rate)) / play_sample_rate));
	RTC_HISTOGRAM_PERCENTAGE("WebRTC.Audio.PlayoutSampleRateOffsetInPercent",
	abs_diff_rate_in_percent);
	RTC_LOG(LS_INFO) << "[PLAY: " << time_since_last << "msec, "
	<< play_sample_rate / 1000 << "kHz] callbacks: "
	<< stats.play_callbacks - last_stats_.play_callbacks
	<< ", "
	"samples: "
	<< diff_samples
	<< ", "
	"rate: "
	<< static_cast<int>(rate + 0.5)
	<< ", "
	"rate diff: "
	<< abs_diff_rate_in_percent
	<< "%, "
	"level: "
	<< stats.max_play_level;
	}
	}
	last_stats_ = stats;

	int64_t time_to_wait_ms = next_callback_time - rtc::TimeMillis();
	RTC_DCHECK_GT(time_to_wait_ms, 0) << "Invalid timer interval";

	// Keep posting new (delayed) tasks until state is changed to kLogStop.
	task_queue_->PostDelayedTask(
	[this] { AudioDeviceBuffer::LogStats(AudioDeviceBuffer::LOG_ACTIVE); },
	TimeDelta::Millis(time_to_wait_ms));
	}

	void AudioDeviceBuffer::ResetRecStats() {
	RTC_DCHECK_RUN_ON(task_queue_.get());
	last_stats_.ResetRecStats();
	MutexLock lock(&lock_);
	stats_.ResetRecStats();
	}

	void AudioDeviceBuffer::ResetPlayStats() {
	RTC_DCHECK_RUN_ON(task_queue_.get());
	last_stats_.ResetPlayStats();
	MutexLock lock(&lock_);
	stats_.ResetPlayStats();
	}

	void AudioDeviceBuffer::UpdateRecStats(int16_t max_abs,
	size_t samples_per_channel) {
	MutexLock lock(&lock_);
	++stats_.rec_callbacks;
	stats_.rec_samples += samples_per_channel;
	if (max_abs > stats_.max_rec_level) {
	stats_.max_rec_level = max_abs;
	}
	}

	void AudioDeviceBuffer::UpdatePlayStats(int16_t max_abs,
	size_t samples_per_channel) {
	MutexLock lock(&lock_);
	++stats_.play_callbacks;
	stats_.play_samples += samples_per_channel;
	if (max_abs > stats_.max_play_level) {
	stats_.max_play_level = max_abs;
	}
	}

	} // namespace webrtc