modules/audio_coding/codecs/red/audio_encoder_copy_red.cc - src/ - Git at Google

 /*
  *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/audio_coding/codecs/red/audio_encoder_copy_red.h"

 #include <string.h>

 #include <utility>
 #include <vector>

 #include "absl/strings/string_view.h"
 #include "rtc_base/byte_order.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/logging.h"

 namespace webrtc {
 static constexpr const int kRedMaxPacketSize =
     1 << 10;  // RED packets must be less than 1024 bytes to fit the 10 bit
               // block length.
 static constexpr const size_t kRedMaxTimestampDelta =
     1 << 14;  // RED packets can encode a timestamp delta of 14 bits.
 static constexpr const size_t kAudioMaxRtpPacketLen =
     1200;  // The typical MTU is 1200 bytes.

 static constexpr size_t kRedHeaderLength = 4;  // 4 bytes RED header.
 static constexpr size_t kRedLastHeaderLength =
     1;  // reduced size for last RED header.

 static constexpr size_t kRedNumberOfRedundantEncodings =
     1;  // The level of redundancy we support.

 AudioEncoderCopyRed::Config::Config() = default;
 AudioEncoderCopyRed::Config::Config(Config&&) = default;
 AudioEncoderCopyRed::Config::~Config() = default;

 size_t GetMaxRedundancyFromFieldTrial(const FieldTrialsView& field_trials) {
   const std::string red_trial =
       field_trials.Lookup("WebRTC-Audio-Red-For-Opus");
   size_t redundancy = 0;
   if (sscanf(red_trial.c_str(), "Enabled-%zu", &redundancy) != 1 ||
       redundancy > 9) {
     return kRedNumberOfRedundantEncodings;
   }
   return redundancy;
 }

 AudioEncoderCopyRed::AudioEncoderCopyRed(Config&& config,
                                          const FieldTrialsView& field_trials)
     : speech_encoder_(std::move(config.speech_encoder)),
       primary_encoded_(0, kAudioMaxRtpPacketLen),
       max_packet_length_(kAudioMaxRtpPacketLen),
       red_payload_type_(config.payload_type) {
   RTC_CHECK(speech_encoder_) << "Speech encoder not provided.";

   auto number_of_redundant_encodings =
       GetMaxRedundancyFromFieldTrial(field_trials);
   for (size_t i = 0; i < number_of_redundant_encodings; i++) {
     std::pair<EncodedInfo, rtc::Buffer> redundant;
     redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);
     redundant_encodings_.push_front(std::move(redundant));
   }
 }

 AudioEncoderCopyRed::~AudioEncoderCopyRed() = default;

 int AudioEncoderCopyRed::SampleRateHz() const {
   return speech_encoder_->SampleRateHz();
 }

 size_t AudioEncoderCopyRed::NumChannels() const {
   return speech_encoder_->NumChannels();
 }

 int AudioEncoderCopyRed::RtpTimestampRateHz() const {
   return speech_encoder_->RtpTimestampRateHz();
 }

 size_t AudioEncoderCopyRed::Num10MsFramesInNextPacket() const {
   return speech_encoder_->Num10MsFramesInNextPacket();
 }

 size_t AudioEncoderCopyRed::Max10MsFramesInAPacket() const {
   return speech_encoder_->Max10MsFramesInAPacket();
 }

 int AudioEncoderCopyRed::GetTargetBitrate() const {
   return speech_encoder_->GetTargetBitrate();
 }

 AudioEncoder::EncodedInfo AudioEncoderCopyRed::EncodeImpl(
     uint32_t rtp_timestamp,
     rtc::ArrayView<const int16_t> audio,
     rtc::Buffer* encoded) {
   primary_encoded_.Clear();
   EncodedInfo info =
       speech_encoder_->Encode(rtp_timestamp, audio, &primary_encoded_);
   RTC_CHECK(info.redundant.empty()) << "Cannot use nested redundant encoders.";
   RTC_DCHECK_EQ(primary_encoded_.size(), info.encoded_bytes);

   if (info.encoded_bytes == 0) {
     return info;
   }
   if (info.encoded_bytes >= kRedMaxPacketSize) {
     // Fallback to the primary encoding if the encoded size is more than
     // what RED can encode as redundancy (1024 bytes). This can happen with
     // Opus stereo at the highest bitrate which consumes up to 1276 bytes.
     encoded->AppendData(primary_encoded_);
     return info;
   }
   RTC_DCHECK_GT(max_packet_length_, info.encoded_bytes);

   size_t header_length_bytes = kRedLastHeaderLength;
   size_t bytes_available = max_packet_length_ - info.encoded_bytes;
   auto it = redundant_encodings_.begin();

   // Determine how much redundancy we can fit into our packet by
   // iterating forward. This is determined both by the length as well
   // as the timestamp difference. The latter can occur with opus DTX which
   // has timestamp gaps of 400ms which exceeds REDs timestamp delta field size.
   for (; it != redundant_encodings_.end(); it++) {
     if (bytes_available < kRedHeaderLength + it->first.encoded_bytes) {
       break;
     }
     if (it->first.encoded_bytes == 0) {
       break;
     }
     if (rtp_timestamp - it->first.encoded_timestamp >= kRedMaxTimestampDelta) {
       break;
     }
     bytes_available -= kRedHeaderLength + it->first.encoded_bytes;
     header_length_bytes += kRedHeaderLength;
   }

   // Allocate room for RFC 2198 header.
   encoded->SetSize(header_length_bytes);

   // Iterate backwards and append the data.
   size_t header_offset = 0;
   while (it-- != redundant_encodings_.begin()) {
     encoded->AppendData(it->second);

     const uint32_t timestamp_delta =
         info.encoded_timestamp - it->first.encoded_timestamp;
     encoded->data()[header_offset] = it->first.payload_type | 0x80;
     rtc::SetBE16(static_cast<uint8_t*>(encoded->data()) + header_offset + 1,
                  (timestamp_delta << 2) | (it->first.encoded_bytes >> 8));
     encoded->data()[header_offset + 3] = it->first.encoded_bytes & 0xff;
     header_offset += kRedHeaderLength;
     info.redundant.push_back(it->first);
   }

   // `info` will be implicitly cast to an EncodedInfoLeaf struct, effectively
   // discarding the (empty) vector of redundant information. This is
   // intentional.
   if (header_length_bytes > kRedHeaderLength) {
     info.redundant.push_back(info);
     RTC_DCHECK_EQ(info.speech,
                   info.redundant[info.redundant.size() - 1].speech);
   }

   encoded->AppendData(primary_encoded_);
   RTC_DCHECK_EQ(header_offset, header_length_bytes - 1);
   encoded->data()[header_offset] = info.payload_type;

   // Shift the redundant encodings.
   auto rit = redundant_encodings_.rbegin();
   for (auto next = std::next(rit); next != redundant_encodings_.rend();
        rit++, next = std::next(rit)) {
     rit->first = next->first;
     rit->second.SetData(next->second);
   }
   it = redundant_encodings_.begin();
   if (it != redundant_encodings_.end()) {
     it->first = info;
     it->second.SetData(primary_encoded_);
   }

   // Update main EncodedInfo.
   info.payload_type = red_payload_type_;
   info.encoded_bytes = encoded->size();
   return info;
 }

 void AudioEncoderCopyRed::Reset() {
   speech_encoder_->Reset();
   auto number_of_redundant_encodings = redundant_encodings_.size();
   redundant_encodings_.clear();
   for (size_t i = 0; i < number_of_redundant_encodings; i++) {
     std::pair<EncodedInfo, rtc::Buffer> redundant;
     redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);
     redundant_encodings_.push_front(std::move(redundant));
   }
 }

 bool AudioEncoderCopyRed::SetFec(bool enable) {
   return speech_encoder_->SetFec(enable);
 }

 bool AudioEncoderCopyRed::SetDtx(bool enable) {
   return speech_encoder_->SetDtx(enable);
 }

 bool AudioEncoderCopyRed::GetDtx() const {
   return speech_encoder_->GetDtx();
 }

 bool AudioEncoderCopyRed::SetApplication(Application application) {
   return speech_encoder_->SetApplication(application);
 }

 void AudioEncoderCopyRed::SetMaxPlaybackRate(int frequency_hz) {
   speech_encoder_->SetMaxPlaybackRate(frequency_hz);
 }

 bool AudioEncoderCopyRed::EnableAudioNetworkAdaptor(
     const std::string& config_string,
     RtcEventLog* event_log) {
   return speech_encoder_->EnableAudioNetworkAdaptor(config_string, event_log);
 }

 void AudioEncoderCopyRed::DisableAudioNetworkAdaptor() {
   speech_encoder_->DisableAudioNetworkAdaptor();
 }

 void AudioEncoderCopyRed::OnReceivedUplinkPacketLossFraction(
     float uplink_packet_loss_fraction) {
   speech_encoder_->OnReceivedUplinkPacketLossFraction(
       uplink_packet_loss_fraction);
 }

 void AudioEncoderCopyRed::OnReceivedUplinkBandwidth(
     int target_audio_bitrate_bps,
     absl::optional<int64_t> bwe_period_ms) {
   speech_encoder_->OnReceivedUplinkBandwidth(target_audio_bitrate_bps,
                                              bwe_period_ms);
 }

 void AudioEncoderCopyRed::OnReceivedUplinkAllocation(
     BitrateAllocationUpdate update) {
   speech_encoder_->OnReceivedUplinkAllocation(update);
 }

 absl::optional<std::pair<TimeDelta, TimeDelta>>
 AudioEncoderCopyRed::GetFrameLengthRange() const {
   return speech_encoder_->GetFrameLengthRange();
 }

 void AudioEncoderCopyRed::OnReceivedRtt(int rtt_ms) {
   speech_encoder_->OnReceivedRtt(rtt_ms);
 }

 void AudioEncoderCopyRed::OnReceivedOverhead(size_t overhead_bytes_per_packet) {
   max_packet_length_ = kAudioMaxRtpPacketLen - overhead_bytes_per_packet;
   return speech_encoder_->OnReceivedOverhead(overhead_bytes_per_packet);
 }

 void AudioEncoderCopyRed::SetReceiverFrameLengthRange(int min_frame_length_ms,
                                                       int max_frame_length_ms) {
   return speech_encoder_->SetReceiverFrameLengthRange(min_frame_length_ms,
                                                       max_frame_length_ms);
 }

 ANAStats AudioEncoderCopyRed::GetANAStats() const {
   return speech_encoder_->GetANAStats();
 }

 rtc::ArrayView<std::unique_ptr<AudioEncoder>>
 AudioEncoderCopyRed::ReclaimContainedEncoders() {
   return rtc::ArrayView<std::unique_ptr<AudioEncoder>>(&speech_encoder_, 1);
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/audio_coding/codecs/red/audio_encoder_copy_red.h"

	#include <string.h>

	#include <utility>
	#include <vector>

	#include "absl/strings/string_view.h"
	#include "rtc_base/byte_order.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/logging.h"

	namespace webrtc {
	static constexpr const int kRedMaxPacketSize =
	1 << 10; // RED packets must be less than 1024 bytes to fit the 10 bit
	// block length.
	static constexpr const size_t kRedMaxTimestampDelta =
	1 << 14; // RED packets can encode a timestamp delta of 14 bits.
	static constexpr const size_t kAudioMaxRtpPacketLen =
	1200; // The typical MTU is 1200 bytes.

	static constexpr size_t kRedHeaderLength = 4; // 4 bytes RED header.
	static constexpr size_t kRedLastHeaderLength =
	1; // reduced size for last RED header.

	static constexpr size_t kRedNumberOfRedundantEncodings =
	1; // The level of redundancy we support.

	AudioEncoderCopyRed::Config::Config() = default;
	AudioEncoderCopyRed::Config::Config(Config&&) = default;
	AudioEncoderCopyRed::Config::~Config() = default;

	size_t GetMaxRedundancyFromFieldTrial(const FieldTrialsView& field_trials) {
	const std::string red_trial =
	field_trials.Lookup("WebRTC-Audio-Red-For-Opus");
	size_t redundancy = 0;
	if (sscanf(red_trial.c_str(), "Enabled-%zu", &redundancy) != 1 \|\|
	redundancy > 9) {
	return kRedNumberOfRedundantEncodings;
	}
	return redundancy;
	}

	AudioEncoderCopyRed::AudioEncoderCopyRed(Config&& config,
	const FieldTrialsView& field_trials)
	: speech_encoder_(std::move(config.speech_encoder)),
	primary_encoded_(0, kAudioMaxRtpPacketLen),
	max_packet_length_(kAudioMaxRtpPacketLen),
	red_payload_type_(config.payload_type) {
	RTC_CHECK(speech_encoder_) << "Speech encoder not provided.";

	auto number_of_redundant_encodings =
	GetMaxRedundancyFromFieldTrial(field_trials);
	for (size_t i = 0; i < number_of_redundant_encodings; i++) {
	std::pair<EncodedInfo, rtc::Buffer> redundant;
	redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);
	redundant_encodings_.push_front(std::move(redundant));
	}
	}

	AudioEncoderCopyRed::~AudioEncoderCopyRed() = default;

	int AudioEncoderCopyRed::SampleRateHz() const {
	return speech_encoder_->SampleRateHz();
	}

	size_t AudioEncoderCopyRed::NumChannels() const {
	return speech_encoder_->NumChannels();
	}

	int AudioEncoderCopyRed::RtpTimestampRateHz() const {
	return speech_encoder_->RtpTimestampRateHz();
	}

	size_t AudioEncoderCopyRed::Num10MsFramesInNextPacket() const {
	return speech_encoder_->Num10MsFramesInNextPacket();
	}

	size_t AudioEncoderCopyRed::Max10MsFramesInAPacket() const {
	return speech_encoder_->Max10MsFramesInAPacket();
	}

	int AudioEncoderCopyRed::GetTargetBitrate() const {
	return speech_encoder_->GetTargetBitrate();
	}

	AudioEncoder::EncodedInfo AudioEncoderCopyRed::EncodeImpl(
	uint32_t rtp_timestamp,
	rtc::ArrayView<const int16_t> audio,
	rtc::Buffer* encoded) {
	primary_encoded_.Clear();
	EncodedInfo info =
	speech_encoder_->Encode(rtp_timestamp, audio, &primary_encoded_);
	RTC_CHECK(info.redundant.empty()) << "Cannot use nested redundant encoders.";
	RTC_DCHECK_EQ(primary_encoded_.size(), info.encoded_bytes);

	if (info.encoded_bytes == 0) {
	return info;
	}
	if (info.encoded_bytes >= kRedMaxPacketSize) {
	// Fallback to the primary encoding if the encoded size is more than
	// what RED can encode as redundancy (1024 bytes). This can happen with
	// Opus stereo at the highest bitrate which consumes up to 1276 bytes.
	encoded->AppendData(primary_encoded_);
	return info;
	}
	RTC_DCHECK_GT(max_packet_length_, info.encoded_bytes);

	size_t header_length_bytes = kRedLastHeaderLength;
	size_t bytes_available = max_packet_length_ - info.encoded_bytes;
	auto it = redundant_encodings_.begin();

	// Determine how much redundancy we can fit into our packet by
	// iterating forward. This is determined both by the length as well
	// as the timestamp difference. The latter can occur with opus DTX which
	// has timestamp gaps of 400ms which exceeds REDs timestamp delta field size.
	for (; it != redundant_encodings_.end(); it++) {
	if (bytes_available < kRedHeaderLength + it->first.encoded_bytes) {
	break;
	}
	if (it->first.encoded_bytes == 0) {
	break;
	}
	if (rtp_timestamp - it->first.encoded_timestamp >= kRedMaxTimestampDelta) {
	break;
	}
	bytes_available -= kRedHeaderLength + it->first.encoded_bytes;
	header_length_bytes += kRedHeaderLength;
	}

	// Allocate room for RFC 2198 header.
	encoded->SetSize(header_length_bytes);

	// Iterate backwards and append the data.
	size_t header_offset = 0;
	while (it-- != redundant_encodings_.begin()) {
	encoded->AppendData(it->second);

	const uint32_t timestamp_delta =
	info.encoded_timestamp - it->first.encoded_timestamp;
	encoded->data()[header_offset] = it->first.payload_type \| 0x80;
	rtc::SetBE16(static_cast<uint8_t*>(encoded->data()) + header_offset + 1,
	(timestamp_delta << 2) \| (it->first.encoded_bytes >> 8));
	encoded->data()[header_offset + 3] = it->first.encoded_bytes & 0xff;
	header_offset += kRedHeaderLength;
	info.redundant.push_back(it->first);
	}

	// `info` will be implicitly cast to an EncodedInfoLeaf struct, effectively
	// discarding the (empty) vector of redundant information. This is
	// intentional.
	if (header_length_bytes > kRedHeaderLength) {
	info.redundant.push_back(info);
	RTC_DCHECK_EQ(info.speech,
	info.redundant[info.redundant.size() - 1].speech);
	}

	encoded->AppendData(primary_encoded_);
	RTC_DCHECK_EQ(header_offset, header_length_bytes - 1);
	encoded->data()[header_offset] = info.payload_type;

	// Shift the redundant encodings.
	auto rit = redundant_encodings_.rbegin();
	for (auto next = std::next(rit); next != redundant_encodings_.rend();
	rit++, next = std::next(rit)) {
	rit->first = next->first;
	rit->second.SetData(next->second);
	}
	it = redundant_encodings_.begin();
	if (it != redundant_encodings_.end()) {
	it->first = info;
	it->second.SetData(primary_encoded_);
	}

	// Update main EncodedInfo.
	info.payload_type = red_payload_type_;
	info.encoded_bytes = encoded->size();
	return info;
	}

	void AudioEncoderCopyRed::Reset() {
	speech_encoder_->Reset();
	auto number_of_redundant_encodings = redundant_encodings_.size();
	redundant_encodings_.clear();
	for (size_t i = 0; i < number_of_redundant_encodings; i++) {
	std::pair<EncodedInfo, rtc::Buffer> redundant;
	redundant.second.EnsureCapacity(kAudioMaxRtpPacketLen);
	redundant_encodings_.push_front(std::move(redundant));
	}
	}

	bool AudioEncoderCopyRed::SetFec(bool enable) {
	return speech_encoder_->SetFec(enable);
	}

	bool AudioEncoderCopyRed::SetDtx(bool enable) {
	return speech_encoder_->SetDtx(enable);
	}

	bool AudioEncoderCopyRed::GetDtx() const {
	return speech_encoder_->GetDtx();
	}

	bool AudioEncoderCopyRed::SetApplication(Application application) {
	return speech_encoder_->SetApplication(application);
	}

	void AudioEncoderCopyRed::SetMaxPlaybackRate(int frequency_hz) {
	speech_encoder_->SetMaxPlaybackRate(frequency_hz);
	}

	bool AudioEncoderCopyRed::EnableAudioNetworkAdaptor(
	const std::string& config_string,
	RtcEventLog* event_log) {
	return speech_encoder_->EnableAudioNetworkAdaptor(config_string, event_log);
	}

	void AudioEncoderCopyRed::DisableAudioNetworkAdaptor() {
	speech_encoder_->DisableAudioNetworkAdaptor();
	}

	void AudioEncoderCopyRed::OnReceivedUplinkPacketLossFraction(
	float uplink_packet_loss_fraction) {
	speech_encoder_->OnReceivedUplinkPacketLossFraction(
	uplink_packet_loss_fraction);
	}

	void AudioEncoderCopyRed::OnReceivedUplinkBandwidth(
	int target_audio_bitrate_bps,
	absl::optional<int64_t> bwe_period_ms) {
	speech_encoder_->OnReceivedUplinkBandwidth(target_audio_bitrate_bps,
	bwe_period_ms);
	}

	void AudioEncoderCopyRed::OnReceivedUplinkAllocation(
	BitrateAllocationUpdate update) {
	speech_encoder_->OnReceivedUplinkAllocation(update);
	}

	absl::optional<std::pair<TimeDelta, TimeDelta>>
	AudioEncoderCopyRed::GetFrameLengthRange() const {
	return speech_encoder_->GetFrameLengthRange();
	}

	void AudioEncoderCopyRed::OnReceivedRtt(int rtt_ms) {
	speech_encoder_->OnReceivedRtt(rtt_ms);
	}

	void AudioEncoderCopyRed::OnReceivedOverhead(size_t overhead_bytes_per_packet) {
	max_packet_length_ = kAudioMaxRtpPacketLen - overhead_bytes_per_packet;
	return speech_encoder_->OnReceivedOverhead(overhead_bytes_per_packet);
	}

	void AudioEncoderCopyRed::SetReceiverFrameLengthRange(int min_frame_length_ms,
	int max_frame_length_ms) {
	return speech_encoder_->SetReceiverFrameLengthRange(min_frame_length_ms,
	max_frame_length_ms);
	}

	ANAStats AudioEncoderCopyRed::GetANAStats() const {
	return speech_encoder_->GetANAStats();
	}

	rtc::ArrayView<std::unique_ptr<AudioEncoder>>
	AudioEncoderCopyRed::ReclaimContainedEncoders() {
	return rtc::ArrayView<std::unique_ptr<AudioEncoder>>(&speech_encoder_, 1);
	}

	} // namespace webrtc