modules/audio_coding/neteq/decision_logic.h - src.git - Git at Google

 /*
  *  Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_
 #define MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_

 #include "modules/audio_coding/neteq/defines.h"
 #include "modules/audio_coding/neteq/include/neteq.h"
 #include "modules/audio_coding/neteq/tick_timer.h"
 #include "rtc_base/constructormagic.h"

 namespace webrtc {

 // Forward declarations.
 class BufferLevelFilter;
 class DecoderDatabase;
 class DelayManager;
 class Expand;
 class PacketBuffer;
 class SyncBuffer;
 struct Packet;

 // This is the class for the decision tree implementation.
 class DecisionLogic final {
  public:
   // Static factory function which creates different types of objects depending
   // on the |playout_mode|.
   static DecisionLogic* Create(int fs_hz,
                                size_t output_size_samples,
                                bool disallow_time_stretching,
                                DecoderDatabase* decoder_database,
                                const PacketBuffer& packet_buffer,
                                DelayManager* delay_manager,
                                BufferLevelFilter* buffer_level_filter,
                                const TickTimer* tick_timer);

   static const int kReinitAfterExpands = 100;
   static const int kMaxWaitForPacket = 10;

   // Constructor.
   DecisionLogic(int fs_hz,
                 size_t output_size_samples,
                 bool disallow_time_stretching,
                 DecoderDatabase* decoder_database,
                 const PacketBuffer& packet_buffer,
                 DelayManager* delay_manager,
                 BufferLevelFilter* buffer_level_filter,
                 const TickTimer* tick_timer);

   ~DecisionLogic();

   // Resets object to a clean state.
   void Reset();

   // Resets parts of the state. Typically done when switching codecs.
   void SoftReset();

   // Sets the sample rate and the output block size.
   void SetSampleRate(int fs_hz, size_t output_size_samples);

   // Returns the operation that should be done next. |sync_buffer| and |expand|
   // are provided for reference. |decoder_frame_length| is the number of samples
   // obtained from the last decoded frame. If there is a packet available, it
   // should be supplied in |next_packet|; otherwise it should be NULL. The mode
   // resulting from the last call to NetEqImpl::GetAudio is supplied in
   // |prev_mode|. If there is a DTMF event to play, |play_dtmf| should be set to
   // true. The output variable |reset_decoder| will be set to true if a reset is
   // required; otherwise it is left unchanged (i.e., it can remain true if it
   // was true before the call).  This method end with calling
   // GetDecisionSpecialized to get the actual return value.
   Operations GetDecision(const SyncBuffer& sync_buffer,
                          const Expand& expand,
                          size_t decoder_frame_length,
                          const Packet* next_packet,
                          Modes prev_mode,
                          bool play_dtmf,
                          size_t generated_noise_samples,
                          bool* reset_decoder);

   // These methods test the |cng_state_| for different conditions.
   bool CngRfc3389On() const { return cng_state_ == kCngRfc3389On; }
   bool CngOff() const { return cng_state_ == kCngOff; }

   // Resets the |cng_state_| to kCngOff.
   void SetCngOff() { cng_state_ = kCngOff; }

   // Reports back to DecisionLogic whether the decision to do expand remains or
   // not. Note that this is necessary, since an expand decision can be changed
   // to kNormal in NetEqImpl::GetDecision if there is still enough data in the
   // sync buffer.
   void ExpandDecision(Operations operation);

   // Adds |value| to |sample_memory_|.
   void AddSampleMemory(int32_t value) { sample_memory_ += value; }

   // Accessors and mutators.
   void set_sample_memory(int32_t value) { sample_memory_ = value; }
   size_t noise_fast_forward() const { return noise_fast_forward_; }
   size_t packet_length_samples() const { return packet_length_samples_; }
   void set_packet_length_samples(size_t value) {
     packet_length_samples_ = value;
   }
   void set_prev_time_scale(bool value) { prev_time_scale_ = value; }

  private:
   // The value 5 sets maximum time-stretch rate to about 100 ms/s.
   static const int kMinTimescaleInterval = 5;

   enum CngState { kCngOff, kCngRfc3389On, kCngInternalOn };

   // Updates the |buffer_level_filter_| with the current buffer level
   // |buffer_size_packets|.
   void FilterBufferLevel(size_t buffer_size_packets, Modes prev_mode);

   // Returns the operation given that the next available packet is a comfort
   // noise payload (RFC 3389 only, not codec-internal).
   Operations CngOperation(Modes prev_mode,
                           uint32_t target_timestamp,
                           uint32_t available_timestamp,
                           size_t generated_noise_samples);

   // Returns the operation given that no packets are available (except maybe
   // a DTMF event, flagged by setting |play_dtmf| true).
   Operations NoPacket(bool play_dtmf);

   // Returns the operation to do given that the expected packet is available.
   Operations ExpectedPacketAvailable(Modes prev_mode, bool play_dtmf);

   // Returns the operation to do given that the expected packet is not
   // available, but a packet further into the future is at hand.
   Operations FuturePacketAvailable(const SyncBuffer& sync_buffer,
                                    const Expand& expand,
                                    size_t decoder_frame_length,
                                    Modes prev_mode,
                                    uint32_t target_timestamp,
                                    uint32_t available_timestamp,
                                    bool play_dtmf,
                                    size_t generated_noise_samples);

   // Checks if enough time has elapsed since the last successful timescale
   // operation was done (i.e., accelerate or preemptive expand).
   bool TimescaleAllowed() const {
     return !timescale_countdown_ || timescale_countdown_->Finished();
   }

   // Checks if the current (filtered) buffer level is under the target level.
   bool UnderTargetLevel() const;

   // Checks if |timestamp_leap| is so long into the future that a reset due
   // to exceeding kReinitAfterExpands will be done.
   bool ReinitAfterExpands(uint32_t timestamp_leap) const;

   // Checks if we still have not done enough expands to cover the distance from
   // the last decoded packet to the next available packet, the distance beeing
   // conveyed in |timestamp_leap|.
   bool PacketTooEarly(uint32_t timestamp_leap) const;

   // Checks if num_consecutive_expands_ >= kMaxWaitForPacket.
   bool MaxWaitForPacket() const;

   DecoderDatabase* decoder_database_;
   const PacketBuffer& packet_buffer_;
   DelayManager* delay_manager_;
   BufferLevelFilter* buffer_level_filter_;
   const TickTimer* tick_timer_;
   int fs_mult_;
   size_t output_size_samples_;
   CngState cng_state_;  // Remember if comfort noise is interrupted by other
                         // event (e.g., DTMF).
   size_t noise_fast_forward_ = 0;
   size_t packet_length_samples_;
   int sample_memory_;
   bool prev_time_scale_;
   bool disallow_time_stretching_;
   std::unique_ptr<TickTimer::Countdown> timescale_countdown_;
   int num_consecutive_expands_;
   const bool postpone_decoding_after_expand_;

   RTC_DISALLOW_COPY_AND_ASSIGN(DecisionLogic);
 };

 }  // namespace webrtc
 #endif  // MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_
	/*
	* Copyright (c) 2013 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_
	#define MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_

	#include "modules/audio_coding/neteq/defines.h"
	#include "modules/audio_coding/neteq/include/neteq.h"
	#include "modules/audio_coding/neteq/tick_timer.h"
	#include "rtc_base/constructormagic.h"

	namespace webrtc {

	// Forward declarations.
	class BufferLevelFilter;
	class DecoderDatabase;
	class DelayManager;
	class Expand;
	class PacketBuffer;
	class SyncBuffer;
	struct Packet;

	// This is the class for the decision tree implementation.
	class DecisionLogic final {
	public:
	// Static factory function which creates different types of objects depending
	// on the \|playout_mode\|.
	static DecisionLogic* Create(int fs_hz,
	size_t output_size_samples,
	bool disallow_time_stretching,
	DecoderDatabase* decoder_database,
	const PacketBuffer& packet_buffer,
	DelayManager* delay_manager,
	BufferLevelFilter* buffer_level_filter,
	const TickTimer* tick_timer);

	static const int kReinitAfterExpands = 100;
	static const int kMaxWaitForPacket = 10;

	// Constructor.
	DecisionLogic(int fs_hz,
	size_t output_size_samples,
	bool disallow_time_stretching,
	DecoderDatabase* decoder_database,
	const PacketBuffer& packet_buffer,
	DelayManager* delay_manager,
	BufferLevelFilter* buffer_level_filter,
	const TickTimer* tick_timer);

	~DecisionLogic();

	// Resets object to a clean state.
	void Reset();

	// Resets parts of the state. Typically done when switching codecs.
	void SoftReset();

	// Sets the sample rate and the output block size.
	void SetSampleRate(int fs_hz, size_t output_size_samples);

	// Returns the operation that should be done next. \|sync_buffer\| and \|expand\|
	// are provided for reference. \|decoder_frame_length\| is the number of samples
	// obtained from the last decoded frame. If there is a packet available, it
	// should be supplied in \|next_packet\|; otherwise it should be NULL. The mode
	// resulting from the last call to NetEqImpl::GetAudio is supplied in
	// \|prev_mode\|. If there is a DTMF event to play, \|play_dtmf\| should be set to
	// true. The output variable \|reset_decoder\| will be set to true if a reset is
	// required; otherwise it is left unchanged (i.e., it can remain true if it
	// was true before the call). This method end with calling
	// GetDecisionSpecialized to get the actual return value.
	Operations GetDecision(const SyncBuffer& sync_buffer,
	const Expand& expand,
	size_t decoder_frame_length,
	const Packet* next_packet,
	Modes prev_mode,
	bool play_dtmf,
	size_t generated_noise_samples,
	bool* reset_decoder);

	// These methods test the \|cng_state_\| for different conditions.
	bool CngRfc3389On() const { return cng_state_ == kCngRfc3389On; }
	bool CngOff() const { return cng_state_ == kCngOff; }

	// Resets the \|cng_state_\| to kCngOff.
	void SetCngOff() { cng_state_ = kCngOff; }

	// Reports back to DecisionLogic whether the decision to do expand remains or
	// not. Note that this is necessary, since an expand decision can be changed
	// to kNormal in NetEqImpl::GetDecision if there is still enough data in the
	// sync buffer.
	void ExpandDecision(Operations operation);

	// Adds \|value\| to \|sample_memory_\|.
	void AddSampleMemory(int32_t value) { sample_memory_ += value; }

	// Accessors and mutators.
	void set_sample_memory(int32_t value) { sample_memory_ = value; }
	size_t noise_fast_forward() const { return noise_fast_forward_; }
	size_t packet_length_samples() const { return packet_length_samples_; }
	void set_packet_length_samples(size_t value) {
	packet_length_samples_ = value;
	}
	void set_prev_time_scale(bool value) { prev_time_scale_ = value; }

	private:
	// The value 5 sets maximum time-stretch rate to about 100 ms/s.
	static const int kMinTimescaleInterval = 5;

	enum CngState { kCngOff, kCngRfc3389On, kCngInternalOn };

	// Updates the \|buffer_level_filter_\| with the current buffer level
	// \|buffer_size_packets\|.
	void FilterBufferLevel(size_t buffer_size_packets, Modes prev_mode);

	// Returns the operation given that the next available packet is a comfort
	// noise payload (RFC 3389 only, not codec-internal).
	Operations CngOperation(Modes prev_mode,
	uint32_t target_timestamp,
	uint32_t available_timestamp,
	size_t generated_noise_samples);

	// Returns the operation given that no packets are available (except maybe
	// a DTMF event, flagged by setting \|play_dtmf\| true).
	Operations NoPacket(bool play_dtmf);

	// Returns the operation to do given that the expected packet is available.
	Operations ExpectedPacketAvailable(Modes prev_mode, bool play_dtmf);

	// Returns the operation to do given that the expected packet is not
	// available, but a packet further into the future is at hand.
	Operations FuturePacketAvailable(const SyncBuffer& sync_buffer,
	const Expand& expand,
	size_t decoder_frame_length,
	Modes prev_mode,
	uint32_t target_timestamp,
	uint32_t available_timestamp,
	bool play_dtmf,
	size_t generated_noise_samples);

	// Checks if enough time has elapsed since the last successful timescale
	// operation was done (i.e., accelerate or preemptive expand).
	bool TimescaleAllowed() const {
	return !timescale_countdown_ \|\| timescale_countdown_->Finished();
	}

	// Checks if the current (filtered) buffer level is under the target level.
	bool UnderTargetLevel() const;

	// Checks if \|timestamp_leap\| is so long into the future that a reset due
	// to exceeding kReinitAfterExpands will be done.
	bool ReinitAfterExpands(uint32_t timestamp_leap) const;

	// Checks if we still have not done enough expands to cover the distance from
	// the last decoded packet to the next available packet, the distance beeing
	// conveyed in \|timestamp_leap\|.
	bool PacketTooEarly(uint32_t timestamp_leap) const;

	// Checks if num_consecutive_expands_ >= kMaxWaitForPacket.
	bool MaxWaitForPacket() const;

	DecoderDatabase* decoder_database_;
	const PacketBuffer& packet_buffer_;
	DelayManager* delay_manager_;
	BufferLevelFilter* buffer_level_filter_;
	const TickTimer* tick_timer_;
	int fs_mult_;
	size_t output_size_samples_;
	CngState cng_state_; // Remember if comfort noise is interrupted by other
	// event (e.g., DTMF).
	size_t noise_fast_forward_ = 0;
	size_t packet_length_samples_;
	int sample_memory_;
	bool prev_time_scale_;
	bool disallow_time_stretching_;
	std::unique_ptr<TickTimer::Countdown> timescale_countdown_;
	int num_consecutive_expands_;
	const bool postpone_decoding_after_expand_;

	RTC_DISALLOW_COPY_AND_ASSIGN(DecisionLogic);
	};

	} // namespace webrtc
	#endif // MODULES_AUDIO_CODING_NETEQ_DECISION_LOGIC_H_