webrtc/modules/audio_coding/main/source/acm_generic_codec.h - src - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef WEBRTC_MODULES_AUDIO_CODING_MAIN_SOURCE_ACM_GENERIC_CODEC_H_
 #define WEBRTC_MODULES_AUDIO_CODING_MAIN_SOURCE_ACM_GENERIC_CODEC_H_

 #include "webrtc/modules/audio_coding/main/interface/audio_coding_module_typedefs.h"
 #include "webrtc/modules/audio_coding/main/source/acm_common_defs.h"
 #include "webrtc/modules/audio_coding/neteq/interface/webrtc_neteq.h"
 #include "webrtc/system_wrappers/interface/rw_lock_wrapper.h"
 #include "webrtc/system_wrappers/interface/trace.h"

 #define MAX_FRAME_SIZE_10MSEC 6

 // forward declaration
 struct WebRtcVadInst;
 struct WebRtcCngEncInst;

 namespace webrtc {

 // forward declaration
 struct CodecInst;
 class ACMNetEQ;

 class ACMGenericCodec {
  public:
   ///////////////////////////////////////////////////////////////////////////
   // Constructor of the class
   //
   ACMGenericCodec();

   ///////////////////////////////////////////////////////////////////////////
   // Destructor of the class.
   //
   virtual ~ACMGenericCodec();

   ///////////////////////////////////////////////////////////////////////////
   // ACMGenericCodec* CreateInstance();
   // The function will be used for FEC. It is not implemented yet.
   //
   virtual ACMGenericCodec* CreateInstance() = 0;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t Encode()
   // The function is called to perform an encoding of the audio stored in
   // audio buffer. An encoding is performed only if enough audio, i.e. equal
   // to the frame-size of the codec, exist. The audio frame will be processed
   // by VAD and CN/DTX if required. There are few different cases.
   //
   // A) Neither VAD nor DTX is active; the frame is encoded by the encoder.
   //
   // B) VAD is enabled but not DTX; in this case the audio is processed by VAD
   //    and encoded by the encoder. The "*encoding_type" will be either
   //    "kActiveNormalEncode" or "kPassiveNormalEncode" if frame is active or
   //    passive, respectively.
   //
   // C) DTX is enabled; if the codec has internal VAD/DTX we just encode the
   //    frame by the encoder. Otherwise, the frame is passed through VAD and
   //    if identified as passive, then it will be processed by CN/DTX. If the
   //    frame is active it will be encoded by the encoder.
   //
   // This function acquires the appropriate locks and calls EncodeSafe() for
   // the actual processing.
   //
   // Outputs:
   //   -bitstream          : a buffer where bit-stream will be written to.
   //   -bitstream_len_byte : contains the length of the bit-stream in
   //                         bytes.
   //   -timestamp          : contains the RTP timestamp, this is the
   //                         sampling time of the first sample encoded
   //                         (measured in number of samples).
   //   -encoding_type       : contains the type of encoding applied on the
   //                         audio samples. The alternatives are
   //                         (c.f. acm_common_types.h)
   //                         -kNoEncoding:
   //                            there was not enough data to encode. or
   //                            some error has happened that we could
   //                            not do encoding.
   //                         -kActiveNormalEncoded:
   //                            the audio frame is active and encoded by
   //                            the given codec.
   //                         -kPassiveNormalEncoded:
   //                            the audio frame is passive but coded with
   //                            the given codec (NO DTX).
   //                         -kPassiveDTXWB:
   //                            The audio frame is passive and used
   //                            wide-band CN to encode.
   //                         -kPassiveDTXNB:
   //                            The audio frame is passive and used
   //                            narrow-band CN to encode.
   //
   // Return value:
   //   -1 if error is occurred, otherwise the length of the bit-stream in
   //      bytes.
   //
   int16_t Encode(uint8_t* bitstream,
                  int16_t* bitstream_len_byte,
                  uint32_t* timestamp,
                  WebRtcACMEncodingType* encoding_type);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t Decode()
   // This function is used to decode a given bit-stream, without engaging
   // NetEQ.
   //
   // This function acquires the appropriate locks and calls DecodeSafe() for
   // the actual processing. Please note that this is not functional yet.
   //
   // Inputs:
   //   -bitstream         : a buffer where bit-stream will be read.
   //   -bitstream_len_byte : the length of the bit-stream in bytes.
   //
   // Outputs:
   //   -audio              : pointer to a buffer where the audio will written.
   //   -audio_samples      : number of audio samples out of decoding the given
   //                         bit-stream.
   //   -speech_type        : speech type (for future use).
   //
   // Return value:
   //   -1 if failed to decode,
   //    0 if succeeded.
   //
   int16_t Decode(uint8_t* bitstream,
                  int16_t bitstream_len_byte,
                  int16_t* audio,
                  int16_t* audio_samples,
                  int8_t* speech_type);

   ///////////////////////////////////////////////////////////////////////////
   // void SplitStereoPacket()
   // This function is used to split stereo payloads in left and right channel.
   // Codecs which has stereo support has there own implementation of the
   // function.
   //
   // Input/Output:
   //   -payload             : a vector with the received payload data.
   //                          The function will reorder the data so that
   //                          first half holds the left channel data, and the
   //                          second half the right channel data.
   //   -payload_length      : length of payload in bytes. Will be changed to
   //                          twice the input in case of true stereo, where
   //                          we simply copy the data and return it both for
   //                          left channel and right channel decoding.
   //
   virtual void SplitStereoPacket(uint8_t* /* payload */,
                                  int32_t* /* payload_length */) {}

   ///////////////////////////////////////////////////////////////////////////
   // bool EncoderInitialized();
   //
   // Return value:
   //   True if the encoder is successfully initialized,
   //   false otherwise.
   //
   bool EncoderInitialized();

   ///////////////////////////////////////////////////////////////////////////
   // bool DecoderInitialized();
   //
   // Return value:
   //   True if the decoder is successfully initialized,
   //   false otherwise.
   //
   bool DecoderInitialized();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t EncoderParams()
   // It is called to get encoder parameters. It will call
   // EncoderParamsSafe() in turn.
   //
   // Output:
   //   -enc_params         : a buffer where the encoder parameters is
   //                         written to. If the encoder is not
   //                         initialized this buffer is filled with
   //                         invalid values
   // Return value:
   //   -1 if the encoder is not initialized,
   //    0 otherwise.
   //
   int16_t EncoderParams(WebRtcACMCodecParams *enc_params);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t DecoderParams(...)
   // It is called to get decoder parameters. It will call DecoderParamsSafe()
   // in turn.
   //
   // Output:
   //   -dec_params         : a buffer where the decoder parameters is
   //                         written to. If the decoder is not initialized
   //                         this buffer is filled with invalid values
   //
   // Return value:
   //   -1 if the decoder is not initialized,
   //    0 otherwise.
   //
   //
   bool DecoderParams(WebRtcACMCodecParams *dec_params,
                      const uint8_t payload_type);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InitEncoder(...)
   // This function is called to initialize the encoder with the given
   // parameters.
   //
   // Input:
   //   -codec_params        : parameters of encoder.
   //   -force_initialization: if false the initialization is invoked only if
   //                          the encoder is not initialized. If true the
   //                          encoder is forced to (re)initialize.
   //
   // Return value:
   //   0 if could initialize successfully,
   //  -1 if failed to initialize.
   //
   //
   int16_t InitEncoder(WebRtcACMCodecParams* codec_params,
                       bool force_initialization);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InitDecoder()
   // This function is called to initialize the decoder with the given
   // parameters. (c.f. acm_common_defs.h & common_types.h for the
   // definition of the structure)
   //
   // Input:
   //   -codec_params        : parameters of decoder.
   //   -force_initialization: if false the initialization is invoked only
   //                          if the decoder is not initialized. If true
   //                          the encoder is forced to(re)initialize.
   //
   // Return value:
   //   0 if could initialize successfully,
   //  -1 if failed to initialize.
   //
   //
   int16_t InitDecoder(WebRtcACMCodecParams* codec_params,
                       bool force_initialization);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t RegisterInNetEq(...)
   // This function is called to register the decoder in NetEq, with the given
   // payload type.
   //
   // Inputs:
   //   -neteq              : pointer to NetEq Instance
   //   -codec_inst         : instance with of the codec settings of the codec
   //
   // Return values
   //   -1 if failed to register,
   //    0 if successfully initialized.
   //
   int32_t RegisterInNetEq(ACMNetEQ* neteq, const CodecInst& codec_inst);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t Add10MsData(...)
   // This function is called to add 10 ms of audio to the audio buffer of
   // the codec.
   //
   // Inputs:
   //   -timestamp          : the timestamp of the 10 ms audio. the timestamp
   //                         is the sampling time of the
   //                         first sample measured in number of samples.
   //   -data               : a buffer that contains the audio. The codec
   //                         expects to get the audio in correct sampling
   //                         frequency
   //   -length             : the length of the audio buffer
   //   -audio_channel      : 0 for mono, 1 for stereo (not supported yet)
   //
   // Return values:
   //   -1 if failed
   //    0 otherwise.
   //
   int32_t Add10MsData(const uint32_t timestamp,
                       const int16_t* data,
                       const uint16_t length,
                       const uint8_t audio_channel);

   ///////////////////////////////////////////////////////////////////////////
   // uint32_t NoMissedSamples()
   // This function returns the number of samples which are overwritten in
   // the audio buffer. The audio samples are overwritten if the input audio
   // buffer is full, but Add10MsData() is called. (We might remove this
   // function if it is not used)
   //
   // Return Value:
   //   Number of samples which are overwritten.
   //
   uint32_t NoMissedSamples() const;

   ///////////////////////////////////////////////////////////////////////////
   // void ResetNoMissedSamples()
   // This function resets the number of overwritten samples to zero.
   // (We might remove this function if we remove NoMissedSamples())
   //
   void ResetNoMissedSamples();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t SetBitRate()
   // The function is called to set the encoding rate.
   //
   // Input:
   //   -bitrate_bps        : encoding rate in bits per second
   //
   // Return value:
   //   -1 if failed to set the rate, due to invalid input or given
   //      codec is not rate-adjustable.
   //    0 if the rate is adjusted successfully
   //
   int16_t SetBitRate(const int32_t bitrate_bps);

   ///////////////////////////////////////////////////////////////////////////
   // DestructEncoderInst()
   // This API is used in conferencing. It will free the memory that is pointed
   // by |ptr_inst|. |ptr_inst| is a pointer to encoder instance, created and
   // filled up by calling EncoderInst(...).
   //
   // Inputs:
   //   -ptr_inst            : pointer to an encoder instance to be deleted.
   //
   //
   void DestructEncoderInst(void* ptr_inst);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t AudioBuffer()
   // This is used when synchronization of codecs is required. There are cases
   // that the audio buffers of two codecs have to be synched. By calling this
   // function on can get the audio buffer and other related parameters, such
   // as timestamps...
   //
   // Output:
   //   -audio_buff         : a pointer to WebRtcACMAudioBuff where the audio
   //                         buffer of this codec will be written to.
   //
   // Return value:
   //   -1 if fails to copy the audio buffer,
   //    0 if succeeded.
   //
   int16_t AudioBuffer(WebRtcACMAudioBuff& audio_buff);

   ///////////////////////////////////////////////////////////////////////////
   // uint32_t EarliestTimestamp()
   // Returns the timestamp of the first 10 ms in audio buffer. This is used
   // to identify if a synchronization of two encoders is required.
   //
   // Return value:
   //   timestamp of the first 10 ms audio in the audio buffer.
   //
   uint32_t EarliestTimestamp() const;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t SetAudioBuffer()
   // This function is called to set the audio buffer and the associated
   // parameters to a given value.
   //
   // Return value:
   //   -1 if fails to copy the audio buffer,
   //    0 if succeeded.
   //
   int16_t SetAudioBuffer(WebRtcACMAudioBuff& audio_buff);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t SetVAD()
   // This is called to set VAD & DTX. If the codec has internal DTX that will
   // be used. If DTX is enabled and the codec does not have internal DTX,
   // WebRtc-VAD will be used to decide if the frame is active. If DTX is
   // disabled but VAD is enabled. The audio is passed through VAD to label it
   // as active or passive, but the frame is  encoded normally. However the
   // bit-stream is labeled properly so that ACM::Process() can use this
   // information. In case of failure, the previous states of the VAD & DTX
   // are kept.
   //
   // Inputs:
   //   -enable_dtx         : if true DTX will be enabled otherwise the DTX is
   //                         disabled. If codec has internal DTX that will be
   //                         used, otherwise WebRtc-CNG is used. In the latter
   //                         case VAD is automatically activated.
   //   -enable_vad         : if true WebRtc-VAD is enabled, otherwise VAD is
   //                         disabled, except for the case that DTX is enabled
   //                         but codec doesn't have internal DTX. In this case
   //                         VAD is enabled regardless of the value of
   //                         |enable_vad|.
   //   -mode               : this specifies the aggressiveness of VAD.
   //
   // Return value
   //   -1 if failed to set DTX & VAD as specified,
   //    0 if succeeded.
   //
   int16_t SetVAD(const bool enable_dtx = true,
                  const bool enable_vad = false,
                  const ACMVADMode mode = VADNormal);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t ReplaceInternalDTX()
   // This is called to replace the codec internal DTX with WebRtc DTX.
   // This is only valid for G729 where the user has possibility to replace
   // AnnexB with WebRtc DTX. For other codecs this function has no effect.
   //
   // Input:
   //   -replace_internal_dtx : if true the internal DTX is replaced with WebRtc.
   //
   // Return value
   //   -1 if failed to replace internal DTX,
   //    0 if succeeded.
   //
   int32_t ReplaceInternalDTX(const bool replace_internal_dtx);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t IsInternalDTXReplaced()
   // This is called to check if the codec internal DTX is replaced by WebRtc
   // DTX. This is only valid for G729 where the user has possibility to replace
   // AnnexB with WebRtc DTX. For other codecs this function has no effect.
   //
   // Output:
   //   -internal_dtx_replaced: if true the internal DTX is replaced with WebRtc.
   //
   // Return value
   //   -1 if failed to check
   //    0 if succeeded.
   //
   int32_t IsInternalDTXReplaced(bool* internal_dtx_replaced);

   ///////////////////////////////////////////////////////////////////////////
   // void SetNetEqDecodeLock()
   // Passes the NetEq lock to the codec.
   //
   // Input:
   //   -neteq_decode_lock  : pointer to the lock associated with NetEQ of ACM.
   //
   void SetNetEqDecodeLock(RWLockWrapper* neteq_decode_lock) {
     neteq_decode_lock_ = neteq_decode_lock;
   }

   ///////////////////////////////////////////////////////////////////////////
   // bool HasInternalDTX()
   // Used to check if the codec has internal DTX.
   //
   // Return value:
   //   true if the codec has an internal DTX, e.g. G729,
   //   false otherwise.
   //
   bool HasInternalDTX() const {
     return has_internal_dtx_;
   }

   ///////////////////////////////////////////////////////////////////////////
   // int32_t GetEstimatedBandwidth()
   // Used to get decoder estimated bandwidth. Only iSAC will provide a value.
   //
   //
   // Return value:
   //   -1 if fails to get decoder estimated bandwidth,
   //    >0 estimated bandwidth in bits/sec.
   //
   int32_t GetEstimatedBandwidth();

   ///////////////////////////////////////////////////////////////////////////
   // int32_t SetEstimatedBandwidth()
   // Used to set estiamted bandwidth sent out of band from other side. Only
   // iSAC will have use for the value.
   //
   // Input:
   //       -estimated_bandwidth:    estimated bandwidth in bits/sec
   //
   // Return value:
   //   -1 if fails to set estimated bandwidth,
   //    0 on success.
   //
   int32_t SetEstimatedBandwidth(int32_t estimated_bandwidth);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t GetRedPayload()
   // Used to get codec specific RED payload (if such is implemented).
   // Currently only done in iSAC.
   //
   // Outputs:
   //   -red_payload       : a pointer to the data for RED payload.
   //   -payload_bytes     : number of bytes in RED payload.
   //
   // Return value:
   //   -1 if fails to get codec specific RED,
   //    0 if succeeded.
   //
   int32_t GetRedPayload(uint8_t* red_payload,
                         int16_t* payload_bytes);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t ResetEncoder()
   // By calling this function you would re-initialize the encoder with the
   // current parameters. All the settings, e.g. VAD/DTX, frame-size... should
   // remain unchanged. (In case of iSAC we don't want to lose BWE history.)
   //
   // Return value
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t ResetEncoder();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t ResetEncoder()
   // By calling this function you would re-initialize the decoder with the
   // current parameters.
   //
   // Return value
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t ResetDecoder(int16_t payload_type);

   ///////////////////////////////////////////////////////////////////////////
   // void DestructEncoder()
   // This function is called to delete the encoder instance, if possible, to
   // have a fresh start. For codecs where encoder and decoder share the same
   // instance we cannot delete the encoder and instead we will initialize the
   // encoder. We also delete VAD and DTX if they have been created.
   //
   void DestructEncoder();

   ///////////////////////////////////////////////////////////////////////////
   // void DestructDecoder()
   // This function is called to delete the decoder instance, if possible, to
   // have a fresh start. For codecs where encoder and decoder share the same
   // instance we cannot delete the encoder and instead we will initialize the
   // decoder. Before deleting decoder instance it has to be removed from the
   // NetEq list.
   //
   void DestructDecoder();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t SamplesLeftToEncode()
   // Returns the number of samples required to be able to do encoding.
   //
   // Return value:
   //   Number of samples.
   //
   int16_t SamplesLeftToEncode();

   ///////////////////////////////////////////////////////////////////////////
   // uint32_t LastEncodedTimestamp()
   // Returns the timestamp of the last frame it encoded.
   //
   // Return value:
   //   Timestamp.
   //
   uint32_t LastEncodedTimestamp() const;

   ///////////////////////////////////////////////////////////////////////////
   // SetUniqueID()
   // Set a unique ID for the codec to be used for tracing and debugging
   //
   // Input
   //   -id                 : A number to identify the codec.
   //
   void SetUniqueID(const uint32_t id);

   ///////////////////////////////////////////////////////////////////////////
   // IsAudioBufferFresh()
   // Specifies if ever audio is injected to this codec.
   //
   // Return value
   //   -true; no audio is feed into this codec
   //   -false; audio has already been  fed to the codec.
   //
   bool IsAudioBufferFresh() const;

   ///////////////////////////////////////////////////////////////////////////
   // UpdateDecoderSampFreq()
   // For most of the codecs this function does nothing. It must be
   // implemented for those codecs that one codec instance serves as the
   // decoder for different flavors of the codec. One example is iSAC. there,
   // iSAC 16 kHz and iSAC 32 kHz are treated as two different codecs with
   // different payload types, however, there is only one iSAC instance to
   // decode. The reason for that is we would like to decode and encode with
   // the same codec instance for bandwidth estimator to work.
   //
   // Each time that we receive a new payload type, we call this function to
   // prepare the decoder associated with the new payload. Normally, decoders
   // doesn't have to do anything. For iSAC the decoder has to change it's
   // sampling rate. The input parameter specifies the current flavor of the
   // codec in codec database. For instance, if we just got a SWB payload then
   // the input parameter is ACMCodecDB::isacswb.
   //
   // Input:
   //   -codec_id           : the ID of the codec associated with the
   //                         payload type that we just received.
   //
   // Return value:
   //    0 if succeeded in updating the decoder.
   //   -1 if failed to update.
   //
   virtual int16_t UpdateDecoderSampFreq(int16_t /* codec_id */) {
     return 0;
   }

   ///////////////////////////////////////////////////////////////////////////
   // UpdateEncoderSampFreq()
   // Call this function to update the encoder sampling frequency. This
   // is for codecs where one payload-name supports several encoder sampling
   // frequencies. Otherwise, to change the sampling frequency we need to
   // register new codec. ACM will consider that as registration of a new
   // codec, not a change in parameter. For iSAC, switching from WB to SWB
   // is treated as a change in parameter. Therefore, we need this function.
   //
   // Input:
   //   -samp_freq_hz        : encoder sampling frequency.
   //
   // Return value:
   //   -1 if failed, or if this is meaningless for the given codec.
   //    0 if succeeded.
   //
   virtual int16_t UpdateEncoderSampFreq(
       uint16_t samp_freq_hz);

   ///////////////////////////////////////////////////////////////////////////
   // EncoderSampFreq()
   // Get the sampling frequency that the encoder (WebRtc wrapper) expects.
   //
   // Output:
   //   -samp_freq_hz       : sampling frequency, in Hertz, which the encoder
   //                         should be fed with.
   //
   // Return value:
   //   -1 if failed to output sampling rate.
   //    0 if the sample rate is returned successfully.
   //
   virtual int16_t EncoderSampFreq(uint16_t& samp_freq_hz);

   ///////////////////////////////////////////////////////////////////////////
   // int32_t ConfigISACBandwidthEstimator()
   // Call this function to configure the bandwidth estimator of ISAC.
   // During the adaptation of bit-rate, iSAC automatically adjusts the
   // frame-size (either 30 or 60 ms) to save on RTP header. The initial
   // frame-size can be specified by the first argument. The configuration also
   // regards the initial estimate of bandwidths. The estimator starts from
   // this point and converges to the actual bottleneck. This is given by the
   // second parameter. Furthermore, it is also possible to control the
   // adaptation of frame-size. This is specified by the last parameter.
   //
   // Input:
   //   -init_frame_fize_ms : initial frame-size in milliseconds. For iSAC-wb
   //                         30 ms and 60 ms (default) are acceptable values,
   //                         and for iSAC-swb 30 ms is the only acceptable
   //                         value. Zero indicates default value.
   //   -init_rate_bps      : initial estimate of the bandwidth. Values
   //                         between 10000 and 58000 are acceptable.
   //   -enforce_frame_size : if true, the frame-size will not be adapted.
   //
   // Return value:
   //   -1 if failed to configure the bandwidth estimator,
   //    0 if the configuration was successfully applied.
   //
   virtual int32_t ConfigISACBandwidthEstimator(
       const uint8_t init_frame_size_msec,
       const uint16_t init_rate_bps,
       const bool enforce_frame_size);

   ///////////////////////////////////////////////////////////////////////////
   // SetISACMaxPayloadSize()
   // Set the maximum payload size of iSAC packets. No iSAC payload,
   // regardless of its frame-size, may exceed the given limit. For
   // an iSAC payload of size B bits and frame-size T sec we have;
   // (B < max_payload_len_bytes * 8) and (B/T < max_rate_bit_per_sec), c.f.
   // SetISACMaxRate().
   //
   // Input:
   //   -max_payload_len_bytes : maximum payload size in bytes.
   //
   // Return value:
   //   -1 if failed to set the maximum  payload-size.
   //    0 if the given length is set successfully.
   //
   virtual int32_t SetISACMaxPayloadSize(
       const uint16_t max_payload_len_bytes);

   ///////////////////////////////////////////////////////////////////////////
   // SetISACMaxRate()
   // Set the maximum instantaneous rate of iSAC. For a payload of B bits
   // with a frame-size of T sec the instantaneous rate is B/T bits per
   // second. Therefore, (B/T < max_rate_bit_per_sec) and
   // (B < max_payload_len_bytes * 8) are always satisfied for iSAC payloads,
   // c.f SetISACMaxPayloadSize().
   //
   // Input:
   //   -max_rate_bps       : maximum instantaneous bit-rate given in bits/sec.
   //
   // Return value:
   //   -1 if failed to set the maximum rate.
   //    0 if the maximum rate is set successfully.
   //
   virtual int32_t SetISACMaxRate(const uint32_t max_rate_bps);

   ///////////////////////////////////////////////////////////////////////////
   // SaveDecoderParamS()
   // Save the parameters of decoder.
   //
   // Input:
   //   -codec_params       : pointer to a structure where the parameters of
   //                         decoder is stored in.
   //
   void SaveDecoderParam(const WebRtcACMCodecParams* codec_params);

   int32_t FrameSize() {
     return frame_len_smpl_;
   }

   void SetIsMaster(bool is_master);

   ///////////////////////////////////////////////////////////////////////////
   // REDPayloadISAC()
   // This is an iSAC-specific function. The function is called to get RED
   // payload from a default-encoder.
   //
   // Inputs:
   //   -isac_rate          : the target rate of the main payload. A RED
   //                         payload is generated according to the rate of
   //                         main payload. Note that we are not specifying the
   //                         rate of RED payload, but the main payload.
   //   -isac_bw_estimate   : bandwidth information should be inserted in
   //                         RED payload.
   //
   // Output:
   //   -payload            : pointer to a buffer where the RED payload will
   //                         written to.
   //   -payload_len_bytes  : a place-holder to write the length of the RED
   //                         payload in Bytes.
   //
   // Return value:
   //   -1 if an error occurs, otherwise the length of the payload (in Bytes)
   //   is returned.
   //
   virtual int16_t REDPayloadISAC(const int32_t isac_rate,
                                  const int16_t isac_bw_estimate,
                                  uint8_t* payload,
                                  int16_t* payload_len_bytes);

   ///////////////////////////////////////////////////////////////////////////
   // IsTrueStereoCodec()
   // Call to see if current encoder is a true stereo codec. This function
   // should be overwritten for codecs which are true stereo codecs
   // Return value:
   //   -true  if stereo codec
   //   -false if not stereo codec.
   //
   virtual bool IsTrueStereoCodec() {
     return false;
   }

   ///////////////////////////////////////////////////////////////////////////
   // HasFrameToEncode()
   // Returns true if there is enough audio buffered for encoding, such that
   // calling Encode() will return a payload.
   //
   bool HasFrameToEncode() const;

  protected:
   ///////////////////////////////////////////////////////////////////////////
   // All the functions with FunctionNameSafe(...) contain the actual
   // implementation of FunctionName(...). FunctionName() acquires an
   // appropriate lock and calls FunctionNameSafe() to do the actual work.
   // Therefore, for the description of functionality, input/output arguments
   // and return value we refer to FunctionName()
   //

   ///////////////////////////////////////////////////////////////////////////
   // See Decode() for the description of function, input(s)/output(s) and
   // return value.
   //
   virtual int16_t DecodeSafe(uint8_t* bitstream,
                              int16_t bitstream_len_byte,
                              int16_t* audio,
                              int16_t* audio_samples,
                              int8_t* speech_type) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // See Add10MsSafe() for the description of function, input(s)/output(s)
   // and return value.
   //
   virtual int32_t Add10MsDataSafe(const uint32_t timestamp,
                                   const int16_t* data,
                                   const uint16_t length,
                                   const uint8_t audio_channel);

   ///////////////////////////////////////////////////////////////////////////
   // See RegisterInNetEq() for the description of function,
   // input(s)/output(s) and  return value.
   //
   virtual int32_t CodecDef(WebRtcNetEQ_CodecDef& codec_def,
                            const CodecInst& codec_inst) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // See EncoderParam() for the description of function, input(s)/output(s)
   // and return value.
   //
   int16_t EncoderParamsSafe(WebRtcACMCodecParams *enc_params);

   ///////////////////////////////////////////////////////////////////////////
   // See DecoderParam for the description of function, input(s)/output(s)
   // and return value.
   //
   // Note:
   // Any Class where a single instance handle several flavors of the
   // same codec, therefore, several payload types are associated with
   // the same instance have to implement this function.
   //
   // Currently only iSAC is implementing it. A single iSAC instance is
   // used for decoding both WB & SWB stream. At one moment both WB & SWB
   // can be registered as receive codec. Hence two payloads are associated
   // with a single codec instance.
   //
   virtual bool DecoderParamsSafe(WebRtcACMCodecParams *dec_params,
                                  const uint8_t payload_type);

   ///////////////////////////////////////////////////////////////////////////
   // See ResetEncoder() for the description of function, input(s)/output(s)
   // and return value.
   //
   int16_t ResetEncoderSafe();

   ///////////////////////////////////////////////////////////////////////////
   // See InitEncoder() for the description of function, input(s)/output(s)
   // and return value.
   //
   int16_t InitEncoderSafe(WebRtcACMCodecParams *codec_params,
                           bool force_initialization);

   ///////////////////////////////////////////////////////////////////////////
   // See InitDecoder() for the description of function, input(s)/output(s)
   // and return value.
   //
   int16_t InitDecoderSafe(WebRtcACMCodecParams *codec_params,
                           bool force_initialization);

   ///////////////////////////////////////////////////////////////////////////
   // See ResetDecoder() for the description of function, input(s)/output(s)
   // and return value.
   //
   int16_t ResetDecoderSafe(int16_t payload_type);

   ///////////////////////////////////////////////////////////////////////////
   // See DestructEncoder() for the description of function,
   // input(s)/output(s) and return value.
   //
   virtual void DestructEncoderSafe() = 0;

   ///////////////////////////////////////////////////////////////////////////
   // See DestructDecoder() for the description of function,
   // input(s)/output(s) and return value.
   //
   virtual void DestructDecoderSafe() = 0;

   ///////////////////////////////////////////////////////////////////////////
   // See SetBitRate() for the description of function, input(s)/output(s)
   // and return value.
   //
   // Any codec that can change the bit-rate has to implement this.
   //
   virtual int16_t SetBitRateSafe(const int32_t bitrate_bps);

   ///////////////////////////////////////////////////////////////////////////
   // See GetEstimatedBandwidth() for the description of function,
   // input(s)/output(s) and return value.
   //
   virtual int32_t GetEstimatedBandwidthSafe();

   ///////////////////////////////////////////////////////////////////////////
   // See SetEstimatedBandwidth() for the description of function,
   // input(s)/output(s) and return value.
   //
   virtual int32_t SetEstimatedBandwidthSafe(
       int32_t estimated_bandwidth);

   ///////////////////////////////////////////////////////////////////////////
   // See GetRedPayload() for the description of function, input(s)/output(s)
   // and return value.
   //
   virtual int32_t GetRedPayloadSafe(uint8_t* red_payload,
                                     int16_t* payload_bytes);

   ///////////////////////////////////////////////////////////////////////////
   // See SetVAD() for the description of function, input(s)/output(s) and
   // return value.
   //
   int16_t SetVADSafe(const bool enable_dtx = true,
                      const bool enable_vad = false,
                      const ACMVADMode mode = VADNormal);

   ///////////////////////////////////////////////////////////////////////////
   // See ReplaceInternalDTX() for the description of function, input and
   // return value.
   //
   virtual int32_t ReplaceInternalDTXSafe(const bool replace_internal_dtx);

   ///////////////////////////////////////////////////////////////////////////
   // See IsInternalDTXReplaced() for the description of function, input and
   // return value.
   //
   virtual int32_t IsInternalDTXReplacedSafe(bool* internal_dtx_replaced);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t CreateEncoder()
   // Creates the encoder instance.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t CreateEncoder();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t CreateDecoder()
   // Creates the decoder instance.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t CreateDecoder();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t EnableVAD();
   // Enables VAD with the given mode. The VAD instance will be created if
   // it does not exists.
   //
   // Input:
   //   -mode               : VAD mode c.f. audio_coding_module_typedefs.h for
   //                         the options.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t EnableVAD(ACMVADMode mode);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t DisableVAD()
   // Disables VAD.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t DisableVAD();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t EnableDTX()
   // Enables DTX. This method should be overwritten for codecs which have
   // internal DTX.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t EnableDTX();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t DisableDTX()
   // Disables usage of DTX. This method should be overwritten for codecs which
   // have internal DTX.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t DisableDTX();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalEncode()
   // This is a codec-specific function called in EncodeSafe() to actually
   // encode a frame of audio.
   //
   // Outputs:
   //   -bitstream          : pointer to a buffer where the bit-stream is
   //                         written to.
   //   -bitstream_len_byte : the length of the bit-stream in bytes,
   //                         a negative value indicates error.
   //
   // Return value:
   //   -1 if failed,
   //   otherwise the length of the bit-stream is returned.
   //
   virtual int16_t InternalEncode(uint8_t* bitstream,
                                  int16_t* bitstream_len_byte) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalInitEncoder()
   // This is a codec-specific function called in InitEncoderSafe(), it has to
   // do all codec-specific operation to initialize the encoder given the
   // encoder parameters.
   //
   // Input:
   //   -codec_params       : pointer to a structure that contains parameters to
   //                         initialize encoder.
   //                         Set codec_params->codec_inst.rate to -1 for
   //                         iSAC to operate in adaptive mode.
   //                         (to do: if frame-length is -1 frame-length will be
   //                         automatically adjusted, otherwise, given
   //                         frame-length is forced)
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t InternalInitEncoder(
       WebRtcACMCodecParams *codec_params) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalInitDecoder()
   // This is a codec-specific function called in InitDecoderSafe(), it has to
   // do all codec-specific operation to initialize the decoder given the
   // decoder parameters.
   //
   // Input:
   //   -codec_params       : pointer to a structure that contains parameters to
   //                         initialize encoder.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t InternalInitDecoder(
       WebRtcACMCodecParams *codec_params) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // void IncreaseNoMissedSamples()
   // This method is called to increase the number of samples that are
   // overwritten in the audio buffer.
   //
   // Input:
   //   -num_samples        : the number of overwritten samples is incremented
   //                         by this value.
   //
   void IncreaseNoMissedSamples(const int16_t num_samples);

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalCreateEncoder()
   // This is a codec-specific method called in CreateEncoderSafe() it is
   // supposed to perform all codec-specific operations to create encoder
   // instance.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t InternalCreateEncoder() = 0;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalCreateDecoder()
   // This is a codec-specific method called in CreateDecoderSafe() it is
   // supposed to perform all codec-specific operations to create decoder
   // instance.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t InternalCreateDecoder() = 0;

   ///////////////////////////////////////////////////////////////////////////
   // void InternalDestructEncoderInst()
   // This is a codec-specific method, used in conferencing, called from
   // DestructEncoderInst(). The input argument is pointer to encoder instance
   // (codec instance for codecs that encoder and decoder share the same
   // instance). This method is called to free the memory that |ptr_inst| is
   // pointing to.
   //
   // Input:
   //   -ptr_inst           : pointer to encoder instance.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual void InternalDestructEncoderInst(void* ptr_inst) = 0;

   ///////////////////////////////////////////////////////////////////////////
   // int16_t InternalResetEncoder()
   // This method is called to reset the states of encoder. However, the
   // current parameters, e.g. frame-length, should remain as they are. For
   // most of the codecs a re-initialization of the encoder is what needs to
   // be down. But for iSAC we like to keep the BWE history so we cannot
   // re-initialize. As soon as such an API is implemented in iSAC this method
   // has to be overwritten in ACMISAC class.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   virtual int16_t InternalResetEncoder();

   ///////////////////////////////////////////////////////////////////////////
   // int16_t ProcessFrameVADDTX()
   // This function is called when a full frame of audio is available. It will
   // break the audio frame into blocks such that each block could be processed
   // by VAD & CN/DTX. If a frame is divided into two blocks then there are two
   // cases. First, the first block is active, the second block will not be
   // processed by CN/DTX but only by VAD and return to caller with
   // '*samples_processed' set to zero. There, the audio frame will be encoded
   // by the encoder. Second, the first block is inactive and is processed by
   // CN/DTX, then we stop processing the next block and return to the caller
   // which is EncodeSafe(), with "*samples_processed" equal to the number of
   // samples in first block.
   //
   // Output:
   //   -bitstream          : pointer to a buffer where DTX frame, if
   //                         generated, will be written to.
   //   -bitstream_len_byte : contains the length of bit-stream in bytes, if
   //                         generated. Zero if no bit-stream is generated.
   //   -samples_processed  : contains no of samples that actually CN has
   //                         processed. Those samples processed by CN will not
   //                         be encoded by the encoder, obviously. If
   //                         contains zero, it means that the frame has been
   //                         identified as active by VAD. Note that
   //                         "*samples_processed" might be non-zero but
   //                         "*bitstream_len_byte" be zero.
   //
   // Return value:
   //   -1 if failed,
   //    0 if succeeded.
   //
   int16_t ProcessFrameVADDTX(uint8_t* bitstream,
                              int16_t* bitstream_len_byte,
                              int16_t* samples_processed);

   ///////////////////////////////////////////////////////////////////////////
   // CanChangeEncodingParam()
   // Check if the codec parameters can be changed. In conferencing normally
   // codec parameters cannot be changed. The exception is bit-rate of isac.
   //
   // return value:
   //   -true  if codec parameters are allowed to change.
   //   -false otherwise.
   //
   virtual bool CanChangeEncodingParam(CodecInst& codec_inst);

   ///////////////////////////////////////////////////////////////////////////
   // CurrentRate()
   // Call to get the current encoding rate of the encoder. This function
   // should be overwritten for codecs which automatically change their
   // target rate. One example is iSAC. The output of the function is the
   // current target rate.
   //
   // Output:
   //   -rate_bps           : the current target rate of the codec.
   //
   virtual void CurrentRate(int32_t& /* rate_bps */) {
     return;
   }

   virtual void SaveDecoderParamSafe(const WebRtcACMCodecParams* codec_params);

   // &in_audio_[in_audio_ix_write_] always point to where new audio can be
   // written to
   int16_t in_audio_ix_write_;

   // &in_audio_[in_audio_ix_read_] points to where audio has to be read from
   int16_t in_audio_ix_read_;

   int16_t in_timestamp_ix_write_;

   // Where the audio is stored before encoding,
   // To save memory the following buffer can be allocated
   // dynamically for 80 ms depending on the sampling frequency
   // of the codec.
   int16_t* in_audio_;
   uint32_t* in_timestamp_;

   int16_t frame_len_smpl_;
   uint16_t num_channels_;

   // This will point to a static database of the supported codecs
   int16_t codec_id_;

   // This will account for the number of samples  were not encoded
   // the case is rare, either samples are missed due to overwrite
   // at input buffer or due to encoding error
   uint32_t num_missed_samples_;

   // True if the encoder instance created
   bool encoder_exist_;
   bool decoder_exist_;
   // True if the encoder instance initialized
   bool encoder_initialized_;
   bool decoder_initialized_;

   bool registered_in_neteq_;

   // VAD/DTX
   bool has_internal_dtx_;
   WebRtcVadInst* ptr_vad_inst_;
   bool vad_enabled_;
   ACMVADMode vad_mode_;
   int16_t vad_label_[MAX_FRAME_SIZE_10MSEC];
   bool dtx_enabled_;
   WebRtcCngEncInst* ptr_dtx_inst_;
   uint8_t num_lpc_params_;
   bool sent_cn_previous_;
   bool is_master_;
   int16_t prev_frame_cng_;

   WebRtcACMCodecParams encoder_params_;
   WebRtcACMCodecParams decoder_params_;

   // Used as a global lock for all available decoders
   // so that no decoder is used when NetEQ decodes.
   RWLockWrapper* neteq_decode_lock_;
   // Used to lock wrapper internal data
   // such as buffers and state variables.
   RWLockWrapper& codec_wrapper_lock_;

   uint32_t last_encoded_timestamp_;
   uint32_t last_timestamp_;
   bool is_audio_buff_fresh_;
   uint32_t unique_id_;
 };

 }  // namespace webrt

 #endif  // WEBRTC_MODULES_AUDIO_CODING_MAIN_SOURCE_ACM_GENERIC_CODEC_H_