| /* |
| * Copyright (c) 2012 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #ifndef MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_ |
| #define MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_ |
| |
| #include <memory> |
| #include <string> |
| #include <utility> |
| #include <vector> |
| |
| #include "absl/types/optional.h" |
| #include "api/audio_codecs/audio_decoder_factory.h" |
| #include "api/audio_codecs/audio_encoder.h" |
| #include "api/function_view.h" |
| #include "api/neteq/neteq.h" |
| #include "api/neteq/neteq_factory.h" |
| #include "modules/audio_coding/include/audio_coding_module_typedefs.h" |
| #include "system_wrappers/include/clock.h" |
| |
| namespace webrtc { |
| |
| // forward declarations |
| class AudioDecoder; |
| class AudioEncoder; |
| class AudioFrame; |
| struct RTPHeader; |
| |
| #define WEBRTC_10MS_PCM_AUDIO 960 // 16 bits super wideband 48 kHz |
| |
| // Callback class used for sending data ready to be packetized |
| class AudioPacketizationCallback { |
| public: |
| virtual ~AudioPacketizationCallback() {} |
| |
| virtual int32_t SendData(AudioFrameType frame_type, |
| uint8_t payload_type, |
| uint32_t timestamp, |
| const uint8_t* payload_data, |
| size_t payload_len_bytes, |
| int64_t absolute_capture_timestamp_ms) { |
| // TODO(bugs.webrtc.org/10739): Deprecate the old SendData and make this one |
| // pure virtual. |
| RTC_NOTREACHED() << "This method must be overridden, or not used."; |
| return -1; |
| } |
| virtual int32_t SendData(AudioFrameType frame_type, |
| uint8_t payload_type, |
| uint32_t timestamp, |
| const uint8_t* payload_data, |
| size_t payload_len_bytes) { |
| return SendData(frame_type, payload_type, timestamp, payload_data, |
| payload_len_bytes, 0); |
| } |
| }; |
| |
| // Callback class used for reporting VAD decision |
| class ACMVADCallback { |
| public: |
| virtual ~ACMVADCallback() {} |
| |
| virtual int32_t InFrameType(AudioFrameType frame_type) = 0; |
| }; |
| |
| class AudioCodingModule { |
| protected: |
| AudioCodingModule() {} |
| |
| public: |
| struct Config { |
| explicit Config( |
| rtc::scoped_refptr<AudioDecoderFactory> decoder_factory = nullptr); |
| Config(const Config&); |
| ~Config(); |
| |
| NetEq::Config neteq_config; |
| Clock* clock; |
| rtc::scoped_refptr<AudioDecoderFactory> decoder_factory; |
| NetEqFactory* neteq_factory = nullptr; |
| }; |
| |
| static AudioCodingModule* Create(const Config& config); |
| virtual ~AudioCodingModule() = default; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // Sender |
| // |
| |
| // |modifier| is called exactly once with one argument: a pointer to the |
| // unique_ptr that holds the current encoder (which is null if there is no |
| // current encoder). For the duration of the call, |modifier| has exclusive |
| // access to the unique_ptr; it may call the encoder, steal the encoder and |
| // replace it with another encoder or with nullptr, etc. |
| virtual void ModifyEncoder( |
| rtc::FunctionView<void(std::unique_ptr<AudioEncoder>*)> modifier) = 0; |
| |
| // Utility method for simply replacing the existing encoder with a new one. |
| void SetEncoder(std::unique_ptr<AudioEncoder> new_encoder) { |
| ModifyEncoder([&](std::unique_ptr<AudioEncoder>* encoder) { |
| *encoder = std::move(new_encoder); |
| }); |
| } |
| |
| // int32_t RegisterTransportCallback() |
| // Register a transport callback which will be called to deliver |
| // the encoded buffers whenever Process() is called and a |
| // bit-stream is ready. |
| // |
| // Input: |
| // -transport : pointer to the callback class |
| // transport->SendData() is called whenever |
| // Process() is called and bit-stream is ready |
| // to deliver. |
| // |
| // Return value: |
| // -1 if the transport callback could not be registered |
| // 0 if registration is successful. |
| // |
| virtual int32_t RegisterTransportCallback( |
| AudioPacketizationCallback* transport) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t Add10MsData() |
| // Add 10MS of raw (PCM) audio data and encode it. If the sampling |
| // frequency of the audio does not match the sampling frequency of the |
| // current encoder ACM will resample the audio. If an encoded packet was |
| // produced, it will be delivered via the callback object registered using |
| // RegisterTransportCallback, and the return value from this function will |
| // be the number of bytes encoded. |
| // |
| // Input: |
| // -audio_frame : the input audio frame, containing raw audio |
| // sampling frequency etc. |
| // |
| // Return value: |
| // >= 0 number of bytes encoded. |
| // -1 some error occurred. |
| // |
| virtual int32_t Add10MsData(const AudioFrame& audio_frame) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int SetPacketLossRate() |
| // Sets expected packet loss rate for encoding. Some encoders provide packet |
| // loss gnostic encoding to make stream less sensitive to packet losses, |
| // through e.g., FEC. No effects on codecs that do not provide such encoding. |
| // |
| // Input: |
| // -packet_loss_rate : expected packet loss rate (0 -- 100 inclusive). |
| // |
| // Return value |
| // -1 if failed to set packet loss rate, |
| // 0 if succeeded. |
| // |
| // This is only used in test code that rely on old ACM APIs. |
| // TODO(minyue): Remove it when possible. |
| virtual int SetPacketLossRate(int packet_loss_rate) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // (VAD) Voice Activity Detection |
| // |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t RegisterVADCallback() |
| // Call this method to register a callback function which is called |
| // any time that ACM encounters an empty frame. That is a frame which is |
| // recognized inactive. Depending on the codec WebRtc VAD or internal codec |
| // VAD is employed to identify a frame as active/inactive. |
| // |
| // Input: |
| // -vad_callback : pointer to a callback function. |
| // |
| // Return value: |
| // -1 if failed to register the callback function. |
| // 0 if the callback function is registered successfully. |
| // |
| virtual int32_t RegisterVADCallback(ACMVADCallback* vad_callback) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // Receiver |
| // |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t InitializeReceiver() |
| // Any decoder-related state of ACM will be initialized to the |
| // same state when ACM is created. This will not interrupt or |
| // effect encoding functionality of ACM. ACM would lose all the |
| // decoding-related settings by calling this function. |
| // For instance, all registered codecs are deleted and have to be |
| // registered again. |
| // |
| // Return value: |
| // -1 if failed to initialize, |
| // 0 if succeeded. |
| // |
| virtual int32_t InitializeReceiver() = 0; |
| |
| // Replace any existing decoders with the given payload type -> decoder map. |
| virtual void SetReceiveCodecs( |
| const std::map<int, SdpAudioFormat>& codecs) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t IncomingPacket() |
| // Call this function to insert a parsed RTP packet into ACM. |
| // |
| // Inputs: |
| // -incoming_payload : received payload. |
| // -payload_len_bytes : the length of payload in bytes. |
| // -rtp_info : the relevant information retrieved from RTP |
| // header. |
| // |
| // Return value: |
| // -1 if failed to push in the payload |
| // 0 if payload is successfully pushed in. |
| // |
| virtual int32_t IncomingPacket(const uint8_t* incoming_payload, |
| const size_t payload_len_bytes, |
| const RTPHeader& rtp_header) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t PlayoutData10Ms( |
| // Get 10 milliseconds of raw audio data for playout, at the given sampling |
| // frequency. ACM will perform a resampling if required. |
| // |
| // Input: |
| // -desired_freq_hz : the desired sampling frequency, in Hertz, of the |
| // output audio. If set to -1, the function returns |
| // the audio at the current sampling frequency. |
| // |
| // Output: |
| // -audio_frame : output audio frame which contains raw audio data |
| // and other relevant parameters. |
| // -muted : if true, the sample data in audio_frame is not |
| // populated, and must be interpreted as all zero. |
| // |
| // Return value: |
| // -1 if the function fails, |
| // 0 if the function succeeds. |
| // |
| virtual int32_t PlayoutData10Ms(int32_t desired_freq_hz, |
| AudioFrame* audio_frame, |
| bool* muted) = 0; |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // statistics |
| // |
| |
| /////////////////////////////////////////////////////////////////////////// |
| // int32_t GetNetworkStatistics() |
| // Get network statistics. Note that the internal statistics of NetEq are |
| // reset by this call. |
| // |
| // Input: |
| // -network_statistics : a structure that contains network statistics. |
| // |
| // Return value: |
| // -1 if failed to set the network statistics, |
| // 0 if statistics are set successfully. |
| // |
| virtual int32_t GetNetworkStatistics( |
| NetworkStatistics* network_statistics) = 0; |
| |
| virtual ANAStats GetANAStats() const = 0; |
| }; |
| |
| } // namespace webrtc |
| |
| #endif // MODULES_AUDIO_CODING_INCLUDE_AUDIO_CODING_MODULE_H_ |