| /* |
| * Copyright (c) 2014 The WebRTC project authors. All Rights Reserved. |
| * |
| * Use of this source code is governed by a BSD-style license |
| * that can be found in the LICENSE file in the root of the source |
| * tree. An additional intellectual property rights grant can be found |
| * in the file PATENTS. All contributing project authors may |
| * be found in the AUTHORS file in the root of the source tree. |
| */ |
| |
| #include "webrtc/modules/audio_coding/codecs/g722/audio_encoder_g722.h" |
| |
| #include <algorithm> |
| |
| #include <limits> |
| #include "webrtc/common_types.h" |
| #include "webrtc/modules/audio_coding/codecs/g722/g722_interface.h" |
| #include "webrtc/rtc_base/checks.h" |
| #include "webrtc/rtc_base/safe_conversions.h" |
| #include "webrtc/rtc_base/string_to_number.h" |
| |
| namespace webrtc { |
| |
| namespace { |
| |
| const size_t kSampleRateHz = 16000; |
| |
| AudioEncoderG722Config CreateConfig(const CodecInst& codec_inst) { |
| AudioEncoderG722Config config; |
| config.num_channels = rtc::dchecked_cast<int>(codec_inst.channels); |
| config.frame_size_ms = codec_inst.pacsize / 16; |
| return config; |
| } |
| |
| } // namespace |
| |
| rtc::Optional<AudioEncoderG722Config> AudioEncoderG722Impl::SdpToConfig( |
| const SdpAudioFormat& format) { |
| if (STR_CASE_CMP(format.name.c_str(), "g722") != 0 || |
| format.clockrate_hz != 8000) { |
| return rtc::Optional<AudioEncoderG722Config>(); |
| } |
| |
| AudioEncoderG722Config config; |
| config.num_channels = rtc::dchecked_cast<int>(format.num_channels); |
| auto ptime_iter = format.parameters.find("ptime"); |
| if (ptime_iter != format.parameters.end()) { |
| auto ptime = rtc::StringToNumber<int>(ptime_iter->second); |
| if (ptime && *ptime > 0) { |
| const int whole_packets = *ptime / 10; |
| config.frame_size_ms = std::max(10, std::min(whole_packets * 10, 60)); |
| } |
| } |
| return config.IsOk() ? rtc::Optional<AudioEncoderG722Config>(config) |
| : rtc::Optional<AudioEncoderG722Config>(); |
| } |
| |
| AudioEncoderG722Impl::AudioEncoderG722Impl(const AudioEncoderG722Config& config, |
| int payload_type) |
| : num_channels_(config.num_channels), |
| payload_type_(payload_type), |
| num_10ms_frames_per_packet_( |
| static_cast<size_t>(config.frame_size_ms / 10)), |
| num_10ms_frames_buffered_(0), |
| first_timestamp_in_buffer_(0), |
| encoders_(new EncoderState[num_channels_]), |
| interleave_buffer_(2 * num_channels_) { |
| RTC_CHECK(config.IsOk()); |
| const size_t samples_per_channel = |
| kSampleRateHz / 100 * num_10ms_frames_per_packet_; |
| for (size_t i = 0; i < num_channels_; ++i) { |
| encoders_[i].speech_buffer.reset(new int16_t[samples_per_channel]); |
| encoders_[i].encoded_buffer.SetSize(samples_per_channel / 2); |
| } |
| Reset(); |
| } |
| |
| AudioEncoderG722Impl::AudioEncoderG722Impl(const CodecInst& codec_inst) |
| : AudioEncoderG722Impl(CreateConfig(codec_inst), codec_inst.pltype) {} |
| |
| AudioEncoderG722Impl::AudioEncoderG722Impl(int payload_type, |
| const SdpAudioFormat& format) |
| : AudioEncoderG722Impl(*SdpToConfig(format), payload_type) {} |
| |
| AudioEncoderG722Impl::~AudioEncoderG722Impl() = default; |
| |
| rtc::Optional<AudioCodecInfo> AudioEncoderG722Impl::QueryAudioEncoder( |
| const SdpAudioFormat& format) { |
| if (STR_CASE_CMP(format.name.c_str(), GetPayloadName()) == 0) { |
| const auto config_opt = SdpToConfig(format); |
| if (format.clockrate_hz == 8000 && config_opt) { |
| RTC_DCHECK(config_opt->IsOk()); |
| return rtc::Optional<AudioCodecInfo>( |
| {rtc::dchecked_cast<int>(kSampleRateHz), |
| rtc::dchecked_cast<size_t>(config_opt->num_channels), 64000}); |
| } |
| } |
| return rtc::Optional<AudioCodecInfo>(); |
| } |
| |
| int AudioEncoderG722Impl::SampleRateHz() const { |
| return kSampleRateHz; |
| } |
| |
| size_t AudioEncoderG722Impl::NumChannels() const { |
| return num_channels_; |
| } |
| |
| int AudioEncoderG722Impl::RtpTimestampRateHz() const { |
| // The RTP timestamp rate for G.722 is 8000 Hz, even though it is a 16 kHz |
| // codec. |
| return kSampleRateHz / 2; |
| } |
| |
| size_t AudioEncoderG722Impl::Num10MsFramesInNextPacket() const { |
| return num_10ms_frames_per_packet_; |
| } |
| |
| size_t AudioEncoderG722Impl::Max10MsFramesInAPacket() const { |
| return num_10ms_frames_per_packet_; |
| } |
| |
| int AudioEncoderG722Impl::GetTargetBitrate() const { |
| // 4 bits/sample, 16000 samples/s/channel. |
| return static_cast<int>(64000 * NumChannels()); |
| } |
| |
| void AudioEncoderG722Impl::Reset() { |
| num_10ms_frames_buffered_ = 0; |
| for (size_t i = 0; i < num_channels_; ++i) |
| RTC_CHECK_EQ(0, WebRtcG722_EncoderInit(encoders_[i].encoder)); |
| } |
| |
| AudioEncoder::EncodedInfo AudioEncoderG722Impl::EncodeImpl( |
| uint32_t rtp_timestamp, |
| rtc::ArrayView<const int16_t> audio, |
| rtc::Buffer* encoded) { |
| if (num_10ms_frames_buffered_ == 0) |
| first_timestamp_in_buffer_ = rtp_timestamp; |
| |
| // Deinterleave samples and save them in each channel's buffer. |
| const size_t start = kSampleRateHz / 100 * num_10ms_frames_buffered_; |
| for (size_t i = 0; i < kSampleRateHz / 100; ++i) |
| for (size_t j = 0; j < num_channels_; ++j) |
| encoders_[j].speech_buffer[start + i] = audio[i * num_channels_ + j]; |
| |
| // If we don't yet have enough samples for a packet, we're done for now. |
| if (++num_10ms_frames_buffered_ < num_10ms_frames_per_packet_) { |
| return EncodedInfo(); |
| } |
| |
| // Encode each channel separately. |
| RTC_CHECK_EQ(num_10ms_frames_buffered_, num_10ms_frames_per_packet_); |
| num_10ms_frames_buffered_ = 0; |
| const size_t samples_per_channel = SamplesPerChannel(); |
| for (size_t i = 0; i < num_channels_; ++i) { |
| const size_t bytes_encoded = WebRtcG722_Encode( |
| encoders_[i].encoder, encoders_[i].speech_buffer.get(), |
| samples_per_channel, encoders_[i].encoded_buffer.data()); |
| RTC_CHECK_EQ(bytes_encoded, samples_per_channel / 2); |
| } |
| |
| const size_t bytes_to_encode = samples_per_channel / 2 * num_channels_; |
| EncodedInfo info; |
| info.encoded_bytes = encoded->AppendData( |
| bytes_to_encode, [&] (rtc::ArrayView<uint8_t> encoded) { |
| // Interleave the encoded bytes of the different channels. Each separate |
| // channel and the interleaved stream encodes two samples per byte, most |
| // significant half first. |
| for (size_t i = 0; i < samples_per_channel / 2; ++i) { |
| for (size_t j = 0; j < num_channels_; ++j) { |
| uint8_t two_samples = encoders_[j].encoded_buffer.data()[i]; |
| interleave_buffer_.data()[j] = two_samples >> 4; |
| interleave_buffer_.data()[num_channels_ + j] = two_samples & 0xf; |
| } |
| for (size_t j = 0; j < num_channels_; ++j) |
| encoded[i * num_channels_ + j] = |
| interleave_buffer_.data()[2 * j] << 4 | |
| interleave_buffer_.data()[2 * j + 1]; |
| } |
| |
| return bytes_to_encode; |
| }); |
| info.encoded_timestamp = first_timestamp_in_buffer_; |
| info.payload_type = payload_type_; |
| info.encoder_type = CodecType::kG722; |
| return info; |
| } |
| |
| AudioEncoderG722Impl::EncoderState::EncoderState() { |
| RTC_CHECK_EQ(0, WebRtcG722_CreateEncoder(&encoder)); |
| } |
| |
| AudioEncoderG722Impl::EncoderState::~EncoderState() { |
| RTC_CHECK_EQ(0, WebRtcG722_FreeEncoder(encoder)); |
| } |
| |
| size_t AudioEncoderG722Impl::SamplesPerChannel() const { |
| return kSampleRateHz / 100 * num_10ms_frames_per_packet_; |
| } |
| |
| } // namespace webrtc |