|  | /* | 
|  | *  Copyright (c) 2011 The WebRTC project authors. All Rights Reserved. | 
|  | * | 
|  | *  Use of this source code is governed by a BSD-style license | 
|  | *  that can be found in the LICENSE file in the root of the source | 
|  | *  tree. An additional intellectual property rights grant can be found | 
|  | *  in the file PATENTS.  All contributing project authors may | 
|  | *  be found in the AUTHORS file in the root of the source tree. | 
|  | */ | 
|  |  | 
|  | #include "modules/video_coding/decoding_state.h" | 
|  |  | 
|  | #include "common_video/h264/h264_common.h" | 
|  | #include "modules/include/module_common_types.h" | 
|  | #include "modules/video_coding/frame_buffer.h" | 
|  | #include "modules/video_coding/jitter_buffer_common.h" | 
|  | #include "modules/video_coding/packet.h" | 
|  | #include "rtc_base/logging.h" | 
|  |  | 
|  | namespace webrtc { | 
|  |  | 
|  | VCMDecodingState::VCMDecodingState() | 
|  | : sequence_num_(0), | 
|  | time_stamp_(0), | 
|  | picture_id_(kNoPictureId), | 
|  | temporal_id_(kNoTemporalIdx), | 
|  | tl0_pic_id_(kNoTl0PicIdx), | 
|  | full_sync_(true), | 
|  | in_initial_state_(true) { | 
|  | memset(frame_decoded_, 0, sizeof(frame_decoded_)); | 
|  | } | 
|  |  | 
|  | VCMDecodingState::~VCMDecodingState() {} | 
|  |  | 
|  | void VCMDecodingState::Reset() { | 
|  | // TODO(mikhal): Verify - not always would want to reset the sync | 
|  | sequence_num_ = 0; | 
|  | time_stamp_ = 0; | 
|  | picture_id_ = kNoPictureId; | 
|  | temporal_id_ = kNoTemporalIdx; | 
|  | tl0_pic_id_ = kNoTl0PicIdx; | 
|  | full_sync_ = true; | 
|  | in_initial_state_ = true; | 
|  | memset(frame_decoded_, 0, sizeof(frame_decoded_)); | 
|  | received_sps_.clear(); | 
|  | received_pps_.clear(); | 
|  | } | 
|  |  | 
|  | uint32_t VCMDecodingState::time_stamp() const { | 
|  | return time_stamp_; | 
|  | } | 
|  |  | 
|  | uint16_t VCMDecodingState::sequence_num() const { | 
|  | return sequence_num_; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::IsOldFrame(const VCMFrameBuffer* frame) const { | 
|  | assert(frame != NULL); | 
|  | if (in_initial_state_) | 
|  | return false; | 
|  | return !IsNewerTimestamp(frame->Timestamp(), time_stamp_); | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::IsOldPacket(const VCMPacket* packet) const { | 
|  | assert(packet != NULL); | 
|  | if (in_initial_state_) | 
|  | return false; | 
|  | return !IsNewerTimestamp(packet->timestamp, time_stamp_); | 
|  | } | 
|  |  | 
|  | void VCMDecodingState::SetState(const VCMFrameBuffer* frame) { | 
|  | assert(frame != NULL && frame->GetHighSeqNum() >= 0); | 
|  | if (!UsingFlexibleMode(frame)) | 
|  | UpdateSyncState(frame); | 
|  | sequence_num_ = static_cast<uint16_t>(frame->GetHighSeqNum()); | 
|  | time_stamp_ = frame->Timestamp(); | 
|  | picture_id_ = frame->PictureId(); | 
|  | temporal_id_ = frame->TemporalId(); | 
|  | tl0_pic_id_ = frame->Tl0PicId(); | 
|  |  | 
|  | for (const NaluInfo& nalu : frame->GetNaluInfos()) { | 
|  | if (nalu.type == H264::NaluType::kPps) { | 
|  | if (nalu.pps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received pps without pps id."; | 
|  | } else if (nalu.sps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received pps without sps id."; | 
|  | } else { | 
|  | received_pps_[nalu.pps_id] = nalu.sps_id; | 
|  | } | 
|  | } else if (nalu.type == H264::NaluType::kSps) { | 
|  | if (nalu.sps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received sps without sps id."; | 
|  | } else { | 
|  | received_sps_.insert(nalu.sps_id); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | if (UsingFlexibleMode(frame)) { | 
|  | uint16_t frame_index = picture_id_ % kFrameDecodedLength; | 
|  | if (in_initial_state_) { | 
|  | frame_decoded_cleared_to_ = frame_index; | 
|  | } else if (frame->FrameType() == VideoFrameType::kVideoFrameKey) { | 
|  | memset(frame_decoded_, 0, sizeof(frame_decoded_)); | 
|  | frame_decoded_cleared_to_ = frame_index; | 
|  | } else { | 
|  | if (AheadOfFramesDecodedClearedTo(frame_index)) { | 
|  | while (frame_decoded_cleared_to_ != frame_index) { | 
|  | frame_decoded_cleared_to_ = | 
|  | (frame_decoded_cleared_to_ + 1) % kFrameDecodedLength; | 
|  | frame_decoded_[frame_decoded_cleared_to_] = false; | 
|  | } | 
|  | } | 
|  | } | 
|  | frame_decoded_[frame_index] = true; | 
|  | } | 
|  |  | 
|  | in_initial_state_ = false; | 
|  | } | 
|  |  | 
|  | void VCMDecodingState::CopyFrom(const VCMDecodingState& state) { | 
|  | sequence_num_ = state.sequence_num_; | 
|  | time_stamp_ = state.time_stamp_; | 
|  | picture_id_ = state.picture_id_; | 
|  | temporal_id_ = state.temporal_id_; | 
|  | tl0_pic_id_ = state.tl0_pic_id_; | 
|  | full_sync_ = state.full_sync_; | 
|  | in_initial_state_ = state.in_initial_state_; | 
|  | frame_decoded_cleared_to_ = state.frame_decoded_cleared_to_; | 
|  | memcpy(frame_decoded_, state.frame_decoded_, sizeof(frame_decoded_)); | 
|  | received_sps_ = state.received_sps_; | 
|  | received_pps_ = state.received_pps_; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::UpdateEmptyFrame(const VCMFrameBuffer* frame) { | 
|  | bool empty_packet = frame->GetHighSeqNum() == frame->GetLowSeqNum(); | 
|  | if (in_initial_state_ && empty_packet) { | 
|  | // Drop empty packets as long as we are in the initial state. | 
|  | return true; | 
|  | } | 
|  | if ((empty_packet && ContinuousSeqNum(frame->GetHighSeqNum())) || | 
|  | ContinuousFrame(frame)) { | 
|  | // Continuous empty packets or continuous frames can be dropped if we | 
|  | // advance the sequence number. | 
|  | sequence_num_ = frame->GetHighSeqNum(); | 
|  | time_stamp_ = frame->Timestamp(); | 
|  | return true; | 
|  | } | 
|  | return false; | 
|  | } | 
|  |  | 
|  | void VCMDecodingState::UpdateOldPacket(const VCMPacket* packet) { | 
|  | assert(packet != NULL); | 
|  | if (packet->timestamp == time_stamp_) { | 
|  | // Late packet belonging to the last decoded frame - make sure we update the | 
|  | // last decoded sequence number. | 
|  | sequence_num_ = LatestSequenceNumber(packet->seqNum, sequence_num_); | 
|  | } | 
|  | } | 
|  |  | 
|  | void VCMDecodingState::SetSeqNum(uint16_t new_seq_num) { | 
|  | sequence_num_ = new_seq_num; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::in_initial_state() const { | 
|  | return in_initial_state_; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::full_sync() const { | 
|  | return full_sync_; | 
|  | } | 
|  |  | 
|  | void VCMDecodingState::UpdateSyncState(const VCMFrameBuffer* frame) { | 
|  | if (in_initial_state_) | 
|  | return; | 
|  | if (frame->TemporalId() == kNoTemporalIdx || | 
|  | frame->Tl0PicId() == kNoTl0PicIdx) { | 
|  | full_sync_ = true; | 
|  | } else if (frame->FrameType() == VideoFrameType::kVideoFrameKey || | 
|  | frame->LayerSync()) { | 
|  | full_sync_ = true; | 
|  | } else if (full_sync_) { | 
|  | // Verify that we are still in sync. | 
|  | // Sync will be broken if continuity is true for layers but not for the | 
|  | // other methods (PictureId and SeqNum). | 
|  | if (UsingPictureId(frame)) { | 
|  | // First check for a valid tl0PicId. | 
|  | if (frame->Tl0PicId() - tl0_pic_id_ > 1) { | 
|  | full_sync_ = false; | 
|  | } else { | 
|  | full_sync_ = ContinuousPictureId(frame->PictureId()); | 
|  | } | 
|  | } else { | 
|  | full_sync_ = | 
|  | ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum())); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::ContinuousFrame(const VCMFrameBuffer* frame) const { | 
|  | // Check continuity based on the following hierarchy: | 
|  | // - Temporal layers (stop here if out of sync). | 
|  | // - Picture Id when available. | 
|  | // - Sequence numbers. | 
|  | // Return true when in initial state. | 
|  | // Note that when a method is not applicable it will return false. | 
|  | assert(frame != NULL); | 
|  | // A key frame is always considered continuous as it doesn't refer to any | 
|  | // frames and therefore won't introduce any errors even if prior frames are | 
|  | // missing. | 
|  | if (frame->FrameType() == VideoFrameType::kVideoFrameKey && | 
|  | HaveSpsAndPps(frame->GetNaluInfos())) { | 
|  | return true; | 
|  | } | 
|  | // When in the initial state we always require a key frame to start decoding. | 
|  | if (in_initial_state_) | 
|  | return false; | 
|  | if (ContinuousLayer(frame->TemporalId(), frame->Tl0PicId())) | 
|  | return true; | 
|  | // tl0picId is either not used, or should remain unchanged. | 
|  | if (frame->Tl0PicId() != tl0_pic_id_) | 
|  | return false; | 
|  | // Base layers are not continuous or temporal layers are inactive. | 
|  | // In the presence of temporal layers, check for Picture ID/sequence number | 
|  | // continuity if sync can be restored by this frame. | 
|  | if (!full_sync_ && !frame->LayerSync()) | 
|  | return false; | 
|  | if (UsingPictureId(frame)) { | 
|  | if (UsingFlexibleMode(frame)) { | 
|  | return ContinuousFrameRefs(frame); | 
|  | } else { | 
|  | return ContinuousPictureId(frame->PictureId()); | 
|  | } | 
|  | } else { | 
|  | return ContinuousSeqNum(static_cast<uint16_t>(frame->GetLowSeqNum())) && | 
|  | HaveSpsAndPps(frame->GetNaluInfos()); | 
|  | } | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::ContinuousPictureId(int picture_id) const { | 
|  | int next_picture_id = picture_id_ + 1; | 
|  | if (picture_id < picture_id_) { | 
|  | // Wrap | 
|  | if (picture_id_ >= 0x80) { | 
|  | // 15 bits used for picture id | 
|  | return ((next_picture_id & 0x7FFF) == picture_id); | 
|  | } else { | 
|  | // 7 bits used for picture id | 
|  | return ((next_picture_id & 0x7F) == picture_id); | 
|  | } | 
|  | } | 
|  | // No wrap | 
|  | return (next_picture_id == picture_id); | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::ContinuousSeqNum(uint16_t seq_num) const { | 
|  | return seq_num == static_cast<uint16_t>(sequence_num_ + 1); | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::ContinuousLayer(int temporal_id, int tl0_pic_id) const { | 
|  | // First, check if applicable. | 
|  | if (temporal_id == kNoTemporalIdx || tl0_pic_id == kNoTl0PicIdx) | 
|  | return false; | 
|  | // If this is the first frame to use temporal layers, make sure we start | 
|  | // from base. | 
|  | else if (tl0_pic_id_ == kNoTl0PicIdx && temporal_id_ == kNoTemporalIdx && | 
|  | temporal_id == 0) | 
|  | return true; | 
|  |  | 
|  | // Current implementation: Look for base layer continuity. | 
|  | if (temporal_id != 0) | 
|  | return false; | 
|  | return (static_cast<uint8_t>(tl0_pic_id_ + 1) == tl0_pic_id); | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::ContinuousFrameRefs(const VCMFrameBuffer* frame) const { | 
|  | uint8_t num_refs = frame->CodecSpecific()->codecSpecific.VP9.num_ref_pics; | 
|  | for (uint8_t r = 0; r < num_refs; ++r) { | 
|  | uint16_t frame_ref = frame->PictureId() - | 
|  | frame->CodecSpecific()->codecSpecific.VP9.p_diff[r]; | 
|  | uint16_t frame_index = frame_ref % kFrameDecodedLength; | 
|  | if (AheadOfFramesDecodedClearedTo(frame_index) || | 
|  | !frame_decoded_[frame_index]) { | 
|  | return false; | 
|  | } | 
|  | } | 
|  | return true; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::UsingPictureId(const VCMFrameBuffer* frame) const { | 
|  | return (frame->PictureId() != kNoPictureId && picture_id_ != kNoPictureId); | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::UsingFlexibleMode(const VCMFrameBuffer* frame) const { | 
|  | bool is_flexible_mode = | 
|  | frame->CodecSpecific()->codecType == kVideoCodecVP9 && | 
|  | frame->CodecSpecific()->codecSpecific.VP9.flexible_mode; | 
|  | if (is_flexible_mode && frame->PictureId() == kNoPictureId) { | 
|  | RTC_LOG(LS_WARNING) << "Frame is marked as using flexible mode but no" | 
|  | << "picture id is set."; | 
|  | return false; | 
|  | } | 
|  | return is_flexible_mode; | 
|  | } | 
|  |  | 
|  | // TODO(philipel): change how check work, this check practially | 
|  | // limits the max p_diff to 64. | 
|  | bool VCMDecodingState::AheadOfFramesDecodedClearedTo(uint16_t index) const { | 
|  | // No way of knowing for sure if we are actually ahead of | 
|  | // frame_decoded_cleared_to_. We just make the assumption | 
|  | // that we are not trying to reference back to a very old | 
|  | // index, but instead are referencing a newer index. | 
|  | uint16_t diff = | 
|  | index > frame_decoded_cleared_to_ | 
|  | ? kFrameDecodedLength - (index - frame_decoded_cleared_to_) | 
|  | : frame_decoded_cleared_to_ - index; | 
|  | return diff > kFrameDecodedLength / 2; | 
|  | } | 
|  |  | 
|  | bool VCMDecodingState::HaveSpsAndPps(const std::vector<NaluInfo>& nalus) const { | 
|  | std::set<int> new_sps; | 
|  | std::map<int, int> new_pps; | 
|  | for (const NaluInfo& nalu : nalus) { | 
|  | // Check if this nalu actually contains sps/pps information or dependencies. | 
|  | if (nalu.sps_id == -1 && nalu.pps_id == -1) | 
|  | continue; | 
|  | switch (nalu.type) { | 
|  | case H264::NaluType::kPps: | 
|  | if (nalu.pps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received pps without pps id."; | 
|  | } else if (nalu.sps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received pps without sps id."; | 
|  | } else { | 
|  | new_pps[nalu.pps_id] = nalu.sps_id; | 
|  | } | 
|  | break; | 
|  | case H264::NaluType::kSps: | 
|  | if (nalu.sps_id < 0) { | 
|  | RTC_LOG(LS_WARNING) << "Received sps without sps id."; | 
|  | } else { | 
|  | new_sps.insert(nalu.sps_id); | 
|  | } | 
|  | break; | 
|  | default: { | 
|  | int needed_sps = -1; | 
|  | auto pps_it = new_pps.find(nalu.pps_id); | 
|  | if (pps_it != new_pps.end()) { | 
|  | needed_sps = pps_it->second; | 
|  | } else { | 
|  | auto pps_it2 = received_pps_.find(nalu.pps_id); | 
|  | if (pps_it2 == received_pps_.end()) { | 
|  | return false; | 
|  | } | 
|  | needed_sps = pps_it2->second; | 
|  | } | 
|  | if (new_sps.find(needed_sps) == new_sps.end() && | 
|  | received_sps_.find(needed_sps) == received_sps_.end()) { | 
|  | return false; | 
|  | } | 
|  | break; | 
|  | } | 
|  | } | 
|  | } | 
|  | return true; | 
|  | } | 
|  |  | 
|  | }  // namespace webrtc |