modules/video_coding/h264_packet_buffer.cc - src.git - Git at Google

 /*
  *  Copyright (c) 2021 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/video_coding/h264_packet_buffer.h"

 #include <algorithm>
 #include <cstdint>
 #include <utility>
 #include <vector>

 #include "api/array_view.h"
 #include "api/rtp_packet_info.h"
 #include "api/video/video_frame_type.h"
 #include "common_video/h264/h264_common.h"
 #include "modules/rtp_rtcp/source/rtp_header_extensions.h"
 #include "modules/rtp_rtcp/source/rtp_packet_received.h"
 #include "modules/rtp_rtcp/source/rtp_video_header.h"
 #include "modules/video_coding/codecs/h264/include/h264_globals.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/copy_on_write_buffer.h"
 #include "rtc_base/logging.h"
 #include "rtc_base/numerics/sequence_number_util.h"

 namespace webrtc {
 namespace {
 int64_t EuclideanMod(int64_t n, int64_t div) {
   RTC_DCHECK_GT(div, 0);
   return (n %= div) < 0 ? n + div : n;
 }

 rtc::ArrayView<const NaluInfo> GetNaluInfos(
     const RTPVideoHeaderH264& h264_header) {
   if (h264_header.nalus_length > kMaxNalusPerPacket) {
     return {};
   }

   return rtc::MakeArrayView(h264_header.nalus, h264_header.nalus_length);
 }

 bool IsFirstPacketOfFragment(const RTPVideoHeaderH264& h264_header) {
   return h264_header.nalus_length > 0;
 }

 bool BeginningOfIdr(const H264PacketBuffer::Packet& packet) {
   const auto& h264_header =
       absl::get<RTPVideoHeaderH264>(packet.video_header.video_type_header);
   const bool contains_idr_nalu =
       absl::c_any_of(GetNaluInfos(h264_header), [](const auto& nalu_info) {
         return nalu_info.type == H264::NaluType::kIdr;
       });
   switch (h264_header.packetization_type) {
     case kH264StapA:
     case kH264SingleNalu: {
       return contains_idr_nalu;
     }
     case kH264FuA: {
       return contains_idr_nalu && IsFirstPacketOfFragment(h264_header);
     }
   }
 }

 bool HasSps(const H264PacketBuffer::Packet& packet) {
   auto& h264_header =
       absl::get<RTPVideoHeaderH264>(packet.video_header.video_type_header);
   return absl::c_any_of(GetNaluInfos(h264_header), [](const auto& nalu_info) {
     return nalu_info.type == H264::NaluType::kSps;
   });
 }

 // TODO(bugs.webrtc.org/13157): Update the H264 depacketizer so we don't have to
 //                              fiddle with the payload at this point.
 rtc::CopyOnWriteBuffer FixVideoPayload(rtc::ArrayView<const uint8_t> payload,
                                        const RTPVideoHeader& video_header) {
   constexpr uint8_t kStartCode[] = {0, 0, 0, 1};

   const auto& h264_header =
       absl::get<RTPVideoHeaderH264>(video_header.video_type_header);

   rtc::CopyOnWriteBuffer result;
   switch (h264_header.packetization_type) {
     case kH264StapA: {
       const uint8_t* payload_end = payload.data() + payload.size();
       const uint8_t* nalu_ptr = payload.data() + 1;
       while (nalu_ptr < payload_end - 1) {
         // The first two bytes describe the length of the segment, where a
         // segment is the nalu type plus nalu payload.
         uint16_t segment_length = nalu_ptr[0] << 8 | nalu_ptr[1];
         nalu_ptr += 2;

         if (nalu_ptr + segment_length <= payload_end) {
           result.AppendData(kStartCode);
           result.AppendData(nalu_ptr, segment_length);
         }
         nalu_ptr += segment_length;
       }
       return result;
     }

     case kH264FuA: {
       if (IsFirstPacketOfFragment(h264_header)) {
         result.AppendData(kStartCode);
       }
       result.AppendData(payload);
       return result;
     }

     case kH264SingleNalu: {
       result.AppendData(kStartCode);
       result.AppendData(payload);
       return result;
     }
   }

   RTC_DCHECK_NOTREACHED();
   return result;
 }

 }  // namespace

 H264PacketBuffer::H264PacketBuffer(bool idr_only_keyframes_allowed)
     : idr_only_keyframes_allowed_(idr_only_keyframes_allowed) {}

 H264PacketBuffer::InsertResult H264PacketBuffer::InsertPacket(
     std::unique_ptr<Packet> packet) {
   RTC_DCHECK(packet->video_header.codec == kVideoCodecH264);

   InsertResult result;
   if (!absl::holds_alternative<RTPVideoHeaderH264>(
           packet->video_header.video_type_header)) {
     return result;
   }

   int64_t unwrapped_seq_num = seq_num_unwrapper_.Unwrap(packet->seq_num);
   auto& packet_slot = GetPacket(unwrapped_seq_num);
   if (packet_slot != nullptr &&
       AheadOrAt(packet_slot->timestamp, packet->timestamp)) {
     // The incoming `packet` is old or a duplicate.
     return result;
   } else {
     packet_slot = std::move(packet);
   }

   result.packets = FindFrames(unwrapped_seq_num);
   return result;
 }

 std::unique_ptr<H264PacketBuffer::Packet>& H264PacketBuffer::GetPacket(
     int64_t unwrapped_seq_num) {
   return buffer_[EuclideanMod(unwrapped_seq_num, kBufferSize)];
 }

 bool H264PacketBuffer::BeginningOfStream(
     const H264PacketBuffer::Packet& packet) const {
   return HasSps(packet) ||
          (idr_only_keyframes_allowed_ && BeginningOfIdr(packet));
 }

 std::vector<std::unique_ptr<H264PacketBuffer::Packet>>
 H264PacketBuffer::FindFrames(int64_t unwrapped_seq_num) {
   std::vector<std::unique_ptr<Packet>> found_frames;

   Packet* packet = GetPacket(unwrapped_seq_num).get();
   RTC_CHECK(packet != nullptr);

   // Check if the packet is continuous or the beginning of a new coded video
   // sequence.
   if (unwrapped_seq_num - 1 != last_continuous_unwrapped_seq_num_) {
     if (unwrapped_seq_num <= last_continuous_unwrapped_seq_num_ ||
         !BeginningOfStream(*packet)) {
       return found_frames;
     }

     last_continuous_unwrapped_seq_num_ = unwrapped_seq_num;
   }

   for (int64_t seq_num = unwrapped_seq_num;
        seq_num < unwrapped_seq_num + kBufferSize;) {
     RTC_DCHECK_GE(seq_num, *last_continuous_unwrapped_seq_num_);

     // Packets that were never assembled into a completed frame will stay in
     // the 'buffer_'. Check that the `packet` sequence number match the expected
     // unwrapped sequence number.
     if (static_cast<uint16_t>(seq_num) != packet->seq_num) {
       return found_frames;
     }

     last_continuous_unwrapped_seq_num_ = seq_num;
     // Last packet of the frame, try to assemble the frame.
     if (packet->marker_bit) {
       uint32_t rtp_timestamp = packet->timestamp;

       // Iterate backwards to find where the frame starts.
       for (int64_t seq_num_start = seq_num;
            seq_num_start > seq_num - kBufferSize; --seq_num_start) {
         auto& prev_packet = GetPacket(seq_num_start - 1);

         if (prev_packet == nullptr || prev_packet->timestamp != rtp_timestamp) {
           if (MaybeAssembleFrame(seq_num_start, seq_num, found_frames)) {
             // Frame was assembled, continue to look for more frames.
             break;
           } else {
             // Frame was not assembled, no subsequent frame will be continuous.
             return found_frames;
           }
         }
       }
     }

     seq_num++;
     packet = GetPacket(seq_num).get();
     if (packet == nullptr) {
       return found_frames;
     }
   }

   return found_frames;
 }

 bool H264PacketBuffer::MaybeAssembleFrame(
     int64_t start_seq_num_unwrapped,
     int64_t end_sequence_number_unwrapped,
     std::vector<std::unique_ptr<Packet>>& frames) {
   bool has_sps = false;
   bool has_pps = false;
   bool has_idr = false;

   int width = -1;
   int height = -1;

   for (int64_t seq_num = start_seq_num_unwrapped;
        seq_num <= end_sequence_number_unwrapped; ++seq_num) {
     const auto& packet = GetPacket(seq_num);
     const auto& h264_header =
         absl::get<RTPVideoHeaderH264>(packet->video_header.video_type_header);
     for (const auto& nalu : GetNaluInfos(h264_header)) {
       has_idr |= nalu.type == H264::NaluType::kIdr;
       has_sps |= nalu.type == H264::NaluType::kSps;
       has_pps |= nalu.type == H264::NaluType::kPps;
     }

     width = std::max<int>(packet->video_header.width, width);
     height = std::max<int>(packet->video_header.height, height);
   }

   if (has_idr) {
     if (!idr_only_keyframes_allowed_ && (!has_sps || !has_pps)) {
       return false;
     }
   }

   for (int64_t seq_num = start_seq_num_unwrapped;
        seq_num <= end_sequence_number_unwrapped; ++seq_num) {
     auto& packet = GetPacket(seq_num);

     packet->video_header.is_first_packet_in_frame =
         (seq_num == start_seq_num_unwrapped);
     packet->video_header.is_last_packet_in_frame =
         (seq_num == end_sequence_number_unwrapped);

     if (packet->video_header.is_first_packet_in_frame) {
       if (width > 0 && height > 0) {
         packet->video_header.width = width;
         packet->video_header.height = height;
       }

       packet->video_header.frame_type = has_idr
                                             ? VideoFrameType::kVideoFrameKey
                                             : VideoFrameType::kVideoFrameDelta;
     }

     packet->video_payload =
         FixVideoPayload(packet->video_payload, packet->video_header);

     frames.push_back(std::move(packet));
   }

   return true;
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2021 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "modules/video_coding/h264_packet_buffer.h"

	#include <algorithm>
	#include <cstdint>
	#include <utility>
	#include <vector>

	#include "api/array_view.h"
	#include "api/rtp_packet_info.h"
	#include "api/video/video_frame_type.h"
	#include "common_video/h264/h264_common.h"
	#include "modules/rtp_rtcp/source/rtp_header_extensions.h"
	#include "modules/rtp_rtcp/source/rtp_packet_received.h"
	#include "modules/rtp_rtcp/source/rtp_video_header.h"
	#include "modules/video_coding/codecs/h264/include/h264_globals.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/copy_on_write_buffer.h"
	#include "rtc_base/logging.h"
	#include "rtc_base/numerics/sequence_number_util.h"

	namespace webrtc {
	namespace {
	int64_t EuclideanMod(int64_t n, int64_t div) {
	RTC_DCHECK_GT(div, 0);
	return (n %= div) < 0 ? n + div : n;
	}

	rtc::ArrayView<const NaluInfo> GetNaluInfos(
	const RTPVideoHeaderH264& h264_header) {
	if (h264_header.nalus_length > kMaxNalusPerPacket) {
	return {};
	}

	return rtc::MakeArrayView(h264_header.nalus, h264_header.nalus_length);
	}

	bool IsFirstPacketOfFragment(const RTPVideoHeaderH264& h264_header) {
	return h264_header.nalus_length > 0;
	}

	bool BeginningOfIdr(const H264PacketBuffer::Packet& packet) {
	const auto& h264_header =
	absl::get<RTPVideoHeaderH264>(packet.video_header.video_type_header);
	const bool contains_idr_nalu =
	absl::c_any_of(GetNaluInfos(h264_header), [](const auto& nalu_info) {
	return nalu_info.type == H264::NaluType::kIdr;
	});
	switch (h264_header.packetization_type) {
	case kH264StapA:
	case kH264SingleNalu: {
	return contains_idr_nalu;
	}
	case kH264FuA: {
	return contains_idr_nalu && IsFirstPacketOfFragment(h264_header);
	}
	}
	}

	bool HasSps(const H264PacketBuffer::Packet& packet) {
	auto& h264_header =
	absl::get<RTPVideoHeaderH264>(packet.video_header.video_type_header);
	return absl::c_any_of(GetNaluInfos(h264_header), [](const auto& nalu_info) {
	return nalu_info.type == H264::NaluType::kSps;
	});
	}

	// TODO(bugs.webrtc.org/13157): Update the H264 depacketizer so we don't have to
	// fiddle with the payload at this point.
	rtc::CopyOnWriteBuffer FixVideoPayload(rtc::ArrayView<const uint8_t> payload,
	const RTPVideoHeader& video_header) {
	constexpr uint8_t kStartCode[] = {0, 0, 0, 1};

	const auto& h264_header =
	absl::get<RTPVideoHeaderH264>(video_header.video_type_header);

	rtc::CopyOnWriteBuffer result;
	switch (h264_header.packetization_type) {
	case kH264StapA: {
	const uint8_t* payload_end = payload.data() + payload.size();
	const uint8_t* nalu_ptr = payload.data() + 1;
	while (nalu_ptr < payload_end - 1) {
	// The first two bytes describe the length of the segment, where a
	// segment is the nalu type plus nalu payload.
	uint16_t segment_length = nalu_ptr[0] << 8 \| nalu_ptr[1];
	nalu_ptr += 2;

	if (nalu_ptr + segment_length <= payload_end) {
	result.AppendData(kStartCode);
	result.AppendData(nalu_ptr, segment_length);
	}
	nalu_ptr += segment_length;
	}
	return result;
	}

	case kH264FuA: {
	if (IsFirstPacketOfFragment(h264_header)) {
	result.AppendData(kStartCode);
	}
	result.AppendData(payload);
	return result;
	}

	case kH264SingleNalu: {
	result.AppendData(kStartCode);
	result.AppendData(payload);
	return result;
	}
	}

	RTC_DCHECK_NOTREACHED();
	return result;
	}

	} // namespace

	H264PacketBuffer::H264PacketBuffer(bool idr_only_keyframes_allowed)
	: idr_only_keyframes_allowed_(idr_only_keyframes_allowed) {}

	H264PacketBuffer::InsertResult H264PacketBuffer::InsertPacket(
	std::unique_ptr<Packet> packet) {
	RTC_DCHECK(packet->video_header.codec == kVideoCodecH264);

	InsertResult result;
	if (!absl::holds_alternative<RTPVideoHeaderH264>(
	packet->video_header.video_type_header)) {
	return result;
	}

	int64_t unwrapped_seq_num = seq_num_unwrapper_.Unwrap(packet->seq_num);
	auto& packet_slot = GetPacket(unwrapped_seq_num);
	if (packet_slot != nullptr &&
	AheadOrAt(packet_slot->timestamp, packet->timestamp)) {
	// The incoming `packet` is old or a duplicate.
	return result;
	} else {
	packet_slot = std::move(packet);
	}

	result.packets = FindFrames(unwrapped_seq_num);
	return result;
	}

	std::unique_ptr<H264PacketBuffer::Packet>& H264PacketBuffer::GetPacket(
	int64_t unwrapped_seq_num) {
	return buffer_[EuclideanMod(unwrapped_seq_num, kBufferSize)];
	}

	bool H264PacketBuffer::BeginningOfStream(
	const H264PacketBuffer::Packet& packet) const {
	return HasSps(packet) \|\|
	(idr_only_keyframes_allowed_ && BeginningOfIdr(packet));
	}

	std::vector<std::unique_ptr<H264PacketBuffer::Packet>>
	H264PacketBuffer::FindFrames(int64_t unwrapped_seq_num) {
	std::vector<std::unique_ptr<Packet>> found_frames;

	Packet* packet = GetPacket(unwrapped_seq_num).get();
	RTC_CHECK(packet != nullptr);

	// Check if the packet is continuous or the beginning of a new coded video
	// sequence.
	if (unwrapped_seq_num - 1 != last_continuous_unwrapped_seq_num_) {
	if (unwrapped_seq_num <= last_continuous_unwrapped_seq_num_ \|\|
	!BeginningOfStream(*packet)) {
	return found_frames;
	}

	last_continuous_unwrapped_seq_num_ = unwrapped_seq_num;
	}

	for (int64_t seq_num = unwrapped_seq_num;
	seq_num < unwrapped_seq_num + kBufferSize;) {
	RTC_DCHECK_GE(seq_num, *last_continuous_unwrapped_seq_num_);

	// Packets that were never assembled into a completed frame will stay in
	// the 'buffer_'. Check that the `packet` sequence number match the expected
	// unwrapped sequence number.
	if (static_cast<uint16_t>(seq_num) != packet->seq_num) {
	return found_frames;
	}

	last_continuous_unwrapped_seq_num_ = seq_num;
	// Last packet of the frame, try to assemble the frame.
	if (packet->marker_bit) {
	uint32_t rtp_timestamp = packet->timestamp;

	// Iterate backwards to find where the frame starts.
	for (int64_t seq_num_start = seq_num;
	seq_num_start > seq_num - kBufferSize; --seq_num_start) {
	auto& prev_packet = GetPacket(seq_num_start - 1);

	if (prev_packet == nullptr \|\| prev_packet->timestamp != rtp_timestamp) {
	if (MaybeAssembleFrame(seq_num_start, seq_num, found_frames)) {
	// Frame was assembled, continue to look for more frames.
	break;
	} else {
	// Frame was not assembled, no subsequent frame will be continuous.
	return found_frames;
	}
	}
	}
	}

	seq_num++;
	packet = GetPacket(seq_num).get();
	if (packet == nullptr) {
	return found_frames;
	}
	}

	return found_frames;
	}

	bool H264PacketBuffer::MaybeAssembleFrame(
	int64_t start_seq_num_unwrapped,
	int64_t end_sequence_number_unwrapped,
	std::vector<std::unique_ptr<Packet>>& frames) {
	bool has_sps = false;
	bool has_pps = false;
	bool has_idr = false;

	int width = -1;
	int height = -1;

	for (int64_t seq_num = start_seq_num_unwrapped;
	seq_num <= end_sequence_number_unwrapped; ++seq_num) {
	const auto& packet = GetPacket(seq_num);
	const auto& h264_header =
	absl::get<RTPVideoHeaderH264>(packet->video_header.video_type_header);
	for (const auto& nalu : GetNaluInfos(h264_header)) {
	has_idr \|= nalu.type == H264::NaluType::kIdr;
	has_sps \|= nalu.type == H264::NaluType::kSps;
	has_pps \|= nalu.type == H264::NaluType::kPps;
	}

	width = std::max<int>(packet->video_header.width, width);
	height = std::max<int>(packet->video_header.height, height);
	}

	if (has_idr) {
	if (!idr_only_keyframes_allowed_ && (!has_sps \|\| !has_pps)) {
	return false;
	}
	}

	for (int64_t seq_num = start_seq_num_unwrapped;
	seq_num <= end_sequence_number_unwrapped; ++seq_num) {
	auto& packet = GetPacket(seq_num);

	packet->video_header.is_first_packet_in_frame =
	(seq_num == start_seq_num_unwrapped);
	packet->video_header.is_last_packet_in_frame =
	(seq_num == end_sequence_number_unwrapped);

	if (packet->video_header.is_first_packet_in_frame) {
	if (width > 0 && height > 0) {
	packet->video_header.width = width;
	packet->video_header.height = height;
	}

	packet->video_header.frame_type = has_idr
	? VideoFrameType::kVideoFrameKey
	: VideoFrameType::kVideoFrameDelta;
	}

	packet->video_payload =
	FixVideoPayload(packet->video_payload, packet->video_header);

	frames.push_back(std::move(packet));
	}

	return true;
	}

	} // namespace webrtc