modules/rtp_rtcp/source/rtp_format_h264.cc - src - Git at Google

 /*
  *  Copyright (c) 2014 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "modules/rtp_rtcp/source/rtp_format_h264.h"

 #include <string.h>
 #include <memory>
 #include <utility>
 #include <vector>

 #include "common_video/h264/h264_common.h"
 #include "common_video/h264/pps_parser.h"
 #include "common_video/h264/sps_parser.h"
 #include "common_video/h264/sps_vui_rewriter.h"
 #include "modules/include/module_common_types.h"
 #include "modules/rtp_rtcp/source/byte_io.h"
 #include "modules/rtp_rtcp/source/rtp_packet_to_send.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/logging.h"
 #include "rtc_base/system/fallthrough.h"
 #include "system_wrappers/include/metrics.h"

 namespace webrtc {
 namespace {

 static const size_t kNalHeaderSize = 1;
 static const size_t kFuAHeaderSize = 2;
 static const size_t kLengthFieldSize = 2;
 static const size_t kStapAHeaderSize = kNalHeaderSize + kLengthFieldSize;

 static const char* kSpsValidHistogramName = "WebRTC.Video.H264.SpsValid";
 enum SpsValidEvent {
   kReceivedSpsPocOk = 0,
   kReceivedSpsVuiOk = 1,
   kReceivedSpsRewritten = 2,
   kReceivedSpsParseFailure = 3,
   kSentSpsPocOk = 4,
   kSentSpsVuiOk = 5,
   kSentSpsRewritten = 6,
   kSentSpsParseFailure = 7,
   kSpsRewrittenMax = 8
 };

 // Bit masks for FU (A and B) indicators.
 enum NalDefs : uint8_t { kFBit = 0x80, kNriMask = 0x60, kTypeMask = 0x1F };

 // Bit masks for FU (A and B) headers.
 enum FuDefs : uint8_t { kSBit = 0x80, kEBit = 0x40, kRBit = 0x20 };

 // TODO(pbos): Avoid parsing this here as well as inside the jitter buffer.
 bool ParseStapAStartOffsets(const uint8_t* nalu_ptr,
                             size_t length_remaining,
                             std::vector<size_t>* offsets) {
   size_t offset = 0;
   while (length_remaining > 0) {
     // Buffer doesn't contain room for additional nalu length.
     if (length_remaining < sizeof(uint16_t))
       return false;
     uint16_t nalu_size = ByteReader<uint16_t>::ReadBigEndian(nalu_ptr);
     nalu_ptr += sizeof(uint16_t);
     length_remaining -= sizeof(uint16_t);
     if (nalu_size > length_remaining)
       return false;
     nalu_ptr += nalu_size;
     length_remaining -= nalu_size;

     offsets->push_back(offset + kStapAHeaderSize);
     offset += kLengthFieldSize + nalu_size;
   }
   return true;
 }

 }  // namespace

 RtpPacketizerH264::RtpPacketizerH264(size_t max_payload_len,
                                      size_t last_packet_reduction_len,
                                      H264PacketizationMode packetization_mode)
     : max_payload_len_(max_payload_len),
       last_packet_reduction_len_(last_packet_reduction_len),
       num_packets_left_(0),
       packetization_mode_(packetization_mode) {
   // Guard against uninitialized memory in packetization_mode.
   RTC_CHECK(packetization_mode == H264PacketizationMode::NonInterleaved ||
             packetization_mode == H264PacketizationMode::SingleNalUnit);
   RTC_CHECK_GT(max_payload_len, last_packet_reduction_len);
 }

 RtpPacketizerH264::~RtpPacketizerH264() {
 }

 RtpPacketizerH264::Fragment::~Fragment() = default;

 RtpPacketizerH264::Fragment::Fragment(const uint8_t* buffer, size_t length)
     : buffer(buffer), length(length) {}
 RtpPacketizerH264::Fragment::Fragment(const Fragment& fragment)
     : buffer(fragment.buffer), length(fragment.length) {}

 size_t RtpPacketizerH264::SetPayloadData(
     const uint8_t* payload_data,
     size_t payload_size,
     const RTPFragmentationHeader* fragmentation) {
   RTC_DCHECK(packets_.empty());
   RTC_DCHECK(input_fragments_.empty());
   RTC_DCHECK(fragmentation);
   for (int i = 0; i < fragmentation->fragmentationVectorSize; ++i) {
     const uint8_t* buffer =
         &payload_data[fragmentation->fragmentationOffset[i]];
     size_t length = fragmentation->fragmentationLength[i];

     bool updated_sps = false;
     H264::NaluType nalu_type = H264::ParseNaluType(buffer[0]);
     if (nalu_type == H264::NaluType::kSps) {
       // Check if stream uses picture order count type 0, and if so rewrite it
       // to enable faster decoding. Streams in that format incur additional
       // delay because it allows decode order to differ from render order.
       // The mechanism used is to rewrite (edit or add) the SPS's VUI to contain
       // restrictions on the maximum number of reordered pictures. This reduces
       // latency significantly, though it still adds about a frame of latency to
       // decoding.
       // Note that we do this rewriting both here (send side, in order to
       // protect legacy receive clients) and below in
       // RtpDepacketizerH264::ParseSingleNalu (receive side, in orderer to
       // protect us from unknown or legacy send clients).

       absl::optional<SpsParser::SpsState> sps;

       std::unique_ptr<rtc::Buffer> output_buffer(new rtc::Buffer());
       // Add the type header to the output buffer first, so that the rewriter
       // can append modified payload on top of that.
       output_buffer->AppendData(buffer[0]);
       SpsVuiRewriter::ParseResult result = SpsVuiRewriter::ParseAndRewriteSps(
           buffer + H264::kNaluTypeSize, length - H264::kNaluTypeSize, &sps,
           output_buffer.get());

       switch (result) {
         case SpsVuiRewriter::ParseResult::kVuiRewritten:
           input_fragments_.push_back(
               Fragment(output_buffer->data(), output_buffer->size()));
           input_fragments_.rbegin()->tmp_buffer = std::move(output_buffer);
           updated_sps = true;
           RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                     SpsValidEvent::kSentSpsRewritten,
                                     SpsValidEvent::kSpsRewrittenMax);
           break;
         case SpsVuiRewriter::ParseResult::kPocOk:
           RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                     SpsValidEvent::kSentSpsPocOk,
                                     SpsValidEvent::kSpsRewrittenMax);
           break;
         case SpsVuiRewriter::ParseResult::kVuiOk:
           RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                     SpsValidEvent::kSentSpsVuiOk,
                                     SpsValidEvent::kSpsRewrittenMax);
           break;
         case SpsVuiRewriter::ParseResult::kFailure:
           RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                     SpsValidEvent::kSentSpsParseFailure,
                                     SpsValidEvent::kSpsRewrittenMax);
           break;
       }
     }

     if (!updated_sps)
       input_fragments_.push_back(Fragment(buffer, length));
   }
   if (!GeneratePackets()) {
     // If failed to generate all the packets, discard already generated
     // packets in case the caller would ignore return value and still try to
     // call NextPacket().
     num_packets_left_ = 0;
     while (!packets_.empty()) {
       packets_.pop();
     }
     return 0;
   }
   return num_packets_left_;
 }

 bool RtpPacketizerH264::GeneratePackets() {
   for (size_t i = 0; i < input_fragments_.size();) {
     switch (packetization_mode_) {
       case H264PacketizationMode::SingleNalUnit:
         if (!PacketizeSingleNalu(i))
           return false;
         ++i;
         break;
       case H264PacketizationMode::NonInterleaved:
         size_t fragment_len = input_fragments_[i].length;
         if (i + 1 == input_fragments_.size()) {
           // Pretend that last fragment is larger instead of making last packet
           // smaller.
           fragment_len += last_packet_reduction_len_;
         }
         if (fragment_len > max_payload_len_) {
           PacketizeFuA(i);
           ++i;
         } else {
           i = PacketizeStapA(i);
         }
         break;
     }
   }
   return true;
 }

 void RtpPacketizerH264::PacketizeFuA(size_t fragment_index) {
   // Fragment payload into packets (FU-A).
   // Strip out the original header and leave room for the FU-A header.
   const Fragment& fragment = input_fragments_[fragment_index];
   bool is_last_fragment = fragment_index + 1 == input_fragments_.size();
   size_t payload_left = fragment.length - kNalHeaderSize;
   size_t offset = kNalHeaderSize;
   size_t per_packet_capacity = max_payload_len_ - kFuAHeaderSize;

   // Instead of making the last packet smaller we pretend that all packets are
   // of the same size but we write additional virtual payload to the last
   // packet.
   size_t extra_len = is_last_fragment ? last_packet_reduction_len_ : 0;

   // Integer divisions with rounding up. Minimal number of packets to fit all
   // payload and virtual payload.
   size_t num_packets = (payload_left + extra_len + (per_packet_capacity - 1)) /
                        per_packet_capacity;
   // Bytes per packet. Average rounded down.
   size_t payload_per_packet = (payload_left + extra_len) / num_packets;
   // We make several first packets to be 1 bytes smaller than the rest.
   // i.e 14 bytes splitted in 4 packets would be 3+3+4+4.
   size_t num_larger_packets = (payload_left + extra_len) % num_packets;

   num_packets_left_ += num_packets;
   while (payload_left > 0) {
     // Increase payload per packet at the right time.
     if (num_packets == num_larger_packets)
       ++payload_per_packet;
     size_t packet_length = payload_per_packet;
     if (payload_left <= packet_length) {  // Last portion of the payload
       packet_length = payload_left;
       // One additional packet may be used for extensions in the last packet.
       // Together with last payload packet there may be at most 2 of them.
       RTC_DCHECK_LE(num_packets, 2);
       if (num_packets == 2) {
         // Whole payload fits in the first num_packets-1 packets but extra
         // packet is used for virtual payload. Leave at least one byte of data
         // for the last packet.
         --packet_length;
       }
     }
     RTC_CHECK_GT(packet_length, 0);
     packets_.push(PacketUnit(Fragment(fragment.buffer + offset, packet_length),
                              offset - kNalHeaderSize == 0,
                              payload_left == packet_length, false,
                              fragment.buffer[0]));
     offset += packet_length;
     payload_left -= packet_length;
     --num_packets;
   }
   RTC_CHECK_EQ(0, payload_left);
 }

 size_t RtpPacketizerH264::PacketizeStapA(size_t fragment_index) {
   // Aggregate fragments into one packet (STAP-A).
   size_t payload_size_left = max_payload_len_;
   int aggregated_fragments = 0;
   size_t fragment_headers_length = 0;
   const Fragment* fragment = &input_fragments_[fragment_index];
   RTC_CHECK_GE(payload_size_left, fragment->length);
   ++num_packets_left_;
   while (payload_size_left >= fragment->length + fragment_headers_length &&
          (fragment_index + 1 < input_fragments_.size() ||
           payload_size_left >= fragment->length + fragment_headers_length +
                                    last_packet_reduction_len_)) {
     RTC_CHECK_GT(fragment->length, 0);
     packets_.push(PacketUnit(*fragment, aggregated_fragments == 0, false, true,
                              fragment->buffer[0]));
     payload_size_left -= fragment->length;
     payload_size_left -= fragment_headers_length;

     fragment_headers_length = kLengthFieldSize;
     // If we are going to try to aggregate more fragments into this packet
     // we need to add the STAP-A NALU header and a length field for the first
     // NALU of this packet.
     if (aggregated_fragments == 0)
       fragment_headers_length += kNalHeaderSize + kLengthFieldSize;
     ++aggregated_fragments;

     // Next fragment.
     ++fragment_index;
     if (fragment_index == input_fragments_.size())
       break;
     fragment = &input_fragments_[fragment_index];
   }
   RTC_CHECK_GT(aggregated_fragments, 0);
   packets_.back().last_fragment = true;
   return fragment_index;
 }

 bool RtpPacketizerH264::PacketizeSingleNalu(size_t fragment_index) {
   // Add a single NALU to the queue, no aggregation.
   size_t payload_size_left = max_payload_len_;
   if (fragment_index + 1 == input_fragments_.size())
     payload_size_left -= last_packet_reduction_len_;
   const Fragment* fragment = &input_fragments_[fragment_index];
   if (payload_size_left < fragment->length) {
     RTC_LOG(LS_ERROR) << "Failed to fit a fragment to packet in SingleNalu "
                          "packetization mode. Payload size left "
                       << payload_size_left << ", fragment length "
                       << fragment->length << ", packet capacity "
                       << max_payload_len_;
     return false;
   }
   RTC_CHECK_GT(fragment->length, 0u);
   packets_.push(PacketUnit(*fragment, true /* first */, true /* last */,
                            false /* aggregated */, fragment->buffer[0]));
   ++num_packets_left_;
   return true;
 }

 bool RtpPacketizerH264::NextPacket(RtpPacketToSend* rtp_packet) {
   RTC_DCHECK(rtp_packet);
   if (packets_.empty()) {
     return false;
   }

   PacketUnit packet = packets_.front();
   if (packet.first_fragment && packet.last_fragment) {
     // Single NAL unit packet.
     size_t bytes_to_send = packet.source_fragment.length;
     uint8_t* buffer = rtp_packet->AllocatePayload(bytes_to_send);
     memcpy(buffer, packet.source_fragment.buffer, bytes_to_send);
     packets_.pop();
     input_fragments_.pop_front();
   } else if (packet.aggregated) {
     RTC_CHECK(H264PacketizationMode::NonInterleaved == packetization_mode_);
     bool is_last_packet = num_packets_left_ == 1;
     NextAggregatePacket(rtp_packet, is_last_packet);
   } else {
     RTC_CHECK(H264PacketizationMode::NonInterleaved == packetization_mode_);
     NextFragmentPacket(rtp_packet);
   }
   RTC_DCHECK_LE(rtp_packet->payload_size(), max_payload_len_);
   if (packets_.empty()) {
     RTC_DCHECK_LE(rtp_packet->payload_size(),
                   max_payload_len_ - last_packet_reduction_len_);
   }
   rtp_packet->SetMarker(packets_.empty());
   --num_packets_left_;
   return true;
 }

 void RtpPacketizerH264::NextAggregatePacket(RtpPacketToSend* rtp_packet,
                                             bool last) {
   uint8_t* buffer = rtp_packet->AllocatePayload(
       last ? max_payload_len_ - last_packet_reduction_len_ : max_payload_len_);
   RTC_DCHECK(buffer);
   PacketUnit* packet = &packets_.front();
   RTC_CHECK(packet->first_fragment);
   // STAP-A NALU header.
   buffer[0] = (packet->header & (kFBit | kNriMask)) | H264::NaluType::kStapA;
   size_t index = kNalHeaderSize;
   bool is_last_fragment = packet->last_fragment;
   while (packet->aggregated) {
     const Fragment& fragment = packet->source_fragment;
     // Add NAL unit length field.
     ByteWriter<uint16_t>::WriteBigEndian(&buffer[index], fragment.length);
     index += kLengthFieldSize;
     // Add NAL unit.
     memcpy(&buffer[index], fragment.buffer, fragment.length);
     index += fragment.length;
     packets_.pop();
     input_fragments_.pop_front();
     if (is_last_fragment)
       break;
     packet = &packets_.front();
     is_last_fragment = packet->last_fragment;
   }
   RTC_CHECK(is_last_fragment);
   rtp_packet->SetPayloadSize(index);
 }

 void RtpPacketizerH264::NextFragmentPacket(RtpPacketToSend* rtp_packet) {
   PacketUnit* packet = &packets_.front();
   // NAL unit fragmented over multiple packets (FU-A).
   // We do not send original NALU header, so it will be replaced by the
   // FU indicator header of the first packet.
   uint8_t fu_indicator =
       (packet->header & (kFBit | kNriMask)) | H264::NaluType::kFuA;
   uint8_t fu_header = 0;

   // S | E | R | 5 bit type.
   fu_header |= (packet->first_fragment ? kSBit : 0);
   fu_header |= (packet->last_fragment ? kEBit : 0);
   uint8_t type = packet->header & kTypeMask;
   fu_header |= type;
   const Fragment& fragment = packet->source_fragment;
   uint8_t* buffer =
       rtp_packet->AllocatePayload(kFuAHeaderSize + fragment.length);
   buffer[0] = fu_indicator;
   buffer[1] = fu_header;
   memcpy(buffer + kFuAHeaderSize, fragment.buffer, fragment.length);
   if (packet->last_fragment)
     input_fragments_.pop_front();
   packets_.pop();
 }

 std::string RtpPacketizerH264::ToString() {
   return "RtpPacketizerH264";
 }

 RtpDepacketizerH264::RtpDepacketizerH264() : offset_(0), length_(0) {}
 RtpDepacketizerH264::~RtpDepacketizerH264() {}

 bool RtpDepacketizerH264::Parse(ParsedPayload* parsed_payload,
                                 const uint8_t* payload_data,
                                 size_t payload_data_length) {
   RTC_CHECK(parsed_payload != nullptr);
   if (payload_data_length == 0) {
     RTC_LOG(LS_ERROR) << "Empty payload.";
     return false;
   }

   offset_ = 0;
   length_ = payload_data_length;
   modified_buffer_.reset();

   uint8_t nal_type = payload_data[0] & kTypeMask;
   parsed_payload->type.Video.codecHeader.H264.nalus_length = 0;
   if (nal_type == H264::NaluType::kFuA) {
     // Fragmented NAL units (FU-A).
     if (!ParseFuaNalu(parsed_payload, payload_data))
       return false;
   } else {
     // We handle STAP-A and single NALU's the same way here. The jitter buffer
     // will depacketize the STAP-A into NAL units later.
     // TODO(sprang): Parse STAP-A offsets here and store in fragmentation vec.
     if (!ProcessStapAOrSingleNalu(parsed_payload, payload_data))
       return false;
   }

   const uint8_t* payload =
       modified_buffer_ ? modified_buffer_->data() : payload_data;

   parsed_payload->payload = payload + offset_;
   parsed_payload->payload_length = length_;
   return true;
 }

 bool RtpDepacketizerH264::ProcessStapAOrSingleNalu(
     ParsedPayload* parsed_payload,
     const uint8_t* payload_data) {
   parsed_payload->type.Video.width = 0;
   parsed_payload->type.Video.height = 0;
   parsed_payload->type.Video.codec = kVideoCodecH264;
   parsed_payload->type.Video.is_first_packet_in_frame = true;
   RTPVideoHeaderH264* h264_header =
       &parsed_payload->type.Video.codecHeader.H264;

   const uint8_t* nalu_start = payload_data + kNalHeaderSize;
   const size_t nalu_length = length_ - kNalHeaderSize;
   uint8_t nal_type = payload_data[0] & kTypeMask;
   std::vector<size_t> nalu_start_offsets;
   if (nal_type == H264::NaluType::kStapA) {
     // Skip the StapA header (StapA NAL type + length).
     if (length_ <= kStapAHeaderSize) {
       RTC_LOG(LS_ERROR) << "StapA header truncated.";
       return false;
     }

     if (!ParseStapAStartOffsets(nalu_start, nalu_length, &nalu_start_offsets)) {
       RTC_LOG(LS_ERROR) << "StapA packet with incorrect NALU packet lengths.";
       return false;
     }

     h264_header->packetization_type = kH264StapA;
     nal_type = payload_data[kStapAHeaderSize] & kTypeMask;
   } else {
     h264_header->packetization_type = kH264SingleNalu;
     nalu_start_offsets.push_back(0);
   }
   h264_header->nalu_type = nal_type;
   parsed_payload->frame_type = kVideoFrameDelta;

   nalu_start_offsets.push_back(length_ + kLengthFieldSize);  // End offset.
   for (size_t i = 0; i < nalu_start_offsets.size() - 1; ++i) {
     size_t start_offset = nalu_start_offsets[i];
     // End offset is actually start offset for next unit, excluding length field
     // so remove that from this units length.
     size_t end_offset = nalu_start_offsets[i + 1] - kLengthFieldSize;
     if (end_offset - start_offset < H264::kNaluTypeSize) {
       RTC_LOG(LS_ERROR) << "STAP-A packet too short";
       return false;
     }

     NaluInfo nalu;
     nalu.type = payload_data[start_offset] & kTypeMask;
     nalu.sps_id = -1;
     nalu.pps_id = -1;
     start_offset += H264::kNaluTypeSize;

     switch (nalu.type) {
       case H264::NaluType::kSps: {
         // Check if VUI is present in SPS and if it needs to be modified to
         // avoid
         // excessive decoder latency.

         // Copy any previous data first (likely just the first header).
         std::unique_ptr<rtc::Buffer> output_buffer(new rtc::Buffer());
         if (start_offset)
           output_buffer->AppendData(payload_data, start_offset);

         absl::optional<SpsParser::SpsState> sps;

         SpsVuiRewriter::ParseResult result = SpsVuiRewriter::ParseAndRewriteSps(
             &payload_data[start_offset], end_offset - start_offset, &sps,
             output_buffer.get());
         switch (result) {
           case SpsVuiRewriter::ParseResult::kVuiRewritten:
             if (modified_buffer_) {
               RTC_LOG(LS_WARNING)
                   << "More than one H264 SPS NAL units needing "
                      "rewriting found within a single STAP-A packet. "
                      "Keeping the first and rewriting the last.";
             }

             // Rewrite length field to new SPS size.
             if (h264_header->packetization_type == kH264StapA) {
               size_t length_field_offset =
                   start_offset - (H264::kNaluTypeSize + kLengthFieldSize);
               // Stap-A Length includes payload data and type header.
               size_t rewritten_size =
                   output_buffer->size() - start_offset + H264::kNaluTypeSize;
               ByteWriter<uint16_t>::WriteBigEndian(
                   &(*output_buffer)[length_field_offset], rewritten_size);
             }

             // Append rest of packet.
             output_buffer->AppendData(
                 &payload_data[end_offset],
                 nalu_length + kNalHeaderSize - end_offset);

             modified_buffer_ = std::move(output_buffer);
             length_ = modified_buffer_->size();

             RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                       SpsValidEvent::kReceivedSpsRewritten,
                                       SpsValidEvent::kSpsRewrittenMax);
             break;
           case SpsVuiRewriter::ParseResult::kPocOk:
             RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                       SpsValidEvent::kReceivedSpsPocOk,
                                       SpsValidEvent::kSpsRewrittenMax);
             break;
           case SpsVuiRewriter::ParseResult::kVuiOk:
             RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                       SpsValidEvent::kReceivedSpsVuiOk,
                                       SpsValidEvent::kSpsRewrittenMax);
             break;
           case SpsVuiRewriter::ParseResult::kFailure:
             RTC_HISTOGRAM_ENUMERATION(kSpsValidHistogramName,
                                       SpsValidEvent::kReceivedSpsParseFailure,
                                       SpsValidEvent::kSpsRewrittenMax);
             break;
         }

         if (sps) {
           parsed_payload->type.Video.width = sps->width;
           parsed_payload->type.Video.height = sps->height;
           nalu.sps_id = sps->id;
         } else {
           RTC_LOG(LS_WARNING) << "Failed to parse SPS id from SPS slice.";
         }
         parsed_payload->frame_type = kVideoFrameKey;
         break;
       }
       case H264::NaluType::kPps: {
         uint32_t pps_id;
         uint32_t sps_id;
         if (PpsParser::ParsePpsIds(&payload_data[start_offset],
                                     end_offset - start_offset, &pps_id,
                                     &sps_id)) {
           nalu.pps_id = pps_id;
           nalu.sps_id = sps_id;
         } else {
           RTC_LOG(LS_WARNING)
               << "Failed to parse PPS id and SPS id from PPS slice.";
         }
         break;
       }
       case H264::NaluType::kIdr:
         parsed_payload->frame_type = kVideoFrameKey;
         RTC_FALLTHROUGH();
       case H264::NaluType::kSlice: {
         absl::optional<uint32_t> pps_id = PpsParser::ParsePpsIdFromSlice(
             &payload_data[start_offset], end_offset - start_offset);
         if (pps_id) {
           nalu.pps_id = *pps_id;
         } else {
           RTC_LOG(LS_WARNING) << "Failed to parse PPS id from slice of type: "
                               << static_cast<int>(nalu.type);
         }
         break;
       }
       // Slices below don't contain SPS or PPS ids.
       case H264::NaluType::kAud:
       case H264::NaluType::kEndOfSequence:
       case H264::NaluType::kEndOfStream:
       case H264::NaluType::kFiller:
       case H264::NaluType::kSei:
         break;
       case H264::NaluType::kStapA:
       case H264::NaluType::kFuA:
         RTC_LOG(LS_WARNING) << "Unexpected STAP-A or FU-A received.";
         return false;
     }
     RTPVideoHeaderH264* h264 = &parsed_payload->type.Video.codecHeader.H264;
     if (h264->nalus_length == kMaxNalusPerPacket) {
       RTC_LOG(LS_WARNING)
           << "Received packet containing more than " << kMaxNalusPerPacket
           << " NAL units. Will not keep track sps and pps ids for all of them.";
     } else {
       h264->nalus[h264->nalus_length++] = nalu;
     }
   }

   return true;
 }

 bool RtpDepacketizerH264::ParseFuaNalu(
     RtpDepacketizer::ParsedPayload* parsed_payload,
     const uint8_t* payload_data) {
   if (length_ < kFuAHeaderSize) {
     RTC_LOG(LS_ERROR) << "FU-A NAL units truncated.";
     return false;
   }
   uint8_t fnri = payload_data[0] & (kFBit | kNriMask);
   uint8_t original_nal_type = payload_data[1] & kTypeMask;
   bool first_fragment = (payload_data[1] & kSBit) > 0;
   NaluInfo nalu;
   nalu.type = original_nal_type;
   nalu.sps_id = -1;
   nalu.pps_id = -1;
   if (first_fragment) {
     offset_ = 0;
     length_ -= kNalHeaderSize;
     absl::optional<uint32_t> pps_id = PpsParser::ParsePpsIdFromSlice(
         payload_data + 2 * kNalHeaderSize, length_ - kNalHeaderSize);
     if (pps_id) {
       nalu.pps_id = *pps_id;
     } else {
       RTC_LOG(LS_WARNING)
           << "Failed to parse PPS from first fragment of FU-A NAL "
              "unit with original type: "
           << static_cast<int>(nalu.type);
     }
     uint8_t original_nal_header = fnri | original_nal_type;
     modified_buffer_.reset(new rtc::Buffer());
     modified_buffer_->AppendData(payload_data + kNalHeaderSize, length_);
     (*modified_buffer_)[0] = original_nal_header;
   } else {
     offset_ = kFuAHeaderSize;
     length_ -= kFuAHeaderSize;
   }

   if (original_nal_type == H264::NaluType::kIdr) {
     parsed_payload->frame_type = kVideoFrameKey;
   } else {
     parsed_payload->frame_type = kVideoFrameDelta;
   }
   parsed_payload->type.Video.width = 0;
   parsed_payload->type.Video.height = 0;
   parsed_payload->type.Video.codec = kVideoCodecH264;
   parsed_payload->type.Video.is_first_packet_in_frame = first_fragment;
   RTPVideoHeaderH264* h264 = &parsed_payload->type.Video.codecHeader.H264;
   h264->packetization_type = kH264FuA;
   h264->nalu_type = original_nal_type;
   if (first_fragment) {
     h264->nalus[h264->nalus_length] = nalu;
     h264->nalus_length = 1;
   }
   return true;
 }

 }  // namespace webrtc