modules/video_coding/codecs/av1/scalability_structure_l3t3.cc - src - Git at Google

 /*
  *  Copyright (c) 2020 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */
 #include "modules/video_coding/codecs/av1/scalability_structure_l3t3.h"

 #include <utility>
 #include <vector>

 #include "absl/base/macros.h"
 #include "absl/types/optional.h"
 #include "api/transport/rtp/dependency_descriptor.h"
 #include "rtc_base/logging.h"

 namespace webrtc {
 namespace {

 constexpr auto kNotPresent = DecodeTargetIndication::kNotPresent;
 constexpr auto kDiscardable = DecodeTargetIndication::kDiscardable;
 constexpr auto kSwitch = DecodeTargetIndication::kSwitch;
 constexpr auto kRequired = DecodeTargetIndication::kRequired;

 constexpr DecodeTargetIndication kDtis[12][9] = {
     // Key, S0
     {kSwitch, kSwitch, kSwitch,   // S0
      kSwitch, kSwitch, kSwitch,   // S1
      kSwitch, kSwitch, kSwitch},  // S2
     // Key, S1
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kSwitch, kSwitch, kSwitch,              // S1
      kSwitch, kSwitch, kSwitch},             // S2
     // Key, S2
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kNotPresent, kNotPresent, kNotPresent,  // S1
      kSwitch, kSwitch, kSwitch},             // S2
     // Delta, S0T2
     {kNotPresent, kNotPresent, kDiscardable,  // S0
      kNotPresent, kNotPresent, kRequired,     // S1
      kNotPresent, kNotPresent, kRequired},    // S2
     // Delta, S1T2
     {kNotPresent, kNotPresent, kNotPresent,   // S0
      kNotPresent, kNotPresent, kDiscardable,  // S1
      kNotPresent, kNotPresent, kRequired},    // S2
     // Delta, S2T2
     {kNotPresent, kNotPresent, kNotPresent,    // S0
      kNotPresent, kNotPresent, kNotPresent,    // S1
      kNotPresent, kNotPresent, kDiscardable},  // S2
     // Delta, S0T1
     {kNotPresent, kDiscardable, kSwitch,  // S0
      kNotPresent, kRequired, kRequired,   // S1
      kNotPresent, kRequired, kRequired},  // S2
     // Delta, S1T1
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kNotPresent, kDiscardable, kSwitch,     // S1
      kNotPresent, kRequired, kRequired},     // S2
     // Delta, S2T1
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kNotPresent, kNotPresent, kNotPresent,  // S1
      kNotPresent, kDiscardable, kSwitch},    // S2
     // Delta, S0T0
     {kSwitch, kSwitch, kSwitch,         // S0
      kRequired, kRequired, kRequired,   // S1
      kRequired, kRequired, kRequired},  // S2
     // Delta, S1T0
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kSwitch, kSwitch, kSwitch,              // S1
      kRequired, kRequired, kRequired},       // S2
     // Delta, S2T0
     {kNotPresent, kNotPresent, kNotPresent,  // S0
      kNotPresent, kNotPresent, kNotPresent,  // S1
      kSwitch, kSwitch, kSwitch},             // S2
 };

 }  // namespace

 ScalabilityStructureL3T3::~ScalabilityStructureL3T3() = default;

 ScalableVideoController::StreamLayersConfig
 ScalabilityStructureL3T3::StreamConfig() const {
   StreamLayersConfig result;
   result.num_spatial_layers = 3;
   result.num_temporal_layers = 3;
   result.scaling_factor_num[0] = 1;
   result.scaling_factor_den[0] = 4;
   result.scaling_factor_num[1] = 1;
   result.scaling_factor_den[1] = 2;
   return result;
 }

 FrameDependencyStructure ScalabilityStructureL3T3::DependencyStructure() const {
   FrameDependencyStructure structure;
   structure.num_decode_targets = 9;
   structure.num_chains = 3;
   structure.decode_target_protected_by_chain = {0, 0, 0, 1, 1, 1, 2, 2, 2};
   auto& t = structure.templates;
   t.resize(15);
   // Templates are shown in the order frames following them appear in the
   // stream, but in `structure.templates` array templates are sorted by
   // (`spatial_id`, `temporal_id`) since that is a dependency descriptor
   // requirement. Indexes are written in hex for nicer alignment.
   t[0x1].S(0).T(0).Dtis("SSSSSSSSS").ChainDiffs({0, 0, 0});
   t[0x6].S(1).T(0).Dtis("---SSSSSS").ChainDiffs({1, 1, 1}).FrameDiffs({1});
   t[0xB].S(2).T(0).Dtis("------SSS").ChainDiffs({2, 1, 1}).FrameDiffs({1});
   t[0x3].S(0).T(2).Dtis("--D--R--R").ChainDiffs({3, 2, 1}).FrameDiffs({3});
   t[0x8].S(1).T(2).Dtis("-----D--R").ChainDiffs({4, 3, 2}).FrameDiffs({3, 1});
   t[0xD].S(2).T(2).Dtis("--------D").ChainDiffs({5, 4, 3}).FrameDiffs({3, 1});
   t[0x2].S(0).T(1).Dtis("-DS-RR-RR").ChainDiffs({6, 5, 4}).FrameDiffs({6});
   t[0x7].S(1).T(1).Dtis("----DS-RR").ChainDiffs({7, 6, 5}).FrameDiffs({6, 1});
   t[0xC].S(2).T(1).Dtis("-------DS").ChainDiffs({8, 7, 6}).FrameDiffs({6, 1});
   t[0x4].S(0).T(2).Dtis("--D--R--R").ChainDiffs({9, 8, 7}).FrameDiffs({3});
   t[0x9].S(1).T(2).Dtis("-----D--R").ChainDiffs({10, 9, 8}).FrameDiffs({3, 1});
   t[0xE].S(2).T(2).Dtis("--------D").ChainDiffs({11, 10, 9}).FrameDiffs({3, 1});
   t[0x0].S(0).T(0).Dtis("SSSRRRRRR").ChainDiffs({12, 11, 10}).FrameDiffs({12});
   t[0x5].S(1).T(0).Dtis("---SSSRRR").ChainDiffs({1, 1, 1}).FrameDiffs({12, 1});
   t[0xA].S(2).T(0).Dtis("------SSS").ChainDiffs({2, 1, 1}).FrameDiffs({12, 1});
   return structure;
 }

 ScalableVideoController::LayerFrameConfig
 ScalabilityStructureL3T3::KeyFrameConfig() const {
   return LayerFrameConfig().Id(0).S(0).T(0).Keyframe().Update(0);
 }

 std::vector<ScalableVideoController::LayerFrameConfig>
 ScalabilityStructureL3T3::NextFrameConfig(bool restart) {
   if (restart) {
     next_pattern_ = kKeyFrame;
   }
   std::vector<LayerFrameConfig> config(3);

   // For this structure name each of 8 buffers after the layer of the frame that
   // buffer keeps.
   static constexpr int kS0T0 = 0;
   static constexpr int kS1T0 = 1;
   static constexpr int kS2T0 = 2;
   static constexpr int kS0T1 = 3;
   static constexpr int kS1T1 = 4;
   static constexpr int kS2T1 = 5;
   static constexpr int kS0T2 = 6;
   static constexpr int kS1T2 = 7;
   switch (next_pattern_) {
     case kKeyFrame:
       config[0].Id(0).S(0).T(0).Keyframe().Update(kS0T0);
       config[1].Id(1).S(1).T(0).Update(kS1T0).Reference(kS0T0);
       config[2].Id(2).S(2).T(0).Update(kS2T0).Reference(kS1T0);
       next_pattern_ = kDeltaFrameT2A;
       break;
     case kDeltaFrameT2A:
       config[0].Id(3).S(0).T(2).Reference(kS0T0).Update(kS0T2);
       config[1].Id(4).S(1).T(2).Reference(kS1T0).Reference(kS0T2).Update(kS1T2);
       config[2].Id(5).S(2).T(2).Reference(kS2T0).Reference(kS1T2);
       next_pattern_ = kDeltaFrameT1;
       break;
     case kDeltaFrameT1:
       config[0].Id(6).S(0).T(1).Reference(kS0T0).Update(kS0T1);
       config[1].Id(7).S(1).T(1).Reference(kS1T0).Reference(kS0T1).Update(kS1T1);
       config[2].Id(8).S(2).T(1).Reference(kS2T0).Reference(kS1T1).Update(kS2T1);
       next_pattern_ = kDeltaFrameT2B;
       break;
     case kDeltaFrameT2B:
       config[0].Id(3).S(0).T(2).Reference(kS0T1).Update(kS0T2);
       config[1].Id(4).S(1).T(2).Reference(kS1T1).Reference(kS0T2).Update(kS1T2);
       config[2].Id(5).S(2).T(2).Reference(kS2T1).Reference(kS1T2);
       next_pattern_ = kDeltaFrameT0;
       break;
     case kDeltaFrameT0:
       config[0].Id(9).S(0).T(0).ReferenceAndUpdate(kS0T0);
       config[1].Id(10).S(1).T(0).ReferenceAndUpdate(kS1T0).Reference(kS0T0);
       config[2].Id(11).S(2).T(0).ReferenceAndUpdate(kS2T0).Reference(kS1T0);
       next_pattern_ = kDeltaFrameT2A;
       break;
   }
   return config;
 }

 absl::optional<GenericFrameInfo> ScalabilityStructureL3T3::OnEncodeDone(
     LayerFrameConfig config) {
   if (config.IsKeyframe() && config.Id() != 0) {
     // Encoder generated a key frame without asking to.
     if (config.SpatialId() > 0) {
       RTC_LOG(LS_WARNING) << "Unexpected spatial id " << config.SpatialId()
                           << " for key frame.";
     }
     config = LayerFrameConfig()
                  .Keyframe()
                  .Id(0)
                  .S(0)
                  .T(0)
                  .Update(0)
                  .Update(1)
                  .Update(2)
                  .Update(3)
                  .Update(4)
                  .Update(5)
                  .Update(6)
                  .Update(7);
   }

   absl::optional<GenericFrameInfo> frame_info;
   if (config.Id() < 0 || config.Id() >= int{ABSL_ARRAYSIZE(kDtis)}) {
     RTC_LOG(LS_ERROR) << "Unexpected config id " << config.Id();
     return frame_info;
   }
   frame_info.emplace();
   frame_info->spatial_id = config.SpatialId();
   frame_info->temporal_id = config.TemporalId();
   frame_info->encoder_buffers = config.Buffers();
   frame_info->decode_target_indications.assign(std::begin(kDtis[config.Id()]),
                                                std::end(kDtis[config.Id()]));
   if (config.TemporalId() == 0) {
     frame_info->part_of_chain = {config.SpatialId() == 0,
                                  config.SpatialId() <= 1, true};
   } else {
     frame_info->part_of_chain = {false, false, false};
   }
   return frame_info;
 }

 }  // namespace webrtc
	/*
	* Copyright (c) 2020 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/
	#include "modules/video_coding/codecs/av1/scalability_structure_l3t3.h"

	#include <utility>
	#include <vector>

	#include "absl/base/macros.h"
	#include "absl/types/optional.h"
	#include "api/transport/rtp/dependency_descriptor.h"
	#include "rtc_base/logging.h"

	namespace webrtc {
	namespace {

	constexpr auto kNotPresent = DecodeTargetIndication::kNotPresent;
	constexpr auto kDiscardable = DecodeTargetIndication::kDiscardable;
	constexpr auto kSwitch = DecodeTargetIndication::kSwitch;
	constexpr auto kRequired = DecodeTargetIndication::kRequired;

	constexpr DecodeTargetIndication kDtis[12][9] = {
	// Key, S0
	{kSwitch, kSwitch, kSwitch, // S0
	kSwitch, kSwitch, kSwitch, // S1
	kSwitch, kSwitch, kSwitch}, // S2
	// Key, S1
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kSwitch, kSwitch, kSwitch, // S1
	kSwitch, kSwitch, kSwitch}, // S2
	// Key, S2
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kNotPresent, kNotPresent, // S1
	kSwitch, kSwitch, kSwitch}, // S2
	// Delta, S0T2
	{kNotPresent, kNotPresent, kDiscardable, // S0
	kNotPresent, kNotPresent, kRequired, // S1
	kNotPresent, kNotPresent, kRequired}, // S2
	// Delta, S1T2
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kNotPresent, kDiscardable, // S1
	kNotPresent, kNotPresent, kRequired}, // S2
	// Delta, S2T2
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kNotPresent, kNotPresent, // S1
	kNotPresent, kNotPresent, kDiscardable}, // S2
	// Delta, S0T1
	{kNotPresent, kDiscardable, kSwitch, // S0
	kNotPresent, kRequired, kRequired, // S1
	kNotPresent, kRequired, kRequired}, // S2
	// Delta, S1T1
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kDiscardable, kSwitch, // S1
	kNotPresent, kRequired, kRequired}, // S2
	// Delta, S2T1
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kNotPresent, kNotPresent, // S1
	kNotPresent, kDiscardable, kSwitch}, // S2
	// Delta, S0T0
	{kSwitch, kSwitch, kSwitch, // S0
	kRequired, kRequired, kRequired, // S1
	kRequired, kRequired, kRequired}, // S2
	// Delta, S1T0
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kSwitch, kSwitch, kSwitch, // S1
	kRequired, kRequired, kRequired}, // S2
	// Delta, S2T0
	{kNotPresent, kNotPresent, kNotPresent, // S0
	kNotPresent, kNotPresent, kNotPresent, // S1
	kSwitch, kSwitch, kSwitch}, // S2
	};

	} // namespace

	ScalabilityStructureL3T3::~ScalabilityStructureL3T3() = default;

	ScalableVideoController::StreamLayersConfig
	ScalabilityStructureL3T3::StreamConfig() const {
	StreamLayersConfig result;
	result.num_spatial_layers = 3;
	result.num_temporal_layers = 3;
	result.scaling_factor_num[0] = 1;
	result.scaling_factor_den[0] = 4;
	result.scaling_factor_num[1] = 1;
	result.scaling_factor_den[1] = 2;
	return result;
	}

	FrameDependencyStructure ScalabilityStructureL3T3::DependencyStructure() const {
	FrameDependencyStructure structure;
	structure.num_decode_targets = 9;
	structure.num_chains = 3;
	structure.decode_target_protected_by_chain = {0, 0, 0, 1, 1, 1, 2, 2, 2};
	auto& t = structure.templates;
	t.resize(15);
	// Templates are shown in the order frames following them appear in the
	// stream, but in `structure.templates` array templates are sorted by
	// (`spatial_id`, `temporal_id`) since that is a dependency descriptor
	// requirement. Indexes are written in hex for nicer alignment.
	t[0x1].S(0).T(0).Dtis("SSSSSSSSS").ChainDiffs({0, 0, 0});
	t[0x6].S(1).T(0).Dtis("---SSSSSS").ChainDiffs({1, 1, 1}).FrameDiffs({1});
	t[0xB].S(2).T(0).Dtis("------SSS").ChainDiffs({2, 1, 1}).FrameDiffs({1});
	t[0x3].S(0).T(2).Dtis("--D--R--R").ChainDiffs({3, 2, 1}).FrameDiffs({3});
	t[0x8].S(1).T(2).Dtis("-----D--R").ChainDiffs({4, 3, 2}).FrameDiffs({3, 1});
	t[0xD].S(2).T(2).Dtis("--------D").ChainDiffs({5, 4, 3}).FrameDiffs({3, 1});
	t[0x2].S(0).T(1).Dtis("-DS-RR-RR").ChainDiffs({6, 5, 4}).FrameDiffs({6});
	t[0x7].S(1).T(1).Dtis("----DS-RR").ChainDiffs({7, 6, 5}).FrameDiffs({6, 1});
	t[0xC].S(2).T(1).Dtis("-------DS").ChainDiffs({8, 7, 6}).FrameDiffs({6, 1});
	t[0x4].S(0).T(2).Dtis("--D--R--R").ChainDiffs({9, 8, 7}).FrameDiffs({3});
	t[0x9].S(1).T(2).Dtis("-----D--R").ChainDiffs({10, 9, 8}).FrameDiffs({3, 1});
	t[0xE].S(2).T(2).Dtis("--------D").ChainDiffs({11, 10, 9}).FrameDiffs({3, 1});
	t[0x0].S(0).T(0).Dtis("SSSRRRRRR").ChainDiffs({12, 11, 10}).FrameDiffs({12});
	t[0x5].S(1).T(0).Dtis("---SSSRRR").ChainDiffs({1, 1, 1}).FrameDiffs({12, 1});
	t[0xA].S(2).T(0).Dtis("------SSS").ChainDiffs({2, 1, 1}).FrameDiffs({12, 1});
	return structure;
	}

	ScalableVideoController::LayerFrameConfig
	ScalabilityStructureL3T3::KeyFrameConfig() const {
	return LayerFrameConfig().Id(0).S(0).T(0).Keyframe().Update(0);
	}

	std::vector<ScalableVideoController::LayerFrameConfig>
	ScalabilityStructureL3T3::NextFrameConfig(bool restart) {
	if (restart) {
	next_pattern_ = kKeyFrame;
	}
	std::vector<LayerFrameConfig> config(3);

	// For this structure name each of 8 buffers after the layer of the frame that
	// buffer keeps.
	static constexpr int kS0T0 = 0;
	static constexpr int kS1T0 = 1;
	static constexpr int kS2T0 = 2;
	static constexpr int kS0T1 = 3;
	static constexpr int kS1T1 = 4;
	static constexpr int kS2T1 = 5;
	static constexpr int kS0T2 = 6;
	static constexpr int kS1T2 = 7;
	switch (next_pattern_) {
	case kKeyFrame:
	config[0].Id(0).S(0).T(0).Keyframe().Update(kS0T0);
	config[1].Id(1).S(1).T(0).Update(kS1T0).Reference(kS0T0);
	config[2].Id(2).S(2).T(0).Update(kS2T0).Reference(kS1T0);
	next_pattern_ = kDeltaFrameT2A;
	break;
	case kDeltaFrameT2A:
	config[0].Id(3).S(0).T(2).Reference(kS0T0).Update(kS0T2);
	config[1].Id(4).S(1).T(2).Reference(kS1T0).Reference(kS0T2).Update(kS1T2);
	config[2].Id(5).S(2).T(2).Reference(kS2T0).Reference(kS1T2);
	next_pattern_ = kDeltaFrameT1;
	break;
	case kDeltaFrameT1:
	config[0].Id(6).S(0).T(1).Reference(kS0T0).Update(kS0T1);
	config[1].Id(7).S(1).T(1).Reference(kS1T0).Reference(kS0T1).Update(kS1T1);
	config[2].Id(8).S(2).T(1).Reference(kS2T0).Reference(kS1T1).Update(kS2T1);
	next_pattern_ = kDeltaFrameT2B;
	break;
	case kDeltaFrameT2B:
	config[0].Id(3).S(0).T(2).Reference(kS0T1).Update(kS0T2);
	config[1].Id(4).S(1).T(2).Reference(kS1T1).Reference(kS0T2).Update(kS1T2);
	config[2].Id(5).S(2).T(2).Reference(kS2T1).Reference(kS1T2);
	next_pattern_ = kDeltaFrameT0;
	break;
	case kDeltaFrameT0:
	config[0].Id(9).S(0).T(0).ReferenceAndUpdate(kS0T0);
	config[1].Id(10).S(1).T(0).ReferenceAndUpdate(kS1T0).Reference(kS0T0);
	config[2].Id(11).S(2).T(0).ReferenceAndUpdate(kS2T0).Reference(kS1T0);
	next_pattern_ = kDeltaFrameT2A;
	break;
	}
	return config;
	}

	absl::optional<GenericFrameInfo> ScalabilityStructureL3T3::OnEncodeDone(
	LayerFrameConfig config) {
	if (config.IsKeyframe() && config.Id() != 0) {
	// Encoder generated a key frame without asking to.
	if (config.SpatialId() > 0) {
	RTC_LOG(LS_WARNING) << "Unexpected spatial id " << config.SpatialId()
	<< " for key frame.";
	}
	config = LayerFrameConfig()
	.Keyframe()
	.Id(0)
	.S(0)
	.T(0)
	.Update(0)
	.Update(1)
	.Update(2)
	.Update(3)
	.Update(4)
	.Update(5)
	.Update(6)
	.Update(7);
	}

	absl::optional<GenericFrameInfo> frame_info;
	if (config.Id() < 0 \|\| config.Id() >= int{ABSL_ARRAYSIZE(kDtis)}) {
	RTC_LOG(LS_ERROR) << "Unexpected config id " << config.Id();
	return frame_info;
	}
	frame_info.emplace();
	frame_info->spatial_id = config.SpatialId();
	frame_info->temporal_id = config.TemporalId();
	frame_info->encoder_buffers = config.Buffers();
	frame_info->decode_target_indications.assign(std::begin(kDtis[config.Id()]),
	std::end(kDtis[config.Id()]));
	if (config.TemporalId() == 0) {
	frame_info->part_of_chain = {config.SpatialId() == 0,
	config.SpatialId() <= 1, true};
	} else {
	frame_info->part_of_chain = {false, false, false};
	}
	return frame_info;
	}

	} // namespace webrtc