media/base/videoadapter.cc - src - Git at Google

 /*
  *  Copyright (c) 2010 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #include "media/base/videoadapter.h"

 #include <algorithm>
 #include <cmath>
 #include <cstdlib>
 #include <limits>
 #include <utility>

 #include "absl/types/optional.h"
 #include "media/base/mediaconstants.h"
 #include "media/base/videocommon.h"
 #include "rtc_base/arraysize.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/logging.h"

 namespace {
 struct Fraction {
   int numerator;
   int denominator;

   // Determines number of output pixels if both width and height of an input of
   // |input_pixels| pixels is scaled with the fraction numerator / denominator.
   int scale_pixel_count(int input_pixels) {
     return (numerator * numerator * input_pixels) / (denominator * denominator);
   }
 };

 // Round |value_to_round| to a multiple of |multiple|. Prefer rounding upwards,
 // but never more than |max_value|.
 int roundUp(int value_to_round, int multiple, int max_value) {
   const int rounded_value =
       (value_to_round + multiple - 1) / multiple * multiple;
   return rounded_value <= max_value ? rounded_value
                                     : (max_value / multiple * multiple);
 }

 // Generates a scale factor that makes |input_pixels| close to |target_pixels|,
 // but no higher than |max_pixels|.
 Fraction FindScale(int input_pixels, int target_pixels, int max_pixels) {
   // This function only makes sense for a positive target.
   RTC_DCHECK_GT(target_pixels, 0);
   RTC_DCHECK_GT(max_pixels, 0);
   RTC_DCHECK_GE(max_pixels, target_pixels);

   // Don't scale up original.
   if (target_pixels >= input_pixels)
     return Fraction{1, 1};

   Fraction current_scale = Fraction{1, 1};
   Fraction best_scale = Fraction{1, 1};
   // The minimum (absolute) difference between the number of output pixels and
   // the target pixel count.
   int min_pixel_diff = std::numeric_limits<int>::max();
   if (input_pixels <= max_pixels) {
     // Start condition for 1/1 case, if it is less than max.
     min_pixel_diff = std::abs(input_pixels - target_pixels);
   }

   // Alternately scale down by 2/3 and 3/4. This results in fractions which are
   // effectively scalable. For instance, starting at 1280x720 will result in
   // the series (3/4) => 960x540, (1/2) => 640x360, (3/8) => 480x270,
   // (1/4) => 320x180, (3/16) => 240x125, (1/8) => 160x90.
   while (current_scale.scale_pixel_count(input_pixels) > target_pixels) {
     if (current_scale.numerator % 3 == 0 &&
         current_scale.denominator % 2 == 0) {
       // Multiply by 2/3.
       current_scale.numerator /= 3;
       current_scale.denominator /= 2;
     } else {
       // Multiply by 3/4.
       current_scale.numerator *= 3;
       current_scale.denominator *= 4;
     }

     int output_pixels = current_scale.scale_pixel_count(input_pixels);
     if (output_pixels <= max_pixels) {
       int diff = std::abs(target_pixels - output_pixels);
       if (diff < min_pixel_diff) {
         min_pixel_diff = diff;
         best_scale = current_scale;
       }
     }
   }

   return best_scale;
 }
 }  // namespace

 namespace cricket {

 VideoAdapter::VideoAdapter(int required_resolution_alignment)
     : frames_in_(0),
       frames_out_(0),
       frames_scaled_(0),
       adaption_changes_(0),
       previous_width_(0),
       previous_height_(0),
       required_resolution_alignment_(required_resolution_alignment),
       resolution_request_target_pixel_count_(std::numeric_limits<int>::max()),
       resolution_request_max_pixel_count_(std::numeric_limits<int>::max()),
       max_framerate_request_(std::numeric_limits<int>::max()) {}

 VideoAdapter::VideoAdapter() : VideoAdapter(1) {}

 VideoAdapter::~VideoAdapter() {}

 bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) {
   rtc::CritScope cs(&critical_section_);
   if (max_framerate_request_ <= 0)
     return false;

   int64_t frame_interval_ns =
       requested_format_ ? requested_format_->interval : 0;

   // If |max_framerate_request_| is not set, it will default to maxint, which
   // will lead to a frame_interval_ns rounded to 0.
   frame_interval_ns = std::max<int64_t>(
       frame_interval_ns, rtc::kNumNanosecsPerSec / max_framerate_request_);

   if (frame_interval_ns <= 0) {
     // Frame rate throttling not enabled.
     return true;
   }

   if (next_frame_timestamp_ns_) {
     // Time until next frame should be outputted.
     const int64_t time_until_next_frame_ns =
         (*next_frame_timestamp_ns_ - in_timestamp_ns);

     // Continue if timestamp is within expected range.
     if (std::abs(time_until_next_frame_ns) < 2 * frame_interval_ns) {
       // Drop if a frame shouldn't be outputted yet.
       if (time_until_next_frame_ns > 0)
         return false;
       // Time to output new frame.
       *next_frame_timestamp_ns_ += frame_interval_ns;
       return true;
     }
   }

   // First timestamp received or timestamp is way outside expected range, so
   // reset. Set first timestamp target to just half the interval to prefer
   // keeping frames in case of jitter.
   next_frame_timestamp_ns_ = in_timestamp_ns + frame_interval_ns / 2;
   return true;
 }

 bool VideoAdapter::AdaptFrameResolution(int in_width,
                                         int in_height,
                                         int64_t in_timestamp_ns,
                                         int* cropped_width,
                                         int* cropped_height,
                                         int* out_width,
                                         int* out_height) {
   rtc::CritScope cs(&critical_section_);
   ++frames_in_;

   // The max output pixel count is the minimum of the requests from
   // OnOutputFormatRequest and OnResolutionRequest.
   int max_pixel_count = resolution_request_max_pixel_count_;
   if (requested_format_) {
     max_pixel_count = std::min(
         max_pixel_count, requested_format_->width * requested_format_->height);
   }
   int target_pixel_count =
       std::min(resolution_request_target_pixel_count_, max_pixel_count);

   // Drop the input frame if necessary.
   if (max_pixel_count <= 0 || !KeepFrame(in_timestamp_ns)) {
     // Show VAdapt log every 90 frames dropped. (3 seconds)
     if ((frames_in_ - frames_out_) % 90 == 0) {
       // TODO(fbarchard): Reduce to LS_VERBOSE when adapter info is not needed
       // in default calls.
       RTC_LOG(LS_INFO) << "VAdapt Drop Frame: scaled " << frames_scaled_
                        << " / out " << frames_out_ << " / in " << frames_in_
                        << " Changes: " << adaption_changes_
                        << " Input: " << in_width << "x" << in_height
                        << " timestamp: " << in_timestamp_ns << " Output: i"
                        << (requested_format_ ? requested_format_->interval : 0);
     }

     // Drop frame.
     return false;
   }

   // Calculate how the input should be cropped.
   if (!requested_format_ ||
       requested_format_->width == 0 || requested_format_->height == 0) {
     *cropped_width = in_width;
     *cropped_height = in_height;
   } else {
     // Adjust |requested_format_| orientation to match input.
     if ((in_width > in_height) !=
         (requested_format_->width > requested_format_->height)) {
       std::swap(requested_format_->width, requested_format_->height);
     }
     const float requested_aspect =
         requested_format_->width /
         static_cast<float>(requested_format_->height);
     *cropped_width =
         std::min(in_width, static_cast<int>(in_height * requested_aspect));
     *cropped_height =
         std::min(in_height, static_cast<int>(in_width / requested_aspect));
   }
   const Fraction scale = FindScale((*cropped_width) * (*cropped_height),
                                    target_pixel_count, max_pixel_count);
   // Adjust cropping slightly to get even integer output size and a perfect
   // scale factor. Make sure the resulting dimensions are aligned correctly
   // to be nice to hardware encoders.
   *cropped_width =
       roundUp(*cropped_width,
               scale.denominator * required_resolution_alignment_, in_width);
   *cropped_height =
       roundUp(*cropped_height,
               scale.denominator * required_resolution_alignment_, in_height);
   RTC_DCHECK_EQ(0, *cropped_width % scale.denominator);
   RTC_DCHECK_EQ(0, *cropped_height % scale.denominator);

   // Calculate final output size.
   *out_width = *cropped_width / scale.denominator * scale.numerator;
   *out_height = *cropped_height / scale.denominator * scale.numerator;
   RTC_DCHECK_EQ(0, *out_width % required_resolution_alignment_);
   RTC_DCHECK_EQ(0, *out_height % required_resolution_alignment_);

   ++frames_out_;
   if (scale.numerator != scale.denominator)
     ++frames_scaled_;

   if (previous_width_ && (previous_width_ != *out_width ||
                           previous_height_ != *out_height)) {
     ++adaption_changes_;
     RTC_LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_
                      << " / out " << frames_out_ << " / in " << frames_in_
                      << " Changes: " << adaption_changes_
                      << " Input: " << in_width << "x" << in_height
                      << " Scale: " << scale.numerator << "/"
                      << scale.denominator << " Output: " << *out_width << "x"
                      << *out_height << " i"
                      << (requested_format_ ? requested_format_->interval : 0);
   }

   previous_width_ = *out_width;
   previous_height_ = *out_height;

   return true;
 }

 void VideoAdapter::OnOutputFormatRequest(
     const absl::optional<VideoFormat>& format) {
   rtc::CritScope cs(&critical_section_);
   requested_format_ = format;
   next_frame_timestamp_ns_ = absl::nullopt;
 }

 void VideoAdapter::OnResolutionFramerateRequest(
     const absl::optional<int>& target_pixel_count,
     int max_pixel_count,
     int max_framerate_fps) {
   rtc::CritScope cs(&critical_section_);
   resolution_request_max_pixel_count_ = max_pixel_count;
   resolution_request_target_pixel_count_ =
       target_pixel_count.value_or(resolution_request_max_pixel_count_);
   max_framerate_request_ = max_framerate_fps;
 }

 }  // namespace cricket
	/*
	* Copyright (c) 2010 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#include "media/base/videoadapter.h"

	#include <algorithm>
	#include <cmath>
	#include <cstdlib>
	#include <limits>
	#include <utility>

	#include "absl/types/optional.h"
	#include "media/base/mediaconstants.h"
	#include "media/base/videocommon.h"
	#include "rtc_base/arraysize.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/logging.h"

	namespace {
	struct Fraction {
	int numerator;
	int denominator;

	// Determines number of output pixels if both width and height of an input of
	// \|input_pixels\| pixels is scaled with the fraction numerator / denominator.
	int scale_pixel_count(int input_pixels) {
	return (numerator * numerator * input_pixels) / (denominator * denominator);
	}
	};

	// Round \|value_to_round\| to a multiple of \|multiple\|. Prefer rounding upwards,
	// but never more than \|max_value\|.
	int roundUp(int value_to_round, int multiple, int max_value) {
	const int rounded_value =
	(value_to_round + multiple - 1) / multiple * multiple;
	return rounded_value <= max_value ? rounded_value
	: (max_value / multiple * multiple);
	}

	// Generates a scale factor that makes \|input_pixels\| close to \|target_pixels\|,
	// but no higher than \|max_pixels\|.
	Fraction FindScale(int input_pixels, int target_pixels, int max_pixels) {
	// This function only makes sense for a positive target.
	RTC_DCHECK_GT(target_pixels, 0);
	RTC_DCHECK_GT(max_pixels, 0);
	RTC_DCHECK_GE(max_pixels, target_pixels);

	// Don't scale up original.
	if (target_pixels >= input_pixels)
	return Fraction{1, 1};

	Fraction current_scale = Fraction{1, 1};
	Fraction best_scale = Fraction{1, 1};
	// The minimum (absolute) difference between the number of output pixels and
	// the target pixel count.
	int min_pixel_diff = std::numeric_limits<int>::max();
	if (input_pixels <= max_pixels) {
	// Start condition for 1/1 case, if it is less than max.
	min_pixel_diff = std::abs(input_pixels - target_pixels);
	}

	// Alternately scale down by 2/3 and 3/4. This results in fractions which are
	// effectively scalable. For instance, starting at 1280x720 will result in
	// the series (3/4) => 960x540, (1/2) => 640x360, (3/8) => 480x270,
	// (1/4) => 320x180, (3/16) => 240x125, (1/8) => 160x90.
	while (current_scale.scale_pixel_count(input_pixels) > target_pixels) {
	if (current_scale.numerator % 3 == 0 &&
	current_scale.denominator % 2 == 0) {
	// Multiply by 2/3.
	current_scale.numerator /= 3;
	current_scale.denominator /= 2;
	} else {
	// Multiply by 3/4.
	current_scale.numerator *= 3;
	current_scale.denominator *= 4;
	}

	int output_pixels = current_scale.scale_pixel_count(input_pixels);
	if (output_pixels <= max_pixels) {
	int diff = std::abs(target_pixels - output_pixels);
	if (diff < min_pixel_diff) {
	min_pixel_diff = diff;
	best_scale = current_scale;
	}
	}
	}

	return best_scale;
	}
	} // namespace

	namespace cricket {

	VideoAdapter::VideoAdapter(int required_resolution_alignment)
	: frames_in_(0),
	frames_out_(0),
	frames_scaled_(0),
	adaption_changes_(0),
	previous_width_(0),
	previous_height_(0),
	required_resolution_alignment_(required_resolution_alignment),
	resolution_request_target_pixel_count_(std::numeric_limits<int>::max()),
	resolution_request_max_pixel_count_(std::numeric_limits<int>::max()),
	max_framerate_request_(std::numeric_limits<int>::max()) {}

	VideoAdapter::VideoAdapter() : VideoAdapter(1) {}

	VideoAdapter::~VideoAdapter() {}

	bool VideoAdapter::KeepFrame(int64_t in_timestamp_ns) {
	rtc::CritScope cs(&critical_section_);
	if (max_framerate_request_ <= 0)
	return false;

	int64_t frame_interval_ns =
	requested_format_ ? requested_format_->interval : 0;

	// If \|max_framerate_request_\| is not set, it will default to maxint, which
	// will lead to a frame_interval_ns rounded to 0.
	frame_interval_ns = std::max<int64_t>(
	frame_interval_ns, rtc::kNumNanosecsPerSec / max_framerate_request_);

	if (frame_interval_ns <= 0) {
	// Frame rate throttling not enabled.
	return true;
	}

	if (next_frame_timestamp_ns_) {
	// Time until next frame should be outputted.
	const int64_t time_until_next_frame_ns =
	(*next_frame_timestamp_ns_ - in_timestamp_ns);

	// Continue if timestamp is within expected range.
	if (std::abs(time_until_next_frame_ns) < 2 * frame_interval_ns) {
	// Drop if a frame shouldn't be outputted yet.
	if (time_until_next_frame_ns > 0)
	return false;
	// Time to output new frame.
	*next_frame_timestamp_ns_ += frame_interval_ns;
	return true;
	}
	}

	// First timestamp received or timestamp is way outside expected range, so
	// reset. Set first timestamp target to just half the interval to prefer
	// keeping frames in case of jitter.
	next_frame_timestamp_ns_ = in_timestamp_ns + frame_interval_ns / 2;
	return true;
	}

	bool VideoAdapter::AdaptFrameResolution(int in_width,
	int in_height,
	int64_t in_timestamp_ns,
	int* cropped_width,
	int* cropped_height,
	int* out_width,
	int* out_height) {
	rtc::CritScope cs(&critical_section_);
	++frames_in_;

	// The max output pixel count is the minimum of the requests from
	// OnOutputFormatRequest and OnResolutionRequest.
	int max_pixel_count = resolution_request_max_pixel_count_;
	if (requested_format_) {
	max_pixel_count = std::min(
	max_pixel_count, requested_format_->width * requested_format_->height);
	}
	int target_pixel_count =
	std::min(resolution_request_target_pixel_count_, max_pixel_count);

	// Drop the input frame if necessary.
	if (max_pixel_count <= 0 \|\| !KeepFrame(in_timestamp_ns)) {
	// Show VAdapt log every 90 frames dropped. (3 seconds)
	if ((frames_in_ - frames_out_) % 90 == 0) {
	// TODO(fbarchard): Reduce to LS_VERBOSE when adapter info is not needed
	// in default calls.
	RTC_LOG(LS_INFO) << "VAdapt Drop Frame: scaled " << frames_scaled_
	<< " / out " << frames_out_ << " / in " << frames_in_
	<< " Changes: " << adaption_changes_
	<< " Input: " << in_width << "x" << in_height
	<< " timestamp: " << in_timestamp_ns << " Output: i"
	<< (requested_format_ ? requested_format_->interval : 0);
	}

	// Drop frame.
	return false;
	}

	// Calculate how the input should be cropped.
	if (!requested_format_ \|\|
	requested_format_->width == 0 \|\| requested_format_->height == 0) {
	*cropped_width = in_width;
	*cropped_height = in_height;
	} else {
	// Adjust \|requested_format_\| orientation to match input.
	if ((in_width > in_height) !=
	(requested_format_->width > requested_format_->height)) {
	std::swap(requested_format_->width, requested_format_->height);
	}
	const float requested_aspect =
	requested_format_->width /
	static_cast<float>(requested_format_->height);
	*cropped_width =
	std::min(in_width, static_cast<int>(in_height * requested_aspect));
	*cropped_height =
	std::min(in_height, static_cast<int>(in_width / requested_aspect));
	}
	const Fraction scale = FindScale((cropped_width) (*cropped_height),
	target_pixel_count, max_pixel_count);
	// Adjust cropping slightly to get even integer output size and a perfect
	// scale factor. Make sure the resulting dimensions are aligned correctly
	// to be nice to hardware encoders.
	*cropped_width =
	roundUp(*cropped_width,
	scale.denominator * required_resolution_alignment_, in_width);
	*cropped_height =
	roundUp(*cropped_height,
	scale.denominator * required_resolution_alignment_, in_height);
	RTC_DCHECK_EQ(0, *cropped_width % scale.denominator);
	RTC_DCHECK_EQ(0, *cropped_height % scale.denominator);

	// Calculate final output size.
	out_width = cropped_width / scale.denominator * scale.numerator;
	out_height = cropped_height / scale.denominator * scale.numerator;
	RTC_DCHECK_EQ(0, *out_width % required_resolution_alignment_);
	RTC_DCHECK_EQ(0, *out_height % required_resolution_alignment_);

	++frames_out_;
	if (scale.numerator != scale.denominator)
	++frames_scaled_;

	if (previous_width_ && (previous_width_ != *out_width \|\|
	previous_height_ != *out_height)) {
	++adaption_changes_;
	RTC_LOG(LS_INFO) << "Frame size changed: scaled " << frames_scaled_
	<< " / out " << frames_out_ << " / in " << frames_in_
	<< " Changes: " << adaption_changes_
	<< " Input: " << in_width << "x" << in_height
	<< " Scale: " << scale.numerator << "/"
	<< scale.denominator << " Output: " << *out_width << "x"
	<< *out_height << " i"
	<< (requested_format_ ? requested_format_->interval : 0);
	}

	previous_width_ = *out_width;
	previous_height_ = *out_height;

	return true;
	}

	void VideoAdapter::OnOutputFormatRequest(
	const absl::optional<VideoFormat>& format) {
	rtc::CritScope cs(&critical_section_);
	requested_format_ = format;
	next_frame_timestamp_ns_ = absl::nullopt;
	}

	void VideoAdapter::OnResolutionFramerateRequest(
	const absl::optional<int>& target_pixel_count,
	int max_pixel_count,
	int max_framerate_fps) {
	rtc::CritScope cs(&critical_section_);
	resolution_request_max_pixel_count_ = max_pixel_count;
	resolution_request_target_pixel_count_ =
	target_pixel_count.value_or(resolution_request_max_pixel_count_);
	max_framerate_request_ = max_framerate_fps;
	}

	} // namespace cricket