modules/video_coding/codecs/test/videoprocessor.h - src/webrtc - Git at Google

 /*
  *  Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_
 #define WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_

 #include <memory>
 #include <string>
 #include <vector>

 #include "webrtc/api/video/video_frame.h"
 #include "webrtc/common_video/libyuv/include/webrtc_libyuv.h"
 #include "webrtc/modules/video_coding/codecs/test/packet_manipulator.h"
 #include "webrtc/modules/video_coding/codecs/test/stats.h"
 #include "webrtc/modules/video_coding/include/video_codec_interface.h"
 #include "webrtc/modules/video_coding/utility/ivf_file_writer.h"
 #include "webrtc/modules/video_coding/utility/vp8_header_parser.h"
 #include "webrtc/modules/video_coding/utility/vp9_uncompressed_header_parser.h"
 #include "webrtc/rtc_base/buffer.h"
 #include "webrtc/rtc_base/checks.h"
 #include "webrtc/test/testsupport/frame_reader.h"
 #include "webrtc/test/testsupport/frame_writer.h"

 namespace webrtc {

 class VideoBitrateAllocator;

 namespace test {

 // Defines which frame types shall be excluded from packet loss and when.
 enum ExcludeFrameTypes {
   // Will exclude the first keyframe in the video sequence from packet loss.
   // Following keyframes will be targeted for packet loss.
   kExcludeOnlyFirstKeyFrame,
   // Exclude all keyframes from packet loss, no matter where in the video
   // sequence they occur.
   kExcludeAllKeyFrames
 };

 // Returns a string representation of the enum value.
 const char* ExcludeFrameTypesToStr(ExcludeFrameTypes e);

 // Test configuration for a test run.
 struct TestConfig {
   // Name of the test. This is purely metadata and does not affect the test.
   std::string name;

   // More detailed description of the test. This is purely metadata and does
   // not affect the test.
   std::string description;

   // Number of this test. Useful if multiple runs of the same test with
   // different configurations shall be managed.
   int test_number = 0;

   // File to process. This must be a video file in the YUV format.
   std::string input_filename;

   // File to write to during processing for the test. Will be a video file
   // in the YUV format.
   std::string output_filename;

   // Path to the directory where encoded files will be put
   // (absolute or relative to the executable).
   std::string output_dir = "out";

   // Configurations related to networking.
   NetworkingConfig networking_config;

   // Decides how the packet loss simulations shall exclude certain frames
   // from packet loss.
   ExcludeFrameTypes exclude_frame_types = kExcludeOnlyFirstKeyFrame;

   // The length of a single frame of the input video file. This value is
   // calculated out of the width and height according to the video format
   // specification. Must be set before processing.
   size_t frame_length_in_bytes = 0;

   // Force the encoder and decoder to use a single core for processing.
   // Using a single core is necessary to get a deterministic behavior for the
   // encoded frames - using multiple cores will produce different encoded frames
   // since multiple cores are competing to consume the byte budget for each
   // frame in parallel.
   // If set to false, the maximum number of available cores will be used.
   bool use_single_core = false;

   // If set to a value >0 this setting forces the encoder to create a keyframe
   // every Nth frame. Note that the encoder may create a keyframe in other
   // locations in addition to the interval that is set using this parameter.
   // Forcing key frames may also affect encoder planning optimizations in
   // a negative way, since it will suddenly be forced to produce an expensive
   // key frame.
   int keyframe_interval = 0;

   // The codec settings to use for the test (target bitrate, video size,
   // framerate and so on). This struct must be created and filled in using
   // the VideoCodingModule::Codec() method.
   webrtc::VideoCodec* codec_settings = nullptr;

   // If printing of information to stdout shall be performed during processing.
   bool verbose = true;
 };

 // Handles encoding/decoding of video using the VideoEncoder/VideoDecoder
 // interfaces. This is done in a sequential manner in order to be able to
 // measure times properly.
 // The class processes a frame at the time for the configured input file.
 // It maintains state of where in the source input file the processing is at.
 //
 // Regarding packet loss: Note that keyframes are excluded (first or all
 // depending on the ExcludeFrameTypes setting). This is because if key frames
 // would be altered, all the following delta frames would be pretty much
 // worthless. VP8 has an error-resilience feature that makes it able to handle
 // packet loss in key non-first keyframes, which is why only the first is
 // excluded by default.
 // Packet loss in such important frames is handled on a higher level in the
 // Video Engine, where signaling would request a retransmit of the lost packets,
 // since they're so important.
 //
 // Note this class is not thread safe in any way and is meant for simple testing
 // purposes.
 class VideoProcessor {
  public:
   virtual ~VideoProcessor() {}

   // Sets up callbacks and initializes the encoder and decoder.
   virtual void Init() = 0;

   // Processes a single frame. Returns true as long as there's more frames
   // available in the source clip.
   // |frame_number| must be an integer >= 0.
   virtual bool ProcessFrame(int frame_number) = 0;

   // Updates the encoder with the target |bit_rate| and the |frame_rate|.
   virtual void SetRates(int bit_rate, int frame_rate) = 0;

   // Return the size of the encoded frame in bytes. Dropped frames by the
   // encoder are regarded as zero size.
   virtual size_t EncodedFrameSize(int frame_number) = 0;

   // Return the encoded frame type (key or delta).
   virtual FrameType EncodedFrameType(int frame_number) = 0;

   // Return the qp used by encoder.
   virtual int GetQpFromEncoder(int frame_number) = 0;

   // Return the qp from the qp parser.
   virtual int GetQpFromBitstream(int frame_number) = 0;

   // Return the number of dropped frames.
   virtual int NumberDroppedFrames() = 0;

   // Return the number of spatial resizes.
   virtual int NumberSpatialResizes() = 0;
 };

 class VideoProcessorImpl : public VideoProcessor {
  public:
   VideoProcessorImpl(webrtc::VideoEncoder* encoder,
                      webrtc::VideoDecoder* decoder,
                      FrameReader* analysis_frame_reader,
                      FrameWriter* analysis_frame_writer,
                      PacketManipulator* packet_manipulator,
                      const TestConfig& config,
                      Stats* stats,
                      FrameWriter* source_frame_writer,
                      IvfFileWriter* encoded_frame_writer,
                      FrameWriter* decoded_frame_writer);
   virtual ~VideoProcessorImpl();
   void Init() override;
   bool ProcessFrame(int frame_number) override;

  private:
   // Container that holds per-frame information that needs to be stored between
   // calls to Encode and Decode, as well as the corresponding callbacks. It is
   // not directly used for statistics -- for that, test::FrameStatistic is used.
   struct FrameInfo {
     FrameInfo()
         : timestamp(0),
           encode_start_ns(0),
           decode_start_ns(0),
           encoded_frame_size(0),
           encoded_frame_type(kVideoFrameDelta),
           decoded_width(0),
           decoded_height(0),
           manipulated_length(0),
           qp_encoder(0),
           qp_bitstream(0) {}

     uint32_t timestamp;
     int64_t encode_start_ns;
     int64_t decode_start_ns;
     size_t encoded_frame_size;
     FrameType encoded_frame_type;
     int decoded_width;
     int decoded_height;
     size_t manipulated_length;
     int qp_encoder;
     int qp_bitstream;
   };

   // Callback class required to implement according to the VideoEncoder API.
   class VideoProcessorEncodeCompleteCallback
       : public webrtc::EncodedImageCallback {
    public:
     explicit VideoProcessorEncodeCompleteCallback(VideoProcessorImpl* vp)
         : video_processor_(vp) {}
     Result OnEncodedImage(
         const webrtc::EncodedImage& encoded_image,
         const webrtc::CodecSpecificInfo* codec_specific_info,
         const webrtc::RTPFragmentationHeader* fragmentation) override {
       // Forward to parent class.
       RTC_CHECK(codec_specific_info);
       video_processor_->FrameEncoded(codec_specific_info->codecType,
                                      encoded_image, fragmentation);
       return Result(Result::OK, 0);
     }

    private:
     VideoProcessorImpl* const video_processor_;
   };

   // Callback class required to implement according to the VideoDecoder API.
   class VideoProcessorDecodeCompleteCallback
       : public webrtc::DecodedImageCallback {
    public:
     explicit VideoProcessorDecodeCompleteCallback(VideoProcessorImpl* vp)
         : video_processor_(vp) {}
     int32_t Decoded(webrtc::VideoFrame& image) override {
       // Forward to parent class.
       video_processor_->FrameDecoded(image);
       return 0;
     }
     int32_t Decoded(webrtc::VideoFrame& image,
                     int64_t decode_time_ms) override {
       return Decoded(image);
     }
     void Decoded(webrtc::VideoFrame& image,
                  rtc::Optional<int32_t> decode_time_ms,
                  rtc::Optional<uint8_t> qp) override {
       Decoded(image,
               decode_time_ms ? static_cast<int32_t>(*decode_time_ms) : -1);
     }

    private:
     VideoProcessorImpl* const video_processor_;
   };

   // Invoked by the callback when a frame has completed encoding.
   void FrameEncoded(webrtc::VideoCodecType codec,
                     const webrtc::EncodedImage& encodedImage,
                     const webrtc::RTPFragmentationHeader* fragmentation);

   // Invoked by the callback when a frame has completed decoding.
   void FrameDecoded(const webrtc::VideoFrame& image);

   // Updates the encoder with the target bit rate and the frame rate.
   void SetRates(int bit_rate, int frame_rate) override;

   // Return the size of the encoded frame in bytes.
   size_t EncodedFrameSize(int frame_number) override;

   // Return the encoded frame type (key or delta).
   FrameType EncodedFrameType(int frame_number) override;

   // Return the qp used by encoder.
   int GetQpFromEncoder(int frame_number) override;

   // Return the qp from the qp parser.
   int GetQpFromBitstream(int frame_number) override;

   // Return the number of dropped frames.
   int NumberDroppedFrames() override;

   // Return the number of spatial resizes.
   int NumberSpatialResizes() override;

   webrtc::VideoEncoder* const encoder_;
   webrtc::VideoDecoder* const decoder_;
   const std::unique_ptr<VideoBitrateAllocator> bitrate_allocator_;

   // Adapters for the codec callbacks.
   const std::unique_ptr<EncodedImageCallback> encode_callback_;
   const std::unique_ptr<DecodedImageCallback> decode_callback_;

   PacketManipulator* const packet_manipulator_;
   const TestConfig& config_;

   // These (mandatory) file manipulators are used for, e.g., objective PSNR and
   // SSIM calculations at the end of a test run.
   FrameReader* const analysis_frame_reader_;
   FrameWriter* const analysis_frame_writer_;

   // These (optional) file writers are used for persistently storing the output
   // of the coding pipeline at different stages: pre encode (source), post
   // encode (encoded), and post decode (decoded). The purpose is to give the
   // experimenter an option to subjectively evaluate the quality of the
   // encoding, given the test settings. Each frame writer is enabled by being
   // non-null.
   FrameWriter* const source_frame_writer_;
   IvfFileWriter* const encoded_frame_writer_;
   FrameWriter* const decoded_frame_writer_;

   bool initialized_;

   // Frame metadata for all frames that have been added through a call to
   // ProcessFrames(). We need to store this metadata over the course of the
   // test run, to support pipelining HW codecs.
   std::vector<FrameInfo> frame_infos_;
   int last_encoded_frame_num_;
   int last_decoded_frame_num_;

   // Keep track of if we have excluded the first key frame from packet loss.
   bool first_key_frame_has_been_excluded_;

   // Keep track of the last successfully decoded frame, since we write that
   // frame to disk when decoding fails.
   rtc::Buffer last_decoded_frame_buffer_;

   // Statistics.
   Stats* stats_;
   int num_dropped_frames_;
   int num_spatial_resizes_;
 };

 }  // namespace test
 }  // namespace webrtc

 #endif  // WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_
	/*
	* Copyright (c) 2012 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_
	#define WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_

	#include <memory>
	#include <string>
	#include <vector>

	#include "webrtc/api/video/video_frame.h"
	#include "webrtc/common_video/libyuv/include/webrtc_libyuv.h"
	#include "webrtc/modules/video_coding/codecs/test/packet_manipulator.h"
	#include "webrtc/modules/video_coding/codecs/test/stats.h"
	#include "webrtc/modules/video_coding/include/video_codec_interface.h"
	#include "webrtc/modules/video_coding/utility/ivf_file_writer.h"
	#include "webrtc/modules/video_coding/utility/vp8_header_parser.h"
	#include "webrtc/modules/video_coding/utility/vp9_uncompressed_header_parser.h"
	#include "webrtc/rtc_base/buffer.h"
	#include "webrtc/rtc_base/checks.h"
	#include "webrtc/test/testsupport/frame_reader.h"
	#include "webrtc/test/testsupport/frame_writer.h"

	namespace webrtc {

	class VideoBitrateAllocator;

	namespace test {

	// Defines which frame types shall be excluded from packet loss and when.
	enum ExcludeFrameTypes {
	// Will exclude the first keyframe in the video sequence from packet loss.
	// Following keyframes will be targeted for packet loss.
	kExcludeOnlyFirstKeyFrame,
	// Exclude all keyframes from packet loss, no matter where in the video
	// sequence they occur.
	kExcludeAllKeyFrames
	};

	// Returns a string representation of the enum value.
	const char* ExcludeFrameTypesToStr(ExcludeFrameTypes e);

	// Test configuration for a test run.
	struct TestConfig {
	// Name of the test. This is purely metadata and does not affect the test.
	std::string name;

	// More detailed description of the test. This is purely metadata and does
	// not affect the test.
	std::string description;

	// Number of this test. Useful if multiple runs of the same test with
	// different configurations shall be managed.
	int test_number = 0;

	// File to process. This must be a video file in the YUV format.
	std::string input_filename;

	// File to write to during processing for the test. Will be a video file
	// in the YUV format.
	std::string output_filename;

	// Path to the directory where encoded files will be put
	// (absolute or relative to the executable).
	std::string output_dir = "out";

	// Configurations related to networking.
	NetworkingConfig networking_config;

	// Decides how the packet loss simulations shall exclude certain frames
	// from packet loss.
	ExcludeFrameTypes exclude_frame_types = kExcludeOnlyFirstKeyFrame;

	// The length of a single frame of the input video file. This value is
	// calculated out of the width and height according to the video format
	// specification. Must be set before processing.
	size_t frame_length_in_bytes = 0;

	// Force the encoder and decoder to use a single core for processing.
	// Using a single core is necessary to get a deterministic behavior for the
	// encoded frames - using multiple cores will produce different encoded frames
	// since multiple cores are competing to consume the byte budget for each
	// frame in parallel.
	// If set to false, the maximum number of available cores will be used.
	bool use_single_core = false;

	// If set to a value >0 this setting forces the encoder to create a keyframe
	// every Nth frame. Note that the encoder may create a keyframe in other
	// locations in addition to the interval that is set using this parameter.
	// Forcing key frames may also affect encoder planning optimizations in
	// a negative way, since it will suddenly be forced to produce an expensive
	// key frame.
	int keyframe_interval = 0;

	// The codec settings to use for the test (target bitrate, video size,
	// framerate and so on). This struct must be created and filled in using
	// the VideoCodingModule::Codec() method.
	webrtc::VideoCodec* codec_settings = nullptr;

	// If printing of information to stdout shall be performed during processing.
	bool verbose = true;
	};

	// Handles encoding/decoding of video using the VideoEncoder/VideoDecoder
	// interfaces. This is done in a sequential manner in order to be able to
	// measure times properly.
	// The class processes a frame at the time for the configured input file.
	// It maintains state of where in the source input file the processing is at.
	//
	// Regarding packet loss: Note that keyframes are excluded (first or all
	// depending on the ExcludeFrameTypes setting). This is because if key frames
	// would be altered, all the following delta frames would be pretty much
	// worthless. VP8 has an error-resilience feature that makes it able to handle
	// packet loss in key non-first keyframes, which is why only the first is
	// excluded by default.
	// Packet loss in such important frames is handled on a higher level in the
	// Video Engine, where signaling would request a retransmit of the lost packets,
	// since they're so important.
	//
	// Note this class is not thread safe in any way and is meant for simple testing
	// purposes.
	class VideoProcessor {
	public:
	virtual ~VideoProcessor() {}

	// Sets up callbacks and initializes the encoder and decoder.
	virtual void Init() = 0;

	// Processes a single frame. Returns true as long as there's more frames
	// available in the source clip.
	// \|frame_number\| must be an integer >= 0.
	virtual bool ProcessFrame(int frame_number) = 0;

	// Updates the encoder with the target \|bit_rate\| and the \|frame_rate\|.
	virtual void SetRates(int bit_rate, int frame_rate) = 0;

	// Return the size of the encoded frame in bytes. Dropped frames by the
	// encoder are regarded as zero size.
	virtual size_t EncodedFrameSize(int frame_number) = 0;

	// Return the encoded frame type (key or delta).
	virtual FrameType EncodedFrameType(int frame_number) = 0;

	// Return the qp used by encoder.
	virtual int GetQpFromEncoder(int frame_number) = 0;

	// Return the qp from the qp parser.
	virtual int GetQpFromBitstream(int frame_number) = 0;

	// Return the number of dropped frames.
	virtual int NumberDroppedFrames() = 0;

	// Return the number of spatial resizes.
	virtual int NumberSpatialResizes() = 0;
	};

	class VideoProcessorImpl : public VideoProcessor {
	public:
	VideoProcessorImpl(webrtc::VideoEncoder* encoder,
	webrtc::VideoDecoder* decoder,
	FrameReader* analysis_frame_reader,
	FrameWriter* analysis_frame_writer,
	PacketManipulator* packet_manipulator,
	const TestConfig& config,
	Stats* stats,
	FrameWriter* source_frame_writer,
	IvfFileWriter* encoded_frame_writer,
	FrameWriter* decoded_frame_writer);
	virtual ~VideoProcessorImpl();
	void Init() override;
	bool ProcessFrame(int frame_number) override;

	private:
	// Container that holds per-frame information that needs to be stored between
	// calls to Encode and Decode, as well as the corresponding callbacks. It is
	// not directly used for statistics -- for that, test::FrameStatistic is used.
	struct FrameInfo {
	FrameInfo()
	: timestamp(0),
	encode_start_ns(0),
	decode_start_ns(0),
	encoded_frame_size(0),
	encoded_frame_type(kVideoFrameDelta),
	decoded_width(0),
	decoded_height(0),
	manipulated_length(0),
	qp_encoder(0),
	qp_bitstream(0) {}

	uint32_t timestamp;
	int64_t encode_start_ns;
	int64_t decode_start_ns;
	size_t encoded_frame_size;
	FrameType encoded_frame_type;
	int decoded_width;
	int decoded_height;
	size_t manipulated_length;
	int qp_encoder;
	int qp_bitstream;
	};

	// Callback class required to implement according to the VideoEncoder API.
	class VideoProcessorEncodeCompleteCallback
	: public webrtc::EncodedImageCallback {
	public:
	explicit VideoProcessorEncodeCompleteCallback(VideoProcessorImpl* vp)
	: video_processor_(vp) {}
	Result OnEncodedImage(
	const webrtc::EncodedImage& encoded_image,
	const webrtc::CodecSpecificInfo* codec_specific_info,
	const webrtc::RTPFragmentationHeader* fragmentation) override {
	// Forward to parent class.
	RTC_CHECK(codec_specific_info);
	video_processor_->FrameEncoded(codec_specific_info->codecType,
	encoded_image, fragmentation);
	return Result(Result::OK, 0);
	}

	private:
	VideoProcessorImpl* const video_processor_;
	};

	// Callback class required to implement according to the VideoDecoder API.
	class VideoProcessorDecodeCompleteCallback
	: public webrtc::DecodedImageCallback {
	public:
	explicit VideoProcessorDecodeCompleteCallback(VideoProcessorImpl* vp)
	: video_processor_(vp) {}
	int32_t Decoded(webrtc::VideoFrame& image) override {
	// Forward to parent class.
	video_processor_->FrameDecoded(image);
	return 0;
	}
	int32_t Decoded(webrtc::VideoFrame& image,
	int64_t decode_time_ms) override {
	return Decoded(image);
	}
	void Decoded(webrtc::VideoFrame& image,
	rtc::Optional<int32_t> decode_time_ms,
	rtc::Optional<uint8_t> qp) override {
	Decoded(image,
	decode_time_ms ? static_cast<int32_t>(*decode_time_ms) : -1);
	}

	private:
	VideoProcessorImpl* const video_processor_;
	};

	// Invoked by the callback when a frame has completed encoding.
	void FrameEncoded(webrtc::VideoCodecType codec,
	const webrtc::EncodedImage& encodedImage,
	const webrtc::RTPFragmentationHeader* fragmentation);

	// Invoked by the callback when a frame has completed decoding.
	void FrameDecoded(const webrtc::VideoFrame& image);

	// Updates the encoder with the target bit rate and the frame rate.
	void SetRates(int bit_rate, int frame_rate) override;

	// Return the size of the encoded frame in bytes.
	size_t EncodedFrameSize(int frame_number) override;

	// Return the encoded frame type (key or delta).
	FrameType EncodedFrameType(int frame_number) override;

	// Return the qp used by encoder.
	int GetQpFromEncoder(int frame_number) override;

	// Return the qp from the qp parser.
	int GetQpFromBitstream(int frame_number) override;

	// Return the number of dropped frames.
	int NumberDroppedFrames() override;

	// Return the number of spatial resizes.
	int NumberSpatialResizes() override;

	webrtc::VideoEncoder* const encoder_;
	webrtc::VideoDecoder* const decoder_;
	const std::unique_ptr<VideoBitrateAllocator> bitrate_allocator_;

	// Adapters for the codec callbacks.
	const std::unique_ptr<EncodedImageCallback> encode_callback_;
	const std::unique_ptr<DecodedImageCallback> decode_callback_;

	PacketManipulator* const packet_manipulator_;
	const TestConfig& config_;

	// These (mandatory) file manipulators are used for, e.g., objective PSNR and
	// SSIM calculations at the end of a test run.
	FrameReader* const analysis_frame_reader_;
	FrameWriter* const analysis_frame_writer_;

	// These (optional) file writers are used for persistently storing the output
	// of the coding pipeline at different stages: pre encode (source), post
	// encode (encoded), and post decode (decoded). The purpose is to give the
	// experimenter an option to subjectively evaluate the quality of the
	// encoding, given the test settings. Each frame writer is enabled by being
	// non-null.
	FrameWriter* const source_frame_writer_;
	IvfFileWriter* const encoded_frame_writer_;
	FrameWriter* const decoded_frame_writer_;

	bool initialized_;

	// Frame metadata for all frames that have been added through a call to
	// ProcessFrames(). We need to store this metadata over the course of the
	// test run, to support pipelining HW codecs.
	std::vector<FrameInfo> frame_infos_;
	int last_encoded_frame_num_;
	int last_decoded_frame_num_;

	// Keep track of if we have excluded the first key frame from packet loss.
	bool first_key_frame_has_been_excluded_;

	// Keep track of the last successfully decoded frame, since we write that
	// frame to disk when decoding fails.
	rtc::Buffer last_decoded_frame_buffer_;

	// Statistics.
	Stats* stats_;
	int num_dropped_frames_;
	int num_spatial_resizes_;
	};

	} // namespace test
	} // namespace webrtc

	#endif // WEBRTC_MODULES_VIDEO_CODING_CODECS_TEST_VIDEOPROCESSOR_H_