api/rtp_headers.h - src - Git at Google

 /*
  *  Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
  *
  *  Use of this source code is governed by a BSD-style license
  *  that can be found in the LICENSE file in the root of the source
  *  tree. An additional intellectual property rights grant can be found
  *  in the file PATENTS.  All contributing project authors may
  *  be found in the AUTHORS file in the root of the source tree.
  */

 #ifndef API_RTP_HEADERS_H_
 #define API_RTP_HEADERS_H_

 #include <stddef.h>
 #include <stdint.h>

 #include <optional>
 #include <string>

 #include "api/units/timestamp.h"
 #include "api/video/color_space.h"
 #include "api/video/video_content_type.h"
 #include "api/video/video_rotation.h"
 #include "api/video/video_timing.h"
 #include "rtc_base/checks.h"
 #include "rtc_base/system/rtc_export.h"

 namespace webrtc {

 struct FeedbackRequest {
   // Determines whether the recv delta as specified in
   // https://tools.ietf.org/html/draft-holmer-rmcat-transport-wide-cc-extensions-01
   // should be included.
   bool include_timestamps;
   // Include feedback of received packets in the range [sequence_number -
   // sequence_count + 1, sequence_number]. That is, no feedback will be sent if
   // sequence_count is zero.
   int sequence_count;
 };

 // The Absolute Capture Time extension is used to stamp RTP packets with a NTP
 // timestamp showing when the first audio or video frame in a packet was
 // originally captured. The intent of this extension is to provide a way to
 // accomplish audio-to-video synchronization when RTCP-terminating intermediate
 // systems (e.g. mixers) are involved. See:
 // http://www.webrtc.org/experiments/rtp-hdrext/abs-capture-time
 struct AbsoluteCaptureTime {
   // Absolute capture timestamp is the NTP timestamp of when the first frame in
   // a packet was originally captured. This timestamp MUST be based on the same
   // clock as the clock used to generate NTP timestamps for RTCP sender reports
   // on the capture system.
   //
   // It’s not always possible to do an NTP clock readout at the exact moment of
   // when a media frame is captured. A capture system MAY postpone the readout
   // until a more convenient time. A capture system SHOULD have known delays
   // (e.g. from hardware buffers) subtracted from the readout to make the final
   // timestamp as close to the actual capture time as possible.
   //
   // This field is encoded as a 64-bit unsigned fixed-point number with the high
   // 32 bits for the timestamp in seconds and low 32 bits for the fractional
   // part. This is also known as the UQ32.32 format and is what the RTP
   // specification defines as the canonical format to represent NTP timestamps.
   uint64_t absolute_capture_timestamp;

   // Estimated capture clock offset is the sender’s estimate of the offset
   // between its own NTP clock and the capture system’s NTP clock. The sender is
   // here defined as the system that owns the NTP clock used to generate the NTP
   // timestamps for the RTCP sender reports on this stream. The sender system is
   // typically either the capture system or a mixer.
   //
   // This field is encoded as a 64-bit two’s complement signed fixed-point
   // number with the high 32 bits for the seconds and low 32 bits for the
   // fractional part. It’s intended to make it easy for a receiver, that knows
   // how to estimate the sender system’s NTP clock, to also estimate the capture
   // system’s NTP clock:
   //
   //   Capture NTP Clock = Sender NTP Clock + Capture Clock Offset
   std::optional<int64_t> estimated_capture_clock_offset;
 };

 // The audio level extension is used to indicate the voice activity and the
 // audio level of the payload in the RTP stream. See:
 // https://tools.ietf.org/html/rfc6464#section-3.
 class AudioLevel {
  public:
   AudioLevel();
   AudioLevel(bool voice_activity, int audio_level);
   AudioLevel(const AudioLevel& other) = default;
   AudioLevel& operator=(const AudioLevel& other) = default;

   // Flag indicating whether the encoder believes the audio packet contains
   // voice activity.
   bool voice_activity() const { return voice_activity_; }

   // Audio level in -dBov. Values range from 0 to 127, representing 0 to -127
   // dBov. 127 represents digital silence.
   int level() const { return audio_level_; }

  private:
   bool voice_activity_;
   int audio_level_;
 };

 inline bool operator==(const AbsoluteCaptureTime& lhs,
                        const AbsoluteCaptureTime& rhs) {
   return (lhs.absolute_capture_timestamp == rhs.absolute_capture_timestamp) &&
          (lhs.estimated_capture_clock_offset ==
           rhs.estimated_capture_clock_offset);
 }

 inline bool operator!=(const AbsoluteCaptureTime& lhs,
                        const AbsoluteCaptureTime& rhs) {
   return !(lhs == rhs);
 }

 struct RTPHeaderExtension {
   RTPHeaderExtension();
   RTPHeaderExtension(const RTPHeaderExtension& other);
   RTPHeaderExtension& operator=(const RTPHeaderExtension& other);

   static constexpr int kAbsSendTimeFraction = 18;

   Timestamp GetAbsoluteSendTimestamp() const {
     RTC_DCHECK(hasAbsoluteSendTime);
     RTC_DCHECK(absoluteSendTime < (1ul << 24));
     return Timestamp::Micros((absoluteSendTime * 1000000ll) /
                              (1 << kAbsSendTimeFraction));
   }

   bool hasTransmissionTimeOffset;
   int32_t transmissionTimeOffset;
   bool hasAbsoluteSendTime;
   uint32_t absoluteSendTime;
   std::optional<AbsoluteCaptureTime> absolute_capture_time;
   bool hasTransportSequenceNumber;
   uint16_t transportSequenceNumber;
   std::optional<FeedbackRequest> feedback_request;

   // Audio Level includes both level in dBov and voiced/unvoiced bit. See:
   // https://tools.ietf.org/html/rfc6464#section-3
   std::optional<AudioLevel> audio_level() const { return audio_level_; }

   void set_audio_level(std::optional<AudioLevel> audio_level) {
     audio_level_ = audio_level;
   }

   // For Coordination of Video Orientation. See
   // http://www.etsi.org/deliver/etsi_ts/126100_126199/126114/12.07.00_60/
   // ts_126114v120700p.pdf
   bool hasVideoRotation;
   VideoRotation videoRotation;

   // TODO(ilnik): Refactor this and one above to be std::optional() and remove
   // a corresponding bool flag.
   bool hasVideoContentType;
   VideoContentType videoContentType;

   bool has_video_timing;
   VideoSendTiming video_timing;

   VideoPlayoutDelay playout_delay;

   // For identification of a stream when ssrc is not signaled. See
   // https://tools.ietf.org/html/rfc8852
   std::string stream_id;
   std::string repaired_stream_id;

   // For identifying the media section used to interpret this RTP packet. See
   // https://tools.ietf.org/html/rfc8843
   std::string mid;

   std::optional<ColorSpace> color_space;

  private:
   std::optional<AudioLevel> audio_level_;
 };

 enum { kRtpCsrcSize = 15 };  // RFC 3550 page 13

 struct RTC_EXPORT RTPHeader {
   RTPHeader();
   RTPHeader(const RTPHeader& other);
   RTPHeader& operator=(const RTPHeader& other);

   bool markerBit;
   uint8_t payloadType;
   uint16_t sequenceNumber;
   uint32_t timestamp;
   uint32_t ssrc;
   uint8_t numCSRCs;
   uint32_t arrOfCSRCs[kRtpCsrcSize];
   size_t paddingLength;
   size_t headerLength;
   RTPHeaderExtension extension;
 };

 // RTCP mode to use. Compound mode is described by RFC 4585 and reduced-size
 // RTCP mode is described by RFC 5506.
 enum class RtcpMode { kOff, kCompound, kReducedSize };

 enum NetworkState {
   kNetworkUp,
   kNetworkDown,
 };

 }  // namespace webrtc

 #endif  // API_RTP_HEADERS_H_
	/*
	* Copyright (c) 2017 The WebRTC project authors. All Rights Reserved.
	*
	* Use of this source code is governed by a BSD-style license
	* that can be found in the LICENSE file in the root of the source
	* tree. An additional intellectual property rights grant can be found
	* in the file PATENTS. All contributing project authors may
	* be found in the AUTHORS file in the root of the source tree.
	*/

	#ifndef API_RTP_HEADERS_H_
	#define API_RTP_HEADERS_H_

	#include <stddef.h>
	#include <stdint.h>

	#include <optional>
	#include <string>

	#include "api/units/timestamp.h"
	#include "api/video/color_space.h"
	#include "api/video/video_content_type.h"
	#include "api/video/video_rotation.h"
	#include "api/video/video_timing.h"
	#include "rtc_base/checks.h"
	#include "rtc_base/system/rtc_export.h"

	namespace webrtc {

	struct FeedbackRequest {
	// Determines whether the recv delta as specified in
	// https://tools.ietf.org/html/draft-holmer-rmcat-transport-wide-cc-extensions-01
	// should be included.
	bool include_timestamps;
	// Include feedback of received packets in the range [sequence_number -
	// sequence_count + 1, sequence_number]. That is, no feedback will be sent if
	// sequence_count is zero.
	int sequence_count;
	};

	// The Absolute Capture Time extension is used to stamp RTP packets with a NTP
	// timestamp showing when the first audio or video frame in a packet was
	// originally captured. The intent of this extension is to provide a way to
	// accomplish audio-to-video synchronization when RTCP-terminating intermediate
	// systems (e.g. mixers) are involved. See:
	// http://www.webrtc.org/experiments/rtp-hdrext/abs-capture-time
	struct AbsoluteCaptureTime {
	// Absolute capture timestamp is the NTP timestamp of when the first frame in
	// a packet was originally captured. This timestamp MUST be based on the same
	// clock as the clock used to generate NTP timestamps for RTCP sender reports
	// on the capture system.
	//
	// It’s not always possible to do an NTP clock readout at the exact moment of
	// when a media frame is captured. A capture system MAY postpone the readout
	// until a more convenient time. A capture system SHOULD have known delays
	// (e.g. from hardware buffers) subtracted from the readout to make the final
	// timestamp as close to the actual capture time as possible.
	//
	// This field is encoded as a 64-bit unsigned fixed-point number with the high
	// 32 bits for the timestamp in seconds and low 32 bits for the fractional
	// part. This is also known as the UQ32.32 format and is what the RTP
	// specification defines as the canonical format to represent NTP timestamps.
	uint64_t absolute_capture_timestamp;

	// Estimated capture clock offset is the sender’s estimate of the offset
	// between its own NTP clock and the capture system’s NTP clock. The sender is
	// here defined as the system that owns the NTP clock used to generate the NTP
	// timestamps for the RTCP sender reports on this stream. The sender system is
	// typically either the capture system or a mixer.
	//
	// This field is encoded as a 64-bit two’s complement signed fixed-point
	// number with the high 32 bits for the seconds and low 32 bits for the
	// fractional part. It’s intended to make it easy for a receiver, that knows
	// how to estimate the sender system’s NTP clock, to also estimate the capture
	// system’s NTP clock:
	//
	// Capture NTP Clock = Sender NTP Clock + Capture Clock Offset
	std::optional<int64_t> estimated_capture_clock_offset;
	};

	// The audio level extension is used to indicate the voice activity and the
	// audio level of the payload in the RTP stream. See:
	// https://tools.ietf.org/html/rfc6464#section-3.
	class AudioLevel {
	public:
	AudioLevel();
	AudioLevel(bool voice_activity, int audio_level);
	AudioLevel(const AudioLevel& other) = default;
	AudioLevel& operator=(const AudioLevel& other) = default;

	// Flag indicating whether the encoder believes the audio packet contains
	// voice activity.
	bool voice_activity() const { return voice_activity_; }

	// Audio level in -dBov. Values range from 0 to 127, representing 0 to -127
	// dBov. 127 represents digital silence.
	int level() const { return audio_level_; }

	private:
	bool voice_activity_;
	int audio_level_;
	};

	inline bool operator==(const AbsoluteCaptureTime& lhs,
	const AbsoluteCaptureTime& rhs) {
	return (lhs.absolute_capture_timestamp == rhs.absolute_capture_timestamp) &&
	(lhs.estimated_capture_clock_offset ==
	rhs.estimated_capture_clock_offset);
	}

	inline bool operator!=(const AbsoluteCaptureTime& lhs,
	const AbsoluteCaptureTime& rhs) {
	return !(lhs == rhs);
	}

	struct RTPHeaderExtension {
	RTPHeaderExtension();
	RTPHeaderExtension(const RTPHeaderExtension& other);
	RTPHeaderExtension& operator=(const RTPHeaderExtension& other);

	static constexpr int kAbsSendTimeFraction = 18;

	Timestamp GetAbsoluteSendTimestamp() const {
	RTC_DCHECK(hasAbsoluteSendTime);
	RTC_DCHECK(absoluteSendTime < (1ul << 24));
	return Timestamp::Micros((absoluteSendTime * 1000000ll) /
	(1 << kAbsSendTimeFraction));
	}

	bool hasTransmissionTimeOffset;
	int32_t transmissionTimeOffset;
	bool hasAbsoluteSendTime;
	uint32_t absoluteSendTime;
	std::optional<AbsoluteCaptureTime> absolute_capture_time;
	bool hasTransportSequenceNumber;
	uint16_t transportSequenceNumber;
	std::optional<FeedbackRequest> feedback_request;

	// Audio Level includes both level in dBov and voiced/unvoiced bit. See:
	// https://tools.ietf.org/html/rfc6464#section-3
	std::optional<AudioLevel> audio_level() const { return audio_level_; }

	void set_audio_level(std::optional<AudioLevel> audio_level) {
	audio_level_ = audio_level;
	}

	// For Coordination of Video Orientation. See
	// http://www.etsi.org/deliver/etsi_ts/126100_126199/126114/12.07.00_60/
	// ts_126114v120700p.pdf
	bool hasVideoRotation;
	VideoRotation videoRotation;

	// TODO(ilnik): Refactor this and one above to be std::optional() and remove
	// a corresponding bool flag.
	bool hasVideoContentType;
	VideoContentType videoContentType;

	bool has_video_timing;
	VideoSendTiming video_timing;

	VideoPlayoutDelay playout_delay;

	// For identification of a stream when ssrc is not signaled. See
	// https://tools.ietf.org/html/rfc8852
	std::string stream_id;
	std::string repaired_stream_id;

	// For identifying the media section used to interpret this RTP packet. See
	// https://tools.ietf.org/html/rfc8843
	std::string mid;

	std::optional<ColorSpace> color_space;

	private:
	std::optional<AudioLevel> audio_level_;
	};

	enum { kRtpCsrcSize = 15 }; // RFC 3550 page 13

	struct RTC_EXPORT RTPHeader {
	RTPHeader();
	RTPHeader(const RTPHeader& other);
	RTPHeader& operator=(const RTPHeader& other);

	bool markerBit;
	uint8_t payloadType;
	uint16_t sequenceNumber;
	uint32_t timestamp;
	uint32_t ssrc;
	uint8_t numCSRCs;
	uint32_t arrOfCSRCs[kRtpCsrcSize];
	size_t paddingLength;
	size_t headerLength;
	RTPHeaderExtension extension;
	};

	// RTCP mode to use. Compound mode is described by RFC 4585 and reduced-size
	// RTCP mode is described by RFC 5506.
	enum class RtcpMode { kOff, kCompound, kReducedSize };

	enum NetworkState {
	kNetworkUp,
	kNetworkDown,
	};

	} // namespace webrtc

	#endif // API_RTP_HEADERS_H_