blob: 9d336739e40014b9a7a73258bc721f7e44767c69 [file] [log] [blame]
henrike@webrtc.org28e20752013-07-10 00:45:361/*
kjellanderb24317b2016-02-10 15:54:432 * Copyright 2012 The WebRTC project authors. All Rights Reserved.
henrike@webrtc.org28e20752013-07-10 00:45:363 *
kjellanderb24317b2016-02-10 15:54:434 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
henrike@webrtc.org28e20752013-07-10 00:45:369 */
10
11// This file contains interfaces for MediaStream, MediaTrack and MediaSource.
12// These interfaces are used for implementing MediaStream and MediaTrack as
13// defined in http://dev.w3.org/2011/webrtc/editor/webrtc.html#stream-api. These
Niels Möllere942b142019-09-17 12:30:4114// interfaces must be used only with PeerConnection.
henrike@webrtc.org28e20752013-07-10 00:45:3615
Steve Anton10542f22019-01-11 17:11:0016#ifndef API_MEDIA_STREAM_INTERFACE_H_
17#define API_MEDIA_STREAM_INTERFACE_H_
henrike@webrtc.org28e20752013-07-10 00:45:3618
pbos9baddf22017-01-02 14:44:4119#include <stddef.h>
20
henrike@webrtc.org28e20752013-07-10 00:45:3621#include <string>
22#include <vector>
23
Danil Chapovalov0bc58cf2018-06-21 11:32:5624#include "absl/types/optional.h"
Piotr (Peter) Slatala95ca6e12018-11-13 15:57:0725#include "api/audio_options.h"
Mirko Bonadeid9708072019-01-25 19:26:4826#include "api/scoped_refptr.h"
Markus Handell9982efa2019-11-21 10:56:5027#include "api/video/recordable_encoded_frame.h"
Mirko Bonadei92ea95e2017-09-15 04:47:3128#include "api/video/video_frame.h"
Niels Möllerc6ce9c52018-05-11 09:15:3029#include "api/video/video_sink_interface.h"
Niels Möller0327c2d2018-05-21 12:09:3130#include "api/video/video_source_interface.h"
Markus Handell6fa9e682021-10-13 20:50:5331#include "api/video_track_source_constraints.h"
Ivo Creusen56d460902017-11-24 16:29:5932#include "modules/audio_processing/include/audio_processing_statistics.h"
Steve Anton10542f22019-01-11 17:11:0033#include "rtc_base/ref_count.h"
Mirko Bonadei66e76792019-04-02 09:33:5934#include "rtc_base/system/rtc_export.h"
henrike@webrtc.org28e20752013-07-10 00:45:3635
henrike@webrtc.org28e20752013-07-10 00:45:3636namespace webrtc {
37
38// Generic observer interface.
39class ObserverInterface {
40 public:
41 virtual void OnChanged() = 0;
42
43 protected:
44 virtual ~ObserverInterface() {}
45};
46
47class NotifierInterface {
48 public:
49 virtual void RegisterObserver(ObserverInterface* observer) = 0;
50 virtual void UnregisterObserver(ObserverInterface* observer) = 0;
51
52 virtual ~NotifierInterface() {}
53};
54
deadbeefb10f32f2017-02-08 09:38:2155// Base class for sources. A MediaStreamTrack has an underlying source that
56// provides media. A source can be shared by multiple tracks.
Mirko Bonadei66e76792019-04-02 09:33:5957class RTC_EXPORT MediaSourceInterface : public rtc::RefCountInterface,
58 public NotifierInterface {
henrike@webrtc.org28e20752013-07-10 00:45:3659 public:
Yves Gerey665174f2018-06-19 13:03:0560 enum SourceState { kInitializing, kLive, kEnded, kMuted };
henrike@webrtc.org28e20752013-07-10 00:45:3661
62 virtual SourceState state() const = 0;
63
tommi6eca7e32015-12-15 12:27:1164 virtual bool remote() const = 0;
65
henrike@webrtc.org28e20752013-07-10 00:45:3666 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:3167 ~MediaSourceInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:3668};
69
deadbeefb10f32f2017-02-08 09:38:2170// C++ version of MediaStreamTrack.
71// See: https://www.w3.org/TR/mediacapture-streams/#mediastreamtrack
Mirko Bonadei66e76792019-04-02 09:33:5972class RTC_EXPORT MediaStreamTrackInterface : public rtc::RefCountInterface,
73 public NotifierInterface {
henrike@webrtc.org28e20752013-07-10 00:45:3674 public:
75 enum TrackState {
perkjc8f952d2016-03-23 07:33:5676 kLive,
77 kEnded,
henrike@webrtc.org28e20752013-07-10 00:45:3678 };
79
Niels Möller6dcd4dc2019-08-26 08:45:2880 static const char* const kAudioKind;
81 static const char* const kVideoKind;
deadbeeffac06552015-11-25 19:26:0182
nissefcc640f2016-04-01 08:10:4283 // The kind() method must return kAudioKind only if the object is a
84 // subclass of AudioTrackInterface, and kVideoKind only if the
85 // object is a subclass of VideoTrackInterface. It is typically used
86 // to protect a static_cast<> to the corresponding subclass.
henrike@webrtc.org28e20752013-07-10 00:45:3687 virtual std::string kind() const = 0;
deadbeefb10f32f2017-02-08 09:38:2188
89 // Track identifier.
henrike@webrtc.org28e20752013-07-10 00:45:3690 virtual std::string id() const = 0;
deadbeefb10f32f2017-02-08 09:38:2191
92 // A disabled track will produce silence (if audio) or black frames (if
93 // video). Can be disabled and re-enabled.
henrike@webrtc.org28e20752013-07-10 00:45:3694 virtual bool enabled() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:3695 virtual bool set_enabled(bool enable) = 0;
fischman@webrtc.org32001ef2013-08-12 23:26:2196
deadbeefb10f32f2017-02-08 09:38:2197 // Live or ended. A track will never be live again after becoming ended.
98 virtual TrackState state() const = 0;
99
fischman@webrtc.org32001ef2013-08-12 23:26:21100 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31101 ~MediaStreamTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36102};
103
deadbeefb10f32f2017-02-08 09:38:21104// VideoTrackSourceInterface is a reference counted source used for
105// VideoTracks. The same source can be used by multiple VideoTracks.
perkj773be362017-08-01 06:22:01106// VideoTrackSourceInterface is designed to be invoked on the signaling thread
107// except for rtc::VideoSourceInterface<VideoFrame> methods that will be invoked
108// on the worker thread via a VideoTrack. A custom implementation of a source
109// can inherit AdaptedVideoTrackSource instead of directly implementing this
110// interface.
Yves Gerey665174f2018-06-19 13:03:05111class VideoTrackSourceInterface : public MediaSourceInterface,
112 public rtc::VideoSourceInterface<VideoFrame> {
perkja3ede6c2016-03-08 00:27:48113 public:
nissefcc640f2016-04-01 08:10:42114 struct Stats {
115 // Original size of captured frame, before video adaptation.
116 int input_width;
117 int input_height;
118 };
perkja3ede6c2016-03-08 00:27:48119
perkj0d3eef22016-03-09 01:39:17120 // Indicates that parameters suitable for screencasts should be automatically
121 // applied to RtpSenders.
122 // TODO(perkj): Remove these once all known applications have moved to
deadbeefb10f32f2017-02-08 09:38:21123 // explicitly setting suitable parameters for screencasts and don't need this
perkj0d3eef22016-03-09 01:39:17124 // implicit behavior.
125 virtual bool is_screencast() const = 0;
126
Perc0d31e92016-03-31 15:23:39127 // Indicates that the encoder should denoise video before encoding it.
128 // If it is not set, the default configuration is used which is different
129 // depending on video codec.
perkj0d3eef22016-03-09 01:39:17130 // TODO(perkj): Remove this once denoising is done by the source, and not by
131 // the encoder.
Danil Chapovalov0bc58cf2018-06-21 11:32:56132 virtual absl::optional<bool> needs_denoising() const = 0;
perkja3ede6c2016-03-08 00:27:48133
deadbeefb10f32f2017-02-08 09:38:21134 // Returns false if no stats are available, e.g, for a remote source, or a
135 // source which has not seen its first frame yet.
136 //
137 // Implementation should avoid blocking.
nissefcc640f2016-04-01 08:10:42138 virtual bool GetStats(Stats* stats) = 0;
139
Markus Handell9982efa2019-11-21 10:56:50140 // Returns true if encoded output can be enabled in the source.
Markus Handell6efc14b2020-05-05 18:11:13141 virtual bool SupportsEncodedOutput() const = 0;
Markus Handell9982efa2019-11-21 10:56:50142
143 // Reliably cause a key frame to be generated in encoded output.
144 // TODO(bugs.webrtc.org/11115): find optimal naming.
Markus Handell6efc14b2020-05-05 18:11:13145 virtual void GenerateKeyFrame() = 0;
Markus Handell9982efa2019-11-21 10:56:50146
147 // Add an encoded video sink to the source and additionally cause
148 // a key frame to be generated from the source. The sink will be
149 // invoked from a decoder queue.
Markus Handell9982efa2019-11-21 10:56:50150 virtual void AddEncodedSink(
Markus Handell6efc14b2020-05-05 18:11:13151 rtc::VideoSinkInterface<RecordableEncodedFrame>* sink) = 0;
Markus Handell9982efa2019-11-21 10:56:50152
153 // Removes an encoded video sink from the source.
Markus Handell9982efa2019-11-21 10:56:50154 virtual void RemoveEncodedSink(
Markus Handell6efc14b2020-05-05 18:11:13155 rtc::VideoSinkInterface<RecordableEncodedFrame>* sink) = 0;
Markus Handell9982efa2019-11-21 10:56:50156
Markus Handell6fa9e682021-10-13 20:50:53157 // Notify about constraints set on the source. The information eventually gets
158 // routed to attached sinks via VideoSinkInterface<>::OnConstraintsChanged.
159 // The call is expected to happen on the network thread.
160 // TODO(crbug/1255737): make pure virtual once downstream project adapts.
161 virtual void ProcessConstraints(
162 const webrtc::VideoTrackSourceConstraints& constraints) {}
163
perkja3ede6c2016-03-08 00:27:48164 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31165 ~VideoTrackSourceInterface() override = default;
perkja3ede6c2016-03-08 00:27:48166};
henrike@webrtc.org28e20752013-07-10 00:45:36167
perkj773be362017-08-01 06:22:01168// VideoTrackInterface is designed to be invoked on the signaling thread except
169// for rtc::VideoSourceInterface<VideoFrame> methods that must be invoked
170// on the worker thread.
171// PeerConnectionFactory::CreateVideoTrack can be used for creating a VideoTrack
172// that ensures thread safety and that all methods are called on the right
173// thread.
Mirko Bonadei35214fc2019-09-23 12:54:28174class RTC_EXPORT VideoTrackInterface
175 : public MediaStreamTrackInterface,
176 public rtc::VideoSourceInterface<VideoFrame> {
henrike@webrtc.org28e20752013-07-10 00:45:36177 public:
pbos5214a0a2016-12-16 23:39:11178 // Video track content hint, used to override the source is_screencast
179 // property.
Harald Alvestrandc19ab072018-06-18 06:53:10180 // See https://crbug.com/653531 and https://w3c.github.io/mst-content-hint.
181 enum class ContentHint { kNone, kFluid, kDetailed, kText };
pbos5214a0a2016-12-16 23:39:11182
mbonadei539d1042017-07-10 09:40:49183 // Register a video sink for this track. Used to connect the track to the
184 // underlying video engine.
185 void AddOrUpdateSink(rtc::VideoSinkInterface<VideoFrame>* sink,
186 const rtc::VideoSinkWants& wants) override {}
187 void RemoveSink(rtc::VideoSinkInterface<VideoFrame>* sink) override {}
188
perkja3ede6c2016-03-08 00:27:48189 virtual VideoTrackSourceInterface* GetSource() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36190
Danil Chapovalov2a5ce2b2018-02-07 08:38:31191 virtual ContentHint content_hint() const;
pbos5214a0a2016-12-16 23:39:11192 virtual void set_content_hint(ContentHint hint) {}
193
henrike@webrtc.org28e20752013-07-10 00:45:36194 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31195 ~VideoTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36196};
197
tommi6eca7e32015-12-15 12:27:11198// Interface for receiving audio data from a AudioTrack.
199class AudioTrackSinkInterface {
200 public:
201 virtual void OnData(const void* audio_data,
202 int bits_per_sample,
203 int sample_rate,
Peter Kasting69558702016-01-13 00:26:35204 size_t number_of_channels,
Minyue Li99d6d812020-01-29 09:25:12205 size_t number_of_frames) {
Artem Titovd3251962021-11-15 15:57:07206 RTC_DCHECK_NOTREACHED() << "This method must be overridden, or not used.";
Minyue Li99d6d812020-01-29 09:25:12207 }
208
Artem Titov0e61fdd2021-07-25 19:50:14209 // In this method, `absolute_capture_timestamp_ms`, when available, is
Minyue Li99d6d812020-01-29 09:25:12210 // supposed to deliver the timestamp when this audio frame was originally
211 // captured. This timestamp MUST be based on the same clock as
212 // rtc::TimeMillis().
213 virtual void OnData(const void* audio_data,
214 int bits_per_sample,
215 int sample_rate,
216 size_t number_of_channels,
217 size_t number_of_frames,
218 absl::optional<int64_t> absolute_capture_timestamp_ms) {
219 // TODO(bugs.webrtc.org/10739): Deprecate the old OnData and make this one
220 // pure virtual.
221 return OnData(audio_data, bits_per_sample, sample_rate, number_of_channels,
222 number_of_frames);
223 }
tommi6eca7e32015-12-15 12:27:11224
Gustaf Ullberg46ea5d72020-12-15 14:12:16225 // Returns the number of channels encoded by the sink. This can be less than
226 // the number_of_channels if down-mixing occur. A value of -1 means an unknown
227 // number.
228 virtual int NumPreferredChannels() const { return -1; }
229
tommi6eca7e32015-12-15 12:27:11230 protected:
231 virtual ~AudioTrackSinkInterface() {}
232};
233
henrike@webrtc.org28e20752013-07-10 00:45:36234// AudioSourceInterface is a reference counted source used for AudioTracks.
deadbeefb10f32f2017-02-08 09:38:21235// The same source can be used by multiple AudioTracks.
Mirko Bonadei66e76792019-04-02 09:33:59236class RTC_EXPORT AudioSourceInterface : public MediaSourceInterface {
wu@webrtc.orgb9a088b2014-02-13 23:18:49237 public:
238 class AudioObserver {
239 public:
240 virtual void OnSetVolume(double volume) = 0;
241
242 protected:
243 virtual ~AudioObserver() {}
244 };
245
deadbeefb10f32f2017-02-08 09:38:21246 // TODO(deadbeef): Makes all the interfaces pure virtual after they're
247 // implemented in chromium.
248
Artem Titov0e61fdd2021-07-25 19:50:14249 // Sets the volume of the source. `volume` is in the range of [0, 10].
Tommif888bb52015-12-12 00:37:01250 // TODO(tommi): This method should be on the track and ideally volume should
251 // be applied in the track in a way that does not affect clones of the track.
wu@webrtc.orgb9a088b2014-02-13 23:18:49252 virtual void SetVolume(double volume) {}
253
deadbeefb10f32f2017-02-08 09:38:21254 // Registers/unregisters observers to the audio source.
wu@webrtc.orgb9a088b2014-02-13 23:18:49255 virtual void RegisterAudioObserver(AudioObserver* observer) {}
256 virtual void UnregisterAudioObserver(AudioObserver* observer) {}
henrike@webrtc.org28e20752013-07-10 00:45:36257
tommi6eca7e32015-12-15 12:27:11258 // TODO(tommi): Make pure virtual.
259 virtual void AddSink(AudioTrackSinkInterface* sink) {}
260 virtual void RemoveSink(AudioTrackSinkInterface* sink) {}
Piotr (Peter) Slatala95ca6e12018-11-13 15:57:07261
262 // Returns options for the AudioSource.
263 // (for some of the settings this approach is broken, e.g. setting
264 // audio network adaptation on the source is the wrong layer of abstraction).
265 virtual const cricket::AudioOptions options() const;
mallinath@webrtc.org67ee6b92014-02-03 16:57:16266};
267
henrike@webrtc.org40b3b682014-03-03 18:30:11268// Interface of the audio processor used by the audio track to collect
269// statistics.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52270class AudioProcessorInterface : public rtc::RefCountInterface {
henrike@webrtc.org40b3b682014-03-03 18:30:11271 public:
Ivo Creusenae0260962017-11-20 12:07:16272 struct AudioProcessorStatistics {
273 bool typing_noise_detected = false;
Ivo Creusen56d460902017-11-24 16:29:59274 AudioProcessingStats apm_statistics;
Ivo Creusenae0260962017-11-20 12:07:16275 };
henrike@webrtc.org40b3b682014-03-03 18:30:11276
Artem Titov0e61fdd2021-07-25 19:50:14277 // Get audio processor statistics. The `has_remote_tracks` argument should be
Ivo Creusenae0260962017-11-20 12:07:16278 // set if there are active remote tracks (this would usually be true during
279 // a call). If there are no remote tracks some of the stats will not be set by
280 // the AudioProcessor, because they only make sense if there is at least one
281 // remote track.
Sam Zackrisson28127632018-11-01 10:37:15282 virtual AudioProcessorStatistics GetStats(bool has_remote_tracks) = 0;
Ivo Creusenae0260962017-11-20 12:07:16283
henrike@webrtc.org40b3b682014-03-03 18:30:11284 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31285 ~AudioProcessorInterface() override = default;
henrike@webrtc.org40b3b682014-03-03 18:30:11286};
287
Mirko Bonadei35214fc2019-09-23 12:54:28288class RTC_EXPORT AudioTrackInterface : public MediaStreamTrackInterface {
henrike@webrtc.org28e20752013-07-10 00:45:36289 public:
deadbeefb10f32f2017-02-08 09:38:21290 // TODO(deadbeef): Figure out if the following interface should be const or
291 // not.
Yves Gerey665174f2018-06-19 13:03:05292 virtual AudioSourceInterface* GetSource() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36293
henrike@webrtc.org40b3b682014-03-03 18:30:11294 // Add/Remove a sink that will receive the audio data from the track.
295 virtual void AddSink(AudioTrackSinkInterface* sink) = 0;
296 virtual void RemoveSink(AudioTrackSinkInterface* sink) = 0;
mallinath@webrtc.org67ee6b92014-02-03 16:57:16297
henrike@webrtc.org40b3b682014-03-03 18:30:11298 // Get the signal level from the audio track.
299 // Return true on success, otherwise false.
deadbeefb10f32f2017-02-08 09:38:21300 // TODO(deadbeef): Change the interface to int GetSignalLevel() and pure
301 // virtual after it's implemented in chromium.
Danil Chapovalov2a5ce2b2018-02-07 08:38:31302 virtual bool GetSignalLevel(int* level);
henrike@webrtc.org40b3b682014-03-03 18:30:11303
deadbeef8d60a942017-02-27 22:47:33304 // Get the audio processor used by the audio track. Return null if the track
henrike@webrtc.org40b3b682014-03-03 18:30:11305 // does not have any processor.
deadbeefb10f32f2017-02-08 09:38:21306 // TODO(deadbeef): Make the interface pure virtual.
Danil Chapovalov2a5ce2b2018-02-07 08:38:31307 virtual rtc::scoped_refptr<AudioProcessorInterface> GetAudioProcessor();
henrike@webrtc.org40b3b682014-03-03 18:30:11308
henrike@webrtc.org28e20752013-07-10 00:45:36309 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31310 ~AudioTrackInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36311};
312
Yves Gerey665174f2018-06-19 13:03:05313typedef std::vector<rtc::scoped_refptr<AudioTrackInterface> > AudioTrackVector;
314typedef std::vector<rtc::scoped_refptr<VideoTrackInterface> > VideoTrackVector;
henrike@webrtc.org28e20752013-07-10 00:45:36315
deadbeefb10f32f2017-02-08 09:38:21316// C++ version of https://www.w3.org/TR/mediacapture-streams/#mediastream.
317//
318// A major difference is that remote audio/video tracks (received by a
319// PeerConnection/RtpReceiver) are not synchronized simply by adding them to
320// the same stream; a session description with the correct "a=msid" attributes
321// must be pushed down.
322//
323// Thus, this interface acts as simply a container for tracks.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52324class MediaStreamInterface : public rtc::RefCountInterface,
henrike@webrtc.org28e20752013-07-10 00:45:36325 public NotifierInterface {
326 public:
Seth Hampson13b8bad2018-03-13 23:05:28327 virtual std::string id() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36328
329 virtual AudioTrackVector GetAudioTracks() = 0;
330 virtual VideoTrackVector GetVideoTracks() = 0;
Yves Gerey665174f2018-06-19 13:03:05331 virtual rtc::scoped_refptr<AudioTrackInterface> FindAudioTrack(
332 const std::string& track_id) = 0;
333 virtual rtc::scoped_refptr<VideoTrackInterface> FindVideoTrack(
334 const std::string& track_id) = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36335
Niels Möllere7cc8832022-01-04 14:20:03336 // Takes ownership of added tracks.
Harald Alvestrand2f7ad282022-04-21 11:35:43337 // Note: Default implementations are for avoiding link time errors in
338 // implementations that mock this API.
339 // TODO(bugs.webrtc.org/13980): Remove default implementations.
340 virtual bool AddTrack(rtc::scoped_refptr<AudioTrackInterface> track) {
341 RTC_CHECK_NOTREACHED();
342 }
343 virtual bool AddTrack(rtc::scoped_refptr<VideoTrackInterface> track) {
344 RTC_CHECK_NOTREACHED();
345 }
346 virtual bool RemoveTrack(rtc::scoped_refptr<AudioTrackInterface> track) {
347 RTC_CHECK_NOTREACHED();
348 }
349 virtual bool RemoveTrack(rtc::scoped_refptr<VideoTrackInterface> track) {
350 RTC_CHECK_NOTREACHED();
351 }
352 // Deprecated: Should use scoped_refptr versions rather than pointers.
353 [[deprecated("Pass a scoped_refptr")]] virtual bool AddTrack(
354 AudioTrackInterface* track) {
355 return AddTrack(rtc::scoped_refptr<AudioTrackInterface>(track));
356 }
357 [[deprecated("Pass a scoped_refptr")]] virtual bool AddTrack(
358 VideoTrackInterface* track) {
359 return AddTrack(rtc::scoped_refptr<VideoTrackInterface>(track));
360 }
361 [[deprecated("Pass a scoped_refptr")]] virtual bool RemoveTrack(
362 AudioTrackInterface* track) {
363 return RemoveTrack(rtc::scoped_refptr<AudioTrackInterface>(track));
364 }
365 [[deprecated("Pass a scoped_refptr")]] virtual bool RemoveTrack(
366 VideoTrackInterface* track) {
367 return RemoveTrack(rtc::scoped_refptr<VideoTrackInterface>(track));
368 }
henrike@webrtc.org28e20752013-07-10 00:45:36369
370 protected:
Danil Chapovalov2a5ce2b2018-02-07 08:38:31371 ~MediaStreamInterface() override = default;
henrike@webrtc.org28e20752013-07-10 00:45:36372};
373
374} // namespace webrtc
375
Steve Anton10542f22019-01-11 17:11:00376#endif // API_MEDIA_STREAM_INTERFACE_H_