blob: 80595e09abec10a82a1aae371add79a08c2d5938 [file] [log] [blame]
henrike@webrtc.org28e20752013-07-10 00:45:36 +00001/*
kjellanderb24317b2016-02-10 07:54:43 -08002 * Copyright 2012 The WebRTC project authors. All Rights Reserved.
henrike@webrtc.org28e20752013-07-10 00:45:36 +00003 *
kjellanderb24317b2016-02-10 07:54:43 -08004 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
henrike@webrtc.org28e20752013-07-10 00:45:36 +00009 */
10
11// This file contains interfaces for MediaStream, MediaTrack and MediaSource.
12// These interfaces are used for implementing MediaStream and MediaTrack as
13// defined in http://dev.w3.org/2011/webrtc/editor/webrtc.html#stream-api. These
14// interfaces must be used only with PeerConnection. PeerConnectionManager
15// interface provides the factory methods to create MediaStream and MediaTracks.
16
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020017#ifndef API_MEDIASTREAMINTERFACE_H_
18#define API_MEDIASTREAMINTERFACE_H_
henrike@webrtc.org28e20752013-07-10 00:45:36 +000019
pbos9baddf22017-01-02 06:44:41 -080020#include <stddef.h>
21
henrike@webrtc.org28e20752013-07-10 00:45:36 +000022#include <string>
23#include <vector>
24
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020025#include "api/optional.h"
26#include "api/video/video_frame.h"
zhihuang38ede132017-06-15 12:52:32 -070027// TODO(zhihuang): Remove unrelated headers once downstream applications stop
28// relying on them; they were previously transitively included by
29// mediachannel.h, which is no longer a dependency of this file.
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020030#include "media/base/videosinkinterface.h"
31#include "media/base/videosourceinterface.h"
Ivo Creusen56d46092017-11-24 17:29:59 +010032#include "modules/audio_processing/include/audio_processing_statistics.h"
Mirko Bonadei92ea95e2017-09-15 06:47:31 +020033#include "rtc_base/ratetracker.h"
34#include "rtc_base/refcount.h"
35#include "rtc_base/scoped_ref_ptr.h"
36#include "rtc_base/thread.h"
37#include "rtc_base/timeutils.h"
henrike@webrtc.org28e20752013-07-10 00:45:36 +000038
henrike@webrtc.org28e20752013-07-10 00:45:36 +000039namespace webrtc {
40
41// Generic observer interface.
42class ObserverInterface {
43 public:
44 virtual void OnChanged() = 0;
45
46 protected:
47 virtual ~ObserverInterface() {}
48};
49
50class NotifierInterface {
51 public:
52 virtual void RegisterObserver(ObserverInterface* observer) = 0;
53 virtual void UnregisterObserver(ObserverInterface* observer) = 0;
54
55 virtual ~NotifierInterface() {}
56};
57
deadbeefb10f32f2017-02-08 01:38:21 -080058// Base class for sources. A MediaStreamTrack has an underlying source that
59// provides media. A source can be shared by multiple tracks.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +000060class MediaSourceInterface : public rtc::RefCountInterface,
henrike@webrtc.org28e20752013-07-10 00:45:36 +000061 public NotifierInterface {
62 public:
63 enum SourceState {
64 kInitializing,
65 kLive,
66 kEnded,
67 kMuted
68 };
69
70 virtual SourceState state() const = 0;
71
tommi6eca7e32015-12-15 04:27:11 -080072 virtual bool remote() const = 0;
73
henrike@webrtc.org28e20752013-07-10 00:45:36 +000074 protected:
75 virtual ~MediaSourceInterface() {}
76};
77
deadbeefb10f32f2017-02-08 01:38:21 -080078// C++ version of MediaStreamTrack.
79// See: https://www.w3.org/TR/mediacapture-streams/#mediastreamtrack
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +000080class MediaStreamTrackInterface : public rtc::RefCountInterface,
henrike@webrtc.org28e20752013-07-10 00:45:36 +000081 public NotifierInterface {
82 public:
83 enum TrackState {
perkjc8f952d2016-03-23 00:33:56 -070084 kLive,
85 kEnded,
henrike@webrtc.org28e20752013-07-10 00:45:36 +000086 };
87
deadbeeffac06552015-11-25 11:26:01 -080088 static const char kAudioKind[];
89 static const char kVideoKind[];
90
nissefcc640f2016-04-01 01:10:42 -070091 // The kind() method must return kAudioKind only if the object is a
92 // subclass of AudioTrackInterface, and kVideoKind only if the
93 // object is a subclass of VideoTrackInterface. It is typically used
94 // to protect a static_cast<> to the corresponding subclass.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000095 virtual std::string kind() const = 0;
deadbeefb10f32f2017-02-08 01:38:21 -080096
97 // Track identifier.
henrike@webrtc.org28e20752013-07-10 00:45:36 +000098 virtual std::string id() const = 0;
deadbeefb10f32f2017-02-08 01:38:21 -080099
100 // A disabled track will produce silence (if audio) or black frames (if
101 // video). Can be disabled and re-enabled.
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000102 virtual bool enabled() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000103 virtual bool set_enabled(bool enable) = 0;
fischman@webrtc.org32001ef2013-08-12 23:26:21 +0000104
deadbeefb10f32f2017-02-08 01:38:21 -0800105 // Live or ended. A track will never be live again after becoming ended.
106 virtual TrackState state() const = 0;
107
fischman@webrtc.org32001ef2013-08-12 23:26:21 +0000108 protected:
109 virtual ~MediaStreamTrackInterface() {}
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000110};
111
deadbeefb10f32f2017-02-08 01:38:21 -0800112// VideoTrackSourceInterface is a reference counted source used for
113// VideoTracks. The same source can be used by multiple VideoTracks.
perkj773be362017-07-31 23:22:01 -0700114// VideoTrackSourceInterface is designed to be invoked on the signaling thread
115// except for rtc::VideoSourceInterface<VideoFrame> methods that will be invoked
116// on the worker thread via a VideoTrack. A custom implementation of a source
117// can inherit AdaptedVideoTrackSource instead of directly implementing this
118// interface.
perkja3ede6c2016-03-08 01:27:48 +0100119class VideoTrackSourceInterface
120 : public MediaSourceInterface,
nisseacd935b2016-11-11 03:55:13 -0800121 public rtc::VideoSourceInterface<VideoFrame> {
perkja3ede6c2016-03-08 01:27:48 +0100122 public:
nissefcc640f2016-04-01 01:10:42 -0700123 struct Stats {
124 // Original size of captured frame, before video adaptation.
125 int input_width;
126 int input_height;
127 };
perkja3ede6c2016-03-08 01:27:48 +0100128
perkj0d3eef22016-03-09 02:39:17 +0100129 // Indicates that parameters suitable for screencasts should be automatically
130 // applied to RtpSenders.
131 // TODO(perkj): Remove these once all known applications have moved to
deadbeefb10f32f2017-02-08 01:38:21 -0800132 // explicitly setting suitable parameters for screencasts and don't need this
perkj0d3eef22016-03-09 02:39:17 +0100133 // implicit behavior.
134 virtual bool is_screencast() const = 0;
135
Perc0d31e92016-03-31 17:23:39 +0200136 // Indicates that the encoder should denoise video before encoding it.
137 // If it is not set, the default configuration is used which is different
138 // depending on video codec.
perkj0d3eef22016-03-09 02:39:17 +0100139 // TODO(perkj): Remove this once denoising is done by the source, and not by
140 // the encoder.
Perc0d31e92016-03-31 17:23:39 +0200141 virtual rtc::Optional<bool> needs_denoising() const = 0;
perkja3ede6c2016-03-08 01:27:48 +0100142
deadbeefb10f32f2017-02-08 01:38:21 -0800143 // Returns false if no stats are available, e.g, for a remote source, or a
144 // source which has not seen its first frame yet.
145 //
146 // Implementation should avoid blocking.
nissefcc640f2016-04-01 01:10:42 -0700147 virtual bool GetStats(Stats* stats) = 0;
148
perkja3ede6c2016-03-08 01:27:48 +0100149 protected:
150 virtual ~VideoTrackSourceInterface() {}
151};
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000152
perkj773be362017-07-31 23:22:01 -0700153// VideoTrackInterface is designed to be invoked on the signaling thread except
154// for rtc::VideoSourceInterface<VideoFrame> methods that must be invoked
155// on the worker thread.
156// PeerConnectionFactory::CreateVideoTrack can be used for creating a VideoTrack
157// that ensures thread safety and that all methods are called on the right
158// thread.
nissedb25d2e2016-02-26 01:24:58 -0800159class VideoTrackInterface
160 : public MediaStreamTrackInterface,
nisseacd935b2016-11-11 03:55:13 -0800161 public rtc::VideoSourceInterface<VideoFrame> {
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000162 public:
pbos5214a0a2016-12-16 15:39:11 -0800163 // Video track content hint, used to override the source is_screencast
164 // property.
165 // See https://crbug.com/653531 and https://github.com/WICG/mst-content-hint.
166 enum class ContentHint { kNone, kFluid, kDetailed };
167
mbonadei539d1042017-07-10 02:40:49 -0700168 // Register a video sink for this track. Used to connect the track to the
169 // underlying video engine.
170 void AddOrUpdateSink(rtc::VideoSinkInterface<VideoFrame>* sink,
171 const rtc::VideoSinkWants& wants) override {}
172 void RemoveSink(rtc::VideoSinkInterface<VideoFrame>* sink) override {}
173
perkja3ede6c2016-03-08 01:27:48 +0100174 virtual VideoTrackSourceInterface* GetSource() const = 0;
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000175
pbos5214a0a2016-12-16 15:39:11 -0800176 virtual ContentHint content_hint() const { return ContentHint::kNone; }
177 virtual void set_content_hint(ContentHint hint) {}
178
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000179 protected:
180 virtual ~VideoTrackInterface() {}
181};
182
tommi6eca7e32015-12-15 04:27:11 -0800183// Interface for receiving audio data from a AudioTrack.
184class AudioTrackSinkInterface {
185 public:
186 virtual void OnData(const void* audio_data,
187 int bits_per_sample,
188 int sample_rate,
Peter Kasting69558702016-01-12 16:26:35 -0800189 size_t number_of_channels,
tommi6eca7e32015-12-15 04:27:11 -0800190 size_t number_of_frames) = 0;
191
192 protected:
193 virtual ~AudioTrackSinkInterface() {}
194};
195
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000196// AudioSourceInterface is a reference counted source used for AudioTracks.
deadbeefb10f32f2017-02-08 01:38:21 -0800197// The same source can be used by multiple AudioTracks.
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000198class AudioSourceInterface : public MediaSourceInterface {
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000199 public:
200 class AudioObserver {
201 public:
202 virtual void OnSetVolume(double volume) = 0;
203
204 protected:
205 virtual ~AudioObserver() {}
206 };
207
deadbeefb10f32f2017-02-08 01:38:21 -0800208 // TODO(deadbeef): Makes all the interfaces pure virtual after they're
209 // implemented in chromium.
210
211 // Sets the volume of the source. |volume| is in the range of [0, 10].
Tommif888bb52015-12-12 01:37:01 +0100212 // TODO(tommi): This method should be on the track and ideally volume should
213 // be applied in the track in a way that does not affect clones of the track.
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000214 virtual void SetVolume(double volume) {}
215
deadbeefb10f32f2017-02-08 01:38:21 -0800216 // Registers/unregisters observers to the audio source.
wu@webrtc.orgb9a088b2014-02-13 23:18:49 +0000217 virtual void RegisterAudioObserver(AudioObserver* observer) {}
218 virtual void UnregisterAudioObserver(AudioObserver* observer) {}
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000219
tommi6eca7e32015-12-15 04:27:11 -0800220 // TODO(tommi): Make pure virtual.
221 virtual void AddSink(AudioTrackSinkInterface* sink) {}
222 virtual void RemoveSink(AudioTrackSinkInterface* sink) {}
mallinath@webrtc.org67ee6b92014-02-03 16:57:16 +0000223};
224
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000225// Interface of the audio processor used by the audio track to collect
226// statistics.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000227class AudioProcessorInterface : public rtc::RefCountInterface {
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000228 public:
Ivo Creusenae026092017-11-20 13:07:16 +0100229 // Deprecated, use AudioProcessorStatistics instead.
230 // TODO(ivoc): Remove this when all implementations have switched to the new
231 // GetStats function. See b/67926135.
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000232 struct AudioProcessorStats {
ivoc4e477a12017-01-15 08:29:46 -0800233 AudioProcessorStats()
234 : typing_noise_detected(false),
235 echo_return_loss(0),
236 echo_return_loss_enhancement(0),
237 echo_delay_median_ms(0),
238 echo_delay_std_ms(0),
239 aec_quality_min(0.0),
240 residual_echo_likelihood(0.0f),
241 residual_echo_likelihood_recent_max(0.0f),
242 aec_divergent_filter_fraction(0.0) {}
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000243 ~AudioProcessorStats() {}
244
245 bool typing_noise_detected;
246 int echo_return_loss;
247 int echo_return_loss_enhancement;
248 int echo_delay_median_ms;
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000249 int echo_delay_std_ms;
ivoc8c63a822016-10-21 04:10:03 -0700250 float aec_quality_min;
251 float residual_echo_likelihood;
ivoc4e477a12017-01-15 08:29:46 -0800252 float residual_echo_likelihood_recent_max;
Minyue2a8a78c2016-04-07 16:48:15 +0200253 float aec_divergent_filter_fraction;
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000254 };
Ivo Creusenae026092017-11-20 13:07:16 +0100255 // This struct maintains the optionality of the stats, and will replace the
256 // regular stats struct when all users have been updated.
257 struct AudioProcessorStatistics {
258 bool typing_noise_detected = false;
Ivo Creusen56d46092017-11-24 17:29:59 +0100259 AudioProcessingStats apm_statistics;
Ivo Creusenae026092017-11-20 13:07:16 +0100260 };
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000261
262 // Get audio processor statistics.
263 virtual void GetStats(AudioProcessorStats* stats) = 0;
264
Ivo Creusenae026092017-11-20 13:07:16 +0100265 // Get audio processor statistics. The |has_remote_tracks| argument should be
266 // set if there are active remote tracks (this would usually be true during
267 // a call). If there are no remote tracks some of the stats will not be set by
268 // the AudioProcessor, because they only make sense if there is at least one
269 // remote track.
270 // TODO(ivoc): Make pure virtual when all implementions are updated.
271 virtual AudioProcessorStatistics GetStats(bool has_remote_tracks);
272
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000273 protected:
274 virtual ~AudioProcessorInterface() {}
275};
276
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000277class AudioTrackInterface : public MediaStreamTrackInterface {
278 public:
deadbeefb10f32f2017-02-08 01:38:21 -0800279 // TODO(deadbeef): Figure out if the following interface should be const or
280 // not.
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000281 virtual AudioSourceInterface* GetSource() const = 0;
282
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000283 // Add/Remove a sink that will receive the audio data from the track.
284 virtual void AddSink(AudioTrackSinkInterface* sink) = 0;
285 virtual void RemoveSink(AudioTrackSinkInterface* sink) = 0;
mallinath@webrtc.org67ee6b92014-02-03 16:57:16 +0000286
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000287 // Get the signal level from the audio track.
288 // Return true on success, otherwise false.
deadbeefb10f32f2017-02-08 01:38:21 -0800289 // TODO(deadbeef): Change the interface to int GetSignalLevel() and pure
290 // virtual after it's implemented in chromium.
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000291 virtual bool GetSignalLevel(int* level) { return false; }
292
deadbeef8d60a942017-02-27 14:47:33 -0800293 // Get the audio processor used by the audio track. Return null if the track
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000294 // does not have any processor.
deadbeefb10f32f2017-02-08 01:38:21 -0800295 // TODO(deadbeef): Make the interface pure virtual.
296 virtual rtc::scoped_refptr<AudioProcessorInterface> GetAudioProcessor() {
297 return nullptr;
298 }
henrike@webrtc.org40b3b682014-03-03 18:30:11 +0000299
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000300 protected:
301 virtual ~AudioTrackInterface() {}
302};
303
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000304typedef std::vector<rtc::scoped_refptr<AudioTrackInterface> >
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000305 AudioTrackVector;
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000306typedef std::vector<rtc::scoped_refptr<VideoTrackInterface> >
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000307 VideoTrackVector;
308
deadbeefb10f32f2017-02-08 01:38:21 -0800309// C++ version of https://www.w3.org/TR/mediacapture-streams/#mediastream.
310//
311// A major difference is that remote audio/video tracks (received by a
312// PeerConnection/RtpReceiver) are not synchronized simply by adding them to
313// the same stream; a session description with the correct "a=msid" attributes
314// must be pushed down.
315//
316// Thus, this interface acts as simply a container for tracks.
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000317class MediaStreamInterface : public rtc::RefCountInterface,
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000318 public NotifierInterface {
319 public:
Steve Anton8ffb9c32017-08-31 15:45:38 -0700320 // TODO(steveanton): This could be renamed to id() to match the spec.
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000321 virtual std::string label() const = 0;
322
323 virtual AudioTrackVector GetAudioTracks() = 0;
324 virtual VideoTrackVector GetVideoTracks() = 0;
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000325 virtual rtc::scoped_refptr<AudioTrackInterface>
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000326 FindAudioTrack(const std::string& track_id) = 0;
buildbot@webrtc.orgd4e598d2014-07-29 17:36:52 +0000327 virtual rtc::scoped_refptr<VideoTrackInterface>
henrike@webrtc.org28e20752013-07-10 00:45:36 +0000328 FindVideoTrack(const std::string& track_id) = 0;
329
330 virtual bool AddTrack(AudioTrackInterface* track) = 0;
331 virtual bool AddTrack(VideoTrackInterface* track) = 0;
332 virtual bool RemoveTrack(AudioTrackInterface* track) = 0;
333 virtual bool RemoveTrack(VideoTrackInterface* track) = 0;
334
335 protected:
336 virtual ~MediaStreamInterface() {}
337};
338
339} // namespace webrtc
340
Mirko Bonadei92ea95e2017-09-15 06:47:31 +0200341#endif // API_MEDIASTREAMINTERFACE_H_