1/*
2 * libjingle
3 * Copyright 2010 Google Inc.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions are met:
7 *
8 *  1. Redistributions of source code must retain the above copyright notice,
9 *     this list of conditions and the following disclaimer.
10 *  2. Redistributions in binary form must reproduce the above copyright notice,
11 *     this list of conditions and the following disclaimer in the documentation
12 *     and/or other materials provided with the distribution.
13 *  3. The name of the author may not be used to endorse or promote products
14 *     derived from this software without specific prior written permission.
15 *
16 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
17 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
18 * MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
19 * EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
20 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
21 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
22 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
23 * WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
24 * OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
25 * ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
26 */
27
28// Declaration of abstract class VideoCapturer
29
30#ifndef TALK_MEDIA_BASE_VIDEOCAPTURER_H_
31#define TALK_MEDIA_BASE_VIDEOCAPTURER_H_
32
33#include <algorithm>
34#include <string>
35#include <vector>
36
37#include "talk/media/base/mediachannel.h"
38#include "talk/media/base/videoadapter.h"
39#include "talk/media/base/videocommon.h"
40#include "talk/media/base/videoframefactory.h"
41#include "talk/media/devices/devicemanager.h"
42#include "webrtc/base/basictypes.h"
43#include "webrtc/base/criticalsection.h"
44#include "webrtc/base/messagehandler.h"
45#include "webrtc/base/rollingaccumulator.h"
46#include "webrtc/base/scoped_ptr.h"
47#include "webrtc/base/sigslot.h"
48#include "webrtc/base/thread.h"
49#include "webrtc/base/timing.h"
50
51
52namespace cricket {
53
54// Current state of the capturer.
55// TODO(hellner): CS_NO_DEVICE is an error code not a capture state. Separate
56//                error codes and states.
57enum CaptureState {
58  CS_STOPPED,    // The capturer has been stopped or hasn't started yet.
59  CS_STARTING,   // The capturer is in the process of starting. Note, it may
60                 // still fail to start.
61  CS_RUNNING,    // The capturer has been started successfully and is now
62                 // capturing.
63  CS_PAUSED,     // The capturer has been paused.
64  CS_FAILED,     // The capturer failed to start.
65  CS_NO_DEVICE,  // The capturer has no device and consequently failed to start.
66};
67
68class VideoFrame;
69
70struct CapturedFrame {
71  static const uint32_t kFrameHeaderSize = 40;  // Size from width to data_size.
72  static const uint32_t kUnknownDataSize = 0xFFFFFFFF;
73
74  CapturedFrame();
75
76  // Get the number of bytes of the frame data. If data_size is known, return
77  // it directly. Otherwise, calculate the size based on width, height, and
78  // fourcc. Return true if succeeded.
79  bool GetDataSize(uint32_t* size) const;
80
81  // The width and height of the captured frame could be different from those
82  // of VideoFormat. Once the first frame is captured, the width, height,
83  // fourcc, pixel_width, and pixel_height should keep the same over frames.
84  int width;              // in number of pixels
85  int height;             // in number of pixels
86  uint32_t fourcc;        // compression
87  uint32_t pixel_width;   // width of a pixel, default is 1
88  uint32_t pixel_height;  // height of a pixel, default is 1
89  int64_t time_stamp;  // timestamp of when the frame was captured, in unix
90                       // time with nanosecond units.
91  uint32_t data_size;  // number of bytes of the frame data
92
93  webrtc::VideoRotation rotation; // rotation in degrees of the frame.
94
95  void*  data;          // pointer to the frame data. This object allocates the
96                        // memory or points to an existing memory.
97
98 private:
99  RTC_DISALLOW_COPY_AND_ASSIGN(CapturedFrame);
100};
101
102// VideoCapturer is an abstract class that defines the interfaces for video
103// capturing. The subclasses implement the video capturer for various types of
104// capturers and various platforms.
105//
106// The captured frames may need to be adapted (for example, cropping).
107// Video adaptation is built into and enabled by default. After a frame has
108// been captured from the device, it is sent to the video adapter, then out to
109// the encoder.
110//
111// Programming model:
112//   Create an object of a subclass of VideoCapturer
113//   Initialize
114//   SignalStateChange.connect()
115//   SignalFrameCaptured.connect()
116//   Find the capture format for Start() by either calling GetSupportedFormats()
117//   and selecting one of the supported or calling GetBestCaptureFormat().
118//   video_adapter()->OnOutputFormatRequest(desired_encoding_format)
119//   Start()
120//   GetCaptureFormat() optionally
121//   Stop()
122//
123// Assumption:
124//   The Start() and Stop() methods are called by a single thread (E.g., the
125//   media engine thread). Hence, the VideoCapture subclasses dont need to be
126//   thread safe.
127//
128class VideoCapturer
129    : public sigslot::has_slots<>,
130      public rtc::MessageHandler {
131 public:
132  // All signals are marshalled to |thread| or the creating thread if
133  // none is provided.
134  VideoCapturer();
135  explicit VideoCapturer(rtc::Thread* thread);
136  virtual ~VideoCapturer() {}
137
138  // Gets the id of the underlying device, which is available after the capturer
139  // is initialized. Can be used to determine if two capturers reference the
140  // same device.
141  const std::string& GetId() const { return id_; }
142
143  // Get the capture formats supported by the video capturer. The supported
144  // formats are non empty after the device has been opened successfully.
145  const std::vector<VideoFormat>* GetSupportedFormats() const;
146
147  // Get the best capture format for the desired format. The best format is the
148  // same as one of the supported formats except that the frame interval may be
149  // different. If the application asks for 16x9 and the camera does not support
150  // 16x9 HD or the application asks for 16x10, we find the closest 4x3 and then
151  // crop; Otherwise, we find what the application asks for. Note that we assume
152  // that for HD, the desired format is always 16x9. The subclasses can override
153  // the default implementation.
154  // Parameters
155  //   desired: the input desired format. If desired.fourcc is not kAnyFourcc,
156  //            the best capture format has the exactly same fourcc. Otherwise,
157  //            the best capture format uses a fourcc in GetPreferredFourccs().
158  //   best_format: the output of the best capture format.
159  // Return false if there is no such a best format, that is, the desired format
160  // is not supported.
161  virtual bool GetBestCaptureFormat(const VideoFormat& desired,
162                                    VideoFormat* best_format);
163
164  // TODO(hellner): deprecate (make private) the Start API in favor of this one.
165  //                Also remove CS_STARTING as it is implied by the return
166  //                value of StartCapturing().
167  bool StartCapturing(const VideoFormat& capture_format);
168  // Start the video capturer with the specified capture format.
169  // Parameter
170  //   capture_format: The caller got this parameter by either calling
171  //                   GetSupportedFormats() and selecting one of the supported
172  //                   or calling GetBestCaptureFormat().
173  // Return
174  //   CS_STARTING:  The capturer is trying to start. Success or failure will
175  //                 be notified via the |SignalStateChange| callback.
176  //   CS_RUNNING:   if the capturer is started and capturing.
177  //   CS_PAUSED:    Will never be returned.
178  //   CS_FAILED:    if the capturer failes to start..
179  //   CS_NO_DEVICE: if the capturer has no device and fails to start.
180  virtual CaptureState Start(const VideoFormat& capture_format) = 0;
181  // Sets the desired aspect ratio. If the capturer is capturing at another
182  // aspect ratio it will crop the width or the height so that asked for
183  // aspect ratio is acheived. Note that ratio_w and ratio_h do not need to be
184  // relatively prime.
185  void UpdateAspectRatio(int ratio_w, int ratio_h);
186  void ClearAspectRatio();
187
188  // Get the current capture format, which is set by the Start() call.
189  // Note that the width and height of the captured frames may differ from the
190  // capture format. For example, the capture format is HD but the captured
191  // frames may be smaller than HD.
192  const VideoFormat* GetCaptureFormat() const {
193    return capture_format_.get();
194  }
195
196  // Pause the video capturer.
197  virtual bool Pause(bool paused);
198  // Stop the video capturer.
199  virtual void Stop() = 0;
200  // Check if the video capturer is running.
201  virtual bool IsRunning() = 0;
202  // Restart the video capturer with the new |capture_format|.
203  // Default implementation stops and starts the capturer.
204  virtual bool Restart(const VideoFormat& capture_format);
205  // TODO(thorcarpenter): This behavior of keeping the camera open just to emit
206  // black frames is a total hack and should be fixed.
207  // When muting, produce black frames then pause the camera.
208  // When unmuting, start the camera. Camera starts unmuted.
209  virtual bool MuteToBlackThenPause(bool muted);
210  virtual bool IsMuted() const {
211    return muted_;
212  }
213  CaptureState capture_state() const {
214    return capture_state_;
215  }
216
217  // Tells videocapturer whether to apply the pending rotation. By default, the
218  // rotation is applied and the generated frame is up right. When set to false,
219  // generated frames will carry the rotation information from
220  // SetCaptureRotation. Return value indicates whether this operation succeeds.
221  virtual bool SetApplyRotation(bool enable);
222  virtual bool GetApplyRotation() { return apply_rotation_; }
223
224  // Returns true if the capturer is screencasting. This can be used to
225  // implement screencast specific behavior.
226  virtual bool IsScreencast() const = 0;
227
228  // Caps the VideoCapturer's format according to max_format. It can e.g. be
229  // used to prevent cameras from capturing at a resolution or framerate that
230  // the capturer is capable of but not performing satisfactorily at.
231  // The capping is an upper bound for each component of the capturing format.
232  // The fourcc component is ignored.
233  void ConstrainSupportedFormats(const VideoFormat& max_format);
234
235  void set_enable_camera_list(bool enable_camera_list) {
236    enable_camera_list_ = enable_camera_list;
237  }
238  bool enable_camera_list() {
239    return enable_camera_list_;
240  }
241
242  // Enable scaling to ensure square pixels.
243  void set_square_pixel_aspect_ratio(bool square_pixel_aspect_ratio) {
244    square_pixel_aspect_ratio_ = square_pixel_aspect_ratio;
245  }
246  bool square_pixel_aspect_ratio() {
247    return square_pixel_aspect_ratio_;
248  }
249
250  // Signal all capture state changes that are not a direct result of calling
251  // Start().
252  sigslot::signal2<VideoCapturer*, CaptureState> SignalStateChange;
253  // Frame callbacks are multithreaded to allow disconnect and connect to be
254  // called concurrently. It also ensures that it is safe to call disconnect
255  // at any time which is needed since the signal may be called from an
256  // unmarshalled thread owned by the VideoCapturer.
257  // Signal the captured frame to downstream.
258  sigslot::signal2<VideoCapturer*, const CapturedFrame*,
259                   sigslot::multi_threaded_local> SignalFrameCaptured;
260  // Signal the captured and possibly adapted frame to downstream consumers
261  // such as the encoder.
262  sigslot::signal2<VideoCapturer*, const VideoFrame*,
263                   sigslot::multi_threaded_local> SignalVideoFrame;
264
265  // If true, run video adaptation. By default, video adaptation is enabled
266  // and users must call video_adapter()->OnOutputFormatRequest()
267  // to receive frames.
268  bool enable_video_adapter() const { return enable_video_adapter_; }
269  void set_enable_video_adapter(bool enable_video_adapter) {
270    enable_video_adapter_ = enable_video_adapter;
271  }
272
273  CoordinatedVideoAdapter* video_adapter() { return &video_adapter_; }
274  const CoordinatedVideoAdapter* video_adapter() const {
275    return &video_adapter_;
276  }
277
278  // Takes ownership.
279  void set_frame_factory(VideoFrameFactory* frame_factory);
280
281  // Gets statistics for tracked variables recorded since the last call to
282  // GetStats.  Note that calling GetStats resets any gathered data so it
283  // should be called only periodically to log statistics.
284  void GetStats(VariableInfo<int>* adapt_drop_stats,
285                VariableInfo<int>* effect_drop_stats,
286                VariableInfo<double>* frame_time_stats,
287                VideoFormat* last_captured_frame_format);
288
289 protected:
290  // Callback attached to SignalFrameCaptured where SignalVideoFrames is called.
291  void OnFrameCaptured(VideoCapturer* video_capturer,
292                       const CapturedFrame* captured_frame);
293  void SetCaptureState(CaptureState state);
294
295  // Marshals SignalStateChange onto thread_.
296  void OnMessage(rtc::Message* message);
297
298  // subclasses override this virtual method to provide a vector of fourccs, in
299  // order of preference, that are expected by the media engine.
300  virtual bool GetPreferredFourccs(std::vector<uint32_t>* fourccs) = 0;
301
302  // mutators to set private attributes
303  void SetId(const std::string& id) {
304    id_ = id;
305  }
306
307  void SetCaptureFormat(const VideoFormat* format) {
308    capture_format_.reset(format ? new VideoFormat(*format) : NULL);
309    if (capture_format_) {
310      ASSERT(capture_format_->interval > 0 &&
311             "Capture format expected to have positive interval.");
312      // Video adapter really only cares about capture format interval.
313      video_adapter_.SetInputFormat(*capture_format_);
314    }
315  }
316
317  void SetSupportedFormats(const std::vector<VideoFormat>& formats);
318  VideoFrameFactory* frame_factory() { return frame_factory_.get(); }
319
320 private:
321  void Construct();
322  // Get the distance between the desired format and the supported format.
323  // Return the max distance if they mismatch. See the implementation for
324  // details.
325  int64_t GetFormatDistance(const VideoFormat& desired,
326                            const VideoFormat& supported);
327
328  // Convert captured frame to readable string for LOG messages.
329  std::string ToString(const CapturedFrame* frame) const;
330
331  // Updates filtered_supported_formats_ so that it contains the formats in
332  // supported_formats_ that fulfill all applied restrictions.
333  void UpdateFilteredSupportedFormats();
334  // Returns true if format doesn't fulfill all applied restrictions.
335  bool ShouldFilterFormat(const VideoFormat& format) const;
336
337  void UpdateStats(const CapturedFrame* captured_frame);
338
339  // Helper function to save statistics on the current data from a
340  // RollingAccumulator into stats.
341  template<class T>
342  static void GetVariableSnapshot(
343      const rtc::RollingAccumulator<T>& data,
344      VariableInfo<T>* stats);
345
346  rtc::Thread* thread_;
347  std::string id_;
348  CaptureState capture_state_;
349  rtc::scoped_ptr<VideoFrameFactory> frame_factory_;
350  rtc::scoped_ptr<VideoFormat> capture_format_;
351  std::vector<VideoFormat> supported_formats_;
352  rtc::scoped_ptr<VideoFormat> max_format_;
353  std::vector<VideoFormat> filtered_supported_formats_;
354
355  int ratio_w_;  // View resolution. e.g. 1280 x 720.
356  int ratio_h_;
357  bool enable_camera_list_;
358  bool square_pixel_aspect_ratio_;  // Enable scaling to square pixels.
359  int scaled_width_;  // Current output size from ComputeScale.
360  int scaled_height_;
361  bool muted_;
362  int black_frame_count_down_;
363
364  bool enable_video_adapter_;
365  CoordinatedVideoAdapter video_adapter_;
366
367  rtc::Timing frame_length_time_reporter_;
368  rtc::CriticalSection frame_stats_crit_;
369
370  int adapt_frame_drops_;
371  rtc::RollingAccumulator<int> adapt_frame_drops_data_;
372  double previous_frame_time_;
373  rtc::RollingAccumulator<double> frame_time_data_;
374  // The captured frame format before potential adapation.
375  VideoFormat last_captured_frame_format_;
376
377  // Whether capturer should apply rotation to the frame before signaling it.
378  bool apply_rotation_;
379
380  RTC_DISALLOW_COPY_AND_ASSIGN(VideoCapturer);
381};
382
383}  // namespace cricket
384
385#endif  // TALK_MEDIA_BASE_VIDEOCAPTURER_H_
386