blob: 93e51520d1b98ce40db4f59e10e1f9565cfd0b28 [file] [log] [blame]
// libjingle
// Copyright 2010 Google Inc.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// 1. Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// 2. Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
// 3. The name of the author may not be used to endorse or promote products
// derived from this software without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
// WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
// MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
// EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
// SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
// PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
// OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
// WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
// OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
// ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
//
// Declaration of abstract class VideoCapturer
#ifndef TALK_SESSION_PHONE_VIDEOCAPTURER_H_
#define TALK_SESSION_PHONE_VIDEOCAPTURER_H_
#include <string>
#include <vector>
#include "talk/base/basictypes.h"
#include "talk/base/scoped_ptr.h"
#include "talk/base/sigslot.h"
#include "talk/session/phone/devicemanager.h"
#include "talk/session/phone/videocommon.h"
namespace cricket {
// General capturer events.
enum CaptureEvent {
// CE_FAILED = -1
// CE_STARTED = 0
CE_STOPPED = 1,
CE_PAUSED = 2,
CE_RESUMED = 3
};
struct CapturedFrame {
static const uint32 kFrameHeaderSize = 40; // Size from width to data_size.
static const uint32 kUnknownDataSize = 0xFFFFFFFF;
CapturedFrame();
// Get the number of bytes of the frame data. If data_size is known, return
// it directly. Otherwise, calculate the size based on width, height, and
// fourcc. Return true if succeeded.
bool GetDataSize(uint32* size) const;
// The width and height of the captured frame could be different from those
// of VideoFormat. Once the first frame is captured, the width, height,
// fourcc, pixel_width, and pixel_height should keep the same over frames.
int width; // in number of pixels
int height; // in number of pixels
uint32 fourcc; // compression
uint32 pixel_width; // width of a pixel, default is 1
uint32 pixel_height; // height of a pixel, default is 1
int64 elapsed_time; // elapsed time since the creation of the frame
// source (that is, the camera), in nanoseconds.
int64 time_stamp; // timestamp of when the frame was captured, in
// nanoseconds.
uint32 data_size; // number of bytes of the frame data
int rotation; // rotation in degrees of the frame (0, 90, 180, 270)
void* data; // pointer to the frame data. This object allocates the
// memory or points to an existing memory.
private:
DISALLOW_COPY_AND_ASSIGN(CapturedFrame);
};
// VideoCapturer is an abstract class that defines the interfaces for video
// capturing. The subclasses implement the video capturer for various platforms.
//
// The captured frames may need to be adapted (for example, cropping). Such an
// adaptor is out of the scope of VideoCapturer. If the adaptor is needed, it
// acts as the downstream of VideoCapturer, adapts the captured frames, and
// delivers the adapted frames to other components such as the encoder.
//
// Programming model:
// Create and initialize an object of a subclass of VideoCapturer
// SignalStartResult.connect()
// SignalFrameCaptured.connect()
// Find the capture format for Start() by either calling GetSupportedFormats()
// and selecting one of the supported or calling GetBestCaptureFormat().
// Start()
// GetCaptureFormat() optionally
// Stop()
//
// Assumption:
// The Start() and Stop() methods are called by a single thread (that is, the
// media engine thread). Hence, there is no need to make them thread safe.
//
class VideoCapturer {
public:
VideoCapturer() {}
virtual ~VideoCapturer() {}
// Gets the id of the underlying device, which is available after the capturer
// is initialized. Can be used to determine if two capturers reference the
// same device.
const std::string& GetId() const { return id_; }
// Get the capture formats supported by the video capturer. The supported
// formats are available after the device is opened successfully.
// Return NULL if the supported formats are not available.
const std::vector<VideoFormat>* GetSupportedFormats() const {
return supported_formats_.get();
}
// Get the best capture format for the desired format. The best format is the
// same as one of the supported formats except that the frame interval may be
// different. If the application asks for 16x9 and the camera does not support
// 16x9 HD or the application asks for 16x10, we find the closest 4x3 and then
// crop; Otherwise, we find what the application asks for. Note that we assume
// that for HD, the desired format is always 16x9. The subclasses can override
// the default implementation.
// Parameters
// desired: the input desired format. If desired.fourcc is not kAnyFourcc,
// the best capture format has the exactly same fourcc. Otherwise,
// the best capture format uses a fourcc in GetPreferredFourccs().
// best_format: the output of the best capture format.
// Return false if there is no such a best format, that is, the desired format
// is not supported.
virtual bool GetBestCaptureFormat(const VideoFormat& desired,
VideoFormat* best_format);
// Start the video capturer with the specified capture format.
// Parameter
// capture_format: The caller got this parameter by either calling
// GetSupportedFormats() and selecting one of the supported
// or calling GetBestCaptureFormat().
// Return
// CR_SUCCESS: if the capturer starts successfully.
// CR_PENDING: if the capturer is pending to start. SignalStartResult
// below will signal the result after the pending.
// CR_NO_DEVICE: if the capturer has no device and fails to start.
// CR_FAILURE: otherwise.
virtual CaptureResult Start(const VideoFormat& capture_format) = 0;
// Get the current capture format, which is set by the Start() call.
// Note that the width and height of the captured frames may differ from the
// capture format. For example, the capture format is HD but the captured
// frames may be smaller than HD.
const VideoFormat* GetCaptureFormat() const {
return capture_format_.get();
}
// Stop the video capturer.
virtual void Stop() = 0;
// Check if the video capturer is running.
virtual bool IsRunning() = 0;
// Signal the result of Start() if it returned CR_PENDING.
sigslot::signal2<VideoCapturer*, CaptureResult> SignalStartResult;
// Signal the captured frame to downstream.
sigslot::signal2<VideoCapturer*, const CapturedFrame*> SignalFrameCaptured;
// Signals a change in capturer state.
sigslot::signal2<VideoCapturer*, CaptureEvent> SignalCaptureEvent;
protected:
// subclasses override this virtual method to provide a vector of fourccs, in
// order of preference, that are expected by the media engine.
virtual bool GetPreferredFourccs(std::vector<uint32>* fourccs) = 0;
// mutators to set private attributes
void SetId(const std::string& id) {
id_ = id;
}
void SetCaptureFormat(const VideoFormat* format) {
capture_format_.reset(format ? new VideoFormat(*format) : NULL);
}
void SetSupportedFormats(const std::vector<VideoFormat>& formats);
private:
// Check if the specified formats include a format with height no less than
// 720 and aspect ratio 16x9. In such a case, if we open the camera in 4x3 and
// crop to 16x9, the camera or driver may crop from 16x9 to 4x3 and then our
// code crop again from 4x3 to 16x9, which is not good.
static bool Includes16x9HD(const std::vector<VideoFormat>& formats);
// Get the distance between the desired format and the supported format.
// Return the max distance if they mismatch. See the implementation for
// details.
int64 GetFormatDistance(const VideoFormat& desired,
const VideoFormat& supported);
std::string id_;
talk_base::scoped_ptr<VideoFormat> capture_format_;
talk_base::scoped_ptr<std::vector<VideoFormat> > supported_formats_;
DISALLOW_COPY_AND_ASSIGN(VideoCapturer);
};
} // namespace cricket
#endif // TALK_SESSION_PHONE_VIDEOCAPTURER_H_