Home | History | Annotate | Download | only in base
      1 // libjingle
      2 // Copyright 2004 Google Inc.
      3 //
      4 // Redistribution and use in source and binary forms, with or without
      5 // modification, are permitted provided that the following conditions are met:
      6 //
      7 //  1. Redistributions of source code must retain the above copyright notice,
      8 //     this list of conditions and the following disclaimer.
      9 //  2. Redistributions in binary form must reproduce the above copyright notice,
     10 //     this list of conditions and the following disclaimer in the documentation
     11 //     and/or other materials provided with the distribution.
     12 //  3. The name of the author may not be used to endorse or promote products
     13 //     derived from this software without specific prior written permission.
     14 //
     15 // THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR IMPLIED
     16 // WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF
     17 // MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO
     18 // EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
     19 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     20 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;
     21 // OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY,
     22 // WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR
     23 // OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF
     24 // ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     25 //
     26 // Common definition for video, including fourcc and VideoFormat.
     27 
     28 #ifndef TALK_MEDIA_BASE_VIDEOCOMMON_H_  // NOLINT
     29 #define TALK_MEDIA_BASE_VIDEOCOMMON_H_
     30 
     31 #include <string>
     32 
     33 #include "talk/base/basictypes.h"
     34 #include "talk/base/timeutils.h"
     35 
     36 namespace cricket {
     37 
     38 // TODO(janahan): For now, a hard-coded ssrc is used as the video ssrc.
     39 // This is because when the video frame is passed to the mediaprocessor for
     40 // processing, it doesn't have the correct ssrc. Since currently only Tx
     41 // Video processing is supported, this is ok. When we switch over to trigger
     42 // from capturer, this should be fixed and this const removed.
     43 const uint32 kDummyVideoSsrc = 0xFFFFFFFF;
     44 
     45 // Minimum interval is 10k fps.
     46 #define FPS_TO_INTERVAL(fps) \
     47     (fps ? talk_base::kNumNanosecsPerSec / fps : \
     48     talk_base::kNumNanosecsPerSec / 10000)
     49 
     50 //////////////////////////////////////////////////////////////////////////////
     51 // Definition of FourCC codes
     52 //////////////////////////////////////////////////////////////////////////////
     53 // Convert four characters to a FourCC code.
     54 // Needs to be a macro otherwise the OS X compiler complains when the kFormat*
     55 // constants are used in a switch.
     56 #define FOURCC(a, b, c, d) ( \
     57     (static_cast<uint32>(a)) | (static_cast<uint32>(b) << 8) | \
     58     (static_cast<uint32>(c) << 16) | (static_cast<uint32>(d) << 24))
     59 // Some pages discussing FourCC codes:
     60 //   http://www.fourcc.org/yuv.php
     61 //   http://v4l2spec.bytesex.org/spec/book1.htm
     62 //   http://developer.apple.com/quicktime/icefloe/dispatch020.html
     63 //   http://msdn.microsoft.com/library/windows/desktop/dd206750.aspx#nv12
     64 //   http://people.xiph.org/~xiphmont/containers/nut/nut4cc.txt
     65 
     66 // FourCC codes grouped according to implementation efficiency.
     67 // Primary formats should convert in 1 efficient step.
     68 // Secondary formats are converted in 2 steps.
     69 // Auxilliary formats call primary converters.
     70 enum FourCC {
     71   // 9 Primary YUV formats: 5 planar, 2 biplanar, 2 packed.
     72   FOURCC_I420 = FOURCC('I', '4', '2', '0'),
     73   FOURCC_I422 = FOURCC('I', '4', '2', '2'),
     74   FOURCC_I444 = FOURCC('I', '4', '4', '4'),
     75   FOURCC_I411 = FOURCC('I', '4', '1', '1'),
     76   FOURCC_I400 = FOURCC('I', '4', '0', '0'),
     77   FOURCC_NV21 = FOURCC('N', 'V', '2', '1'),
     78   FOURCC_NV12 = FOURCC('N', 'V', '1', '2'),
     79   FOURCC_YUY2 = FOURCC('Y', 'U', 'Y', '2'),
     80   FOURCC_UYVY = FOURCC('U', 'Y', 'V', 'Y'),
     81 
     82   // 2 Secondary YUV formats: row biplanar.
     83   FOURCC_M420 = FOURCC('M', '4', '2', '0'),
     84   FOURCC_Q420 = FOURCC('Q', '4', '2', '0'),
     85 
     86   // 9 Primary RGB formats: 4 32 bpp, 2 24 bpp, 3 16 bpp.
     87   FOURCC_ARGB = FOURCC('A', 'R', 'G', 'B'),
     88   FOURCC_BGRA = FOURCC('B', 'G', 'R', 'A'),
     89   FOURCC_ABGR = FOURCC('A', 'B', 'G', 'R'),
     90   FOURCC_24BG = FOURCC('2', '4', 'B', 'G'),
     91   FOURCC_RAW  = FOURCC('r', 'a', 'w', ' '),
     92   FOURCC_RGBA = FOURCC('R', 'G', 'B', 'A'),
     93   FOURCC_RGBP = FOURCC('R', 'G', 'B', 'P'),  // bgr565.
     94   FOURCC_RGBO = FOURCC('R', 'G', 'B', 'O'),  // abgr1555.
     95   FOURCC_R444 = FOURCC('R', '4', '4', '4'),  // argb4444.
     96 
     97   // 4 Secondary RGB formats: 4 Bayer Patterns.
     98   FOURCC_RGGB = FOURCC('R', 'G', 'G', 'B'),
     99   FOURCC_BGGR = FOURCC('B', 'G', 'G', 'R'),
    100   FOURCC_GRBG = FOURCC('G', 'R', 'B', 'G'),
    101   FOURCC_GBRG = FOURCC('G', 'B', 'R', 'G'),
    102 
    103   // 1 Primary Compressed YUV format.
    104   FOURCC_MJPG = FOURCC('M', 'J', 'P', 'G'),
    105 
    106   // 5 Auxiliary YUV variations: 3 with U and V planes are swapped, 1 Alias.
    107   FOURCC_YV12 = FOURCC('Y', 'V', '1', '2'),
    108   FOURCC_YV16 = FOURCC('Y', 'V', '1', '6'),
    109   FOURCC_YV24 = FOURCC('Y', 'V', '2', '4'),
    110   FOURCC_YU12 = FOURCC('Y', 'U', '1', '2'),  // Linux version of I420.
    111   FOURCC_J420 = FOURCC('J', '4', '2', '0'),
    112   FOURCC_J400 = FOURCC('J', '4', '0', '0'),
    113 
    114   // 14 Auxiliary aliases.  CanonicalFourCC() maps these to canonical fourcc.
    115   FOURCC_IYUV = FOURCC('I', 'Y', 'U', 'V'),  // Alias for I420.
    116   FOURCC_YU16 = FOURCC('Y', 'U', '1', '6'),  // Alias for I422.
    117   FOURCC_YU24 = FOURCC('Y', 'U', '2', '4'),  // Alias for I444.
    118   FOURCC_YUYV = FOURCC('Y', 'U', 'Y', 'V'),  // Alias for YUY2.
    119   FOURCC_YUVS = FOURCC('y', 'u', 'v', 's'),  // Alias for YUY2 on Mac.
    120   FOURCC_HDYC = FOURCC('H', 'D', 'Y', 'C'),  // Alias for UYVY.
    121   FOURCC_2VUY = FOURCC('2', 'v', 'u', 'y'),  // Alias for UYVY on Mac.
    122   FOURCC_JPEG = FOURCC('J', 'P', 'E', 'G'),  // Alias for MJPG.
    123   FOURCC_DMB1 = FOURCC('d', 'm', 'b', '1'),  // Alias for MJPG on Mac.
    124   FOURCC_BA81 = FOURCC('B', 'A', '8', '1'),  // Alias for BGGR.
    125   FOURCC_RGB3 = FOURCC('R', 'G', 'B', '3'),  // Alias for RAW.
    126   FOURCC_BGR3 = FOURCC('B', 'G', 'R', '3'),  // Alias for 24BG.
    127   FOURCC_CM32 = FOURCC(0, 0, 0, 32),  // Alias for BGRA kCMPixelFormat_32ARGB
    128   FOURCC_CM24 = FOURCC(0, 0, 0, 24),  // Alias for RAW kCMPixelFormat_24RGB
    129 
    130   // 1 Auxiliary compressed YUV format set aside for capturer.
    131   FOURCC_H264 = FOURCC('H', '2', '6', '4'),
    132 
    133   // Match any fourcc.
    134   FOURCC_ANY  = 0xFFFFFFFF,
    135 };
    136 
    137 // Converts fourcc aliases into canonical ones.
    138 uint32 CanonicalFourCC(uint32 fourcc);
    139 
    140 // Get FourCC code as a string.
    141 inline std::string GetFourccName(uint32 fourcc) {
    142   std::string name;
    143   name.push_back(static_cast<char>(fourcc & 0xFF));
    144   name.push_back(static_cast<char>((fourcc >> 8) & 0xFF));
    145   name.push_back(static_cast<char>((fourcc >> 16) & 0xFF));
    146   name.push_back(static_cast<char>((fourcc >> 24) & 0xFF));
    147   return name;
    148 }
    149 
    150 // Computes a scale less to fit in max_pixels while maintaining aspect ratio.
    151 void ComputeScaleMaxPixels(int frame_width, int frame_height, int max_pixels,
    152                            int* scaled_width, int* scaled_height);
    153 
    154 // For low fps, max pixels limit is set to Retina MacBookPro 15" resolution of
    155 // 2880 x 1800 as of 4/18/2013.
    156 // For high fps, maximum pixels limit is set based on common 24" monitor
    157 // resolution of 2048 x 1280 as of 6/13/2013. The Retina resolution is
    158 // therefore reduced to 1440 x 900.
    159 void ComputeScale(int frame_width, int frame_height, int fps,
    160                   int* scaled_width, int* scaled_height);
    161 
    162 // Compute the frame size that conversion should crop to based on aspect ratio.
    163 // Ensures size is multiple of 2 due to I420 and conversion limitations.
    164 void ComputeCrop(int cropped_format_width, int cropped_format_height,
    165                  int frame_width, int frame_height,
    166                  int pixel_width, int pixel_height,
    167                  int rotation,
    168                  int* cropped_width, int* cropped_height);
    169 
    170 // Compute the frame size that makes pixels square pixel aspect ratio.
    171 void ComputeScaleToSquarePixels(int in_width, int in_height,
    172                                 int pixel_width, int pixel_height,
    173                                 int* scaled_width, int* scaled_height);
    174 
    175 //////////////////////////////////////////////////////////////////////////////
    176 // Definition of VideoFormat.
    177 //////////////////////////////////////////////////////////////////////////////
    178 
    179 // VideoFormat with Plain Old Data for global variables.
    180 struct VideoFormatPod {
    181   int width;  // Number of pixels.
    182   int height;  // Number of pixels.
    183   int64 interval;  // Nanoseconds.
    184   uint32 fourcc;  // Color space. FOURCC_ANY means that any color space is OK.
    185 };
    186 
    187 struct VideoFormat : VideoFormatPod {
    188   static const int64 kMinimumInterval =
    189       talk_base::kNumNanosecsPerSec / 10000;  // 10k fps.
    190 
    191   VideoFormat() {
    192     Construct(0, 0, 0, 0);
    193   }
    194 
    195   VideoFormat(int w, int h, int64 interval_ns, uint32 cc) {
    196     Construct(w, h, interval_ns, cc);
    197   }
    198 
    199   explicit VideoFormat(const VideoFormatPod& format) {
    200     Construct(format.width, format.height, format.interval, format.fourcc);
    201   }
    202 
    203   void Construct(int w, int h, int64 interval_ns, uint32 cc) {
    204     width = w;
    205     height = h;
    206     interval = interval_ns;
    207     fourcc = cc;
    208   }
    209 
    210   static int64 FpsToInterval(int fps) {
    211     return fps ? talk_base::kNumNanosecsPerSec / fps : kMinimumInterval;
    212   }
    213 
    214   static int IntervalToFps(int64 interval) {
    215     // Normalize the interval first.
    216     interval = talk_base::_max(interval, kMinimumInterval);
    217     return static_cast<int>(talk_base::kNumNanosecsPerSec / interval);
    218   }
    219 
    220   bool operator==(const VideoFormat& format) const {
    221     return width == format.width && height == format.height &&
    222         interval == format.interval && fourcc == format.fourcc;
    223   }
    224 
    225   bool operator!=(const VideoFormat& format) const {
    226     return !(*this == format);
    227   }
    228 
    229   bool operator<(const VideoFormat& format) const {
    230     return (fourcc < format.fourcc) ||
    231         (fourcc == format.fourcc && width < format.width) ||
    232         (fourcc == format.fourcc && width == format.width &&
    233             height < format.height) ||
    234         (fourcc == format.fourcc && width == format.width &&
    235             height == format.height && interval > format.interval);
    236   }
    237 
    238   int framerate() const { return IntervalToFps(interval); }
    239 
    240   // Check if both width and height are 0.
    241   bool IsSize0x0() const { return 0 == width && 0 == height; }
    242 
    243   // Check if this format is less than another one by comparing the resolution
    244   // and frame rate.
    245   bool IsPixelRateLess(const VideoFormat& format) const {
    246     return width * height * framerate() <
    247         format.width * format.height * format.framerate();
    248   }
    249 
    250   // Get a string presentation in the form of "fourcc width x height x fps"
    251   std::string ToString() const;
    252 };
    253 
    254 }  // namespace cricket
    255 
    256 #endif  // TALK_MEDIA_BASE_VIDEOCOMMON_H_  // NOLINT
    257