Home | History | Annotate | Download | only in examples
      1 /*
      2  *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
      3  *
      4  *  Use of this source code is governed by a BSD-style license
      5  *  that can be found in the LICENSE file in the root of the source
      6  *  tree. An additional intellectual property rights grant can be found
      7  *  in the file PATENTS.  All contributing project authors may
      8  *  be found in the AUTHORS file in the root of the source tree.
      9  */
     10 
     11 
     12 // VP8 Set Active and ROI Maps
     13 // ===========================
     14 //
     15 // This is an example demonstrating how to control the VP8 encoder's
     16 // ROI and Active maps.
     17 //
     18 // ROI (Reigon of Interest) maps are a way for the application to assign
     19 // each macroblock in the image to a region, and then set quantizer and
     20 // filtering parameters on that image.
     21 //
     22 // Active maps are a way for the application to specify on a
     23 // macroblock-by-macroblock basis whether there is any activity in that
     24 // macroblock.
     25 //
     26 //
     27 // Configuration
     28 // -------------
     29 // An ROI map is set on frame 22. If the width of the image in macroblocks
     30 // is evenly divisble by 4, then the output will appear to have distinct
     31 // columns, where the quantizer, loopfilter, and static threshold differ
     32 // from column to column.
     33 //
     34 // An active map is set on frame 33. If the width of the image in macroblocks
     35 // is evenly divisble by 4, then the output will appear to have distinct
     36 // columns, where one column will have motion and the next will not.
     37 //
     38 // The active map is cleared on frame 44.
     39 //
     40 // Observing The Effects
     41 // ---------------------
     42 // Use the `simple_decoder` example to decode this sample, and observe
     43 // the change in the image at frames 22, 33, and 44.
     44 
     45 #include <stdio.h>
     46 #include <stdlib.h>
     47 #include <string.h>
     48 
     49 #define VPX_CODEC_DISABLE_COMPAT 1
     50 #include "vpx/vp8cx.h"
     51 #include "vpx/vpx_encoder.h"
     52 
     53 #include "./tools_common.h"
     54 #include "./video_writer.h"
     55 
     56 static const char *exec_name;
     57 
     58 void usage_exit() {
     59   fprintf(stderr, "Usage: %s <codec> <width> <height> <infile> <outfile>\n",
     60           exec_name);
     61   exit(EXIT_FAILURE);
     62 }
     63 
     64 static void set_roi_map(const vpx_codec_enc_cfg_t *cfg,
     65                         vpx_codec_ctx_t *codec) {
     66   unsigned int i;
     67   vpx_roi_map_t roi = {0};
     68 
     69   roi.rows = (cfg->g_h + 15) / 16;
     70   roi.cols = (cfg->g_w + 15) / 16;
     71 
     72   roi.delta_q[0] = 0;
     73   roi.delta_q[1] = -2;
     74   roi.delta_q[2] = -4;
     75   roi.delta_q[3] = -6;
     76 
     77   roi.delta_lf[0] = 0;
     78   roi.delta_lf[1] = 1;
     79   roi.delta_lf[2] = 2;
     80   roi.delta_lf[3] = 3;
     81 
     82   roi.static_threshold[0] = 1500;
     83   roi.static_threshold[1] = 1000;
     84   roi.static_threshold[2] = 500;
     85   roi.static_threshold[3] = 0;
     86 
     87   roi.roi_map = (uint8_t *)malloc(roi.rows * roi.cols);
     88   for (i = 0; i < roi.rows * roi.cols; ++i)
     89     roi.roi_map[i] = i % 4;
     90 
     91   if (vpx_codec_control(codec, VP8E_SET_ROI_MAP, &roi))
     92     die_codec(codec, "Failed to set ROI map");
     93 
     94   free(roi.roi_map);
     95 }
     96 
     97 static void set_active_map(const vpx_codec_enc_cfg_t *cfg,
     98                            vpx_codec_ctx_t *codec) {
     99   unsigned int i;
    100   vpx_active_map_t map = {0};
    101 
    102   map.rows = (cfg->g_h + 15) / 16;
    103   map.cols = (cfg->g_w + 15) / 16;
    104 
    105   map.active_map = (uint8_t *)malloc(map.rows * map.cols);
    106   for (i = 0; i < map.rows * map.cols; ++i)
    107     map.active_map[i] = i % 2;
    108 
    109   if (vpx_codec_control(codec, VP8E_SET_ACTIVEMAP, &map))
    110     die_codec(codec, "Failed to set active map");
    111 
    112   free(map.active_map);
    113 }
    114 
    115 static void unset_active_map(const vpx_codec_enc_cfg_t *cfg,
    116                              vpx_codec_ctx_t *codec) {
    117   vpx_active_map_t map = {0};
    118 
    119   map.rows = (cfg->g_h + 15) / 16;
    120   map.cols = (cfg->g_w + 15) / 16;
    121   map.active_map = NULL;
    122 
    123   if (vpx_codec_control(codec, VP8E_SET_ACTIVEMAP, &map))
    124     die_codec(codec, "Failed to set active map");
    125 }
    126 
    127 static void encode_frame(vpx_codec_ctx_t *codec,
    128                          vpx_image_t *img,
    129                          int frame_index,
    130                          VpxVideoWriter *writer) {
    131   vpx_codec_iter_t iter = NULL;
    132   const vpx_codec_cx_pkt_t *pkt = NULL;
    133   const vpx_codec_err_t res = vpx_codec_encode(codec, img, frame_index, 1, 0,
    134                                                VPX_DL_GOOD_QUALITY);
    135   if (res != VPX_CODEC_OK)
    136     die_codec(codec, "Failed to encode frame");
    137 
    138   while ((pkt = vpx_codec_get_cx_data(codec, &iter)) != NULL) {
    139     if (pkt->kind == VPX_CODEC_CX_FRAME_PKT) {
    140       const int keyframe = (pkt->data.frame.flags & VPX_FRAME_IS_KEY) != 0;
    141       if (!vpx_video_writer_write_frame(writer,
    142                                         pkt->data.frame.buf,
    143                                         pkt->data.frame.sz,
    144                                         pkt->data.frame.pts)) {
    145         die_codec(codec, "Failed to write compressed frame");
    146       }
    147 
    148       printf(keyframe ? "K" : ".");
    149       fflush(stdout);
    150     }
    151   }
    152 }
    153 
    154 int main(int argc, char **argv) {
    155   FILE *infile = NULL;
    156   vpx_codec_ctx_t codec = {0};
    157   vpx_codec_enc_cfg_t cfg = {0};
    158   int frame_count = 0;
    159   vpx_image_t raw = {0};
    160   vpx_codec_err_t res;
    161   VpxVideoInfo info = {0};
    162   VpxVideoWriter *writer = NULL;
    163   const VpxInterface *encoder = NULL;
    164   const int fps = 2;        // TODO(dkovalev) add command line argument
    165   const double bits_per_pixel_per_frame = 0.067;
    166 
    167   exec_name = argv[0];
    168 
    169   if (argc != 6)
    170     die("Invalid number of arguments");
    171 
    172   encoder = get_vpx_encoder_by_name(argv[1]);
    173   if (!encoder)
    174     die("Unsupported codec.");
    175 
    176   info.codec_fourcc = encoder->fourcc;
    177   info.frame_width = strtol(argv[2], NULL, 0);
    178   info.frame_height = strtol(argv[3], NULL, 0);
    179   info.time_base.numerator = 1;
    180   info.time_base.denominator = fps;
    181 
    182   if (info.frame_width <= 0 ||
    183       info.frame_height <= 0 ||
    184       (info.frame_width % 2) != 0 ||
    185       (info.frame_height % 2) != 0) {
    186     die("Invalid frame size: %dx%d", info.frame_width, info.frame_height);
    187   }
    188 
    189   if (!vpx_img_alloc(&raw, VPX_IMG_FMT_I420, info.frame_width,
    190                                              info.frame_height, 1)) {
    191     die("Failed to allocate image.");
    192   }
    193 
    194   printf("Using %s\n", vpx_codec_iface_name(encoder->interface()));
    195 
    196   res = vpx_codec_enc_config_default(encoder->interface(), &cfg, 0);
    197   if (res)
    198     die_codec(&codec, "Failed to get default codec config.");
    199 
    200   cfg.g_w = info.frame_width;
    201   cfg.g_h = info.frame_height;
    202   cfg.g_timebase.num = info.time_base.numerator;
    203   cfg.g_timebase.den = info.time_base.denominator;
    204   cfg.rc_target_bitrate = (unsigned int)(bits_per_pixel_per_frame * cfg.g_w *
    205                                          cfg.g_h * fps / 1000);
    206   cfg.g_lag_in_frames = 0;
    207 
    208   writer = vpx_video_writer_open(argv[5], kContainerIVF, &info);
    209   if (!writer)
    210     die("Failed to open %s for writing.", argv[5]);
    211 
    212   if (!(infile = fopen(argv[4], "rb")))
    213     die("Failed to open %s for reading.", argv[4]);
    214 
    215   if (vpx_codec_enc_init(&codec, encoder->interface(), &cfg, 0))
    216     die_codec(&codec, "Failed to initialize encoder");
    217 
    218   while (vpx_img_read(&raw, infile)) {
    219     ++frame_count;
    220 
    221     if (frame_count == 22 && encoder->fourcc == VP8_FOURCC) {
    222       set_roi_map(&cfg, &codec);
    223     } else if (frame_count == 33) {
    224       set_active_map(&cfg, &codec);
    225     } else if (frame_count == 44) {
    226       unset_active_map(&cfg, &codec);
    227     }
    228 
    229     encode_frame(&codec, &raw, frame_count, writer);
    230   }
    231   encode_frame(&codec, NULL, -1, writer);
    232   printf("\n");
    233   fclose(infile);
    234   printf("Processed %d frames.\n", frame_count);
    235 
    236   vpx_img_free(&raw);
    237   if (vpx_codec_destroy(&codec))
    238     die_codec(&codec, "Failed to destroy codec.");
    239 
    240   vpx_video_writer_close(writer);
    241 
    242   return EXIT_SUCCESS;
    243 }
    244