Home | History | Annotate | Download | only in libjpeg-turbo
      1 /*
      2  * jdmainct.c
      3  *
      4  * This file was part of the Independent JPEG Group's software:
      5  * Copyright (C) 1994-1996, Thomas G. Lane.
      6  * libjpeg-turbo Modifications:
      7  * Copyright (C) 2010, 2016, D. R. Commander.
      8  * For conditions of distribution and use, see the accompanying README.ijg
      9  * file.
     10  *
     11  * This file contains the main buffer controller for decompression.
     12  * The main buffer lies between the JPEG decompressor proper and the
     13  * post-processor; it holds downsampled data in the JPEG colorspace.
     14  *
     15  * Note that this code is bypassed in raw-data mode, since the application
     16  * supplies the equivalent of the main buffer in that case.
     17  */
     18 
     19 #include "jinclude.h"
     20 #include "jdmainct.h"
     21 
     22 
     23 /*
     24  * In the current system design, the main buffer need never be a full-image
     25  * buffer; any full-height buffers will be found inside the coefficient or
     26  * postprocessing controllers.  Nonetheless, the main controller is not
     27  * trivial.  Its responsibility is to provide context rows for upsampling/
     28  * rescaling, and doing this in an efficient fashion is a bit tricky.
     29  *
     30  * Postprocessor input data is counted in "row groups".  A row group
     31  * is defined to be (v_samp_factor * DCT_scaled_size / min_DCT_scaled_size)
     32  * sample rows of each component.  (We require DCT_scaled_size values to be
     33  * chosen such that these numbers are integers.  In practice DCT_scaled_size
     34  * values will likely be powers of two, so we actually have the stronger
     35  * condition that DCT_scaled_size / min_DCT_scaled_size is an integer.)
     36  * Upsampling will typically produce max_v_samp_factor pixel rows from each
     37  * row group (times any additional scale factor that the upsampler is
     38  * applying).
     39  *
     40  * The coefficient controller will deliver data to us one iMCU row at a time;
     41  * each iMCU row contains v_samp_factor * DCT_scaled_size sample rows, or
     42  * exactly min_DCT_scaled_size row groups.  (This amount of data corresponds
     43  * to one row of MCUs when the image is fully interleaved.)  Note that the
     44  * number of sample rows varies across components, but the number of row
     45  * groups does not.  Some garbage sample rows may be included in the last iMCU
     46  * row at the bottom of the image.
     47  *
     48  * Depending on the vertical scaling algorithm used, the upsampler may need
     49  * access to the sample row(s) above and below its current input row group.
     50  * The upsampler is required to set need_context_rows TRUE at global selection
     51  * time if so.  When need_context_rows is FALSE, this controller can simply
     52  * obtain one iMCU row at a time from the coefficient controller and dole it
     53  * out as row groups to the postprocessor.
     54  *
     55  * When need_context_rows is TRUE, this controller guarantees that the buffer
     56  * passed to postprocessing contains at least one row group's worth of samples
     57  * above and below the row group(s) being processed.  Note that the context
     58  * rows "above" the first passed row group appear at negative row offsets in
     59  * the passed buffer.  At the top and bottom of the image, the required
     60  * context rows are manufactured by duplicating the first or last real sample
     61  * row; this avoids having special cases in the upsampling inner loops.
     62  *
     63  * The amount of context is fixed at one row group just because that's a
     64  * convenient number for this controller to work with.  The existing
     65  * upsamplers really only need one sample row of context.  An upsampler
     66  * supporting arbitrary output rescaling might wish for more than one row
     67  * group of context when shrinking the image; tough, we don't handle that.
     68  * (This is justified by the assumption that downsizing will be handled mostly
     69  * by adjusting the DCT_scaled_size values, so that the actual scale factor at
     70  * the upsample step needn't be much less than one.)
     71  *
     72  * To provide the desired context, we have to retain the last two row groups
     73  * of one iMCU row while reading in the next iMCU row.  (The last row group
     74  * can't be processed until we have another row group for its below-context,
     75  * and so we have to save the next-to-last group too for its above-context.)
     76  * We could do this most simply by copying data around in our buffer, but
     77  * that'd be very slow.  We can avoid copying any data by creating a rather
     78  * strange pointer structure.  Here's how it works.  We allocate a workspace
     79  * consisting of M+2 row groups (where M = min_DCT_scaled_size is the number
     80  * of row groups per iMCU row).  We create two sets of redundant pointers to
     81  * the workspace.  Labeling the physical row groups 0 to M+1, the synthesized
     82  * pointer lists look like this:
     83  *                   M+1                          M-1
     84  * master pointer --> 0         master pointer --> 0
     85  *                    1                            1
     86  *                   ...                          ...
     87  *                   M-3                          M-3
     88  *                   M-2                           M
     89  *                   M-1                          M+1
     90  *                    M                           M-2
     91  *                   M+1                          M-1
     92  *                    0                            0
     93  * We read alternate iMCU rows using each master pointer; thus the last two
     94  * row groups of the previous iMCU row remain un-overwritten in the workspace.
     95  * The pointer lists are set up so that the required context rows appear to
     96  * be adjacent to the proper places when we pass the pointer lists to the
     97  * upsampler.
     98  *
     99  * The above pictures describe the normal state of the pointer lists.
    100  * At top and bottom of the image, we diddle the pointer lists to duplicate
    101  * the first or last sample row as necessary (this is cheaper than copying
    102  * sample rows around).
    103  *
    104  * This scheme breaks down if M < 2, ie, min_DCT_scaled_size is 1.  In that
    105  * situation each iMCU row provides only one row group so the buffering logic
    106  * must be different (eg, we must read two iMCU rows before we can emit the
    107  * first row group).  For now, we simply do not support providing context
    108  * rows when min_DCT_scaled_size is 1.  That combination seems unlikely to
    109  * be worth providing --- if someone wants a 1/8th-size preview, they probably
    110  * want it quick and dirty, so a context-free upsampler is sufficient.
    111  */
    112 
    113 
    114 /* Forward declarations */
    115 METHODDEF(void) process_data_simple_main(j_decompress_ptr cinfo,
    116                                          JSAMPARRAY output_buf,
    117                                          JDIMENSION *out_row_ctr,
    118                                          JDIMENSION out_rows_avail);
    119 METHODDEF(void) process_data_context_main(j_decompress_ptr cinfo,
    120                                           JSAMPARRAY output_buf,
    121                                           JDIMENSION *out_row_ctr,
    122                                           JDIMENSION out_rows_avail);
    123 #ifdef QUANT_2PASS_SUPPORTED
    124 METHODDEF(void) process_data_crank_post(j_decompress_ptr cinfo,
    125                                         JSAMPARRAY output_buf,
    126                                         JDIMENSION *out_row_ctr,
    127                                         JDIMENSION out_rows_avail);
    128 #endif
    129 
    130 
    131 LOCAL(void)
    132 alloc_funny_pointers(j_decompress_ptr cinfo)
    133 /* Allocate space for the funny pointer lists.
    134  * This is done only once, not once per pass.
    135  */
    136 {
    137   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    138   int ci, rgroup;
    139   int M = cinfo->_min_DCT_scaled_size;
    140   jpeg_component_info *compptr;
    141   JSAMPARRAY xbuf;
    142 
    143   /* Get top-level space for component array pointers.
    144    * We alloc both arrays with one call to save a few cycles.
    145    */
    146   main_ptr->xbuffer[0] = (JSAMPIMAGE)
    147     (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
    148                                 cinfo->num_components * 2 * sizeof(JSAMPARRAY));
    149   main_ptr->xbuffer[1] = main_ptr->xbuffer[0] + cinfo->num_components;
    150 
    151   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    152        ci++, compptr++) {
    153     rgroup = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
    154       cinfo->_min_DCT_scaled_size; /* height of a row group of component */
    155     /* Get space for pointer lists --- M+4 row groups in each list.
    156      * We alloc both pointer lists with one call to save a few cycles.
    157      */
    158     xbuf = (JSAMPARRAY)
    159       (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
    160                                   2 * (rgroup * (M + 4)) * sizeof(JSAMPROW));
    161     xbuf += rgroup;             /* want one row group at negative offsets */
    162     main_ptr->xbuffer[0][ci] = xbuf;
    163     xbuf += rgroup * (M + 4);
    164     main_ptr->xbuffer[1][ci] = xbuf;
    165   }
    166 }
    167 
    168 
    169 LOCAL(void)
    170 make_funny_pointers(j_decompress_ptr cinfo)
    171 /* Create the funny pointer lists discussed in the comments above.
    172  * The actual workspace is already allocated (in main_ptr->buffer),
    173  * and the space for the pointer lists is allocated too.
    174  * This routine just fills in the curiously ordered lists.
    175  * This will be repeated at the beginning of each pass.
    176  */
    177 {
    178   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    179   int ci, i, rgroup;
    180   int M = cinfo->_min_DCT_scaled_size;
    181   jpeg_component_info *compptr;
    182   JSAMPARRAY buf, xbuf0, xbuf1;
    183 
    184   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    185        ci++, compptr++) {
    186     rgroup = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
    187       cinfo->_min_DCT_scaled_size; /* height of a row group of component */
    188     xbuf0 = main_ptr->xbuffer[0][ci];
    189     xbuf1 = main_ptr->xbuffer[1][ci];
    190     /* First copy the workspace pointers as-is */
    191     buf = main_ptr->buffer[ci];
    192     for (i = 0; i < rgroup * (M + 2); i++) {
    193       xbuf0[i] = xbuf1[i] = buf[i];
    194     }
    195     /* In the second list, put the last four row groups in swapped order */
    196     for (i = 0; i < rgroup * 2; i++) {
    197       xbuf1[rgroup * (M - 2) + i] = buf[rgroup * M + i];
    198       xbuf1[rgroup * M + i] = buf[rgroup * (M - 2) + i];
    199     }
    200     /* The wraparound pointers at top and bottom will be filled later
    201      * (see set_wraparound_pointers, below).  Initially we want the "above"
    202      * pointers to duplicate the first actual data line.  This only needs
    203      * to happen in xbuffer[0].
    204      */
    205     for (i = 0; i < rgroup; i++) {
    206       xbuf0[i - rgroup] = xbuf0[0];
    207     }
    208   }
    209 }
    210 
    211 
    212 LOCAL(void)
    213 set_bottom_pointers(j_decompress_ptr cinfo)
    214 /* Change the pointer lists to duplicate the last sample row at the bottom
    215  * of the image.  whichptr indicates which xbuffer holds the final iMCU row.
    216  * Also sets rowgroups_avail to indicate number of nondummy row groups in row.
    217  */
    218 {
    219   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    220   int ci, i, rgroup, iMCUheight, rows_left;
    221   jpeg_component_info *compptr;
    222   JSAMPARRAY xbuf;
    223 
    224   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    225        ci++, compptr++) {
    226     /* Count sample rows in one iMCU row and in one row group */
    227     iMCUheight = compptr->v_samp_factor * compptr->_DCT_scaled_size;
    228     rgroup = iMCUheight / cinfo->_min_DCT_scaled_size;
    229     /* Count nondummy sample rows remaining for this component */
    230     rows_left = (int)(compptr->downsampled_height % (JDIMENSION)iMCUheight);
    231     if (rows_left == 0) rows_left = iMCUheight;
    232     /* Count nondummy row groups.  Should get same answer for each component,
    233      * so we need only do it once.
    234      */
    235     if (ci == 0) {
    236       main_ptr->rowgroups_avail = (JDIMENSION)((rows_left - 1) / rgroup + 1);
    237     }
    238     /* Duplicate the last real sample row rgroup*2 times; this pads out the
    239      * last partial rowgroup and ensures at least one full rowgroup of context.
    240      */
    241     xbuf = main_ptr->xbuffer[main_ptr->whichptr][ci];
    242     for (i = 0; i < rgroup * 2; i++) {
    243       xbuf[rows_left + i] = xbuf[rows_left - 1];
    244     }
    245   }
    246 }
    247 
    248 
    249 /*
    250  * Initialize for a processing pass.
    251  */
    252 
    253 METHODDEF(void)
    254 start_pass_main(j_decompress_ptr cinfo, J_BUF_MODE pass_mode)
    255 {
    256   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    257 
    258   switch (pass_mode) {
    259   case JBUF_PASS_THRU:
    260     if (cinfo->upsample->need_context_rows) {
    261       main_ptr->pub.process_data = process_data_context_main;
    262       make_funny_pointers(cinfo); /* Create the xbuffer[] lists */
    263       main_ptr->whichptr = 0;   /* Read first iMCU row into xbuffer[0] */
    264       main_ptr->context_state = CTX_PREPARE_FOR_IMCU;
    265       main_ptr->iMCU_row_ctr = 0;
    266     } else {
    267       /* Simple case with no context needed */
    268       main_ptr->pub.process_data = process_data_simple_main;
    269     }
    270     main_ptr->buffer_full = FALSE;      /* Mark buffer empty */
    271     main_ptr->rowgroup_ctr = 0;
    272     break;
    273 #ifdef QUANT_2PASS_SUPPORTED
    274   case JBUF_CRANK_DEST:
    275     /* For last pass of 2-pass quantization, just crank the postprocessor */
    276     main_ptr->pub.process_data = process_data_crank_post;
    277     break;
    278 #endif
    279   default:
    280     ERREXIT(cinfo, JERR_BAD_BUFFER_MODE);
    281     break;
    282   }
    283 }
    284 
    285 
    286 /*
    287  * Process some data.
    288  * This handles the simple case where no context is required.
    289  */
    290 
    291 METHODDEF(void)
    292 process_data_simple_main(j_decompress_ptr cinfo, JSAMPARRAY output_buf,
    293                          JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail)
    294 {
    295   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    296   JDIMENSION rowgroups_avail;
    297 
    298   /* Read input data if we haven't filled the main buffer yet */
    299   if (!main_ptr->buffer_full) {
    300     if (!(*cinfo->coef->decompress_data) (cinfo, main_ptr->buffer))
    301       return;                   /* suspension forced, can do nothing more */
    302     main_ptr->buffer_full = TRUE;       /* OK, we have an iMCU row to work with */
    303   }
    304 
    305   /* There are always min_DCT_scaled_size row groups in an iMCU row. */
    306   rowgroups_avail = (JDIMENSION)cinfo->_min_DCT_scaled_size;
    307   /* Note: at the bottom of the image, we may pass extra garbage row groups
    308    * to the postprocessor.  The postprocessor has to check for bottom
    309    * of image anyway (at row resolution), so no point in us doing it too.
    310    */
    311 
    312   /* Feed the postprocessor */
    313   (*cinfo->post->post_process_data) (cinfo, main_ptr->buffer,
    314                                      &main_ptr->rowgroup_ctr, rowgroups_avail,
    315                                      output_buf, out_row_ctr, out_rows_avail);
    316 
    317   /* Has postprocessor consumed all the data yet? If so, mark buffer empty */
    318   if (main_ptr->rowgroup_ctr >= rowgroups_avail) {
    319     main_ptr->buffer_full = FALSE;
    320     main_ptr->rowgroup_ctr = 0;
    321   }
    322 }
    323 
    324 
    325 /*
    326  * Process some data.
    327  * This handles the case where context rows must be provided.
    328  */
    329 
    330 METHODDEF(void)
    331 process_data_context_main(j_decompress_ptr cinfo, JSAMPARRAY output_buf,
    332                           JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail)
    333 {
    334   my_main_ptr main_ptr = (my_main_ptr)cinfo->main;
    335 
    336   /* Read input data if we haven't filled the main buffer yet */
    337   if (!main_ptr->buffer_full) {
    338     if (!(*cinfo->coef->decompress_data) (cinfo,
    339                                           main_ptr->xbuffer[main_ptr->whichptr]))
    340       return;                   /* suspension forced, can do nothing more */
    341     main_ptr->buffer_full = TRUE;       /* OK, we have an iMCU row to work with */
    342     main_ptr->iMCU_row_ctr++;   /* count rows received */
    343   }
    344 
    345   /* Postprocessor typically will not swallow all the input data it is handed
    346    * in one call (due to filling the output buffer first).  Must be prepared
    347    * to exit and restart.  This switch lets us keep track of how far we got.
    348    * Note that each case falls through to the next on successful completion.
    349    */
    350   switch (main_ptr->context_state) {
    351   case CTX_POSTPONED_ROW:
    352     /* Call postprocessor using previously set pointers for postponed row */
    353     (*cinfo->post->post_process_data) (cinfo,
    354                                        main_ptr->xbuffer[main_ptr->whichptr],
    355                                        &main_ptr->rowgroup_ctr,
    356                                        main_ptr->rowgroups_avail, output_buf,
    357                                        out_row_ctr, out_rows_avail);
    358     if (main_ptr->rowgroup_ctr < main_ptr->rowgroups_avail)
    359       return;                   /* Need to suspend */
    360     main_ptr->context_state = CTX_PREPARE_FOR_IMCU;
    361     if (*out_row_ctr >= out_rows_avail)
    362       return;                   /* Postprocessor exactly filled output buf */
    363     /*FALLTHROUGH*/
    364   case CTX_PREPARE_FOR_IMCU:
    365     /* Prepare to process first M-1 row groups of this iMCU row */
    366     main_ptr->rowgroup_ctr = 0;
    367     main_ptr->rowgroups_avail = (JDIMENSION)(cinfo->_min_DCT_scaled_size - 1);
    368     /* Check for bottom of image: if so, tweak pointers to "duplicate"
    369      * the last sample row, and adjust rowgroups_avail to ignore padding rows.
    370      */
    371     if (main_ptr->iMCU_row_ctr == cinfo->total_iMCU_rows)
    372       set_bottom_pointers(cinfo);
    373     main_ptr->context_state = CTX_PROCESS_IMCU;
    374     /*FALLTHROUGH*/
    375   case CTX_PROCESS_IMCU:
    376     /* Call postprocessor using previously set pointers */
    377     (*cinfo->post->post_process_data) (cinfo,
    378                                        main_ptr->xbuffer[main_ptr->whichptr],
    379                                        &main_ptr->rowgroup_ctr,
    380                                        main_ptr->rowgroups_avail, output_buf,
    381                                        out_row_ctr, out_rows_avail);
    382     if (main_ptr->rowgroup_ctr < main_ptr->rowgroups_avail)
    383       return;                   /* Need to suspend */
    384     /* After the first iMCU, change wraparound pointers to normal state */
    385     if (main_ptr->iMCU_row_ctr == 1)
    386       set_wraparound_pointers(cinfo);
    387     /* Prepare to load new iMCU row using other xbuffer list */
    388     main_ptr->whichptr ^= 1;    /* 0=>1 or 1=>0 */
    389     main_ptr->buffer_full = FALSE;
    390     /* Still need to process last row group of this iMCU row, */
    391     /* which is saved at index M+1 of the other xbuffer */
    392     main_ptr->rowgroup_ctr = (JDIMENSION)(cinfo->_min_DCT_scaled_size + 1);
    393     main_ptr->rowgroups_avail = (JDIMENSION)(cinfo->_min_DCT_scaled_size + 2);
    394     main_ptr->context_state = CTX_POSTPONED_ROW;
    395   }
    396 }
    397 
    398 
    399 /*
    400  * Process some data.
    401  * Final pass of two-pass quantization: just call the postprocessor.
    402  * Source data will be the postprocessor controller's internal buffer.
    403  */
    404 
    405 #ifdef QUANT_2PASS_SUPPORTED
    406 
    407 METHODDEF(void)
    408 process_data_crank_post(j_decompress_ptr cinfo, JSAMPARRAY output_buf,
    409                         JDIMENSION *out_row_ctr, JDIMENSION out_rows_avail)
    410 {
    411   (*cinfo->post->post_process_data) (cinfo, (JSAMPIMAGE)NULL,
    412                                      (JDIMENSION *)NULL, (JDIMENSION)0,
    413                                      output_buf, out_row_ctr, out_rows_avail);
    414 }
    415 
    416 #endif /* QUANT_2PASS_SUPPORTED */
    417 
    418 
    419 /*
    420  * Initialize main buffer controller.
    421  */
    422 
    423 GLOBAL(void)
    424 jinit_d_main_controller(j_decompress_ptr cinfo, boolean need_full_buffer)
    425 {
    426   my_main_ptr main_ptr;
    427   int ci, rgroup, ngroups;
    428   jpeg_component_info *compptr;
    429 
    430   main_ptr = (my_main_ptr)
    431     (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
    432                                 sizeof(my_main_controller));
    433   cinfo->main = (struct jpeg_d_main_controller *)main_ptr;
    434   main_ptr->pub.start_pass = start_pass_main;
    435 
    436   if (need_full_buffer)         /* shouldn't happen */
    437     ERREXIT(cinfo, JERR_BAD_BUFFER_MODE);
    438 
    439   /* Allocate the workspace.
    440    * ngroups is the number of row groups we need.
    441    */
    442   if (cinfo->upsample->need_context_rows) {
    443     if (cinfo->_min_DCT_scaled_size < 2) /* unsupported, see comments above */
    444       ERREXIT(cinfo, JERR_NOTIMPL);
    445     alloc_funny_pointers(cinfo); /* Alloc space for xbuffer[] lists */
    446     ngroups = cinfo->_min_DCT_scaled_size + 2;
    447   } else {
    448     ngroups = cinfo->_min_DCT_scaled_size;
    449   }
    450 
    451   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    452        ci++, compptr++) {
    453     rgroup = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
    454       cinfo->_min_DCT_scaled_size; /* height of a row group of component */
    455     main_ptr->buffer[ci] = (*cinfo->mem->alloc_sarray)
    456                         ((j_common_ptr)cinfo, JPOOL_IMAGE,
    457                          compptr->width_in_blocks * compptr->_DCT_scaled_size,
    458                          (JDIMENSION)(rgroup * ngroups));
    459   }
    460 }
    461