Home | History | Annotate | Download | only in jpeg
      1 /*
      2  * jddctmgr.c
      3  *
      4  * Copyright (C) 1994-1996, Thomas G. Lane.
      5  * This file is part of the Independent JPEG Group's software.
      6  * For conditions of distribution and use, see the accompanying README file.
      7  *
      8  * This file contains the inverse-DCT management logic.
      9  * This code selects a particular IDCT implementation to be used,
     10  * and it performs related housekeeping chores.  No code in this file
     11  * is executed per IDCT step, only during output pass setup.
     12  *
     13  * Note that the IDCT routines are responsible for performing coefficient
     14  * dequantization as well as the IDCT proper.  This module sets up the
     15  * dequantization multiplier table needed by the IDCT routine.
     16  */
     17 
     18 #define JPEG_INTERNALS
     19 #include "jinclude.h"
     20 #include "jpeglib.h"
     21 #include "jdct.h"		/* Private declarations for DCT subsystem */
     22 
     23 #ifdef ANDROID_ARMV6_IDCT
     24   #undef ANDROID_ARMV6_IDCT
     25   #ifdef __arm__
     26     #include <machine/cpu-features.h>
     27     #if __ARM_ARCH__ >= 6
     28       #define ANDROID_ARMV6_IDCT
     29     #else
     30       #warning "ANDROID_ARMV6_IDCT is disabled"
     31     #endif
     32   #endif
     33 #endif
     34 
     35 #ifdef NV_ARM_NEON
     36 #include "jsimd_neon.h"
     37 #endif
     38 
     39 #ifdef ANDROID_ARMV6_IDCT
     40 
     41 /* Intentionally declare the prototype with arguments of primitive types instead
     42  * of type-defined ones. This will at least generate some warnings if jmorecfg.h
     43  * is changed and becomes incompatible with the assembly code.
     44  */
     45 extern void armv6_idct(short *coefs, int *quans, unsigned char **rows, int col);
     46 
     47 void jpeg_idct_armv6 (j_decompress_ptr cinfo, jpeg_component_info * compptr,
     48 		 JCOEFPTR coef_block,
     49 		 JSAMPARRAY output_buf, JDIMENSION output_col)
     50 {
     51   IFAST_MULT_TYPE *dct_table = (IFAST_MULT_TYPE *)compptr->dct_table;
     52   armv6_idct(coef_block, dct_table, output_buf, output_col);
     53 }
     54 
     55 #endif
     56 
     57 #ifdef ANDROID_INTELSSE2_IDCT
     58 extern short __attribute__((aligned(16))) quantptrSSE[DCTSIZE2];
     59 extern void jpeg_idct_intelsse (j_decompress_ptr cinfo, jpeg_component_info * compptr,
     60 		JCOEFPTR coef_block,
     61 		JSAMPARRAY output_buf, JDIMENSION output_col);
     62 #endif
     63 
     64 #ifdef ANDROID_MIPS_IDCT
     65 extern void jpeg_idct_mips(j_decompress_ptr, jpeg_component_info *, JCOEFPTR, JSAMPARRAY, JDIMENSION);
     66 #endif
     67 
     68 /*
     69  * The decompressor input side (jdinput.c) saves away the appropriate
     70  * quantization table for each component at the start of the first scan
     71  * involving that component.  (This is necessary in order to correctly
     72  * decode files that reuse Q-table slots.)
     73  * When we are ready to make an output pass, the saved Q-table is converted
     74  * to a multiplier table that will actually be used by the IDCT routine.
     75  * The multiplier table contents are IDCT-method-dependent.  To support
     76  * application changes in IDCT method between scans, we can remake the
     77  * multiplier tables if necessary.
     78  * In buffered-image mode, the first output pass may occur before any data
     79  * has been seen for some components, and thus before their Q-tables have
     80  * been saved away.  To handle this case, multiplier tables are preset
     81  * to zeroes; the result of the IDCT will be a neutral gray level.
     82  */
     83 
     84 
     85 /* Private subobject for this module */
     86 
     87 typedef struct {
     88   struct jpeg_inverse_dct pub;	/* public fields */
     89 
     90   /* This array contains the IDCT method code that each multiplier table
     91    * is currently set up for, or -1 if it's not yet set up.
     92    * The actual multiplier tables are pointed to by dct_table in the
     93    * per-component comp_info structures.
     94    */
     95   int cur_method[MAX_COMPONENTS];
     96 } my_idct_controller;
     97 
     98 typedef my_idct_controller * my_idct_ptr;
     99 
    100 
    101 /* Allocated multiplier tables: big enough for any supported variant */
    102 
    103 typedef union {
    104   ISLOW_MULT_TYPE islow_array[DCTSIZE2];
    105 #ifdef DCT_IFAST_SUPPORTED
    106   IFAST_MULT_TYPE ifast_array[DCTSIZE2];
    107 #endif
    108 #ifdef DCT_FLOAT_SUPPORTED
    109   FLOAT_MULT_TYPE float_array[DCTSIZE2];
    110 #endif
    111 } multiplier_table;
    112 
    113 
    114 /* The current scaled-IDCT routines require ISLOW-style multiplier tables,
    115  * so be sure to compile that code if either ISLOW or SCALING is requested.
    116  */
    117 #ifdef DCT_ISLOW_SUPPORTED
    118 #define PROVIDE_ISLOW_TABLES
    119 #else
    120 #ifdef IDCT_SCALING_SUPPORTED
    121 #define PROVIDE_ISLOW_TABLES
    122 #endif
    123 #endif
    124 
    125 
    126 /*
    127  * Prepare for an output pass.
    128  * Here we select the proper IDCT routine for each component and build
    129  * a matching multiplier table.
    130  */
    131 
    132 METHODDEF(void)
    133 start_pass (j_decompress_ptr cinfo)
    134 {
    135   my_idct_ptr idct = (my_idct_ptr) cinfo->idct;
    136   int ci, i;
    137   jpeg_component_info *compptr;
    138   int method = 0;
    139   inverse_DCT_method_ptr method_ptr = NULL;
    140   JQUANT_TBL * qtbl;
    141 
    142   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    143        ci++, compptr++) {
    144     /* Select the proper IDCT routine for this component's scaling */
    145     switch (compptr->DCT_scaled_size) {
    146 #ifdef IDCT_SCALING_SUPPORTED
    147     case 1:
    148       method_ptr = jpeg_idct_1x1;
    149       method = JDCT_ISLOW;	/* jidctred uses islow-style table */
    150       break;
    151     case 2:
    152 #if defined(NV_ARM_NEON) && defined(__ARM_HAVE_NEON)
    153       if (cap_neon_idct_2x2()) {
    154         method_ptr = jsimd_idct_2x2;
    155       } else {
    156         method_ptr = jpeg_idct_2x2;
    157       }
    158 #else
    159       method_ptr = jpeg_idct_2x2;
    160 #endif
    161       method = JDCT_ISLOW;	/* jidctred uses islow-style table */
    162       break;
    163     case 4:
    164 #if defined(NV_ARM_NEON) && defined(__ARM_HAVE_NEON)
    165 	  if (cap_neon_idct_4x4()) {
    166         method_ptr = jsimd_idct_4x4;
    167       } else {
    168         method_ptr = jpeg_idct_4x4;
    169       }
    170 #else
    171       method_ptr = jpeg_idct_4x4;
    172 #endif
    173       method = JDCT_ISLOW;	/* jidctred uses islow-style table */
    174       break;
    175 #endif
    176     case DCTSIZE:
    177       switch (cinfo->dct_method) {
    178 #ifdef ANDROID_ARMV6_IDCT
    179       case JDCT_ISLOW:
    180       case JDCT_IFAST:
    181 	method_ptr = jpeg_idct_armv6;
    182 	method = JDCT_IFAST;
    183 	break;
    184 #else /* ANDROID_ARMV6_IDCT */
    185 #ifdef ANDROID_INTELSSE2_IDCT
    186       case JDCT_ISLOW:
    187       case JDCT_IFAST:
    188 	method_ptr = jpeg_idct_intelsse;
    189 	method = JDCT_ISLOW; /* Use quant table of ISLOW.*/
    190 	break;
    191 #else /* ANDROID_INTELSSE2_IDCT */
    192 #ifdef ANDROID_MIPS_IDCT
    193       case JDCT_ISLOW:
    194       case JDCT_IFAST:
    195 	method_ptr = jpeg_idct_mips;
    196 	method = JDCT_IFAST;
    197 	break;
    198 #else /* ANDROID_MIPS_IDCT */
    199 #ifdef DCT_ISLOW_SUPPORTED
    200       case JDCT_ISLOW:
    201 	method_ptr = jpeg_idct_islow;
    202 	method = JDCT_ISLOW;
    203 	break;
    204 #endif
    205 #ifdef DCT_IFAST_SUPPORTED
    206       case JDCT_IFAST:
    207 #if defined(NV_ARM_NEON) && defined(__ARM_HAVE_NEON)
    208         if (cap_neon_idct_ifast()) {
    209           method_ptr = jsimd_idct_ifast;
    210         } else {
    211           method_ptr = jpeg_idct_ifast;
    212         }
    213 #else
    214         method_ptr = jpeg_idct_ifast;
    215 #endif
    216 	method = JDCT_IFAST;
    217 	break;
    218 #endif
    219 #endif /* ANDROID_MIPS_IDCT */
    220 #endif /* ANDROID_INTELSSE2_IDCT*/
    221 #endif /* ANDROID_ARMV6_IDCT */
    222 #ifdef DCT_FLOAT_SUPPORTED
    223       case JDCT_FLOAT:
    224 	method_ptr = jpeg_idct_float;
    225 	method = JDCT_FLOAT;
    226 	break;
    227 #endif
    228       default:
    229 	ERREXIT(cinfo, JERR_NOT_COMPILED);
    230 	break;
    231       }
    232       break;
    233     default:
    234       ERREXIT1(cinfo, JERR_BAD_DCTSIZE, compptr->DCT_scaled_size);
    235       break;
    236     }
    237     idct->pub.inverse_DCT[ci] = method_ptr;
    238     /* Create multiplier table from quant table.
    239      * However, we can skip this if the component is uninteresting
    240      * or if we already built the table.  Also, if no quant table
    241      * has yet been saved for the component, we leave the
    242      * multiplier table all-zero; we'll be reading zeroes from the
    243      * coefficient controller's buffer anyway.
    244      */
    245     if (! compptr->component_needed || idct->cur_method[ci] == method)
    246       continue;
    247     qtbl = compptr->quant_table;
    248     if (qtbl == NULL)		/* happens if no data yet for component */
    249       continue;
    250     idct->cur_method[ci] = method;
    251     switch (method) {
    252 #ifdef PROVIDE_ISLOW_TABLES
    253     case JDCT_ISLOW:
    254       {
    255 	/* For LL&M IDCT method, multipliers are equal to raw quantization
    256 	 * coefficients, but are stored as ints to ensure access efficiency.
    257 	 */
    258 	ISLOW_MULT_TYPE * ismtbl = (ISLOW_MULT_TYPE *) compptr->dct_table;
    259 	for (i = 0; i < DCTSIZE2; i++) {
    260 	  ismtbl[i] = (ISLOW_MULT_TYPE) qtbl->quantval[i];
    261 	}
    262       }
    263       break;
    264 #endif
    265 #ifdef DCT_IFAST_SUPPORTED
    266     case JDCT_IFAST:
    267       {
    268 	/* For AA&N IDCT method, multipliers are equal to quantization
    269 	 * coefficients scaled by scalefactor[row]*scalefactor[col], where
    270 	 *   scalefactor[0] = 1
    271 	 *   scalefactor[k] = cos(k*PI/16) * sqrt(2)    for k=1..7
    272 	 * For integer operation, the multiplier table is to be scaled by
    273 	 * IFAST_SCALE_BITS.
    274 	 */
    275 	IFAST_MULT_TYPE * ifmtbl = (IFAST_MULT_TYPE *) compptr->dct_table;
    276 #ifdef ANDROID_ARMV6_IDCT
    277 	/* Precomputed values scaled up by 15 bits. */
    278 	static const unsigned short scales[DCTSIZE2] = {
    279 	  32768, 45451, 42813, 38531, 32768, 25746, 17734,  9041,
    280 	  45451, 63042, 59384, 53444, 45451, 35710, 24598, 12540,
    281 	  42813, 59384, 55938, 50343, 42813, 33638, 23170, 11812,
    282 	  38531, 53444, 50343, 45308, 38531, 30274, 20853, 10631,
    283 	  32768, 45451, 42813, 38531, 32768, 25746, 17734,  9041,
    284 	  25746, 35710, 33638, 30274, 25746, 20228, 13933,  7103,
    285 	  17734, 24598, 23170, 20853, 17734, 13933,  9598,  4893,
    286 	   9041, 12540, 11812, 10631,  9041,  7103,  4893,  2494,
    287 	};
    288 	/* Inverse map of [7, 5, 1, 3, 0, 2, 4, 6]. */
    289 	static const char orders[DCTSIZE] = {4, 2, 5, 3, 6, 1, 7, 0};
    290 	/* Reorder the columns after transposing. */
    291 	for (i = 0; i < DCTSIZE2; ++i) {
    292 	  int j = ((i & 7) << 3) + orders[i >> 3];
    293 	  ifmtbl[j] = (qtbl->quantval[i] * scales[i] + 2) >> 2;
    294 	}
    295 #else /* ANDROID_ARMV6_IDCT */
    296 
    297 #define CONST_BITS 14
    298 	static const INT16 aanscales[DCTSIZE2] = {
    299 	  /* precomputed values scaled up by 14 bits */
    300 	  16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    301 	  22725, 31521, 29692, 26722, 22725, 17855, 12299,  6270,
    302 	  21407, 29692, 27969, 25172, 21407, 16819, 11585,  5906,
    303 	  19266, 26722, 25172, 22654, 19266, 15137, 10426,  5315,
    304 	  16384, 22725, 21407, 19266, 16384, 12873,  8867,  4520,
    305 	  12873, 17855, 16819, 15137, 12873, 10114,  6967,  3552,
    306 	   8867, 12299, 11585, 10426,  8867,  6967,  4799,  2446,
    307 	   4520,  6270,  5906,  5315,  4520,  3552,  2446,  1247
    308 	};
    309 	SHIFT_TEMPS
    310 
    311 	for (i = 0; i < DCTSIZE2; i++) {
    312 	  ifmtbl[i] = (IFAST_MULT_TYPE)
    313 	    DESCALE(MULTIPLY16V16((INT32) qtbl->quantval[i],
    314 				  (INT32) aanscales[i]),
    315 		    CONST_BITS-IFAST_SCALE_BITS);
    316 	}
    317 #endif /* ANDROID_ARMV6_IDCT */
    318       }
    319       break;
    320 #endif
    321 #ifdef DCT_FLOAT_SUPPORTED
    322     case JDCT_FLOAT:
    323       {
    324 	/* For float AA&N IDCT method, multipliers are equal to quantization
    325 	 * coefficients scaled by scalefactor[row]*scalefactor[col], where
    326 	 *   scalefactor[0] = 1
    327 	 *   scalefactor[k] = cos(k*PI/16) * sqrt(2)    for k=1..7
    328 	 */
    329 	FLOAT_MULT_TYPE * fmtbl = (FLOAT_MULT_TYPE *) compptr->dct_table;
    330 	int row, col;
    331 	static const double aanscalefactor[DCTSIZE] = {
    332 	  1.0, 1.387039845, 1.306562965, 1.175875602,
    333 	  1.0, 0.785694958, 0.541196100, 0.275899379
    334 	};
    335 
    336 	i = 0;
    337 	for (row = 0; row < DCTSIZE; row++) {
    338 	  for (col = 0; col < DCTSIZE; col++) {
    339 	    fmtbl[i] = (FLOAT_MULT_TYPE)
    340 	      ((double) qtbl->quantval[i] *
    341 	       aanscalefactor[row] * aanscalefactor[col]);
    342 	    i++;
    343 	  }
    344 	}
    345       }
    346       break;
    347 #endif
    348     default:
    349       ERREXIT(cinfo, JERR_NOT_COMPILED);
    350       break;
    351     }
    352   }
    353 }
    354 
    355 
    356 /*
    357  * Initialize IDCT manager.
    358  */
    359 
    360 GLOBAL(void)
    361 jinit_inverse_dct (j_decompress_ptr cinfo)
    362 {
    363   my_idct_ptr idct;
    364   int ci;
    365   jpeg_component_info *compptr;
    366 
    367   idct = (my_idct_ptr)
    368     (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
    369 				SIZEOF(my_idct_controller));
    370   cinfo->idct = (struct jpeg_inverse_dct *) idct;
    371   idct->pub.start_pass = start_pass;
    372 
    373   for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
    374        ci++, compptr++) {
    375     /* Allocate and pre-zero a multiplier table for each component */
    376     compptr->dct_table =
    377       (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE,
    378 				  SIZEOF(multiplier_table));
    379     MEMZERO(compptr->dct_table, SIZEOF(multiplier_table));
    380     /* Mark multiplier table not yet set up for any method */
    381     idct->cur_method[ci] = -1;
    382   }
    383 }
    384