1 /* 2 * jdsample.c 3 * 4 * This file was part of the Independent JPEG Group's software: 5 * Copyright (C) 1991-1996, Thomas G. Lane. 6 * libjpeg-turbo Modifications: 7 * Copyright 2009 Pierre Ossman <ossman (at) cendio.se> for Cendio AB 8 * Copyright (C) 2010, D. R. Commander. 9 * For conditions of distribution and use, see the accompanying README file. 10 * 11 * This file contains upsampling routines. 12 * 13 * Upsampling input data is counted in "row groups". A row group 14 * is defined to be (v_samp_factor * DCT_scaled_size / min_DCT_scaled_size) 15 * sample rows of each component. Upsampling will normally produce 16 * max_v_samp_factor pixel rows from each row group (but this could vary 17 * if the upsampler is applying a scale factor of its own). 18 * 19 * An excellent reference for image resampling is 20 * Digital Image Warping, George Wolberg, 1990. 21 * Pub. by IEEE Computer Society Press, Los Alamitos, CA. ISBN 0-8186-8944-7. 22 */ 23 24 #define JPEG_INTERNALS 25 #include "jinclude.h" 26 #include "jpeglib.h" 27 #include "jsimd.h" 28 #include "jpegcomp.h" 29 30 31 /* Pointer to routine to upsample a single component */ 32 typedef JMETHOD(void, upsample1_ptr, 33 (j_decompress_ptr cinfo, jpeg_component_info * compptr, 34 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr)); 35 36 /* Private subobject */ 37 38 typedef struct { 39 struct jpeg_upsampler pub; /* public fields */ 40 41 /* Color conversion buffer. When using separate upsampling and color 42 * conversion steps, this buffer holds one upsampled row group until it 43 * has been color converted and output. 44 * Note: we do not allocate any storage for component(s) which are full-size, 45 * ie do not need rescaling. The corresponding entry of color_buf[] is 46 * simply set to point to the input data array, thereby avoiding copying. 47 */ 48 JSAMPARRAY color_buf[MAX_COMPONENTS]; 49 50 /* Per-component upsampling method pointers */ 51 upsample1_ptr methods[MAX_COMPONENTS]; 52 53 int next_row_out; /* counts rows emitted from color_buf */ 54 JDIMENSION rows_to_go; /* counts rows remaining in image */ 55 56 /* Height of an input row group for each component. */ 57 int rowgroup_height[MAX_COMPONENTS]; 58 59 /* These arrays save pixel expansion factors so that int_expand need not 60 * recompute them each time. They are unused for other upsampling methods. 61 */ 62 UINT8 h_expand[MAX_COMPONENTS]; 63 UINT8 v_expand[MAX_COMPONENTS]; 64 } my_upsampler; 65 66 typedef my_upsampler * my_upsample_ptr; 67 68 69 /* 70 * Initialize for an upsampling pass. 71 */ 72 73 METHODDEF(void) 74 start_pass_upsample (j_decompress_ptr cinfo) 75 { 76 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample; 77 78 /* Mark the conversion buffer empty */ 79 upsample->next_row_out = cinfo->max_v_samp_factor; 80 /* Initialize total-height counter for detecting bottom of image */ 81 upsample->rows_to_go = cinfo->output_height; 82 } 83 84 85 /* 86 * Control routine to do upsampling (and color conversion). 87 * 88 * In this version we upsample each component independently. 89 * We upsample one row group into the conversion buffer, then apply 90 * color conversion a row at a time. 91 */ 92 93 METHODDEF(void) 94 sep_upsample (j_decompress_ptr cinfo, 95 JSAMPIMAGE input_buf, JDIMENSION *in_row_group_ctr, 96 JDIMENSION in_row_groups_avail, 97 JSAMPARRAY output_buf, JDIMENSION *out_row_ctr, 98 JDIMENSION out_rows_avail) 99 { 100 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample; 101 int ci; 102 jpeg_component_info * compptr; 103 JDIMENSION num_rows; 104 105 /* Fill the conversion buffer, if it's empty */ 106 if (upsample->next_row_out >= cinfo->max_v_samp_factor) { 107 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components; 108 ci++, compptr++) { 109 /* Invoke per-component upsample method. Notice we pass a POINTER 110 * to color_buf[ci], so that fullsize_upsample can change it. 111 */ 112 (*upsample->methods[ci]) (cinfo, compptr, 113 input_buf[ci] + (*in_row_group_ctr * upsample->rowgroup_height[ci]), 114 upsample->color_buf + ci); 115 } 116 upsample->next_row_out = 0; 117 } 118 119 /* Color-convert and emit rows */ 120 121 /* How many we have in the buffer: */ 122 num_rows = (JDIMENSION) (cinfo->max_v_samp_factor - upsample->next_row_out); 123 /* Not more than the distance to the end of the image. Need this test 124 * in case the image height is not a multiple of max_v_samp_factor: 125 */ 126 if (num_rows > upsample->rows_to_go) 127 num_rows = upsample->rows_to_go; 128 /* And not more than what the client can accept: */ 129 out_rows_avail -= *out_row_ctr; 130 if (num_rows > out_rows_avail) 131 num_rows = out_rows_avail; 132 133 (*cinfo->cconvert->color_convert) (cinfo, upsample->color_buf, 134 (JDIMENSION) upsample->next_row_out, 135 output_buf + *out_row_ctr, 136 (int) num_rows); 137 138 /* Adjust counts */ 139 *out_row_ctr += num_rows; 140 upsample->rows_to_go -= num_rows; 141 upsample->next_row_out += num_rows; 142 /* When the buffer is emptied, declare this input row group consumed */ 143 if (upsample->next_row_out >= cinfo->max_v_samp_factor) 144 (*in_row_group_ctr)++; 145 } 146 147 148 /* 149 * These are the routines invoked by sep_upsample to upsample pixel values 150 * of a single component. One row group is processed per call. 151 */ 152 153 154 /* 155 * For full-size components, we just make color_buf[ci] point at the 156 * input buffer, and thus avoid copying any data. Note that this is 157 * safe only because sep_upsample doesn't declare the input row group 158 * "consumed" until we are done color converting and emitting it. 159 */ 160 161 METHODDEF(void) 162 fullsize_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 163 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 164 { 165 *output_data_ptr = input_data; 166 } 167 168 169 /* 170 * This is a no-op version used for "uninteresting" components. 171 * These components will not be referenced by color conversion. 172 */ 173 174 METHODDEF(void) 175 noop_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 176 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 177 { 178 *output_data_ptr = NULL; /* safety check */ 179 } 180 181 182 /* 183 * This version handles any integral sampling ratios. 184 * This is not used for typical JPEG files, so it need not be fast. 185 * Nor, for that matter, is it particularly accurate: the algorithm is 186 * simple replication of the input pixel onto the corresponding output 187 * pixels. The hi-falutin sampling literature refers to this as a 188 * "box filter". A box filter tends to introduce visible artifacts, 189 * so if you are actually going to use 3:1 or 4:1 sampling ratios 190 * you would be well advised to improve this code. 191 */ 192 193 METHODDEF(void) 194 int_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 195 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 196 { 197 my_upsample_ptr upsample = (my_upsample_ptr) cinfo->upsample; 198 JSAMPARRAY output_data = *output_data_ptr; 199 register JSAMPROW inptr, outptr; 200 register JSAMPLE invalue; 201 register int h; 202 JSAMPROW outend; 203 int h_expand, v_expand; 204 int inrow, outrow; 205 206 h_expand = upsample->h_expand[compptr->component_index]; 207 v_expand = upsample->v_expand[compptr->component_index]; 208 209 inrow = outrow = 0; 210 while (outrow < cinfo->max_v_samp_factor) { 211 /* Generate one output row with proper horizontal expansion */ 212 inptr = input_data[inrow]; 213 outptr = output_data[outrow]; 214 outend = outptr + cinfo->output_width; 215 while (outptr < outend) { 216 invalue = *inptr++; /* don't need GETJSAMPLE() here */ 217 for (h = h_expand; h > 0; h--) { 218 *outptr++ = invalue; 219 } 220 } 221 /* Generate any additional output rows by duplicating the first one */ 222 if (v_expand > 1) { 223 jcopy_sample_rows(output_data, outrow, output_data, outrow+1, 224 v_expand-1, cinfo->output_width); 225 } 226 inrow++; 227 outrow += v_expand; 228 } 229 } 230 231 232 /* 233 * Fast processing for the common case of 2:1 horizontal and 1:1 vertical. 234 * It's still a box filter. 235 */ 236 237 METHODDEF(void) 238 h2v1_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 239 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 240 { 241 JSAMPARRAY output_data = *output_data_ptr; 242 register JSAMPROW inptr, outptr; 243 register JSAMPLE invalue; 244 JSAMPROW outend; 245 int inrow; 246 247 for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) { 248 inptr = input_data[inrow]; 249 outptr = output_data[inrow]; 250 outend = outptr + cinfo->output_width; 251 while (outptr < outend) { 252 invalue = *inptr++; /* don't need GETJSAMPLE() here */ 253 *outptr++ = invalue; 254 *outptr++ = invalue; 255 } 256 } 257 } 258 259 260 /* 261 * Fast processing for the common case of 2:1 horizontal and 2:1 vertical. 262 * It's still a box filter. 263 */ 264 265 METHODDEF(void) 266 h2v2_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 267 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 268 { 269 JSAMPARRAY output_data = *output_data_ptr; 270 register JSAMPROW inptr, outptr; 271 register JSAMPLE invalue; 272 JSAMPROW outend; 273 int inrow, outrow; 274 275 inrow = outrow = 0; 276 while (outrow < cinfo->max_v_samp_factor) { 277 inptr = input_data[inrow]; 278 outptr = output_data[outrow]; 279 outend = outptr + cinfo->output_width; 280 while (outptr < outend) { 281 invalue = *inptr++; /* don't need GETJSAMPLE() here */ 282 *outptr++ = invalue; 283 *outptr++ = invalue; 284 } 285 jcopy_sample_rows(output_data, outrow, output_data, outrow+1, 286 1, cinfo->output_width); 287 inrow++; 288 outrow += 2; 289 } 290 } 291 292 293 /* 294 * Fancy processing for the common case of 2:1 horizontal and 1:1 vertical. 295 * 296 * The upsampling algorithm is linear interpolation between pixel centers, 297 * also known as a "triangle filter". This is a good compromise between 298 * speed and visual quality. The centers of the output pixels are 1/4 and 3/4 299 * of the way between input pixel centers. 300 * 301 * A note about the "bias" calculations: when rounding fractional values to 302 * integer, we do not want to always round 0.5 up to the next integer. 303 * If we did that, we'd introduce a noticeable bias towards larger values. 304 * Instead, this code is arranged so that 0.5 will be rounded up or down at 305 * alternate pixel locations (a simple ordered dither pattern). 306 */ 307 308 METHODDEF(void) 309 h2v1_fancy_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 310 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 311 { 312 JSAMPARRAY output_data = *output_data_ptr; 313 register JSAMPROW inptr, outptr; 314 register int invalue; 315 register JDIMENSION colctr; 316 int inrow; 317 318 for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) { 319 inptr = input_data[inrow]; 320 outptr = output_data[inrow]; 321 /* Special case for first column */ 322 invalue = GETJSAMPLE(*inptr++); 323 *outptr++ = (JSAMPLE) invalue; 324 *outptr++ = (JSAMPLE) ((invalue * 3 + GETJSAMPLE(*inptr) + 2) >> 2); 325 326 for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) { 327 /* General case: 3/4 * nearer pixel + 1/4 * further pixel */ 328 invalue = GETJSAMPLE(*inptr++) * 3; 329 *outptr++ = (JSAMPLE) ((invalue + GETJSAMPLE(inptr[-2]) + 1) >> 2); 330 *outptr++ = (JSAMPLE) ((invalue + GETJSAMPLE(*inptr) + 2) >> 2); 331 } 332 333 /* Special case for last column */ 334 invalue = GETJSAMPLE(*inptr); 335 *outptr++ = (JSAMPLE) ((invalue * 3 + GETJSAMPLE(inptr[-1]) + 1) >> 2); 336 *outptr++ = (JSAMPLE) invalue; 337 } 338 } 339 340 341 /* 342 * Fancy processing for the common case of 2:1 horizontal and 2:1 vertical. 343 * Again a triangle filter; see comments for h2v1 case, above. 344 * 345 * It is OK for us to reference the adjacent input rows because we demanded 346 * context from the main buffer controller (see initialization code). 347 */ 348 349 METHODDEF(void) 350 h2v2_fancy_upsample (j_decompress_ptr cinfo, jpeg_component_info * compptr, 351 JSAMPARRAY input_data, JSAMPARRAY * output_data_ptr) 352 { 353 JSAMPARRAY output_data = *output_data_ptr; 354 register JSAMPROW inptr0, inptr1, outptr; 355 #if BITS_IN_JSAMPLE == 8 356 register int thiscolsum, lastcolsum, nextcolsum; 357 #else 358 register INT32 thiscolsum, lastcolsum, nextcolsum; 359 #endif 360 register JDIMENSION colctr; 361 int inrow, outrow, v; 362 363 inrow = outrow = 0; 364 while (outrow < cinfo->max_v_samp_factor) { 365 for (v = 0; v < 2; v++) { 366 /* inptr0 points to nearest input row, inptr1 points to next nearest */ 367 inptr0 = input_data[inrow]; 368 if (v == 0) /* next nearest is row above */ 369 inptr1 = input_data[inrow-1]; 370 else /* next nearest is row below */ 371 inptr1 = input_data[inrow+1]; 372 outptr = output_data[outrow++]; 373 374 /* Special case for first column */ 375 thiscolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++); 376 nextcolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++); 377 *outptr++ = (JSAMPLE) ((thiscolsum * 4 + 8) >> 4); 378 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + nextcolsum + 7) >> 4); 379 lastcolsum = thiscolsum; thiscolsum = nextcolsum; 380 381 for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) { 382 /* General case: 3/4 * nearer pixel + 1/4 * further pixel in each */ 383 /* dimension, thus 9/16, 3/16, 3/16, 1/16 overall */ 384 nextcolsum = GETJSAMPLE(*inptr0++) * 3 + GETJSAMPLE(*inptr1++); 385 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + lastcolsum + 8) >> 4); 386 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + nextcolsum + 7) >> 4); 387 lastcolsum = thiscolsum; thiscolsum = nextcolsum; 388 } 389 390 /* Special case for last column */ 391 *outptr++ = (JSAMPLE) ((thiscolsum * 3 + lastcolsum + 8) >> 4); 392 *outptr++ = (JSAMPLE) ((thiscolsum * 4 + 7) >> 4); 393 } 394 inrow++; 395 } 396 } 397 398 399 /* 400 * Module initialization routine for upsampling. 401 */ 402 403 GLOBAL(void) 404 jinit_upsampler (j_decompress_ptr cinfo) 405 { 406 my_upsample_ptr upsample; 407 int ci; 408 jpeg_component_info * compptr; 409 boolean need_buffer, do_fancy; 410 int h_in_group, v_in_group, h_out_group, v_out_group; 411 412 upsample = (my_upsample_ptr) 413 (*cinfo->mem->alloc_small) ((j_common_ptr) cinfo, JPOOL_IMAGE, 414 SIZEOF(my_upsampler)); 415 cinfo->upsample = (struct jpeg_upsampler *) upsample; 416 upsample->pub.start_pass = start_pass_upsample; 417 upsample->pub.upsample = sep_upsample; 418 upsample->pub.need_context_rows = FALSE; /* until we find out differently */ 419 420 if (cinfo->CCIR601_sampling) /* this isn't supported */ 421 ERREXIT(cinfo, JERR_CCIR601_NOTIMPL); 422 423 /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1, 424 * so don't ask for it. 425 */ 426 do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1; 427 428 /* Verify we can handle the sampling factors, select per-component methods, 429 * and create storage as needed. 430 */ 431 for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components; 432 ci++, compptr++) { 433 /* Compute size of an "input group" after IDCT scaling. This many samples 434 * are to be converted to max_h_samp_factor * max_v_samp_factor pixels. 435 */ 436 h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) / 437 cinfo->_min_DCT_scaled_size; 438 v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) / 439 cinfo->_min_DCT_scaled_size; 440 h_out_group = cinfo->max_h_samp_factor; 441 v_out_group = cinfo->max_v_samp_factor; 442 upsample->rowgroup_height[ci] = v_in_group; /* save for use later */ 443 need_buffer = TRUE; 444 if (! compptr->component_needed) { 445 /* Don't bother to upsample an uninteresting component. */ 446 upsample->methods[ci] = noop_upsample; 447 need_buffer = FALSE; 448 } else if (h_in_group == h_out_group && v_in_group == v_out_group) { 449 /* Fullsize components can be processed without any work. */ 450 upsample->methods[ci] = fullsize_upsample; 451 need_buffer = FALSE; 452 } else if (h_in_group * 2 == h_out_group && 453 v_in_group == v_out_group) { 454 /* Special cases for 2h1v upsampling */ 455 if (do_fancy && compptr->downsampled_width > 2) { 456 if (jsimd_can_h2v1_fancy_upsample()) 457 upsample->methods[ci] = jsimd_h2v1_fancy_upsample; 458 else 459 upsample->methods[ci] = h2v1_fancy_upsample; 460 } else { 461 if (jsimd_can_h2v1_upsample()) 462 upsample->methods[ci] = jsimd_h2v1_upsample; 463 else 464 upsample->methods[ci] = h2v1_upsample; 465 } 466 } else if (h_in_group * 2 == h_out_group && 467 v_in_group * 2 == v_out_group) { 468 /* Special cases for 2h2v upsampling */ 469 if (do_fancy && compptr->downsampled_width > 2) { 470 if (jsimd_can_h2v2_fancy_upsample()) 471 upsample->methods[ci] = jsimd_h2v2_fancy_upsample; 472 else 473 upsample->methods[ci] = h2v2_fancy_upsample; 474 upsample->pub.need_context_rows = TRUE; 475 } else { 476 if (jsimd_can_h2v2_upsample()) 477 upsample->methods[ci] = jsimd_h2v2_upsample; 478 else 479 upsample->methods[ci] = h2v2_upsample; 480 } 481 } else if ((h_out_group % h_in_group) == 0 && 482 (v_out_group % v_in_group) == 0) { 483 /* Generic integral-factors upsampling method */ 484 upsample->methods[ci] = int_upsample; 485 upsample->h_expand[ci] = (UINT8) (h_out_group / h_in_group); 486 upsample->v_expand[ci] = (UINT8) (v_out_group / v_in_group); 487 } else 488 ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL); 489 if (need_buffer) { 490 upsample->color_buf[ci] = (*cinfo->mem->alloc_sarray) 491 ((j_common_ptr) cinfo, JPOOL_IMAGE, 492 (JDIMENSION) jround_up((long) cinfo->output_width, 493 (long) cinfo->max_h_samp_factor), 494 (JDIMENSION) cinfo->max_v_samp_factor); 495 } 496 } 497 } 498