1 // Copyright 2012 Google Inc. All Rights Reserved. 2 // 3 // Use of this source code is governed by a BSD-style license 4 // that can be found in the COPYING file in the root of the source 5 // tree. An additional intellectual property rights grant can be found 6 // in the file PATENTS. All contributing project authors may 7 // be found in the AUTHORS file in the root of the source tree. 8 // ----------------------------------------------------------------------------- 9 // 10 // main entry for the decoder 11 // 12 // Authors: Vikas Arora (vikaas.arora (at) gmail.com) 13 // Jyrki Alakuijala (jyrki (at) google.com) 14 15 #include <stdlib.h> 16 17 #include "./alphai_dec.h" 18 #include "./vp8li_dec.h" 19 #include "../dsp/dsp.h" 20 #include "../dsp/lossless.h" 21 #include "../dsp/lossless_common.h" 22 #include "../dsp/yuv.h" 23 #include "../utils/endian_inl_utils.h" 24 #include "../utils/huffman_utils.h" 25 #include "../utils/utils.h" 26 27 #define NUM_ARGB_CACHE_ROWS 16 28 29 static const int kCodeLengthLiterals = 16; 30 static const int kCodeLengthRepeatCode = 16; 31 static const int kCodeLengthExtraBits[3] = { 2, 3, 7 }; 32 static const int kCodeLengthRepeatOffsets[3] = { 3, 3, 11 }; 33 34 // ----------------------------------------------------------------------------- 35 // Five Huffman codes are used at each meta code: 36 // 1. green + length prefix codes + color cache codes, 37 // 2. alpha, 38 // 3. red, 39 // 4. blue, and, 40 // 5. distance prefix codes. 41 typedef enum { 42 GREEN = 0, 43 RED = 1, 44 BLUE = 2, 45 ALPHA = 3, 46 DIST = 4 47 } HuffIndex; 48 49 static const uint16_t kAlphabetSize[HUFFMAN_CODES_PER_META_CODE] = { 50 NUM_LITERAL_CODES + NUM_LENGTH_CODES, 51 NUM_LITERAL_CODES, NUM_LITERAL_CODES, NUM_LITERAL_CODES, 52 NUM_DISTANCE_CODES 53 }; 54 55 static const uint8_t kLiteralMap[HUFFMAN_CODES_PER_META_CODE] = { 56 0, 1, 1, 1, 0 57 }; 58 59 #define NUM_CODE_LENGTH_CODES 19 60 static const uint8_t kCodeLengthCodeOrder[NUM_CODE_LENGTH_CODES] = { 61 17, 18, 0, 1, 2, 3, 4, 5, 16, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15 62 }; 63 64 #define CODE_TO_PLANE_CODES 120 65 static const uint8_t kCodeToPlane[CODE_TO_PLANE_CODES] = { 66 0x18, 0x07, 0x17, 0x19, 0x28, 0x06, 0x27, 0x29, 0x16, 0x1a, 67 0x26, 0x2a, 0x38, 0x05, 0x37, 0x39, 0x15, 0x1b, 0x36, 0x3a, 68 0x25, 0x2b, 0x48, 0x04, 0x47, 0x49, 0x14, 0x1c, 0x35, 0x3b, 69 0x46, 0x4a, 0x24, 0x2c, 0x58, 0x45, 0x4b, 0x34, 0x3c, 0x03, 70 0x57, 0x59, 0x13, 0x1d, 0x56, 0x5a, 0x23, 0x2d, 0x44, 0x4c, 71 0x55, 0x5b, 0x33, 0x3d, 0x68, 0x02, 0x67, 0x69, 0x12, 0x1e, 72 0x66, 0x6a, 0x22, 0x2e, 0x54, 0x5c, 0x43, 0x4d, 0x65, 0x6b, 73 0x32, 0x3e, 0x78, 0x01, 0x77, 0x79, 0x53, 0x5d, 0x11, 0x1f, 74 0x64, 0x6c, 0x42, 0x4e, 0x76, 0x7a, 0x21, 0x2f, 0x75, 0x7b, 75 0x31, 0x3f, 0x63, 0x6d, 0x52, 0x5e, 0x00, 0x74, 0x7c, 0x41, 76 0x4f, 0x10, 0x20, 0x62, 0x6e, 0x30, 0x73, 0x7d, 0x51, 0x5f, 77 0x40, 0x72, 0x7e, 0x61, 0x6f, 0x50, 0x71, 0x7f, 0x60, 0x70 78 }; 79 80 // Memory needed for lookup tables of one Huffman tree group. Red, blue, alpha 81 // and distance alphabets are constant (256 for red, blue and alpha, 40 for 82 // distance) and lookup table sizes for them in worst case are 630 and 410 83 // respectively. Size of green alphabet depends on color cache size and is equal 84 // to 256 (green component values) + 24 (length prefix values) 85 // + color_cache_size (between 0 and 2048). 86 // All values computed for 8-bit first level lookup with Mark Adler's tool: 87 // http://www.hdfgroup.org/ftp/lib-external/zlib/zlib-1.2.5/examples/enough.c 88 #define FIXED_TABLE_SIZE (630 * 3 + 410) 89 static const int kTableSize[12] = { 90 FIXED_TABLE_SIZE + 654, 91 FIXED_TABLE_SIZE + 656, 92 FIXED_TABLE_SIZE + 658, 93 FIXED_TABLE_SIZE + 662, 94 FIXED_TABLE_SIZE + 670, 95 FIXED_TABLE_SIZE + 686, 96 FIXED_TABLE_SIZE + 718, 97 FIXED_TABLE_SIZE + 782, 98 FIXED_TABLE_SIZE + 912, 99 FIXED_TABLE_SIZE + 1168, 100 FIXED_TABLE_SIZE + 1680, 101 FIXED_TABLE_SIZE + 2704 102 }; 103 104 static int DecodeImageStream(int xsize, int ysize, 105 int is_level0, 106 VP8LDecoder* const dec, 107 uint32_t** const decoded_data); 108 109 //------------------------------------------------------------------------------ 110 111 int VP8LCheckSignature(const uint8_t* const data, size_t size) { 112 return (size >= VP8L_FRAME_HEADER_SIZE && 113 data[0] == VP8L_MAGIC_BYTE && 114 (data[4] >> 5) == 0); // version 115 } 116 117 static int ReadImageInfo(VP8LBitReader* const br, 118 int* const width, int* const height, 119 int* const has_alpha) { 120 if (VP8LReadBits(br, 8) != VP8L_MAGIC_BYTE) return 0; 121 *width = VP8LReadBits(br, VP8L_IMAGE_SIZE_BITS) + 1; 122 *height = VP8LReadBits(br, VP8L_IMAGE_SIZE_BITS) + 1; 123 *has_alpha = VP8LReadBits(br, 1); 124 if (VP8LReadBits(br, VP8L_VERSION_BITS) != 0) return 0; 125 return !br->eos_; 126 } 127 128 int VP8LGetInfo(const uint8_t* data, size_t data_size, 129 int* const width, int* const height, int* const has_alpha) { 130 if (data == NULL || data_size < VP8L_FRAME_HEADER_SIZE) { 131 return 0; // not enough data 132 } else if (!VP8LCheckSignature(data, data_size)) { 133 return 0; // bad signature 134 } else { 135 int w, h, a; 136 VP8LBitReader br; 137 VP8LInitBitReader(&br, data, data_size); 138 if (!ReadImageInfo(&br, &w, &h, &a)) { 139 return 0; 140 } 141 if (width != NULL) *width = w; 142 if (height != NULL) *height = h; 143 if (has_alpha != NULL) *has_alpha = a; 144 return 1; 145 } 146 } 147 148 //------------------------------------------------------------------------------ 149 150 static WEBP_INLINE int GetCopyDistance(int distance_symbol, 151 VP8LBitReader* const br) { 152 int extra_bits, offset; 153 if (distance_symbol < 4) { 154 return distance_symbol + 1; 155 } 156 extra_bits = (distance_symbol - 2) >> 1; 157 offset = (2 + (distance_symbol & 1)) << extra_bits; 158 return offset + VP8LReadBits(br, extra_bits) + 1; 159 } 160 161 static WEBP_INLINE int GetCopyLength(int length_symbol, 162 VP8LBitReader* const br) { 163 // Length and distance prefixes are encoded the same way. 164 return GetCopyDistance(length_symbol, br); 165 } 166 167 static WEBP_INLINE int PlaneCodeToDistance(int xsize, int plane_code) { 168 if (plane_code > CODE_TO_PLANE_CODES) { 169 return plane_code - CODE_TO_PLANE_CODES; 170 } else { 171 const int dist_code = kCodeToPlane[plane_code - 1]; 172 const int yoffset = dist_code >> 4; 173 const int xoffset = 8 - (dist_code & 0xf); 174 const int dist = yoffset * xsize + xoffset; 175 return (dist >= 1) ? dist : 1; // dist<1 can happen if xsize is very small 176 } 177 } 178 179 //------------------------------------------------------------------------------ 180 // Decodes the next Huffman code from bit-stream. 181 // FillBitWindow(br) needs to be called at minimum every second call 182 // to ReadSymbol, in order to pre-fetch enough bits. 183 static WEBP_INLINE int ReadSymbol(const HuffmanCode* table, 184 VP8LBitReader* const br) { 185 int nbits; 186 uint32_t val = VP8LPrefetchBits(br); 187 table += val & HUFFMAN_TABLE_MASK; 188 nbits = table->bits - HUFFMAN_TABLE_BITS; 189 if (nbits > 0) { 190 VP8LSetBitPos(br, br->bit_pos_ + HUFFMAN_TABLE_BITS); 191 val = VP8LPrefetchBits(br); 192 table += table->value; 193 table += val & ((1 << nbits) - 1); 194 } 195 VP8LSetBitPos(br, br->bit_pos_ + table->bits); 196 return table->value; 197 } 198 199 // Reads packed symbol depending on GREEN channel 200 #define BITS_SPECIAL_MARKER 0x100 // something large enough (and a bit-mask) 201 #define PACKED_NON_LITERAL_CODE 0 // must be < NUM_LITERAL_CODES 202 static WEBP_INLINE int ReadPackedSymbols(const HTreeGroup* group, 203 VP8LBitReader* const br, 204 uint32_t* const dst) { 205 const uint32_t val = VP8LPrefetchBits(br) & (HUFFMAN_PACKED_TABLE_SIZE - 1); 206 const HuffmanCode32 code = group->packed_table[val]; 207 assert(group->use_packed_table); 208 if (code.bits < BITS_SPECIAL_MARKER) { 209 VP8LSetBitPos(br, br->bit_pos_ + code.bits); 210 *dst = code.value; 211 return PACKED_NON_LITERAL_CODE; 212 } else { 213 VP8LSetBitPos(br, br->bit_pos_ + code.bits - BITS_SPECIAL_MARKER); 214 assert(code.value >= NUM_LITERAL_CODES); 215 return code.value; 216 } 217 } 218 219 static int AccumulateHCode(HuffmanCode hcode, int shift, 220 HuffmanCode32* const huff) { 221 huff->bits += hcode.bits; 222 huff->value |= (uint32_t)hcode.value << shift; 223 assert(huff->bits <= HUFFMAN_TABLE_BITS); 224 return hcode.bits; 225 } 226 227 static void BuildPackedTable(HTreeGroup* const htree_group) { 228 uint32_t code; 229 for (code = 0; code < HUFFMAN_PACKED_TABLE_SIZE; ++code) { 230 uint32_t bits = code; 231 HuffmanCode32* const huff = &htree_group->packed_table[bits]; 232 HuffmanCode hcode = htree_group->htrees[GREEN][bits]; 233 if (hcode.value >= NUM_LITERAL_CODES) { 234 huff->bits = hcode.bits + BITS_SPECIAL_MARKER; 235 huff->value = hcode.value; 236 } else { 237 huff->bits = 0; 238 huff->value = 0; 239 bits >>= AccumulateHCode(hcode, 8, huff); 240 bits >>= AccumulateHCode(htree_group->htrees[RED][bits], 16, huff); 241 bits >>= AccumulateHCode(htree_group->htrees[BLUE][bits], 0, huff); 242 bits >>= AccumulateHCode(htree_group->htrees[ALPHA][bits], 24, huff); 243 (void)bits; 244 } 245 } 246 } 247 248 static int ReadHuffmanCodeLengths( 249 VP8LDecoder* const dec, const int* const code_length_code_lengths, 250 int num_symbols, int* const code_lengths) { 251 int ok = 0; 252 VP8LBitReader* const br = &dec->br_; 253 int symbol; 254 int max_symbol; 255 int prev_code_len = DEFAULT_CODE_LENGTH; 256 HuffmanCode table[1 << LENGTHS_TABLE_BITS]; 257 258 if (!VP8LBuildHuffmanTable(table, LENGTHS_TABLE_BITS, 259 code_length_code_lengths, 260 NUM_CODE_LENGTH_CODES)) { 261 goto End; 262 } 263 264 if (VP8LReadBits(br, 1)) { // use length 265 const int length_nbits = 2 + 2 * VP8LReadBits(br, 3); 266 max_symbol = 2 + VP8LReadBits(br, length_nbits); 267 if (max_symbol > num_symbols) { 268 goto End; 269 } 270 } else { 271 max_symbol = num_symbols; 272 } 273 274 symbol = 0; 275 while (symbol < num_symbols) { 276 const HuffmanCode* p; 277 int code_len; 278 if (max_symbol-- == 0) break; 279 VP8LFillBitWindow(br); 280 p = &table[VP8LPrefetchBits(br) & LENGTHS_TABLE_MASK]; 281 VP8LSetBitPos(br, br->bit_pos_ + p->bits); 282 code_len = p->value; 283 if (code_len < kCodeLengthLiterals) { 284 code_lengths[symbol++] = code_len; 285 if (code_len != 0) prev_code_len = code_len; 286 } else { 287 const int use_prev = (code_len == kCodeLengthRepeatCode); 288 const int slot = code_len - kCodeLengthLiterals; 289 const int extra_bits = kCodeLengthExtraBits[slot]; 290 const int repeat_offset = kCodeLengthRepeatOffsets[slot]; 291 int repeat = VP8LReadBits(br, extra_bits) + repeat_offset; 292 if (symbol + repeat > num_symbols) { 293 goto End; 294 } else { 295 const int length = use_prev ? prev_code_len : 0; 296 while (repeat-- > 0) code_lengths[symbol++] = length; 297 } 298 } 299 } 300 ok = 1; 301 302 End: 303 if (!ok) dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 304 return ok; 305 } 306 307 // 'code_lengths' is pre-allocated temporary buffer, used for creating Huffman 308 // tree. 309 static int ReadHuffmanCode(int alphabet_size, VP8LDecoder* const dec, 310 int* const code_lengths, HuffmanCode* const table) { 311 int ok = 0; 312 int size = 0; 313 VP8LBitReader* const br = &dec->br_; 314 const int simple_code = VP8LReadBits(br, 1); 315 316 memset(code_lengths, 0, alphabet_size * sizeof(*code_lengths)); 317 318 if (simple_code) { // Read symbols, codes & code lengths directly. 319 const int num_symbols = VP8LReadBits(br, 1) + 1; 320 const int first_symbol_len_code = VP8LReadBits(br, 1); 321 // The first code is either 1 bit or 8 bit code. 322 int symbol = VP8LReadBits(br, (first_symbol_len_code == 0) ? 1 : 8); 323 code_lengths[symbol] = 1; 324 // The second code (if present), is always 8 bit long. 325 if (num_symbols == 2) { 326 symbol = VP8LReadBits(br, 8); 327 code_lengths[symbol] = 1; 328 } 329 ok = 1; 330 } else { // Decode Huffman-coded code lengths. 331 int i; 332 int code_length_code_lengths[NUM_CODE_LENGTH_CODES] = { 0 }; 333 const int num_codes = VP8LReadBits(br, 4) + 4; 334 if (num_codes > NUM_CODE_LENGTH_CODES) { 335 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 336 return 0; 337 } 338 339 for (i = 0; i < num_codes; ++i) { 340 code_length_code_lengths[kCodeLengthCodeOrder[i]] = VP8LReadBits(br, 3); 341 } 342 ok = ReadHuffmanCodeLengths(dec, code_length_code_lengths, alphabet_size, 343 code_lengths); 344 } 345 346 ok = ok && !br->eos_; 347 if (ok) { 348 size = VP8LBuildHuffmanTable(table, HUFFMAN_TABLE_BITS, 349 code_lengths, alphabet_size); 350 } 351 if (!ok || size == 0) { 352 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 353 return 0; 354 } 355 return size; 356 } 357 358 static int ReadHuffmanCodes(VP8LDecoder* const dec, int xsize, int ysize, 359 int color_cache_bits, int allow_recursion) { 360 int i, j; 361 VP8LBitReader* const br = &dec->br_; 362 VP8LMetadata* const hdr = &dec->hdr_; 363 uint32_t* huffman_image = NULL; 364 HTreeGroup* htree_groups = NULL; 365 HuffmanCode* huffman_tables = NULL; 366 HuffmanCode* next = NULL; 367 int num_htree_groups = 1; 368 int max_alphabet_size = 0; 369 int* code_lengths = NULL; 370 const int table_size = kTableSize[color_cache_bits]; 371 372 if (allow_recursion && VP8LReadBits(br, 1)) { 373 // use meta Huffman codes. 374 const int huffman_precision = VP8LReadBits(br, 3) + 2; 375 const int huffman_xsize = VP8LSubSampleSize(xsize, huffman_precision); 376 const int huffman_ysize = VP8LSubSampleSize(ysize, huffman_precision); 377 const int huffman_pixs = huffman_xsize * huffman_ysize; 378 if (!DecodeImageStream(huffman_xsize, huffman_ysize, 0, dec, 379 &huffman_image)) { 380 goto Error; 381 } 382 hdr->huffman_subsample_bits_ = huffman_precision; 383 for (i = 0; i < huffman_pixs; ++i) { 384 // The huffman data is stored in red and green bytes. 385 const int group = (huffman_image[i] >> 8) & 0xffff; 386 huffman_image[i] = group; 387 if (group >= num_htree_groups) { 388 num_htree_groups = group + 1; 389 } 390 } 391 } 392 393 if (br->eos_) goto Error; 394 395 // Find maximum alphabet size for the htree group. 396 for (j = 0; j < HUFFMAN_CODES_PER_META_CODE; ++j) { 397 int alphabet_size = kAlphabetSize[j]; 398 if (j == 0 && color_cache_bits > 0) { 399 alphabet_size += 1 << color_cache_bits; 400 } 401 if (max_alphabet_size < alphabet_size) { 402 max_alphabet_size = alphabet_size; 403 } 404 } 405 406 huffman_tables = (HuffmanCode*)WebPSafeMalloc(num_htree_groups * table_size, 407 sizeof(*huffman_tables)); 408 htree_groups = VP8LHtreeGroupsNew(num_htree_groups); 409 code_lengths = (int*)WebPSafeCalloc((uint64_t)max_alphabet_size, 410 sizeof(*code_lengths)); 411 412 if (htree_groups == NULL || code_lengths == NULL || huffman_tables == NULL) { 413 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 414 goto Error; 415 } 416 417 next = huffman_tables; 418 for (i = 0; i < num_htree_groups; ++i) { 419 HTreeGroup* const htree_group = &htree_groups[i]; 420 HuffmanCode** const htrees = htree_group->htrees; 421 int size; 422 int total_size = 0; 423 int is_trivial_literal = 1; 424 int max_bits = 0; 425 for (j = 0; j < HUFFMAN_CODES_PER_META_CODE; ++j) { 426 int alphabet_size = kAlphabetSize[j]; 427 htrees[j] = next; 428 if (j == 0 && color_cache_bits > 0) { 429 alphabet_size += 1 << color_cache_bits; 430 } 431 size = ReadHuffmanCode(alphabet_size, dec, code_lengths, next); 432 if (size == 0) { 433 goto Error; 434 } 435 if (is_trivial_literal && kLiteralMap[j] == 1) { 436 is_trivial_literal = (next->bits == 0); 437 } 438 total_size += next->bits; 439 next += size; 440 if (j <= ALPHA) { 441 int local_max_bits = code_lengths[0]; 442 int k; 443 for (k = 1; k < alphabet_size; ++k) { 444 if (code_lengths[k] > local_max_bits) { 445 local_max_bits = code_lengths[k]; 446 } 447 } 448 max_bits += local_max_bits; 449 } 450 } 451 htree_group->is_trivial_literal = is_trivial_literal; 452 htree_group->is_trivial_code = 0; 453 if (is_trivial_literal) { 454 const int red = htrees[RED][0].value; 455 const int blue = htrees[BLUE][0].value; 456 const int alpha = htrees[ALPHA][0].value; 457 htree_group->literal_arb = 458 ((uint32_t)alpha << 24) | (red << 16) | blue; 459 if (total_size == 0 && htrees[GREEN][0].value < NUM_LITERAL_CODES) { 460 htree_group->is_trivial_code = 1; 461 htree_group->literal_arb |= htrees[GREEN][0].value << 8; 462 } 463 } 464 htree_group->use_packed_table = !htree_group->is_trivial_code && 465 (max_bits < HUFFMAN_PACKED_BITS); 466 if (htree_group->use_packed_table) BuildPackedTable(htree_group); 467 } 468 WebPSafeFree(code_lengths); 469 470 // All OK. Finalize pointers and return. 471 hdr->huffman_image_ = huffman_image; 472 hdr->num_htree_groups_ = num_htree_groups; 473 hdr->htree_groups_ = htree_groups; 474 hdr->huffman_tables_ = huffman_tables; 475 return 1; 476 477 Error: 478 WebPSafeFree(code_lengths); 479 WebPSafeFree(huffman_image); 480 WebPSafeFree(huffman_tables); 481 VP8LHtreeGroupsFree(htree_groups); 482 return 0; 483 } 484 485 //------------------------------------------------------------------------------ 486 // Scaling. 487 488 static int AllocateAndInitRescaler(VP8LDecoder* const dec, VP8Io* const io) { 489 const int num_channels = 4; 490 const int in_width = io->mb_w; 491 const int out_width = io->scaled_width; 492 const int in_height = io->mb_h; 493 const int out_height = io->scaled_height; 494 const uint64_t work_size = 2 * num_channels * (uint64_t)out_width; 495 rescaler_t* work; // Rescaler work area. 496 const uint64_t scaled_data_size = (uint64_t)out_width; 497 uint32_t* scaled_data; // Temporary storage for scaled BGRA data. 498 const uint64_t memory_size = sizeof(*dec->rescaler) + 499 work_size * sizeof(*work) + 500 scaled_data_size * sizeof(*scaled_data); 501 uint8_t* memory = (uint8_t*)WebPSafeMalloc(memory_size, sizeof(*memory)); 502 if (memory == NULL) { 503 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 504 return 0; 505 } 506 assert(dec->rescaler_memory == NULL); 507 dec->rescaler_memory = memory; 508 509 dec->rescaler = (WebPRescaler*)memory; 510 memory += sizeof(*dec->rescaler); 511 work = (rescaler_t*)memory; 512 memory += work_size * sizeof(*work); 513 scaled_data = (uint32_t*)memory; 514 515 WebPRescalerInit(dec->rescaler, in_width, in_height, (uint8_t*)scaled_data, 516 out_width, out_height, 0, num_channels, work); 517 return 1; 518 } 519 520 //------------------------------------------------------------------------------ 521 // Export to ARGB 522 523 // We have special "export" function since we need to convert from BGRA 524 static int Export(WebPRescaler* const rescaler, WEBP_CSP_MODE colorspace, 525 int rgba_stride, uint8_t* const rgba) { 526 uint32_t* const src = (uint32_t*)rescaler->dst; 527 const int dst_width = rescaler->dst_width; 528 int num_lines_out = 0; 529 while (WebPRescalerHasPendingOutput(rescaler)) { 530 uint8_t* const dst = rgba + num_lines_out * rgba_stride; 531 WebPRescalerExportRow(rescaler); 532 WebPMultARGBRow(src, dst_width, 1); 533 VP8LConvertFromBGRA(src, dst_width, colorspace, dst); 534 ++num_lines_out; 535 } 536 return num_lines_out; 537 } 538 539 // Emit scaled rows. 540 static int EmitRescaledRowsRGBA(const VP8LDecoder* const dec, 541 uint8_t* in, int in_stride, int mb_h, 542 uint8_t* const out, int out_stride) { 543 const WEBP_CSP_MODE colorspace = dec->output_->colorspace; 544 int num_lines_in = 0; 545 int num_lines_out = 0; 546 while (num_lines_in < mb_h) { 547 uint8_t* const row_in = in + num_lines_in * in_stride; 548 uint8_t* const row_out = out + num_lines_out * out_stride; 549 const int lines_left = mb_h - num_lines_in; 550 const int needed_lines = WebPRescaleNeededLines(dec->rescaler, lines_left); 551 int lines_imported; 552 assert(needed_lines > 0 && needed_lines <= lines_left); 553 WebPMultARGBRows(row_in, in_stride, 554 dec->rescaler->src_width, needed_lines, 0); 555 lines_imported = 556 WebPRescalerImport(dec->rescaler, lines_left, row_in, in_stride); 557 assert(lines_imported == needed_lines); 558 num_lines_in += lines_imported; 559 num_lines_out += Export(dec->rescaler, colorspace, out_stride, row_out); 560 } 561 return num_lines_out; 562 } 563 564 // Emit rows without any scaling. 565 static int EmitRows(WEBP_CSP_MODE colorspace, 566 const uint8_t* row_in, int in_stride, 567 int mb_w, int mb_h, 568 uint8_t* const out, int out_stride) { 569 int lines = mb_h; 570 uint8_t* row_out = out; 571 while (lines-- > 0) { 572 VP8LConvertFromBGRA((const uint32_t*)row_in, mb_w, colorspace, row_out); 573 row_in += in_stride; 574 row_out += out_stride; 575 } 576 return mb_h; // Num rows out == num rows in. 577 } 578 579 //------------------------------------------------------------------------------ 580 // Export to YUVA 581 582 static void ConvertToYUVA(const uint32_t* const src, int width, int y_pos, 583 const WebPDecBuffer* const output) { 584 const WebPYUVABuffer* const buf = &output->u.YUVA; 585 586 // first, the luma plane 587 WebPConvertARGBToY(src, buf->y + y_pos * buf->y_stride, width); 588 589 // then U/V planes 590 { 591 uint8_t* const u = buf->u + (y_pos >> 1) * buf->u_stride; 592 uint8_t* const v = buf->v + (y_pos >> 1) * buf->v_stride; 593 // even lines: store values 594 // odd lines: average with previous values 595 WebPConvertARGBToUV(src, u, v, width, !(y_pos & 1)); 596 } 597 // Lastly, store alpha if needed. 598 if (buf->a != NULL) { 599 uint8_t* const a = buf->a + y_pos * buf->a_stride; 600 #if defined(WORDS_BIGENDIAN) 601 WebPExtractAlpha((uint8_t*)src + 0, 0, width, 1, a, 0); 602 #else 603 WebPExtractAlpha((uint8_t*)src + 3, 0, width, 1, a, 0); 604 #endif 605 } 606 } 607 608 static int ExportYUVA(const VP8LDecoder* const dec, int y_pos) { 609 WebPRescaler* const rescaler = dec->rescaler; 610 uint32_t* const src = (uint32_t*)rescaler->dst; 611 const int dst_width = rescaler->dst_width; 612 int num_lines_out = 0; 613 while (WebPRescalerHasPendingOutput(rescaler)) { 614 WebPRescalerExportRow(rescaler); 615 WebPMultARGBRow(src, dst_width, 1); 616 ConvertToYUVA(src, dst_width, y_pos, dec->output_); 617 ++y_pos; 618 ++num_lines_out; 619 } 620 return num_lines_out; 621 } 622 623 static int EmitRescaledRowsYUVA(const VP8LDecoder* const dec, 624 uint8_t* in, int in_stride, int mb_h) { 625 int num_lines_in = 0; 626 int y_pos = dec->last_out_row_; 627 while (num_lines_in < mb_h) { 628 const int lines_left = mb_h - num_lines_in; 629 const int needed_lines = WebPRescaleNeededLines(dec->rescaler, lines_left); 630 int lines_imported; 631 WebPMultARGBRows(in, in_stride, dec->rescaler->src_width, needed_lines, 0); 632 lines_imported = 633 WebPRescalerImport(dec->rescaler, lines_left, in, in_stride); 634 assert(lines_imported == needed_lines); 635 num_lines_in += lines_imported; 636 in += needed_lines * in_stride; 637 y_pos += ExportYUVA(dec, y_pos); 638 } 639 return y_pos; 640 } 641 642 static int EmitRowsYUVA(const VP8LDecoder* const dec, 643 const uint8_t* in, int in_stride, 644 int mb_w, int num_rows) { 645 int y_pos = dec->last_out_row_; 646 while (num_rows-- > 0) { 647 ConvertToYUVA((const uint32_t*)in, mb_w, y_pos, dec->output_); 648 in += in_stride; 649 ++y_pos; 650 } 651 return y_pos; 652 } 653 654 //------------------------------------------------------------------------------ 655 // Cropping. 656 657 // Sets io->mb_y, io->mb_h & io->mb_w according to start row, end row and 658 // crop options. Also updates the input data pointer, so that it points to the 659 // start of the cropped window. Note that pixels are in ARGB format even if 660 // 'in_data' is uint8_t*. 661 // Returns true if the crop window is not empty. 662 static int SetCropWindow(VP8Io* const io, int y_start, int y_end, 663 uint8_t** const in_data, int pixel_stride) { 664 assert(y_start < y_end); 665 assert(io->crop_left < io->crop_right); 666 if (y_end > io->crop_bottom) { 667 y_end = io->crop_bottom; // make sure we don't overflow on last row. 668 } 669 if (y_start < io->crop_top) { 670 const int delta = io->crop_top - y_start; 671 y_start = io->crop_top; 672 *in_data += delta * pixel_stride; 673 } 674 if (y_start >= y_end) return 0; // Crop window is empty. 675 676 *in_data += io->crop_left * sizeof(uint32_t); 677 678 io->mb_y = y_start - io->crop_top; 679 io->mb_w = io->crop_right - io->crop_left; 680 io->mb_h = y_end - y_start; 681 return 1; // Non-empty crop window. 682 } 683 684 //------------------------------------------------------------------------------ 685 686 static WEBP_INLINE int GetMetaIndex( 687 const uint32_t* const image, int xsize, int bits, int x, int y) { 688 if (bits == 0) return 0; 689 return image[xsize * (y >> bits) + (x >> bits)]; 690 } 691 692 static WEBP_INLINE HTreeGroup* GetHtreeGroupForPos(VP8LMetadata* const hdr, 693 int x, int y) { 694 const int meta_index = GetMetaIndex(hdr->huffman_image_, hdr->huffman_xsize_, 695 hdr->huffman_subsample_bits_, x, y); 696 assert(meta_index < hdr->num_htree_groups_); 697 return hdr->htree_groups_ + meta_index; 698 } 699 700 //------------------------------------------------------------------------------ 701 // Main loop, with custom row-processing function 702 703 typedef void (*ProcessRowsFunc)(VP8LDecoder* const dec, int row); 704 705 static void ApplyInverseTransforms(VP8LDecoder* const dec, int num_rows, 706 const uint32_t* const rows) { 707 int n = dec->next_transform_; 708 const int cache_pixs = dec->width_ * num_rows; 709 const int start_row = dec->last_row_; 710 const int end_row = start_row + num_rows; 711 const uint32_t* rows_in = rows; 712 uint32_t* const rows_out = dec->argb_cache_; 713 714 // Inverse transforms. 715 while (n-- > 0) { 716 VP8LTransform* const transform = &dec->transforms_[n]; 717 VP8LInverseTransform(transform, start_row, end_row, rows_in, rows_out); 718 rows_in = rows_out; 719 } 720 if (rows_in != rows_out) { 721 // No transform called, hence just copy. 722 memcpy(rows_out, rows_in, cache_pixs * sizeof(*rows_out)); 723 } 724 } 725 726 // Processes (transforms, scales & color-converts) the rows decoded after the 727 // last call. 728 static void ProcessRows(VP8LDecoder* const dec, int row) { 729 const uint32_t* const rows = dec->pixels_ + dec->width_ * dec->last_row_; 730 const int num_rows = row - dec->last_row_; 731 732 assert(row <= dec->io_->crop_bottom); 733 // We can't process more than NUM_ARGB_CACHE_ROWS at a time (that's the size 734 // of argb_cache_), but we currently don't need more than that. 735 assert(num_rows <= NUM_ARGB_CACHE_ROWS); 736 if (num_rows > 0) { // Emit output. 737 VP8Io* const io = dec->io_; 738 uint8_t* rows_data = (uint8_t*)dec->argb_cache_; 739 const int in_stride = io->width * sizeof(uint32_t); // in unit of RGBA 740 741 ApplyInverseTransforms(dec, num_rows, rows); 742 if (!SetCropWindow(io, dec->last_row_, row, &rows_data, in_stride)) { 743 // Nothing to output (this time). 744 } else { 745 const WebPDecBuffer* const output = dec->output_; 746 if (WebPIsRGBMode(output->colorspace)) { // convert to RGBA 747 const WebPRGBABuffer* const buf = &output->u.RGBA; 748 uint8_t* const rgba = buf->rgba + dec->last_out_row_ * buf->stride; 749 const int num_rows_out = io->use_scaling ? 750 EmitRescaledRowsRGBA(dec, rows_data, in_stride, io->mb_h, 751 rgba, buf->stride) : 752 EmitRows(output->colorspace, rows_data, in_stride, 753 io->mb_w, io->mb_h, rgba, buf->stride); 754 // Update 'last_out_row_'. 755 dec->last_out_row_ += num_rows_out; 756 } else { // convert to YUVA 757 dec->last_out_row_ = io->use_scaling ? 758 EmitRescaledRowsYUVA(dec, rows_data, in_stride, io->mb_h) : 759 EmitRowsYUVA(dec, rows_data, in_stride, io->mb_w, io->mb_h); 760 } 761 assert(dec->last_out_row_ <= output->height); 762 } 763 } 764 765 // Update 'last_row_'. 766 dec->last_row_ = row; 767 assert(dec->last_row_ <= dec->height_); 768 } 769 770 // Row-processing for the special case when alpha data contains only one 771 // transform (color indexing), and trivial non-green literals. 772 static int Is8bOptimizable(const VP8LMetadata* const hdr) { 773 int i; 774 if (hdr->color_cache_size_ > 0) return 0; 775 // When the Huffman tree contains only one symbol, we can skip the 776 // call to ReadSymbol() for red/blue/alpha channels. 777 for (i = 0; i < hdr->num_htree_groups_; ++i) { 778 HuffmanCode** const htrees = hdr->htree_groups_[i].htrees; 779 if (htrees[RED][0].bits > 0) return 0; 780 if (htrees[BLUE][0].bits > 0) return 0; 781 if (htrees[ALPHA][0].bits > 0) return 0; 782 } 783 return 1; 784 } 785 786 static void AlphaApplyFilter(ALPHDecoder* const alph_dec, 787 int first_row, int last_row, 788 uint8_t* out, int stride) { 789 if (alph_dec->filter_ != WEBP_FILTER_NONE) { 790 int y; 791 const uint8_t* prev_line = alph_dec->prev_line_; 792 assert(WebPUnfilters[alph_dec->filter_] != NULL); 793 for (y = first_row; y < last_row; ++y) { 794 WebPUnfilters[alph_dec->filter_](prev_line, out, out, stride); 795 prev_line = out; 796 out += stride; 797 } 798 alph_dec->prev_line_ = prev_line; 799 } 800 } 801 802 static void ExtractPalettedAlphaRows(VP8LDecoder* const dec, int last_row) { 803 // For vertical and gradient filtering, we need to decode the part above the 804 // crop_top row, in order to have the correct spatial predictors. 805 ALPHDecoder* const alph_dec = (ALPHDecoder*)dec->io_->opaque; 806 const int top_row = 807 (alph_dec->filter_ == WEBP_FILTER_NONE || 808 alph_dec->filter_ == WEBP_FILTER_HORIZONTAL) ? dec->io_->crop_top 809 : dec->last_row_; 810 const int first_row = (dec->last_row_ < top_row) ? top_row : dec->last_row_; 811 assert(last_row <= dec->io_->crop_bottom); 812 if (last_row > first_row) { 813 // Special method for paletted alpha data. We only process the cropped area. 814 const int width = dec->io_->width; 815 uint8_t* out = alph_dec->output_ + width * first_row; 816 const uint8_t* const in = 817 (uint8_t*)dec->pixels_ + dec->width_ * first_row; 818 VP8LTransform* const transform = &dec->transforms_[0]; 819 assert(dec->next_transform_ == 1); 820 assert(transform->type_ == COLOR_INDEXING_TRANSFORM); 821 VP8LColorIndexInverseTransformAlpha(transform, first_row, last_row, 822 in, out); 823 AlphaApplyFilter(alph_dec, first_row, last_row, out, width); 824 } 825 dec->last_row_ = dec->last_out_row_ = last_row; 826 } 827 828 //------------------------------------------------------------------------------ 829 // Helper functions for fast pattern copy (8b and 32b) 830 831 // cyclic rotation of pattern word 832 static WEBP_INLINE uint32_t Rotate8b(uint32_t V) { 833 #if defined(WORDS_BIGENDIAN) 834 return ((V & 0xff000000u) >> 24) | (V << 8); 835 #else 836 return ((V & 0xffu) << 24) | (V >> 8); 837 #endif 838 } 839 840 // copy 1, 2 or 4-bytes pattern 841 static WEBP_INLINE void CopySmallPattern8b(const uint8_t* src, uint8_t* dst, 842 int length, uint32_t pattern) { 843 int i; 844 // align 'dst' to 4-bytes boundary. Adjust the pattern along the way. 845 while ((uintptr_t)dst & 3) { 846 *dst++ = *src++; 847 pattern = Rotate8b(pattern); 848 --length; 849 } 850 // Copy the pattern 4 bytes at a time. 851 for (i = 0; i < (length >> 2); ++i) { 852 ((uint32_t*)dst)[i] = pattern; 853 } 854 // Finish with left-overs. 'pattern' is still correctly positioned, 855 // so no Rotate8b() call is needed. 856 for (i <<= 2; i < length; ++i) { 857 dst[i] = src[i]; 858 } 859 } 860 861 static WEBP_INLINE void CopyBlock8b(uint8_t* const dst, int dist, int length) { 862 const uint8_t* src = dst - dist; 863 if (length >= 8) { 864 uint32_t pattern = 0; 865 switch (dist) { 866 case 1: 867 pattern = src[0]; 868 #if defined(__arm__) || defined(_M_ARM) // arm doesn't like multiply that much 869 pattern |= pattern << 8; 870 pattern |= pattern << 16; 871 #elif defined(WEBP_USE_MIPS_DSP_R2) 872 __asm__ volatile ("replv.qb %0, %0" : "+r"(pattern)); 873 #else 874 pattern = 0x01010101u * pattern; 875 #endif 876 break; 877 case 2: 878 memcpy(&pattern, src, sizeof(uint16_t)); 879 #if defined(__arm__) || defined(_M_ARM) 880 pattern |= pattern << 16; 881 #elif defined(WEBP_USE_MIPS_DSP_R2) 882 __asm__ volatile ("replv.ph %0, %0" : "+r"(pattern)); 883 #else 884 pattern = 0x00010001u * pattern; 885 #endif 886 break; 887 case 4: 888 memcpy(&pattern, src, sizeof(uint32_t)); 889 break; 890 default: 891 goto Copy; 892 break; 893 } 894 CopySmallPattern8b(src, dst, length, pattern); 895 return; 896 } 897 Copy: 898 if (dist >= length) { // no overlap -> use memcpy() 899 memcpy(dst, src, length * sizeof(*dst)); 900 } else { 901 int i; 902 for (i = 0; i < length; ++i) dst[i] = src[i]; 903 } 904 } 905 906 // copy pattern of 1 or 2 uint32_t's 907 static WEBP_INLINE void CopySmallPattern32b(const uint32_t* src, 908 uint32_t* dst, 909 int length, uint64_t pattern) { 910 int i; 911 if ((uintptr_t)dst & 4) { // Align 'dst' to 8-bytes boundary. 912 *dst++ = *src++; 913 pattern = (pattern >> 32) | (pattern << 32); 914 --length; 915 } 916 assert(0 == ((uintptr_t)dst & 7)); 917 for (i = 0; i < (length >> 1); ++i) { 918 ((uint64_t*)dst)[i] = pattern; // Copy the pattern 8 bytes at a time. 919 } 920 if (length & 1) { // Finish with left-over. 921 dst[i << 1] = src[i << 1]; 922 } 923 } 924 925 static WEBP_INLINE void CopyBlock32b(uint32_t* const dst, 926 int dist, int length) { 927 const uint32_t* const src = dst - dist; 928 if (dist <= 2 && length >= 4 && ((uintptr_t)dst & 3) == 0) { 929 uint64_t pattern; 930 if (dist == 1) { 931 pattern = (uint64_t)src[0]; 932 pattern |= pattern << 32; 933 } else { 934 memcpy(&pattern, src, sizeof(pattern)); 935 } 936 CopySmallPattern32b(src, dst, length, pattern); 937 } else if (dist >= length) { // no overlap 938 memcpy(dst, src, length * sizeof(*dst)); 939 } else { 940 int i; 941 for (i = 0; i < length; ++i) dst[i] = src[i]; 942 } 943 } 944 945 //------------------------------------------------------------------------------ 946 947 static int DecodeAlphaData(VP8LDecoder* const dec, uint8_t* const data, 948 int width, int height, int last_row) { 949 int ok = 1; 950 int row = dec->last_pixel_ / width; 951 int col = dec->last_pixel_ % width; 952 VP8LBitReader* const br = &dec->br_; 953 VP8LMetadata* const hdr = &dec->hdr_; 954 int pos = dec->last_pixel_; // current position 955 const int end = width * height; // End of data 956 const int last = width * last_row; // Last pixel to decode 957 const int len_code_limit = NUM_LITERAL_CODES + NUM_LENGTH_CODES; 958 const int mask = hdr->huffman_mask_; 959 const HTreeGroup* htree_group = 960 (pos < last) ? GetHtreeGroupForPos(hdr, col, row) : NULL; 961 assert(pos <= end); 962 assert(last_row <= height); 963 assert(Is8bOptimizable(hdr)); 964 965 while (!br->eos_ && pos < last) { 966 int code; 967 // Only update when changing tile. 968 if ((col & mask) == 0) { 969 htree_group = GetHtreeGroupForPos(hdr, col, row); 970 } 971 assert(htree_group != NULL); 972 VP8LFillBitWindow(br); 973 code = ReadSymbol(htree_group->htrees[GREEN], br); 974 if (code < NUM_LITERAL_CODES) { // Literal 975 data[pos] = code; 976 ++pos; 977 ++col; 978 if (col >= width) { 979 col = 0; 980 ++row; 981 if (row <= last_row && (row % NUM_ARGB_CACHE_ROWS == 0)) { 982 ExtractPalettedAlphaRows(dec, row); 983 } 984 } 985 } else if (code < len_code_limit) { // Backward reference 986 int dist_code, dist; 987 const int length_sym = code - NUM_LITERAL_CODES; 988 const int length = GetCopyLength(length_sym, br); 989 const int dist_symbol = ReadSymbol(htree_group->htrees[DIST], br); 990 VP8LFillBitWindow(br); 991 dist_code = GetCopyDistance(dist_symbol, br); 992 dist = PlaneCodeToDistance(width, dist_code); 993 if (pos >= dist && end - pos >= length) { 994 CopyBlock8b(data + pos, dist, length); 995 } else { 996 ok = 0; 997 goto End; 998 } 999 pos += length; 1000 col += length; 1001 while (col >= width) { 1002 col -= width; 1003 ++row; 1004 if (row <= last_row && (row % NUM_ARGB_CACHE_ROWS == 0)) { 1005 ExtractPalettedAlphaRows(dec, row); 1006 } 1007 } 1008 if (pos < last && (col & mask)) { 1009 htree_group = GetHtreeGroupForPos(hdr, col, row); 1010 } 1011 } else { // Not reached 1012 ok = 0; 1013 goto End; 1014 } 1015 assert(br->eos_ == VP8LIsEndOfStream(br)); 1016 } 1017 // Process the remaining rows corresponding to last row-block. 1018 ExtractPalettedAlphaRows(dec, row > last_row ? last_row : row); 1019 1020 End: 1021 if (!ok || (br->eos_ && pos < end)) { 1022 ok = 0; 1023 dec->status_ = br->eos_ ? VP8_STATUS_SUSPENDED 1024 : VP8_STATUS_BITSTREAM_ERROR; 1025 } else { 1026 dec->last_pixel_ = pos; 1027 } 1028 return ok; 1029 } 1030 1031 static void SaveState(VP8LDecoder* const dec, int last_pixel) { 1032 assert(dec->incremental_); 1033 dec->saved_br_ = dec->br_; 1034 dec->saved_last_pixel_ = last_pixel; 1035 if (dec->hdr_.color_cache_size_ > 0) { 1036 VP8LColorCacheCopy(&dec->hdr_.color_cache_, &dec->hdr_.saved_color_cache_); 1037 } 1038 } 1039 1040 static void RestoreState(VP8LDecoder* const dec) { 1041 assert(dec->br_.eos_); 1042 dec->status_ = VP8_STATUS_SUSPENDED; 1043 dec->br_ = dec->saved_br_; 1044 dec->last_pixel_ = dec->saved_last_pixel_; 1045 if (dec->hdr_.color_cache_size_ > 0) { 1046 VP8LColorCacheCopy(&dec->hdr_.saved_color_cache_, &dec->hdr_.color_cache_); 1047 } 1048 } 1049 1050 #define SYNC_EVERY_N_ROWS 8 // minimum number of rows between check-points 1051 static int DecodeImageData(VP8LDecoder* const dec, uint32_t* const data, 1052 int width, int height, int last_row, 1053 ProcessRowsFunc process_func) { 1054 int row = dec->last_pixel_ / width; 1055 int col = dec->last_pixel_ % width; 1056 VP8LBitReader* const br = &dec->br_; 1057 VP8LMetadata* const hdr = &dec->hdr_; 1058 uint32_t* src = data + dec->last_pixel_; 1059 uint32_t* last_cached = src; 1060 uint32_t* const src_end = data + width * height; // End of data 1061 uint32_t* const src_last = data + width * last_row; // Last pixel to decode 1062 const int len_code_limit = NUM_LITERAL_CODES + NUM_LENGTH_CODES; 1063 const int color_cache_limit = len_code_limit + hdr->color_cache_size_; 1064 int next_sync_row = dec->incremental_ ? row : 1 << 24; 1065 VP8LColorCache* const color_cache = 1066 (hdr->color_cache_size_ > 0) ? &hdr->color_cache_ : NULL; 1067 const int mask = hdr->huffman_mask_; 1068 const HTreeGroup* htree_group = 1069 (src < src_last) ? GetHtreeGroupForPos(hdr, col, row) : NULL; 1070 assert(dec->last_row_ < last_row); 1071 assert(src_last <= src_end); 1072 1073 while (src < src_last) { 1074 int code; 1075 if (row >= next_sync_row) { 1076 SaveState(dec, (int)(src - data)); 1077 next_sync_row = row + SYNC_EVERY_N_ROWS; 1078 } 1079 // Only update when changing tile. Note we could use this test: 1080 // if "((((prev_col ^ col) | prev_row ^ row)) > mask)" -> tile changed 1081 // but that's actually slower and needs storing the previous col/row. 1082 if ((col & mask) == 0) { 1083 htree_group = GetHtreeGroupForPos(hdr, col, row); 1084 } 1085 assert(htree_group != NULL); 1086 if (htree_group->is_trivial_code) { 1087 *src = htree_group->literal_arb; 1088 goto AdvanceByOne; 1089 } 1090 VP8LFillBitWindow(br); 1091 if (htree_group->use_packed_table) { 1092 code = ReadPackedSymbols(htree_group, br, src); 1093 if (code == PACKED_NON_LITERAL_CODE) goto AdvanceByOne; 1094 } else { 1095 code = ReadSymbol(htree_group->htrees[GREEN], br); 1096 } 1097 if (br->eos_) break; // early out 1098 if (code < NUM_LITERAL_CODES) { // Literal 1099 if (htree_group->is_trivial_literal) { 1100 *src = htree_group->literal_arb | (code << 8); 1101 } else { 1102 int red, blue, alpha; 1103 red = ReadSymbol(htree_group->htrees[RED], br); 1104 VP8LFillBitWindow(br); 1105 blue = ReadSymbol(htree_group->htrees[BLUE], br); 1106 alpha = ReadSymbol(htree_group->htrees[ALPHA], br); 1107 if (br->eos_) break; 1108 *src = ((uint32_t)alpha << 24) | (red << 16) | (code << 8) | blue; 1109 } 1110 AdvanceByOne: 1111 ++src; 1112 ++col; 1113 if (col >= width) { 1114 col = 0; 1115 ++row; 1116 if (process_func != NULL) { 1117 if (row <= last_row && (row % NUM_ARGB_CACHE_ROWS == 0)) { 1118 process_func(dec, row); 1119 } 1120 } 1121 if (color_cache != NULL) { 1122 while (last_cached < src) { 1123 VP8LColorCacheInsert(color_cache, *last_cached++); 1124 } 1125 } 1126 } 1127 } else if (code < len_code_limit) { // Backward reference 1128 int dist_code, dist; 1129 const int length_sym = code - NUM_LITERAL_CODES; 1130 const int length = GetCopyLength(length_sym, br); 1131 const int dist_symbol = ReadSymbol(htree_group->htrees[DIST], br); 1132 VP8LFillBitWindow(br); 1133 dist_code = GetCopyDistance(dist_symbol, br); 1134 dist = PlaneCodeToDistance(width, dist_code); 1135 if (br->eos_) break; 1136 if (src - data < (ptrdiff_t)dist || src_end - src < (ptrdiff_t)length) { 1137 goto Error; 1138 } else { 1139 CopyBlock32b(src, dist, length); 1140 } 1141 src += length; 1142 col += length; 1143 while (col >= width) { 1144 col -= width; 1145 ++row; 1146 if (process_func != NULL) { 1147 if (row <= last_row && (row % NUM_ARGB_CACHE_ROWS == 0)) { 1148 process_func(dec, row); 1149 } 1150 } 1151 } 1152 // Because of the check done above (before 'src' was incremented by 1153 // 'length'), the following holds true. 1154 assert(src <= src_end); 1155 if (col & mask) htree_group = GetHtreeGroupForPos(hdr, col, row); 1156 if (color_cache != NULL) { 1157 while (last_cached < src) { 1158 VP8LColorCacheInsert(color_cache, *last_cached++); 1159 } 1160 } 1161 } else if (code < color_cache_limit) { // Color cache 1162 const int key = code - len_code_limit; 1163 assert(color_cache != NULL); 1164 while (last_cached < src) { 1165 VP8LColorCacheInsert(color_cache, *last_cached++); 1166 } 1167 *src = VP8LColorCacheLookup(color_cache, key); 1168 goto AdvanceByOne; 1169 } else { // Not reached 1170 goto Error; 1171 } 1172 assert(br->eos_ == VP8LIsEndOfStream(br)); 1173 } 1174 1175 if (dec->incremental_ && br->eos_ && src < src_end) { 1176 RestoreState(dec); 1177 } else if (!br->eos_) { 1178 // Process the remaining rows corresponding to last row-block. 1179 if (process_func != NULL) { 1180 process_func(dec, row > last_row ? last_row : row); 1181 } 1182 dec->status_ = VP8_STATUS_OK; 1183 dec->last_pixel_ = (int)(src - data); // end-of-scan marker 1184 } else { 1185 // if not incremental, and we are past the end of buffer (eos_=1), then this 1186 // is a real bitstream error. 1187 goto Error; 1188 } 1189 return 1; 1190 1191 Error: 1192 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 1193 return 0; 1194 } 1195 1196 // ----------------------------------------------------------------------------- 1197 // VP8LTransform 1198 1199 static void ClearTransform(VP8LTransform* const transform) { 1200 WebPSafeFree(transform->data_); 1201 transform->data_ = NULL; 1202 } 1203 1204 // For security reason, we need to remap the color map to span 1205 // the total possible bundled values, and not just the num_colors. 1206 static int ExpandColorMap(int num_colors, VP8LTransform* const transform) { 1207 int i; 1208 const int final_num_colors = 1 << (8 >> transform->bits_); 1209 uint32_t* const new_color_map = 1210 (uint32_t*)WebPSafeMalloc((uint64_t)final_num_colors, 1211 sizeof(*new_color_map)); 1212 if (new_color_map == NULL) { 1213 return 0; 1214 } else { 1215 uint8_t* const data = (uint8_t*)transform->data_; 1216 uint8_t* const new_data = (uint8_t*)new_color_map; 1217 new_color_map[0] = transform->data_[0]; 1218 for (i = 4; i < 4 * num_colors; ++i) { 1219 // Equivalent to AddPixelEq(), on a byte-basis. 1220 new_data[i] = (data[i] + new_data[i - 4]) & 0xff; 1221 } 1222 for (; i < 4 * final_num_colors; ++i) { 1223 new_data[i] = 0; // black tail. 1224 } 1225 WebPSafeFree(transform->data_); 1226 transform->data_ = new_color_map; 1227 } 1228 return 1; 1229 } 1230 1231 static int ReadTransform(int* const xsize, int const* ysize, 1232 VP8LDecoder* const dec) { 1233 int ok = 1; 1234 VP8LBitReader* const br = &dec->br_; 1235 VP8LTransform* transform = &dec->transforms_[dec->next_transform_]; 1236 const VP8LImageTransformType type = 1237 (VP8LImageTransformType)VP8LReadBits(br, 2); 1238 1239 // Each transform type can only be present once in the stream. 1240 if (dec->transforms_seen_ & (1U << type)) { 1241 return 0; // Already there, let's not accept the second same transform. 1242 } 1243 dec->transforms_seen_ |= (1U << type); 1244 1245 transform->type_ = type; 1246 transform->xsize_ = *xsize; 1247 transform->ysize_ = *ysize; 1248 transform->data_ = NULL; 1249 ++dec->next_transform_; 1250 assert(dec->next_transform_ <= NUM_TRANSFORMS); 1251 1252 switch (type) { 1253 case PREDICTOR_TRANSFORM: 1254 case CROSS_COLOR_TRANSFORM: 1255 transform->bits_ = VP8LReadBits(br, 3) + 2; 1256 ok = DecodeImageStream(VP8LSubSampleSize(transform->xsize_, 1257 transform->bits_), 1258 VP8LSubSampleSize(transform->ysize_, 1259 transform->bits_), 1260 0, dec, &transform->data_); 1261 break; 1262 case COLOR_INDEXING_TRANSFORM: { 1263 const int num_colors = VP8LReadBits(br, 8) + 1; 1264 const int bits = (num_colors > 16) ? 0 1265 : (num_colors > 4) ? 1 1266 : (num_colors > 2) ? 2 1267 : 3; 1268 *xsize = VP8LSubSampleSize(transform->xsize_, bits); 1269 transform->bits_ = bits; 1270 ok = DecodeImageStream(num_colors, 1, 0, dec, &transform->data_); 1271 ok = ok && ExpandColorMap(num_colors, transform); 1272 break; 1273 } 1274 case SUBTRACT_GREEN: 1275 break; 1276 default: 1277 assert(0); // can't happen 1278 break; 1279 } 1280 1281 return ok; 1282 } 1283 1284 // ----------------------------------------------------------------------------- 1285 // VP8LMetadata 1286 1287 static void InitMetadata(VP8LMetadata* const hdr) { 1288 assert(hdr != NULL); 1289 memset(hdr, 0, sizeof(*hdr)); 1290 } 1291 1292 static void ClearMetadata(VP8LMetadata* const hdr) { 1293 assert(hdr != NULL); 1294 1295 WebPSafeFree(hdr->huffman_image_); 1296 WebPSafeFree(hdr->huffman_tables_); 1297 VP8LHtreeGroupsFree(hdr->htree_groups_); 1298 VP8LColorCacheClear(&hdr->color_cache_); 1299 VP8LColorCacheClear(&hdr->saved_color_cache_); 1300 InitMetadata(hdr); 1301 } 1302 1303 // ----------------------------------------------------------------------------- 1304 // VP8LDecoder 1305 1306 VP8LDecoder* VP8LNew(void) { 1307 VP8LDecoder* const dec = (VP8LDecoder*)WebPSafeCalloc(1ULL, sizeof(*dec)); 1308 if (dec == NULL) return NULL; 1309 dec->status_ = VP8_STATUS_OK; 1310 dec->state_ = READ_DIM; 1311 1312 VP8LDspInit(); // Init critical function pointers. 1313 1314 return dec; 1315 } 1316 1317 void VP8LClear(VP8LDecoder* const dec) { 1318 int i; 1319 if (dec == NULL) return; 1320 ClearMetadata(&dec->hdr_); 1321 1322 WebPSafeFree(dec->pixels_); 1323 dec->pixels_ = NULL; 1324 for (i = 0; i < dec->next_transform_; ++i) { 1325 ClearTransform(&dec->transforms_[i]); 1326 } 1327 dec->next_transform_ = 0; 1328 dec->transforms_seen_ = 0; 1329 1330 WebPSafeFree(dec->rescaler_memory); 1331 dec->rescaler_memory = NULL; 1332 1333 dec->output_ = NULL; // leave no trace behind 1334 } 1335 1336 void VP8LDelete(VP8LDecoder* const dec) { 1337 if (dec != NULL) { 1338 VP8LClear(dec); 1339 WebPSafeFree(dec); 1340 } 1341 } 1342 1343 static void UpdateDecoder(VP8LDecoder* const dec, int width, int height) { 1344 VP8LMetadata* const hdr = &dec->hdr_; 1345 const int num_bits = hdr->huffman_subsample_bits_; 1346 dec->width_ = width; 1347 dec->height_ = height; 1348 1349 hdr->huffman_xsize_ = VP8LSubSampleSize(width, num_bits); 1350 hdr->huffman_mask_ = (num_bits == 0) ? ~0 : (1 << num_bits) - 1; 1351 } 1352 1353 static int DecodeImageStream(int xsize, int ysize, 1354 int is_level0, 1355 VP8LDecoder* const dec, 1356 uint32_t** const decoded_data) { 1357 int ok = 1; 1358 int transform_xsize = xsize; 1359 int transform_ysize = ysize; 1360 VP8LBitReader* const br = &dec->br_; 1361 VP8LMetadata* const hdr = &dec->hdr_; 1362 uint32_t* data = NULL; 1363 int color_cache_bits = 0; 1364 1365 // Read the transforms (may recurse). 1366 if (is_level0) { 1367 while (ok && VP8LReadBits(br, 1)) { 1368 ok = ReadTransform(&transform_xsize, &transform_ysize, dec); 1369 } 1370 } 1371 1372 // Color cache 1373 if (ok && VP8LReadBits(br, 1)) { 1374 color_cache_bits = VP8LReadBits(br, 4); 1375 ok = (color_cache_bits >= 1 && color_cache_bits <= MAX_CACHE_BITS); 1376 if (!ok) { 1377 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 1378 goto End; 1379 } 1380 } 1381 1382 // Read the Huffman codes (may recurse). 1383 ok = ok && ReadHuffmanCodes(dec, transform_xsize, transform_ysize, 1384 color_cache_bits, is_level0); 1385 if (!ok) { 1386 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 1387 goto End; 1388 } 1389 1390 // Finish setting up the color-cache 1391 if (color_cache_bits > 0) { 1392 hdr->color_cache_size_ = 1 << color_cache_bits; 1393 if (!VP8LColorCacheInit(&hdr->color_cache_, color_cache_bits)) { 1394 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 1395 ok = 0; 1396 goto End; 1397 } 1398 } else { 1399 hdr->color_cache_size_ = 0; 1400 } 1401 UpdateDecoder(dec, transform_xsize, transform_ysize); 1402 1403 if (is_level0) { // level 0 complete 1404 dec->state_ = READ_HDR; 1405 goto End; 1406 } 1407 1408 { 1409 const uint64_t total_size = (uint64_t)transform_xsize * transform_ysize; 1410 data = (uint32_t*)WebPSafeMalloc(total_size, sizeof(*data)); 1411 if (data == NULL) { 1412 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 1413 ok = 0; 1414 goto End; 1415 } 1416 } 1417 1418 // Use the Huffman trees to decode the LZ77 encoded data. 1419 ok = DecodeImageData(dec, data, transform_xsize, transform_ysize, 1420 transform_ysize, NULL); 1421 ok = ok && !br->eos_; 1422 1423 End: 1424 if (!ok) { 1425 WebPSafeFree(data); 1426 ClearMetadata(hdr); 1427 } else { 1428 if (decoded_data != NULL) { 1429 *decoded_data = data; 1430 } else { 1431 // We allocate image data in this function only for transforms. At level 0 1432 // (that is: not the transforms), we shouldn't have allocated anything. 1433 assert(data == NULL); 1434 assert(is_level0); 1435 } 1436 dec->last_pixel_ = 0; // Reset for future DECODE_DATA_FUNC() calls. 1437 if (!is_level0) ClearMetadata(hdr); // Clean up temporary data behind. 1438 } 1439 return ok; 1440 } 1441 1442 //------------------------------------------------------------------------------ 1443 // Allocate internal buffers dec->pixels_ and dec->argb_cache_. 1444 static int AllocateInternalBuffers32b(VP8LDecoder* const dec, int final_width) { 1445 const uint64_t num_pixels = (uint64_t)dec->width_ * dec->height_; 1446 // Scratch buffer corresponding to top-prediction row for transforming the 1447 // first row in the row-blocks. Not needed for paletted alpha. 1448 const uint64_t cache_top_pixels = (uint16_t)final_width; 1449 // Scratch buffer for temporary BGRA storage. Not needed for paletted alpha. 1450 const uint64_t cache_pixels = (uint64_t)final_width * NUM_ARGB_CACHE_ROWS; 1451 const uint64_t total_num_pixels = 1452 num_pixels + cache_top_pixels + cache_pixels; 1453 1454 assert(dec->width_ <= final_width); 1455 dec->pixels_ = (uint32_t*)WebPSafeMalloc(total_num_pixels, sizeof(uint32_t)); 1456 if (dec->pixels_ == NULL) { 1457 dec->argb_cache_ = NULL; // for sanity check 1458 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 1459 return 0; 1460 } 1461 dec->argb_cache_ = dec->pixels_ + num_pixels + cache_top_pixels; 1462 return 1; 1463 } 1464 1465 static int AllocateInternalBuffers8b(VP8LDecoder* const dec) { 1466 const uint64_t total_num_pixels = (uint64_t)dec->width_ * dec->height_; 1467 dec->argb_cache_ = NULL; // for sanity check 1468 dec->pixels_ = (uint32_t*)WebPSafeMalloc(total_num_pixels, sizeof(uint8_t)); 1469 if (dec->pixels_ == NULL) { 1470 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 1471 return 0; 1472 } 1473 return 1; 1474 } 1475 1476 //------------------------------------------------------------------------------ 1477 1478 // Special row-processing that only stores the alpha data. 1479 static void ExtractAlphaRows(VP8LDecoder* const dec, int last_row) { 1480 int cur_row = dec->last_row_; 1481 int num_rows = last_row - cur_row; 1482 const uint32_t* in = dec->pixels_ + dec->width_ * cur_row; 1483 1484 assert(last_row <= dec->io_->crop_bottom); 1485 while (num_rows > 0) { 1486 const int num_rows_to_process = 1487 (num_rows > NUM_ARGB_CACHE_ROWS) ? NUM_ARGB_CACHE_ROWS : num_rows; 1488 // Extract alpha (which is stored in the green plane). 1489 ALPHDecoder* const alph_dec = (ALPHDecoder*)dec->io_->opaque; 1490 uint8_t* const output = alph_dec->output_; 1491 const int width = dec->io_->width; // the final width (!= dec->width_) 1492 const int cache_pixs = width * num_rows_to_process; 1493 uint8_t* const dst = output + width * cur_row; 1494 const uint32_t* const src = dec->argb_cache_; 1495 ApplyInverseTransforms(dec, num_rows_to_process, in); 1496 WebPExtractGreen(src, dst, cache_pixs); 1497 AlphaApplyFilter(alph_dec, 1498 cur_row, cur_row + num_rows_to_process, dst, width); 1499 num_rows -= num_rows_to_process; 1500 in += num_rows_to_process * dec->width_; 1501 cur_row += num_rows_to_process; 1502 } 1503 assert(cur_row == last_row); 1504 dec->last_row_ = dec->last_out_row_ = last_row; 1505 } 1506 1507 int VP8LDecodeAlphaHeader(ALPHDecoder* const alph_dec, 1508 const uint8_t* const data, size_t data_size) { 1509 int ok = 0; 1510 VP8LDecoder* dec = VP8LNew(); 1511 1512 if (dec == NULL) return 0; 1513 1514 assert(alph_dec != NULL); 1515 alph_dec->vp8l_dec_ = dec; 1516 1517 dec->width_ = alph_dec->width_; 1518 dec->height_ = alph_dec->height_; 1519 dec->io_ = &alph_dec->io_; 1520 dec->io_->opaque = alph_dec; 1521 dec->io_->width = alph_dec->width_; 1522 dec->io_->height = alph_dec->height_; 1523 1524 dec->status_ = VP8_STATUS_OK; 1525 VP8LInitBitReader(&dec->br_, data, data_size); 1526 1527 if (!DecodeImageStream(alph_dec->width_, alph_dec->height_, 1, dec, NULL)) { 1528 goto Err; 1529 } 1530 1531 // Special case: if alpha data uses only the color indexing transform and 1532 // doesn't use color cache (a frequent case), we will use DecodeAlphaData() 1533 // method that only needs allocation of 1 byte per pixel (alpha channel). 1534 if (dec->next_transform_ == 1 && 1535 dec->transforms_[0].type_ == COLOR_INDEXING_TRANSFORM && 1536 Is8bOptimizable(&dec->hdr_)) { 1537 alph_dec->use_8b_decode_ = 1; 1538 ok = AllocateInternalBuffers8b(dec); 1539 } else { 1540 // Allocate internal buffers (note that dec->width_ may have changed here). 1541 alph_dec->use_8b_decode_ = 0; 1542 ok = AllocateInternalBuffers32b(dec, alph_dec->width_); 1543 } 1544 1545 if (!ok) goto Err; 1546 1547 return 1; 1548 1549 Err: 1550 VP8LDelete(alph_dec->vp8l_dec_); 1551 alph_dec->vp8l_dec_ = NULL; 1552 return 0; 1553 } 1554 1555 int VP8LDecodeAlphaImageStream(ALPHDecoder* const alph_dec, int last_row) { 1556 VP8LDecoder* const dec = alph_dec->vp8l_dec_; 1557 assert(dec != NULL); 1558 assert(last_row <= dec->height_); 1559 1560 if (dec->last_row_ >= last_row) { 1561 return 1; // done 1562 } 1563 1564 if (!alph_dec->use_8b_decode_) WebPInitAlphaProcessing(); 1565 1566 // Decode (with special row processing). 1567 return alph_dec->use_8b_decode_ ? 1568 DecodeAlphaData(dec, (uint8_t*)dec->pixels_, dec->width_, dec->height_, 1569 last_row) : 1570 DecodeImageData(dec, dec->pixels_, dec->width_, dec->height_, 1571 last_row, ExtractAlphaRows); 1572 } 1573 1574 //------------------------------------------------------------------------------ 1575 1576 int VP8LDecodeHeader(VP8LDecoder* const dec, VP8Io* const io) { 1577 int width, height, has_alpha; 1578 1579 if (dec == NULL) return 0; 1580 if (io == NULL) { 1581 dec->status_ = VP8_STATUS_INVALID_PARAM; 1582 return 0; 1583 } 1584 1585 dec->io_ = io; 1586 dec->status_ = VP8_STATUS_OK; 1587 VP8LInitBitReader(&dec->br_, io->data, io->data_size); 1588 if (!ReadImageInfo(&dec->br_, &width, &height, &has_alpha)) { 1589 dec->status_ = VP8_STATUS_BITSTREAM_ERROR; 1590 goto Error; 1591 } 1592 dec->state_ = READ_DIM; 1593 io->width = width; 1594 io->height = height; 1595 1596 if (!DecodeImageStream(width, height, 1, dec, NULL)) goto Error; 1597 return 1; 1598 1599 Error: 1600 VP8LClear(dec); 1601 assert(dec->status_ != VP8_STATUS_OK); 1602 return 0; 1603 } 1604 1605 int VP8LDecodeImage(VP8LDecoder* const dec) { 1606 VP8Io* io = NULL; 1607 WebPDecParams* params = NULL; 1608 1609 // Sanity checks. 1610 if (dec == NULL) return 0; 1611 1612 assert(dec->hdr_.huffman_tables_ != NULL); 1613 assert(dec->hdr_.htree_groups_ != NULL); 1614 assert(dec->hdr_.num_htree_groups_ > 0); 1615 1616 io = dec->io_; 1617 assert(io != NULL); 1618 params = (WebPDecParams*)io->opaque; 1619 assert(params != NULL); 1620 1621 // Initialization. 1622 if (dec->state_ != READ_DATA) { 1623 dec->output_ = params->output; 1624 assert(dec->output_ != NULL); 1625 1626 if (!WebPIoInitFromOptions(params->options, io, MODE_BGRA)) { 1627 dec->status_ = VP8_STATUS_INVALID_PARAM; 1628 goto Err; 1629 } 1630 1631 if (!AllocateInternalBuffers32b(dec, io->width)) goto Err; 1632 1633 if (io->use_scaling && !AllocateAndInitRescaler(dec, io)) goto Err; 1634 1635 if (io->use_scaling || WebPIsPremultipliedMode(dec->output_->colorspace)) { 1636 // need the alpha-multiply functions for premultiplied output or rescaling 1637 WebPInitAlphaProcessing(); 1638 } 1639 if (!WebPIsRGBMode(dec->output_->colorspace)) { 1640 WebPInitConvertARGBToYUV(); 1641 if (dec->output_->u.YUVA.a != NULL) WebPInitAlphaProcessing(); 1642 } 1643 if (dec->incremental_) { 1644 if (dec->hdr_.color_cache_size_ > 0 && 1645 dec->hdr_.saved_color_cache_.colors_ == NULL) { 1646 if (!VP8LColorCacheInit(&dec->hdr_.saved_color_cache_, 1647 dec->hdr_.color_cache_.hash_bits_)) { 1648 dec->status_ = VP8_STATUS_OUT_OF_MEMORY; 1649 goto Err; 1650 } 1651 } 1652 } 1653 dec->state_ = READ_DATA; 1654 } 1655 1656 // Decode. 1657 if (!DecodeImageData(dec, dec->pixels_, dec->width_, dec->height_, 1658 io->crop_bottom, ProcessRows)) { 1659 goto Err; 1660 } 1661 1662 params->last_y = dec->last_out_row_; 1663 return 1; 1664 1665 Err: 1666 VP8LClear(dec); 1667 assert(dec->status_ != VP8_STATUS_OK); 1668 return 0; 1669 } 1670 1671 //------------------------------------------------------------------------------ 1672