Home | History | Annotate | Download | only in zopfli
      1 /*
      2 Copyright 2011 Google Inc. All Rights Reserved.
      3 
      4 Licensed under the Apache License, Version 2.0 (the "License");
      5 you may not use this file except in compliance with the License.
      6 You may obtain a copy of the License at
      7 
      8     http://www.apache.org/licenses/LICENSE-2.0
      9 
     10 Unless required by applicable law or agreed to in writing, software
     11 distributed under the License is distributed on an "AS IS" BASIS,
     12 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13 See the License for the specific language governing permissions and
     14 limitations under the License.
     15 
     16 Author: lode.vandevenne (at) gmail.com (Lode Vandevenne)
     17 Author: jyrki.alakuijala (at) gmail.com (Jyrki Alakuijala)
     18 */
     19 
     20 /*
     21 Several utilities, including: #defines to try different compression results,
     22 basic deflate specification values and generic program options.
     23 */
     24 
     25 #ifndef ZOPFLI_UTIL_H_
     26 #define ZOPFLI_UTIL_H_
     27 
     28 #include <string.h>
     29 #include <stdlib.h>
     30 
     31 /* Minimum and maximum length that can be encoded in deflate. */
     32 #define ZOPFLI_MAX_MATCH 258
     33 #define ZOPFLI_MIN_MATCH 3
     34 
     35 /*
     36 The window size for deflate. Must be a power of two. This should be 32768, the
     37 maximum possible by the deflate spec. Anything less hurts compression more than
     38 speed.
     39 */
     40 #define ZOPFLI_WINDOW_SIZE 32768
     41 
     42 /*
     43 The window mask used to wrap indices into the window. This is why the
     44 window size must be a power of two.
     45 */
     46 #define ZOPFLI_WINDOW_MASK (ZOPFLI_WINDOW_SIZE - 1)
     47 
     48 /*
     49 A block structure of huge, non-smart, blocks to divide the input into, to allow
     50 operating on huge files without exceeding memory, such as the 1GB wiki9 corpus.
     51 The whole compression algorithm, including the smarter block splitting, will
     52 be executed independently on each huge block.
     53 Dividing into huge blocks hurts compression, but not much relative to the size.
     54 Set this to, for example, 20MB (20000000). Set it to 0 to disable master blocks.
     55 */
     56 #define ZOPFLI_MASTER_BLOCK_SIZE 20000000
     57 
     58 /*
     59 Used to initialize costs for example
     60 */
     61 #define ZOPFLI_LARGE_FLOAT 1e30
     62 
     63 /*
     64 For longest match cache. max 256. Uses huge amounts of memory but makes it
     65 faster. Uses this many times three bytes per single byte of the input data.
     66 This is so because longest match finding has to find the exact distance
     67 that belongs to each length for the best lz77 strategy.
     68 Good values: e.g. 5, 8.
     69 */
     70 #define ZOPFLI_CACHE_LENGTH 8
     71 
     72 /*
     73 limit the max hash chain hits for this hash value. This has an effect only
     74 on files where the hash value is the same very often. On these files, this
     75 gives worse compression (the value should ideally be 32768, which is the
     76 ZOPFLI_WINDOW_SIZE, while zlib uses 4096 even for best level), but makes it
     77 faster on some specific files.
     78 Good value: e.g. 8192.
     79 */
     80 #define ZOPFLI_MAX_CHAIN_HITS 8192
     81 
     82 /*
     83 Whether to use the longest match cache for ZopfliFindLongestMatch. This cache
     84 consumes a lot of memory but speeds it up. No effect on compression size.
     85 */
     86 #define ZOPFLI_LONGEST_MATCH_CACHE
     87 
     88 /*
     89 Enable to remember amount of successive identical bytes in the hash chain for
     90 finding longest match
     91 required for ZOPFLI_HASH_SAME_HASH and ZOPFLI_SHORTCUT_LONG_REPETITIONS
     92 This has no effect on the compression result, and enabling it increases speed.
     93 */
     94 #define ZOPFLI_HASH_SAME
     95 
     96 /*
     97 Switch to a faster hash based on the info from ZOPFLI_HASH_SAME once the
     98 best length so far is long enough. This is way faster for files with lots of
     99 identical bytes, on which the compressor is otherwise too slow. Regular files
    100 are unaffected or maybe a tiny bit slower.
    101 This has no effect on the compression result, only on speed.
    102 */
    103 #define ZOPFLI_HASH_SAME_HASH
    104 
    105 /*
    106 Enable this, to avoid slowness for files which are a repetition of the same
    107 character more than a multiple of ZOPFLI_MAX_MATCH times. This should not affect
    108 the compression result.
    109 */
    110 #define ZOPFLI_SHORTCUT_LONG_REPETITIONS
    111 
    112 /*
    113 Whether to use lazy matching in the greedy LZ77 implementation. This gives a
    114 better result of ZopfliLZ77Greedy, but the effect this has on the optimal LZ77
    115 varies from file to file.
    116 */
    117 #define ZOPFLI_LAZY_MATCHING
    118 
    119 /*
    120 Gets the symbol for the given length, cfr. the DEFLATE spec.
    121 Returns the symbol in the range [257-285] (inclusive)
    122 */
    123 int ZopfliGetLengthSymbol(int l);
    124 
    125 /* Gets the amount of extra bits for the given length, cfr. the DEFLATE spec. */
    126 int ZopfliGetLengthExtraBits(int l);
    127 
    128 /* Gets value of the extra bits for the given length, cfr. the DEFLATE spec. */
    129 int ZopfliGetLengthExtraBitsValue(int l);
    130 
    131 /* Gets the symbol for the given dist, cfr. the DEFLATE spec. */
    132 int ZopfliGetDistSymbol(int dist);
    133 
    134 /* Gets the amount of extra bits for the given dist, cfr. the DEFLATE spec. */
    135 int ZopfliGetDistExtraBits(int dist);
    136 
    137 /* Gets value of the extra bits for the given dist, cfr. the DEFLATE spec. */
    138 int ZopfliGetDistExtraBitsValue(int dist);
    139 
    140 /*
    141 Appends value to dynamically allocated memory, doubling its allocation size
    142 whenever needed.
    143 
    144 value: the value to append, type T
    145 data: pointer to the dynamic array to append to, type T**
    146 size: pointer to the size of the array to append to, type size_t*. This is the
    147 size that you consider the array to be, not the internal allocation size.
    148 Precondition: allocated size of data is at least a power of two greater than or
    149 equal than *size.
    150 */
    151 #ifdef __cplusplus /* C++ cannot assign void* from malloc to *data */
    152 #define ZOPFLI_APPEND_DATA(/* T */ value, /* T** */ data, /* size_t* */ size) {\
    153   if (!((*size) & ((*size) - 1))) {\
    154     /*double alloc size if it's a power of two*/\
    155     void** data_void = reinterpret_cast<void**>(data);\
    156     *data_void = (*size) == 0 ? malloc(sizeof(**data))\
    157                               : realloc((*data), (*size) * 2 * sizeof(**data));\
    158   }\
    159   (*data)[(*size)] = (value);\
    160   (*size)++;\
    161 }
    162 #else /* C gives problems with strict-aliasing rules for (void**) cast */
    163 #define ZOPFLI_APPEND_DATA(/* T */ value, /* T** */ data, /* size_t* */ size) {\
    164   if (!((*size) & ((*size) - 1))) {\
    165     /*double alloc size if it's a power of two*/\
    166     (*data) = (*size) == 0 ? malloc(sizeof(**data))\
    167                            : realloc((*data), (*size) * 2 * sizeof(**data));\
    168   }\
    169   (*data)[(*size)] = (value);\
    170   (*size)++;\
    171 }
    172 #endif
    173 
    174 
    175 #endif  /* ZOPFLI_UTIL_H_ */
    176