Home | History | Annotate | Download | only in google
      1 // Copyright 2008 Google Inc.
      2 // Author: Lincoln Smith
      3 //
      4 // Licensed under the Apache License, Version 2.0 (the "License");
      5 // you may not use this file except in compliance with the License.
      6 // You may obtain a copy of the License at
      7 //
      8 //      http://www.apache.org/licenses/LICENSE-2.0
      9 //
     10 // Unless required by applicable law or agreed to in writing, software
     11 // distributed under the License is distributed on an "AS IS" BASIS,
     12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
     13 // See the License for the specific language governing permissions and
     14 // limitations under the License.
     15 
     16 #ifndef OPEN_VCDIFF_VCDECODER_H_
     17 #define OPEN_VCDIFF_VCDECODER_H_
     18 
     19 #include <stddef.h>  // size_t
     20 #include <string>
     21 #include "google/output_string.h"
     22 
     23 namespace open_vcdiff {
     24 
     25 class VCDiffStreamingDecoderImpl;
     26 
     27 // A streaming decoder class.  Takes a dictionary (source) file and a delta
     28 // file, and produces the original target file.  It is intended to process
     29 // the partial contents of the delta file as they arrive, in "chunks".
     30 // As soon as a chunk of bytes is received from a file read or from a network
     31 // transmission, it can be passed to DecodeChunk(), which will then output
     32 // as much of the target file as it can.
     33 //
     34 // The client should use this class as follows:
     35 //    VCDiffStreamingDecoder v;
     36 //    v.StartDecoding(dictionary_ptr, dictionary_size);
     37 //    while (any data left) {
     38 //      if (!v.DecodeChunk(data, len, &output_string)) {
     39 //        handle error;
     40 //        break;
     41 //      }
     42 //      process(output_string);  // might have no new data, though
     43 //    }
     44 //    if (!v.FinishDecoding()) { ... handle error ... }
     45 //
     46 // I.e., the allowed pattern of calls is
     47 //    StartDecoding DecodeChunk* FinishDecoding
     48 //
     49 // NOTE: It is not necessary to call FinishDecoding if DecodeChunk
     50 //       returns false.  When DecodeChunk returns false to signal an
     51 //       error, it resets its state and is ready for a new StartDecoding.
     52 //       If FinishDecoding is called, it will also return false.
     53 //
     54 class VCDiffStreamingDecoder {
     55  public:
     56   VCDiffStreamingDecoder();
     57   ~VCDiffStreamingDecoder();
     58 
     59   // Resets the dictionary contents to "dictionary_ptr[0,dictionary_size-1]"
     60   // and sets up the data structures for decoding.  Note that the dictionary
     61   // contents are not copied, and the client is responsible for ensuring that
     62   // dictionary_ptr is valid until FinishDecoding is called.
     63   //
     64   void StartDecoding(const char* dictionary_ptr, size_t dictionary_size);
     65 
     66   // Accepts "data[0,len-1]" as additional data received in the
     67   // compressed stream.  If any chunks of data can be fully decoded,
     68   // they are appended to output_string.
     69   //
     70   // Returns true on success, and false if the data was malformed
     71   // or if there was an error in decoding it (e.g. out of memory, etc.).
     72   //
     73   // Note: we *append*, so the old contents of output_string stick around.
     74   // This convention differs from the non-streaming Encode/Decode
     75   // interfaces in VCDiffDecoder.
     76   //
     77   // output_string is guaranteed to be resized no more than once for each
     78   // window in the VCDIFF delta file.  This rule is irrespective
     79   // of the number of calls to DecodeChunk().
     80   //
     81   template<class OutputType>
     82   bool DecodeChunk(const char* data, size_t len, OutputType* output) {
     83     OutputString<OutputType> output_string(output);
     84     return DecodeChunkToInterface(data, len, &output_string);
     85   }
     86 
     87   bool DecodeChunkToInterface(const char* data, size_t len,
     88                               OutputStringInterface* output_string);
     89 
     90   // Finishes decoding after all data has been received.  Returns true
     91   // if decoding of the entire stream was successful.  FinishDecoding()
     92   // must be called for the current target before StartDecoding() can be
     93   // called for a different target.
     94   //
     95   bool FinishDecoding();
     96 
     97   // *** Adjustable parameters ***
     98 
     99   // Specifies the maximum allowable target file size.  If the decoder
    100   // encounters a delta file that would cause it to create a target file larger
    101   // than this limit, it will log an error and stop decoding.  If the decoder is
    102   // applied to delta files whose sizes vary greatly and whose contents can be
    103   // trusted, then a value larger than the the default value (64 MB) can be
    104   // specified to allow for maximum flexibility.  On the other hand, if the
    105   // input data is known never to exceed a particular size, and/or the input
    106   // data may be maliciously constructed, a lower value can be supplied in order
    107   // to guard against running out of memory or swapping to disk while decoding
    108   // an extremely large target file.  The argument must be between 0 and
    109   // INT32_MAX (2G); if it is within these bounds, the function will set the
    110   // limit and return true.  Otherwise, the function will return false and will
    111   // not change the limit.  Setting the limit to 0 will cause all decode
    112   // operations of non-empty target files to fail.
    113   bool SetMaximumTargetFileSize(size_t new_maximum_target_file_size);
    114 
    115   // Specifies the maximum allowable target *window* size.  (A target file is
    116   // composed of zero or more target windows.)  If the decoder encounters a
    117   // delta window that would cause it to create a target window larger
    118   // than this limit, it will log an error and stop decoding.
    119   bool SetMaximumTargetWindowSize(size_t new_maximum_target_window_size);
    120 
    121   // This interface must be called before StartDecoding().  If its argument
    122   // is true, then the VCD_TARGET flag can be specified to allow the source
    123   // segment to be chosen from the previously-decoded target data.  (This is the
    124   // default behavior.)  If it is false, then specifying the VCD_TARGET flag is
    125   // considered an error, and the decoder does not need to keep in memory any
    126   // decoded target data prior to the current window.
    127   void SetAllowVcdTarget(bool allow_vcd_target);
    128 
    129  private:
    130   VCDiffStreamingDecoderImpl* const impl_;
    131 
    132   // Make the copy constructor and assignment operator private
    133   // so that they don't inadvertently get used.
    134   explicit VCDiffStreamingDecoder(const VCDiffStreamingDecoder&);
    135   void operator=(const VCDiffStreamingDecoder&);
    136 };
    137 
    138 // A simpler (non-streaming) interface to the VCDIFF decoder that can be used
    139 // if the entire delta file is available.
    140 //
    141 class VCDiffDecoder {
    142  public:
    143   typedef std::string string;
    144 
    145   VCDiffDecoder() { }
    146   ~VCDiffDecoder() { }
    147 
    148   /***** Simple interface *****/
    149 
    150   // Replaces old contents of "*target" with the result of decoding
    151   // the bytes found in "encoding."
    152   //
    153   // Returns true if "encoding" was a well-formed sequence of
    154   // instructions, and returns false if not.
    155   //
    156   template<class OutputType>
    157   bool Decode(const char* dictionary_ptr,
    158               size_t dictionary_size,
    159               const string& encoding,
    160               OutputType* target) {
    161     OutputString<OutputType> output_string(target);
    162     return DecodeToInterface(dictionary_ptr,
    163                              dictionary_size,
    164                              encoding,
    165                              &output_string);
    166   }
    167 
    168  private:
    169   bool DecodeToInterface(const char* dictionary_ptr,
    170                          size_t dictionary_size,
    171                          const string& encoding,
    172                          OutputStringInterface* target);
    173 
    174   VCDiffStreamingDecoder decoder_;
    175 
    176   // Make the copy constructor and assignment operator private
    177   // so that they don't inadvertently get used.
    178   explicit VCDiffDecoder(const VCDiffDecoder&);
    179   void operator=(const VCDiffDecoder&);
    180 };
    181 
    182 };  // namespace open_vcdiff
    183 
    184 #endif  // OPEN_VCDIFF_VCDECODER_H_
    185