• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // Copyright 2008 Google Inc.
2 // Author: Lincoln Smith
3 //
4 // Licensed under the Apache License, Version 2.0 (the "License");
5 // you may not use this file except in compliance with the License.
6 // You may obtain a copy of the License at
7 //
8 //      http://www.apache.org/licenses/LICENSE-2.0
9 //
10 // Unless required by applicable law or agreed to in writing, software
11 // distributed under the License is distributed on an "AS IS" BASIS,
12 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 // See the License for the specific language governing permissions and
14 // limitations under the License.
15 
16 #ifndef OPEN_VCDIFF_VCDECODER_H_
17 #define OPEN_VCDIFF_VCDECODER_H_
18 
19 #include <stddef.h>  // size_t
20 #include <string>
21 #include "google/output_string.h"
22 
23 namespace open_vcdiff {
24 
25 class VCDiffStreamingDecoderImpl;
26 
27 // A streaming decoder class.  Takes a dictionary (source) file and a delta
28 // file, and produces the original target file.  It is intended to process
29 // the partial contents of the delta file as they arrive, in "chunks".
30 // As soon as a chunk of bytes is received from a file read or from a network
31 // transmission, it can be passed to DecodeChunk(), which will then output
32 // as much of the target file as it can.
33 //
34 // The client should use this class as follows:
35 //    VCDiffStreamingDecoder v;
36 //    v.StartDecoding(dictionary_ptr, dictionary_size);
37 //    while (any data left) {
38 //      if (!v.DecodeChunk(data, len, &output_string)) {
39 //        handle error;
40 //        break;
41 //      }
42 //      process(output_string);  // might have no new data, though
43 //    }
44 //    if (!v.FinishDecoding()) { ... handle error ... }
45 //
46 // I.e., the allowed pattern of calls is
47 //    StartDecoding DecodeChunk* FinishDecoding
48 //
49 // NOTE: It is not necessary to call FinishDecoding if DecodeChunk
50 //       returns false.  When DecodeChunk returns false to signal an
51 //       error, it resets its state and is ready for a new StartDecoding.
52 //       If FinishDecoding is called, it will also return false.
53 //
54 class VCDiffStreamingDecoder {
55  public:
56   VCDiffStreamingDecoder();
57   ~VCDiffStreamingDecoder();
58 
59   // Resets the dictionary contents to "dictionary_ptr[0,dictionary_size-1]"
60   // and sets up the data structures for decoding.  Note that the dictionary
61   // contents are not copied, and the client is responsible for ensuring that
62   // dictionary_ptr is valid until FinishDecoding is called.
63   //
64   void StartDecoding(const char* dictionary_ptr, size_t dictionary_size);
65 
66   // Accepts "data[0,len-1]" as additional data received in the
67   // compressed stream.  If any chunks of data can be fully decoded,
68   // they are appended to output_string.
69   //
70   // Returns true on success, and false if the data was malformed
71   // or if there was an error in decoding it (e.g. out of memory, etc.).
72   //
73   // Note: we *append*, so the old contents of output_string stick around.
74   // This convention differs from the non-streaming Encode/Decode
75   // interfaces in VCDiffDecoder.
76   //
77   // output_string is guaranteed to be resized no more than once for each
78   // window in the VCDIFF delta file.  This rule is irrespective
79   // of the number of calls to DecodeChunk().
80   //
81   template<class OutputType>
DecodeChunk(const char * data,size_t len,OutputType * output)82   bool DecodeChunk(const char* data, size_t len, OutputType* output) {
83     OutputString<OutputType> output_string(output);
84     return DecodeChunkToInterface(data, len, &output_string);
85   }
86 
87   bool DecodeChunkToInterface(const char* data, size_t len,
88                               OutputStringInterface* output_string);
89 
90   // Finishes decoding after all data has been received.  Returns true
91   // if decoding of the entire stream was successful.  FinishDecoding()
92   // must be called for the current target before StartDecoding() can be
93   // called for a different target.
94   //
95   bool FinishDecoding();
96 
97   // *** Adjustable parameters ***
98 
99   // Specifies the maximum allowable target file size.  If the decoder
100   // encounters a delta file that would cause it to create a target file larger
101   // than this limit, it will log an error and stop decoding.  If the decoder is
102   // applied to delta files whose sizes vary greatly and whose contents can be
103   // trusted, then a value larger than the the default value (64 MB) can be
104   // specified to allow for maximum flexibility.  On the other hand, if the
105   // input data is known never to exceed a particular size, and/or the input
106   // data may be maliciously constructed, a lower value can be supplied in order
107   // to guard against running out of memory or swapping to disk while decoding
108   // an extremely large target file.  The argument must be between 0 and
109   // INT32_MAX (2G); if it is within these bounds, the function will set the
110   // limit and return true.  Otherwise, the function will return false and will
111   // not change the limit.  Setting the limit to 0 will cause all decode
112   // operations of non-empty target files to fail.
113   bool SetMaximumTargetFileSize(size_t new_maximum_target_file_size);
114 
115   // Specifies the maximum allowable target *window* size.  (A target file is
116   // composed of zero or more target windows.)  If the decoder encounters a
117   // delta window that would cause it to create a target window larger
118   // than this limit, it will log an error and stop decoding.
119   bool SetMaximumTargetWindowSize(size_t new_maximum_target_window_size);
120 
121   // This interface must be called before StartDecoding().  If its argument
122   // is true, then the VCD_TARGET flag can be specified to allow the source
123   // segment to be chosen from the previously-decoded target data.  (This is the
124   // default behavior.)  If it is false, then specifying the VCD_TARGET flag is
125   // considered an error, and the decoder does not need to keep in memory any
126   // decoded target data prior to the current window.
127   void SetAllowVcdTarget(bool allow_vcd_target);
128 
129  private:
130   VCDiffStreamingDecoderImpl* const impl_;
131 
132   // Make the copy constructor and assignment operator private
133   // so that they don't inadvertently get used.
134   explicit VCDiffStreamingDecoder(const VCDiffStreamingDecoder&);
135   void operator=(const VCDiffStreamingDecoder&);
136 };
137 
138 // A simpler (non-streaming) interface to the VCDIFF decoder that can be used
139 // if the entire delta file is available.
140 //
141 class VCDiffDecoder {
142  public:
143   typedef std::string string;
144 
VCDiffDecoder()145   VCDiffDecoder() { }
~VCDiffDecoder()146   ~VCDiffDecoder() { }
147 
148   /***** Simple interface *****/
149 
150   // Replaces old contents of "*target" with the result of decoding
151   // the bytes found in "encoding."
152   //
153   // Returns true if "encoding" was a well-formed sequence of
154   // instructions, and returns false if not.
155   //
156   template<class OutputType>
Decode(const char * dictionary_ptr,size_t dictionary_size,const string & encoding,OutputType * target)157   bool Decode(const char* dictionary_ptr,
158               size_t dictionary_size,
159               const string& encoding,
160               OutputType* target) {
161     OutputString<OutputType> output_string(target);
162     return DecodeToInterface(dictionary_ptr,
163                              dictionary_size,
164                              encoding,
165                              &output_string);
166   }
167 
168  private:
169   bool DecodeToInterface(const char* dictionary_ptr,
170                          size_t dictionary_size,
171                          const string& encoding,
172                          OutputStringInterface* target);
173 
174   VCDiffStreamingDecoder decoder_;
175 
176   // Make the copy constructor and assignment operator private
177   // so that they don't inadvertently get used.
178   explicit VCDiffDecoder(const VCDiffDecoder&);
179   void operator=(const VCDiffDecoder&);
180 };
181 
182 };  // namespace open_vcdiff
183 
184 #endif  // OPEN_VCDIFF_VCDECODER_H_
185