| // Copyright 2008 Google Inc. |
| // Author: Lincoln Smith |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #ifndef OPEN_VCDIFF_VCDECODER_H_ |
| #define OPEN_VCDIFF_VCDECODER_H_ |
| |
| #include <stddef.h> // size_t |
| #include <string> |
| #include "google/output_string.h" |
| |
| namespace open_vcdiff { |
| |
| class VCDiffStreamingDecoderImpl; |
| |
| // A streaming decoder class. Takes a dictionary (source) file and a delta |
| // file, and produces the original target file. It is intended to process |
| // the partial contents of the delta file as they arrive, in "chunks". |
| // As soon as a chunk of bytes is received from a file read or from a network |
| // transmission, it can be passed to DecodeChunk(), which will then output |
| // as much of the target file as it can. |
| // |
| // The client should use this class as follows: |
| // VCDiffStreamingDecoder v; |
| // v.StartDecoding(dictionary_ptr, dictionary_size); |
| // while (any data left) { |
| // if (!v.DecodeChunk(data, len, &output_string)) { |
| // handle error; |
| // break; |
| // } |
| // process(output_string); // might have no new data, though |
| // } |
| // if (!v.FinishDecoding()) { ... handle error ... } |
| // |
| // I.e., the allowed pattern of calls is |
| // StartDecoding DecodeChunk* FinishDecoding |
| // |
| // NOTE: It is not necessary to call FinishDecoding if DecodeChunk |
| // returns false. When DecodeChunk returns false to signal an |
| // error, it resets its state and is ready for a new StartDecoding. |
| // If FinishDecoding is called, it will also return false. |
| // |
| class VCDiffStreamingDecoder { |
| public: |
| VCDiffStreamingDecoder(); |
| ~VCDiffStreamingDecoder(); |
| |
| // Resets the dictionary contents to "dictionary_ptr[0,dictionary_size-1]" |
| // and sets up the data structures for decoding. Note that the dictionary |
| // contents are not copied, and the client is responsible for ensuring that |
| // dictionary_ptr is valid until FinishDecoding is called. |
| // |
| void StartDecoding(const char* dictionary_ptr, size_t dictionary_size); |
| |
| // Accepts "data[0,len-1]" as additional data received in the |
| // compressed stream. If any chunks of data can be fully decoded, |
| // they are appended to output_string. |
| // |
| // Returns true on success, and false if the data was malformed |
| // or if there was an error in decoding it (e.g. out of memory, etc.). |
| // |
| // Note: we *append*, so the old contents of output_string stick around. |
| // This convention differs from the non-streaming Encode/Decode |
| // interfaces in VCDiffDecoder. |
| // |
| // output_string is guaranteed to be resized no more than once for each |
| // window in the VCDIFF delta file. This rule is irrespective |
| // of the number of calls to DecodeChunk(). |
| // |
| template<class OutputType> |
| bool DecodeChunk(const char* data, size_t len, OutputType* output) { |
| OutputString<OutputType> output_string(output); |
| return DecodeChunkToInterface(data, len, &output_string); |
| } |
| |
| bool DecodeChunkToInterface(const char* data, size_t len, |
| OutputStringInterface* output_string); |
| |
| // Finishes decoding after all data has been received. Returns true |
| // if decoding of the entire stream was successful. FinishDecoding() |
| // must be called for the current target before StartDecoding() can be |
| // called for a different target. |
| // |
| bool FinishDecoding(); |
| |
| // *** Adjustable parameters *** |
| |
| // Specifies the maximum allowable target file size. If the decoder |
| // encounters a delta file that would cause it to create a target file larger |
| // than this limit, it will log an error and stop decoding. If the decoder is |
| // applied to delta files whose sizes vary greatly and whose contents can be |
| // trusted, then a value larger than the the default value (64 MB) can be |
| // specified to allow for maximum flexibility. On the other hand, if the |
| // input data is known never to exceed a particular size, and/or the input |
| // data may be maliciously constructed, a lower value can be supplied in order |
| // to guard against running out of memory or swapping to disk while decoding |
| // an extremely large target file. The argument must be between 0 and |
| // INT32_MAX (2G); if it is within these bounds, the function will set the |
| // limit and return true. Otherwise, the function will return false and will |
| // not change the limit. Setting the limit to 0 will cause all decode |
| // operations of non-empty target files to fail. |
| bool SetMaximumTargetFileSize(size_t new_maximum_target_file_size); |
| |
| // Specifies the maximum allowable target *window* size. (A target file is |
| // composed of zero or more target windows.) If the decoder encounters a |
| // delta window that would cause it to create a target window larger |
| // than this limit, it will log an error and stop decoding. |
| bool SetMaximumTargetWindowSize(size_t new_maximum_target_window_size); |
| |
| // This interface must be called before StartDecoding(). If its argument |
| // is true, then the VCD_TARGET flag can be specified to allow the source |
| // segment to be chosen from the previously-decoded target data. (This is the |
| // default behavior.) If it is false, then specifying the VCD_TARGET flag is |
| // considered an error, and the decoder does not need to keep in memory any |
| // decoded target data prior to the current window. |
| void SetAllowVcdTarget(bool allow_vcd_target); |
| |
| private: |
| VCDiffStreamingDecoderImpl* const impl_; |
| |
| // Make the copy constructor and assignment operator private |
| // so that they don't inadvertently get used. |
| explicit VCDiffStreamingDecoder(const VCDiffStreamingDecoder&); |
| void operator=(const VCDiffStreamingDecoder&); |
| }; |
| |
| // A simpler (non-streaming) interface to the VCDIFF decoder that can be used |
| // if the entire delta file is available. |
| // |
| class VCDiffDecoder { |
| public: |
| typedef std::string string; |
| |
| VCDiffDecoder() { } |
| ~VCDiffDecoder() { } |
| |
| /***** Simple interface *****/ |
| |
| // Replaces old contents of "*target" with the result of decoding |
| // the bytes found in "encoding." |
| // |
| // Returns true if "encoding" was a well-formed sequence of |
| // instructions, and returns false if not. |
| // |
| template<class OutputType> |
| bool Decode(const char* dictionary_ptr, |
| size_t dictionary_size, |
| const string& encoding, |
| OutputType* target) { |
| OutputString<OutputType> output_string(target); |
| return DecodeToInterface(dictionary_ptr, |
| dictionary_size, |
| encoding, |
| &output_string); |
| } |
| |
| private: |
| bool DecodeToInterface(const char* dictionary_ptr, |
| size_t dictionary_size, |
| const string& encoding, |
| OutputStringInterface* target); |
| |
| VCDiffStreamingDecoder decoder_; |
| |
| // Make the copy constructor and assignment operator private |
| // so that they don't inadvertently get used. |
| explicit VCDiffDecoder(const VCDiffDecoder&); |
| void operator=(const VCDiffDecoder&); |
| }; |
| |
| }; // namespace open_vcdiff |
| |
| #endif // OPEN_VCDIFF_VCDECODER_H_ |