diff options
Diffstat (limited to 'src/google/vcdecoder.h')
-rw-r--r-- | src/google/vcdecoder.h | 184 |
1 files changed, 184 insertions, 0 deletions
diff --git a/src/google/vcdecoder.h b/src/google/vcdecoder.h new file mode 100644 index 0000000..3b3b9ec --- /dev/null +++ b/src/google/vcdecoder.h @@ -0,0 +1,184 @@ +// Copyright 2008 Google Inc. +// Author: Lincoln Smith +// +// Licensed under the Apache License, Version 2.0 (the "License"); +// you may not use this file except in compliance with the License. +// You may obtain a copy of the License at +// +// http://www.apache.org/licenses/LICENSE-2.0 +// +// Unless required by applicable law or agreed to in writing, software +// distributed under the License is distributed on an "AS IS" BASIS, +// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +// See the License for the specific language governing permissions and +// limitations under the License. + +#ifndef OPEN_VCDIFF_VCDECODER_H_ +#define OPEN_VCDIFF_VCDECODER_H_ + +#include <stddef.h> // size_t +#include <string> +#include "google/output_string.h" + +namespace open_vcdiff { + +class VCDiffStreamingDecoderImpl; + +// A streaming decoder class. Takes a dictionary (source) file and a delta +// file, and produces the original target file. It is intended to process +// the partial contents of the delta file as they arrive, in "chunks". +// As soon as a chunk of bytes is received from a file read or from a network +// transmission, it can be passed to DecodeChunk(), which will then output +// as much of the target file as it can. +// +// The client should use this class as follows: +// VCDiffStreamingDecoder v; +// v.StartDecoding(dictionary_ptr, dictionary_size); +// while (any data left) { +// if (!v.DecodeChunk(data, len, &output_string)) { +// handle error; +// break; +// } +// process(output_string); // might have no new data, though +// } +// if (!v.FinishDecoding()) { ... handle error ... } +// +// I.e., the allowed pattern of calls is +// StartDecoding DecodeChunk* FinishDecoding +// +// NOTE: It is not necessary to call FinishDecoding if DecodeChunk +// returns false. When DecodeChunk returns false to signal an +// error, it resets its state and is ready for a new StartDecoding. +// If FinishDecoding is called, it will also return false. +// +class VCDiffStreamingDecoder { + public: + VCDiffStreamingDecoder(); + ~VCDiffStreamingDecoder(); + + // Resets the dictionary contents to "dictionary_ptr[0,dictionary_size-1]" + // and sets up the data structures for decoding. Note that the dictionary + // contents are not copied, and the client is responsible for ensuring that + // dictionary_ptr is valid until FinishDecoding is called. + // + void StartDecoding(const char* dictionary_ptr, size_t dictionary_size); + + // Accepts "data[0,len-1]" as additional data received in the + // compressed stream. If any chunks of data can be fully decoded, + // they are appended to output_string. + // + // Returns true on success, and false if the data was malformed + // or if there was an error in decoding it (e.g. out of memory, etc.). + // + // Note: we *append*, so the old contents of output_string stick around. + // This convention differs from the non-streaming Encode/Decode + // interfaces in VCDiffDecoder. + // + // output_string is guaranteed to be resized no more than once for each + // window in the VCDIFF delta file. This rule is irrespective + // of the number of calls to DecodeChunk(). + // + template<class OutputType> + bool DecodeChunk(const char* data, size_t len, OutputType* output) { + OutputString<OutputType> output_string(output); + return DecodeChunkToInterface(data, len, &output_string); + } + + bool DecodeChunkToInterface(const char* data, size_t len, + OutputStringInterface* output_string); + + // Finishes decoding after all data has been received. Returns true + // if decoding of the entire stream was successful. FinishDecoding() + // must be called for the current target before StartDecoding() can be + // called for a different target. + // + bool FinishDecoding(); + + // *** Adjustable parameters *** + + // Specifies the maximum allowable target file size. If the decoder + // encounters a delta file that would cause it to create a target file larger + // than this limit, it will log an error and stop decoding. If the decoder is + // applied to delta files whose sizes vary greatly and whose contents can be + // trusted, then a value larger than the the default value (64 MB) can be + // specified to allow for maximum flexibility. On the other hand, if the + // input data is known never to exceed a particular size, and/or the input + // data may be maliciously constructed, a lower value can be supplied in order + // to guard against running out of memory or swapping to disk while decoding + // an extremely large target file. The argument must be between 0 and + // INT32_MAX (2G); if it is within these bounds, the function will set the + // limit and return true. Otherwise, the function will return false and will + // not change the limit. Setting the limit to 0 will cause all decode + // operations of non-empty target files to fail. + bool SetMaximumTargetFileSize(size_t new_maximum_target_file_size); + + // Specifies the maximum allowable target *window* size. (A target file is + // composed of zero or more target windows.) If the decoder encounters a + // delta window that would cause it to create a target window larger + // than this limit, it will log an error and stop decoding. + bool SetMaximumTargetWindowSize(size_t new_maximum_target_window_size); + + // This interface must be called before StartDecoding(). If its argument + // is true, then the VCD_TARGET flag can be specified to allow the source + // segment to be chosen from the previously-decoded target data. (This is the + // default behavior.) If it is false, then specifying the VCD_TARGET flag is + // considered an error, and the decoder does not need to keep in memory any + // decoded target data prior to the current window. + void SetAllowVcdTarget(bool allow_vcd_target); + + private: + VCDiffStreamingDecoderImpl* const impl_; + + // Make the copy constructor and assignment operator private + // so that they don't inadvertently get used. + explicit VCDiffStreamingDecoder(const VCDiffStreamingDecoder&); + void operator=(const VCDiffStreamingDecoder&); +}; + +// A simpler (non-streaming) interface to the VCDIFF decoder that can be used +// if the entire delta file is available. +// +class VCDiffDecoder { + public: + typedef std::string string; + + VCDiffDecoder() { } + ~VCDiffDecoder() { } + + /***** Simple interface *****/ + + // Replaces old contents of "*target" with the result of decoding + // the bytes found in "encoding." + // + // Returns true if "encoding" was a well-formed sequence of + // instructions, and returns false if not. + // + template<class OutputType> + bool Decode(const char* dictionary_ptr, + size_t dictionary_size, + const string& encoding, + OutputType* target) { + OutputString<OutputType> output_string(target); + return DecodeToInterface(dictionary_ptr, + dictionary_size, + encoding, + &output_string); + } + + private: + bool DecodeToInterface(const char* dictionary_ptr, + size_t dictionary_size, + const string& encoding, + OutputStringInterface* target); + + VCDiffStreamingDecoder decoder_; + + // Make the copy constructor and assignment operator private + // so that they don't inadvertently get used. + explicit VCDiffDecoder(const VCDiffDecoder&); + void operator=(const VCDiffDecoder&); +}; + +}; // namespace open_vcdiff + +#endif // OPEN_VCDIFF_VCDECODER_H_ |