snappy 0.0.10 → 0.0.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (47) hide show
  1. checksums.yaml +4 -4
  2. data/.gitmodules +3 -0
  3. data/Rakefile +12 -13
  4. data/ext/extconf.rb +22 -31
  5. data/lib/snappy/reader.rb +10 -7
  6. data/lib/snappy/version.rb +1 -1
  7. data/snappy.gemspec +24 -0
  8. data/test/test-snappy-reader.rb +16 -0
  9. data/vendor/snappy/AUTHORS +1 -0
  10. data/vendor/snappy/COPYING +54 -0
  11. data/vendor/snappy/ChangeLog +1916 -0
  12. data/vendor/snappy/Makefile.am +23 -0
  13. data/vendor/snappy/NEWS +128 -0
  14. data/vendor/snappy/README +135 -0
  15. data/vendor/snappy/autogen.sh +7 -0
  16. data/vendor/snappy/configure.ac +133 -0
  17. data/vendor/snappy/format_description.txt +110 -0
  18. data/vendor/snappy/framing_format.txt +135 -0
  19. data/vendor/snappy/m4/gtest.m4 +74 -0
  20. data/vendor/snappy/snappy-c.cc +90 -0
  21. data/vendor/snappy/snappy-c.h +138 -0
  22. data/vendor/snappy/snappy-internal.h +150 -0
  23. data/vendor/snappy/snappy-sinksource.cc +71 -0
  24. data/vendor/snappy/snappy-sinksource.h +137 -0
  25. data/vendor/snappy/snappy-stubs-internal.cc +42 -0
  26. data/vendor/snappy/snappy-stubs-internal.h +491 -0
  27. data/vendor/snappy/snappy-stubs-public.h.in +98 -0
  28. data/vendor/snappy/snappy-test.cc +606 -0
  29. data/vendor/snappy/snappy-test.h +582 -0
  30. data/vendor/snappy/snappy.cc +1306 -0
  31. data/vendor/snappy/snappy.h +184 -0
  32. data/vendor/snappy/snappy_unittest.cc +1355 -0
  33. data/vendor/snappy/testdata/alice29.txt +3609 -0
  34. data/vendor/snappy/testdata/asyoulik.txt +4122 -0
  35. data/vendor/snappy/testdata/baddata1.snappy +0 -0
  36. data/vendor/snappy/testdata/baddata2.snappy +0 -0
  37. data/vendor/snappy/testdata/baddata3.snappy +0 -0
  38. data/vendor/snappy/testdata/fireworks.jpeg +0 -0
  39. data/vendor/snappy/testdata/geo.protodata +0 -0
  40. data/vendor/snappy/testdata/html +1 -0
  41. data/vendor/snappy/testdata/html_x_4 +1 -0
  42. data/vendor/snappy/testdata/kppkn.gtb +0 -0
  43. data/vendor/snappy/testdata/lcet10.txt +7519 -0
  44. data/vendor/snappy/testdata/paper-100k.pdf +600 -2
  45. data/vendor/snappy/testdata/plrabn12.txt +10699 -0
  46. data/vendor/snappy/testdata/urls.10K +10000 -0
  47. metadata +51 -12
@@ -0,0 +1,184 @@
1
+ // Copyright 2005 and onwards Google Inc.
2
+ //
3
+ // Redistribution and use in source and binary forms, with or without
4
+ // modification, are permitted provided that the following conditions are
5
+ // met:
6
+ //
7
+ // * Redistributions of source code must retain the above copyright
8
+ // notice, this list of conditions and the following disclaimer.
9
+ // * Redistributions in binary form must reproduce the above
10
+ // copyright notice, this list of conditions and the following disclaimer
11
+ // in the documentation and/or other materials provided with the
12
+ // distribution.
13
+ // * Neither the name of Google Inc. nor the names of its
14
+ // contributors may be used to endorse or promote products derived from
15
+ // this software without specific prior written permission.
16
+ //
17
+ // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18
+ // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19
+ // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20
+ // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21
+ // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22
+ // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23
+ // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24
+ // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25
+ // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26
+ // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27
+ // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28
+ //
29
+ // A light-weight compression algorithm. It is designed for speed of
30
+ // compression and decompression, rather than for the utmost in space
31
+ // savings.
32
+ //
33
+ // For getting better compression ratios when you are compressing data
34
+ // with long repeated sequences or compressing data that is similar to
35
+ // other data, while still compressing fast, you might look at first
36
+ // using BMDiff and then compressing the output of BMDiff with
37
+ // Snappy.
38
+
39
+ #ifndef UTIL_SNAPPY_SNAPPY_H__
40
+ #define UTIL_SNAPPY_SNAPPY_H__
41
+
42
+ #include <stddef.h>
43
+ #include <string>
44
+
45
+ #include "snappy-stubs-public.h"
46
+
47
+ namespace snappy {
48
+ class Source;
49
+ class Sink;
50
+
51
+ // ------------------------------------------------------------------------
52
+ // Generic compression/decompression routines.
53
+ // ------------------------------------------------------------------------
54
+
55
+ // Compress the bytes read from "*source" and append to "*sink". Return the
56
+ // number of bytes written.
57
+ size_t Compress(Source* source, Sink* sink);
58
+
59
+ // Find the uncompressed length of the given stream, as given by the header.
60
+ // Note that the true length could deviate from this; the stream could e.g.
61
+ // be truncated.
62
+ //
63
+ // Also note that this leaves "*source" in a state that is unsuitable for
64
+ // further operations, such as RawUncompress(). You will need to rewind
65
+ // or recreate the source yourself before attempting any further calls.
66
+ bool GetUncompressedLength(Source* source, uint32* result);
67
+
68
+ // ------------------------------------------------------------------------
69
+ // Higher-level string based routines (should be sufficient for most users)
70
+ // ------------------------------------------------------------------------
71
+
72
+ // Sets "*output" to the compressed version of "input[0,input_length-1]".
73
+ // Original contents of *output are lost.
74
+ //
75
+ // REQUIRES: "input[]" is not an alias of "*output".
76
+ size_t Compress(const char* input, size_t input_length, string* output);
77
+
78
+ // Decompresses "compressed[0,compressed_length-1]" to "*uncompressed".
79
+ // Original contents of "*uncompressed" are lost.
80
+ //
81
+ // REQUIRES: "compressed[]" is not an alias of "*uncompressed".
82
+ //
83
+ // returns false if the message is corrupted and could not be decompressed
84
+ bool Uncompress(const char* compressed, size_t compressed_length,
85
+ string* uncompressed);
86
+
87
+
88
+ // ------------------------------------------------------------------------
89
+ // Lower-level character array based routines. May be useful for
90
+ // efficiency reasons in certain circumstances.
91
+ // ------------------------------------------------------------------------
92
+
93
+ // REQUIRES: "compressed" must point to an area of memory that is at
94
+ // least "MaxCompressedLength(input_length)" bytes in length.
95
+ //
96
+ // Takes the data stored in "input[0..input_length]" and stores
97
+ // it in the array pointed to by "compressed".
98
+ //
99
+ // "*compressed_length" is set to the length of the compressed output.
100
+ //
101
+ // Example:
102
+ // char* output = new char[snappy::MaxCompressedLength(input_length)];
103
+ // size_t output_length;
104
+ // RawCompress(input, input_length, output, &output_length);
105
+ // ... Process(output, output_length) ...
106
+ // delete [] output;
107
+ void RawCompress(const char* input,
108
+ size_t input_length,
109
+ char* compressed,
110
+ size_t* compressed_length);
111
+
112
+ // Given data in "compressed[0..compressed_length-1]" generated by
113
+ // calling the Snappy::Compress routine, this routine
114
+ // stores the uncompressed data to
115
+ // uncompressed[0..GetUncompressedLength(compressed)-1]
116
+ // returns false if the message is corrupted and could not be decrypted
117
+ bool RawUncompress(const char* compressed, size_t compressed_length,
118
+ char* uncompressed);
119
+
120
+ // Given data from the byte source 'compressed' generated by calling
121
+ // the Snappy::Compress routine, this routine stores the uncompressed
122
+ // data to
123
+ // uncompressed[0..GetUncompressedLength(compressed,compressed_length)-1]
124
+ // returns false if the message is corrupted and could not be decrypted
125
+ bool RawUncompress(Source* compressed, char* uncompressed);
126
+
127
+ // Given data in "compressed[0..compressed_length-1]" generated by
128
+ // calling the Snappy::Compress routine, this routine
129
+ // stores the uncompressed data to the iovec "iov". The number of physical
130
+ // buffers in "iov" is given by iov_cnt and their cumulative size
131
+ // must be at least GetUncompressedLength(compressed). The individual buffers
132
+ // in "iov" must not overlap with each other.
133
+ //
134
+ // returns false if the message is corrupted and could not be decrypted
135
+ bool RawUncompressToIOVec(const char* compressed, size_t compressed_length,
136
+ const struct iovec* iov, size_t iov_cnt);
137
+
138
+ // Given data from the byte source 'compressed' generated by calling
139
+ // the Snappy::Compress routine, this routine stores the uncompressed
140
+ // data to the iovec "iov". The number of physical
141
+ // buffers in "iov" is given by iov_cnt and their cumulative size
142
+ // must be at least GetUncompressedLength(compressed). The individual buffers
143
+ // in "iov" must not overlap with each other.
144
+ //
145
+ // returns false if the message is corrupted and could not be decrypted
146
+ bool RawUncompressToIOVec(Source* compressed, const struct iovec* iov,
147
+ size_t iov_cnt);
148
+
149
+ // Returns the maximal size of the compressed representation of
150
+ // input data that is "source_bytes" bytes in length;
151
+ size_t MaxCompressedLength(size_t source_bytes);
152
+
153
+ // REQUIRES: "compressed[]" was produced by RawCompress() or Compress()
154
+ // Returns true and stores the length of the uncompressed data in
155
+ // *result normally. Returns false on parsing error.
156
+ // This operation takes O(1) time.
157
+ bool GetUncompressedLength(const char* compressed, size_t compressed_length,
158
+ size_t* result);
159
+
160
+ // Returns true iff the contents of "compressed[]" can be uncompressed
161
+ // successfully. Does not return the uncompressed data. Takes
162
+ // time proportional to compressed_length, but is usually at least
163
+ // a factor of four faster than actual decompression.
164
+ bool IsValidCompressedBuffer(const char* compressed,
165
+ size_t compressed_length);
166
+
167
+ // The size of a compression block. Note that many parts of the compression
168
+ // code assumes that kBlockSize <= 65536; in particular, the hash table
169
+ // can only store 16-bit offsets, and EmitCopy() also assumes the offset
170
+ // is 65535 bytes or less. Note also that if you change this, it will
171
+ // affect the framing format (see framing_format.txt).
172
+ //
173
+ // Note that there might be older data around that is compressed with larger
174
+ // block sizes, so the decompression code should not rely on the
175
+ // non-existence of long backreferences.
176
+ static const int kBlockLog = 16;
177
+ static const size_t kBlockSize = 1 << kBlockLog;
178
+
179
+ static const int kMaxHashTableBits = 14;
180
+ static const size_t kMaxHashTableSize = 1 << kMaxHashTableBits;
181
+ } // end namespace snappy
182
+
183
+
184
+ #endif // UTIL_SNAPPY_SNAPPY_H__