lz4-ruby 0.2.0-java

Sign up to get free protection for your applications and to get access to all the features.
data/ext/lz4ruby/lz4.h ADDED
@@ -0,0 +1,117 @@
1
+ /*
2
+ LZ4 - Fast LZ compression algorithm
3
+ Header File
4
+ Copyright (C) 2011-2012, Yann Collet.
5
+ BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
6
+
7
+ Redistribution and use in source and binary forms, with or without
8
+ modification, are permitted provided that the following conditions are
9
+ met:
10
+
11
+ * Redistributions of source code must retain the above copyright
12
+ notice, this list of conditions and the following disclaimer.
13
+ * Redistributions in binary form must reproduce the above
14
+ copyright notice, this list of conditions and the following disclaimer
15
+ in the documentation and/or other materials provided with the
16
+ distribution.
17
+
18
+ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
19
+ "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
20
+ LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
21
+ A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
22
+ OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
23
+ SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
24
+ LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
25
+ DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
26
+ THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
27
+ (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
28
+ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
29
+
30
+ You can contact the author at :
31
+ - LZ4 homepage : http://fastcompression.blogspot.com/p/lz4.html
32
+ - LZ4 source repository : http://code.google.com/p/lz4/
33
+ */
34
+ #pragma once
35
+
36
+ #if defined (__cplusplus)
37
+ extern "C" {
38
+ #endif
39
+
40
+
41
+ //****************************
42
+ // Simple Functions
43
+ //****************************
44
+
45
+ int LZ4_compress (const char* source, char* dest, int isize);
46
+ int LZ4_uncompress (const char* source, char* dest, int osize);
47
+
48
+ /*
49
+ LZ4_compress() :
50
+ Compresses 'isize' bytes from 'source' into 'dest'.
51
+ Destination buffer must be already allocated,
52
+ and must be sized to handle worst cases situations (input data not compressible)
53
+ Worst case size evaluation is provided by macro LZ4_compressBound()
54
+
55
+ isize : is the input size. Max supported value is ~1.9GB
56
+ return : the number of bytes written in buffer dest
57
+
58
+
59
+ LZ4_uncompress() :
60
+ osize : is the output size, therefore the original size
61
+ return : the number of bytes read in the source buffer
62
+ If the source stream is malformed, the function will stop decoding and return a negative result, indicating the byte position of the faulty instruction
63
+ This function never writes beyond dest + osize, and is therefore protected against malicious data packets
64
+ note : destination buffer must be already allocated.
65
+ its size must be a minimum of 'osize' bytes.
66
+ */
67
+
68
+
69
+ //****************************
70
+ // Advanced Functions
71
+ //****************************
72
+
73
+ #define LZ4_compressBound(isize) (isize + (isize/255) + 16)
74
+
75
+ /*
76
+ LZ4_compressBound() :
77
+ Provides the maximum size that LZ4 may output in a "worst case" scenario (input data not compressible)
78
+ primarily useful for memory allocation of output buffer.
79
+
80
+ isize : is the input size. Max supported value is ~1.9GB
81
+ return : maximum output size in a "worst case" scenario
82
+ note : this function is limited by "int" range (2^31-1)
83
+ */
84
+
85
+
86
+ int LZ4_compress_limitedOutput (const char* source, char* dest, int isize, int maxOutputSize);
87
+
88
+ /*
89
+ LZ4_compress_limitedOutput() :
90
+ Compress 'isize' bytes from 'source' into an output buffer 'dest' of maximum size 'maxOutputSize'.
91
+ If it cannot achieve it, compression will stop, and result of the function will be zero.
92
+ This function never writes outside of provided output buffer.
93
+
94
+ isize : is the input size. Max supported value is ~1.9GB
95
+ maxOutputSize : is the size of the destination buffer (which must be already allocated)
96
+ return : the number of bytes written in buffer 'dest'
97
+ or 0 if the compression fails
98
+ */
99
+
100
+
101
+ int LZ4_uncompress_unknownOutputSize (const char* source, char* dest, int isize, int maxOutputSize);
102
+
103
+ /*
104
+ LZ4_uncompress_unknownOutputSize() :
105
+ isize : is the input size, therefore the compressed size
106
+ maxOutputSize : is the size of the destination buffer (which must be already allocated)
107
+ return : the number of bytes decoded in the destination buffer (necessarily <= maxOutputSize)
108
+ If the source stream is malformed, the function will stop decoding and return a negative result, indicating the byte position of the faulty instruction
109
+ This function never writes beyond dest + maxOutputSize, and is therefore protected against malicious data packets
110
+ note : Destination buffer must be already allocated.
111
+ This version is slightly slower than LZ4_uncompress()
112
+ */
113
+
114
+
115
+ #if defined (__cplusplus)
116
+ }
117
+ #endif
@@ -0,0 +1,671 @@
1
+ /*
2
+ LZ4 HC - High Compression Mode of LZ4
3
+ Copyright (C) 2011-2012, Yann Collet.
4
+ BSD 2-Clause License (http://www.opensource.org/licenses/bsd-license.php)
5
+
6
+ Redistribution and use in source and binary forms, with or without
7
+ modification, are permitted provided that the following conditions are
8
+ met:
9
+
10
+ * Redistributions of source code must retain the above copyright
11
+ notice, this list of conditions and the following disclaimer.
12
+ * Redistributions in binary form must reproduce the above
13
+ copyright notice, this list of conditions and the following disclaimer
14
+ in the documentation and/or other materials provided with the
15
+ distribution.
16
+
17
+ THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18
+ "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19
+ LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20
+ A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
21
+ OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
22
+ SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
23
+ LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
24
+ DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
25
+ THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
26
+ (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
27
+ OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28
+
29
+ You can contact the author at :
30
+ - LZ4 homepage : http://fastcompression.blogspot.com/p/lz4.html
31
+ - LZ4 source repository : http://code.google.com/p/lz4/
32
+ */
33
+
34
+
35
+ //**************************************
36
+ // CPU Feature Detection
37
+ //**************************************
38
+ // 32 or 64 bits ?
39
+ #if (defined(__x86_64__) || defined(__x86_64) || defined(__amd64__) || defined(__amd64) || defined(__ppc64__) || defined(_WIN64) || defined(__LP64__) || defined(_LP64) ) // Detects 64 bits mode
40
+ #define LZ4_ARCH64 1
41
+ #else
42
+ #define LZ4_ARCH64 0
43
+ #endif
44
+
45
+ // Little Endian or Big Endian ?
46
+ #if (defined(__BIG_ENDIAN__) || defined(__BIG_ENDIAN) || defined(_BIG_ENDIAN) || defined(_ARCH_PPC) || defined(__PPC__) || defined(__PPC) || defined(PPC) || defined(__powerpc__) || defined(__powerpc) || defined(powerpc) || ((defined(__BYTE_ORDER__)&&(__BYTE_ORDER__ == __ORDER_BIG_ENDIAN__))) )
47
+ #define LZ4_BIG_ENDIAN 1
48
+ #else
49
+ // Little Endian assumed. PDP Endian and other very rare endian format are unsupported.
50
+ #endif
51
+
52
+ // Unaligned memory access is automatically enabled for "common" CPU, such as x86.
53
+ // For others CPU, the compiler will be more cautious, and insert extra code to ensure aligned access is respected
54
+ // If you know your target CPU supports unaligned memory access, you may want to force this option manually to improve performance
55
+ #if defined(__ARM_FEATURE_UNALIGNED)
56
+ #define LZ4_FORCE_UNALIGNED_ACCESS 1
57
+ #endif
58
+
59
+
60
+ //**************************************
61
+ // Compiler Options
62
+ //**************************************
63
+ #if __STDC_VERSION__ >= 199901L // C99
64
+ /* "restrict" is a known keyword */
65
+ #else
66
+ #define restrict // Disable restrict
67
+ #endif
68
+
69
+ #ifdef _MSC_VER
70
+ #define inline __forceinline // Visual is not C99, but supports some kind of inline
71
+ #include <intrin.h> // For Visual 2005
72
+ # if LZ4_ARCH64 // 64-bit
73
+ # pragma intrinsic(_BitScanForward64) // For Visual 2005
74
+ # pragma intrinsic(_BitScanReverse64) // For Visual 2005
75
+ # else
76
+ # pragma intrinsic(_BitScanForward) // For Visual 2005
77
+ # pragma intrinsic(_BitScanReverse) // For Visual 2005
78
+ # endif
79
+ #endif
80
+
81
+ #ifdef _MSC_VER // Visual Studio
82
+ #define lz4_bswap16(x) _byteswap_ushort(x)
83
+ #else
84
+ #define lz4_bswap16(x) ((unsigned short int) ((((x) >> 8) & 0xffu) | (((x) & 0xffu) << 8)))
85
+ #endif
86
+
87
+
88
+ //**************************************
89
+ // Includes
90
+ //**************************************
91
+ #include <stdlib.h> // calloc, free
92
+ #include <string.h> // memset, memcpy
93
+ #include "lz4hc.h"
94
+
95
+ #define ALLOCATOR(s) calloc(1,s)
96
+ #define FREEMEM free
97
+ #define MEM_INIT memset
98
+
99
+
100
+ //**************************************
101
+ // Basic Types
102
+ //**************************************
103
+ #if defined(_MSC_VER) // Visual Studio does not support 'stdint' natively
104
+ #define BYTE unsigned __int8
105
+ #define U16 unsigned __int16
106
+ #define U32 unsigned __int32
107
+ #define S32 __int32
108
+ #define U64 unsigned __int64
109
+ #else
110
+ #include <stdint.h>
111
+ #define BYTE uint8_t
112
+ #define U16 uint16_t
113
+ #define U32 uint32_t
114
+ #define S32 int32_t
115
+ #define U64 uint64_t
116
+ #endif
117
+
118
+ #ifndef LZ4_FORCE_UNALIGNED_ACCESS
119
+ #pragma pack(push, 1)
120
+ #endif
121
+
122
+ typedef struct _U16_S { U16 v; } U16_S;
123
+ typedef struct _U32_S { U32 v; } U32_S;
124
+ typedef struct _U64_S { U64 v; } U64_S;
125
+
126
+ #ifndef LZ4_FORCE_UNALIGNED_ACCESS
127
+ #pragma pack(pop)
128
+ #endif
129
+
130
+ #define A64(x) (((U64_S *)(x))->v)
131
+ #define A32(x) (((U32_S *)(x))->v)
132
+ #define A16(x) (((U16_S *)(x))->v)
133
+
134
+
135
+ //**************************************
136
+ // Constants
137
+ //**************************************
138
+ #define MINMATCH 4
139
+
140
+ #define DICTIONARY_LOGSIZE 16
141
+ #define MAXD (1<<DICTIONARY_LOGSIZE)
142
+ #define MAXD_MASK ((U32)(MAXD - 1))
143
+ #define MAX_DISTANCE (MAXD - 1)
144
+
145
+ #define HASH_LOG (DICTIONARY_LOGSIZE-1)
146
+ #define HASHTABLESIZE (1 << HASH_LOG)
147
+ #define HASH_MASK (HASHTABLESIZE - 1)
148
+
149
+ #define MAX_NB_ATTEMPTS 256
150
+
151
+ #define ML_BITS 4
152
+ #define ML_MASK (size_t)((1U<<ML_BITS)-1)
153
+ #define RUN_BITS (8-ML_BITS)
154
+ #define RUN_MASK ((1U<<RUN_BITS)-1)
155
+
156
+ #define COPYLENGTH 8
157
+ #define LASTLITERALS 5
158
+ #define MFLIMIT (COPYLENGTH+MINMATCH)
159
+ #define MINLENGTH (MFLIMIT+1)
160
+ #define OPTIMAL_ML (int)((ML_MASK-1)+MINMATCH)
161
+
162
+
163
+ //**************************************
164
+ // Architecture-specific macros
165
+ //**************************************
166
+ #if LZ4_ARCH64 // 64-bit
167
+ #define STEPSIZE 8
168
+ #define LZ4_COPYSTEP(s,d) A64(d) = A64(s); d+=8; s+=8;
169
+ #define LZ4_COPYPACKET(s,d) LZ4_COPYSTEP(s,d)
170
+ #define UARCH U64
171
+ #define AARCH A64
172
+ #define HTYPE U32
173
+ #define INITBASE(b,s) const BYTE* const b = s
174
+ #else // 32-bit
175
+ #define STEPSIZE 4
176
+ #define LZ4_COPYSTEP(s,d) A32(d) = A32(s); d+=4; s+=4;
177
+ #define LZ4_COPYPACKET(s,d) LZ4_COPYSTEP(s,d); LZ4_COPYSTEP(s,d);
178
+ #define UARCH U32
179
+ #define AARCH A32
180
+ #define HTYPE const BYTE*
181
+ #define INITBASE(b,s) const int b = 0
182
+ #endif
183
+
184
+ #if defined(LZ4_BIG_ENDIAN)
185
+ #define LZ4_READ_LITTLEENDIAN_16(d,s,p) { U16 v = A16(p); v = lz4_bswap16(v); d = (s) - v; }
186
+ #define LZ4_WRITE_LITTLEENDIAN_16(p,i) { U16 v = (U16)(i); v = lz4_bswap16(v); A16(p) = v; p+=2; }
187
+ #else // Little Endian
188
+ #define LZ4_READ_LITTLEENDIAN_16(d,s,p) { d = (s) - A16(p); }
189
+ #define LZ4_WRITE_LITTLEENDIAN_16(p,v) { A16(p) = v; p+=2; }
190
+ #endif
191
+
192
+
193
+ //************************************************************
194
+ // Local Types
195
+ //************************************************************
196
+ typedef struct
197
+ {
198
+ const BYTE* base;
199
+ HTYPE hashTable[HASHTABLESIZE];
200
+ U16 chainTable[MAXD];
201
+ const BYTE* nextToUpdate;
202
+ } LZ4HC_Data_Structure;
203
+
204
+
205
+ //**************************************
206
+ // Macros
207
+ //**************************************
208
+ #define LZ4_WILDCOPY(s,d,e) do { LZ4_COPYPACKET(s,d) } while (d<e);
209
+ #define LZ4_BLINDCOPY(s,d,l) { BYTE* e=d+l; LZ4_WILDCOPY(s,d,e); d=e; }
210
+ #define HASH_FUNCTION(i) (((i) * 2654435761U) >> ((MINMATCH*8)-HASH_LOG))
211
+ #define HASH_VALUE(p) HASH_FUNCTION(*(U32*)(p))
212
+ #define HASH_POINTER(p) (HashTable[HASH_VALUE(p)] + base)
213
+ #define DELTANEXT(p) chainTable[(size_t)(p) & MAXD_MASK]
214
+ #define GETNEXT(p) ((p) - (size_t)DELTANEXT(p))
215
+ #define ADD_HASH(p) { size_t delta = (p) - HASH_POINTER(p); if (delta>MAX_DISTANCE) delta = MAX_DISTANCE; DELTANEXT(p) = (U16)delta; HashTable[HASH_VALUE(p)] = (p) - base; }
216
+
217
+
218
+ //**************************************
219
+ // Private functions
220
+ //**************************************
221
+ #if LZ4_ARCH64
222
+
223
+ inline static int LZ4_NbCommonBytes (register U64 val)
224
+ {
225
+ #if defined(LZ4_BIG_ENDIAN)
226
+ #if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT)
227
+ unsigned long r = 0;
228
+ _BitScanReverse64( &r, val );
229
+ return (int)(r>>3);
230
+ #elif defined(__GNUC__) && ((__GNUC__ * 100 + __GNUC_MINOR__) >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT)
231
+ return (__builtin_clzll(val) >> 3);
232
+ #else
233
+ int r;
234
+ if (!(val>>32)) { r=4; } else { r=0; val>>=32; }
235
+ if (!(val>>16)) { r+=2; val>>=8; } else { val>>=24; }
236
+ r += (!val);
237
+ return r;
238
+ #endif
239
+ #else
240
+ #if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT)
241
+ unsigned long r = 0;
242
+ _BitScanForward64( &r, val );
243
+ return (int)(r>>3);
244
+ #elif defined(__GNUC__) && ((__GNUC__ * 100 + __GNUC_MINOR__) >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT)
245
+ return (__builtin_ctzll(val) >> 3);
246
+ #else
247
+ static const int DeBruijnBytePos[64] = { 0, 0, 0, 0, 0, 1, 1, 2, 0, 3, 1, 3, 1, 4, 2, 7, 0, 2, 3, 6, 1, 5, 3, 5, 1, 3, 4, 4, 2, 5, 6, 7, 7, 0, 1, 2, 3, 3, 4, 6, 2, 6, 5, 5, 3, 4, 5, 6, 7, 1, 2, 4, 6, 4, 4, 5, 7, 2, 6, 5, 7, 6, 7, 7 };
248
+ return DeBruijnBytePos[((U64)((val & -val) * 0x0218A392CDABBD3F)) >> 58];
249
+ #endif
250
+ #endif
251
+ }
252
+
253
+ #else
254
+
255
+ inline static int LZ4_NbCommonBytes (register U32 val)
256
+ {
257
+ #if defined(LZ4_BIG_ENDIAN)
258
+ #if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT)
259
+ unsigned long r = 0;
260
+ _BitScanReverse( &r, val );
261
+ return (int)(r>>3);
262
+ #elif defined(__GNUC__) && ((__GNUC__ * 100 + __GNUC_MINOR__) >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT)
263
+ return (__builtin_clz(val) >> 3);
264
+ #else
265
+ int r;
266
+ if (!(val>>16)) { r=2; val>>=8; } else { r=0; val>>=24; }
267
+ r += (!val);
268
+ return r;
269
+ #endif
270
+ #else
271
+ #if defined(_MSC_VER) && !defined(LZ4_FORCE_SW_BITCOUNT)
272
+ unsigned long r = 0;
273
+ _BitScanForward( &r, val );
274
+ return (int)(r>>3);
275
+ #elif defined(__GNUC__) && ((__GNUC__ * 100 + __GNUC_MINOR__) >= 304) && !defined(LZ4_FORCE_SW_BITCOUNT)
276
+ return (__builtin_ctz(val) >> 3);
277
+ #else
278
+ static const int DeBruijnBytePos[32] = { 0, 0, 3, 0, 3, 1, 3, 0, 3, 2, 2, 1, 3, 2, 0, 1, 3, 3, 1, 2, 2, 2, 2, 0, 3, 1, 2, 0, 1, 0, 1, 1 };
279
+ return DeBruijnBytePos[((U32)((val & -(S32)val) * 0x077CB531U)) >> 27];
280
+ #endif
281
+ #endif
282
+ }
283
+
284
+ #endif
285
+
286
+
287
+ inline static int LZ4HC_Init (LZ4HC_Data_Structure* hc4, const BYTE* base)
288
+ {
289
+ MEM_INIT((void*)hc4->hashTable, 0, sizeof(hc4->hashTable));
290
+ MEM_INIT(hc4->chainTable, 0xFF, sizeof(hc4->chainTable));
291
+ hc4->nextToUpdate = base + LZ4_ARCH64;
292
+ hc4->base = base;
293
+ return 1;
294
+ }
295
+
296
+
297
+ inline static void* LZ4HC_Create (const BYTE* base)
298
+ {
299
+ void* hc4 = ALLOCATOR(sizeof(LZ4HC_Data_Structure));
300
+
301
+ LZ4HC_Init (hc4, base);
302
+ return hc4;
303
+ }
304
+
305
+
306
+ inline static int LZ4HC_Free (void** LZ4HC_Data)
307
+ {
308
+ FREEMEM(*LZ4HC_Data);
309
+ *LZ4HC_Data = NULL;
310
+ return (1);
311
+ }
312
+
313
+
314
+ inline static void LZ4HC_Insert (LZ4HC_Data_Structure* hc4, const BYTE* ip)
315
+ {
316
+ U16* chainTable = hc4->chainTable;
317
+ HTYPE* HashTable = hc4->hashTable;
318
+ INITBASE(base,hc4->base);
319
+
320
+ while(hc4->nextToUpdate < ip)
321
+ {
322
+ ADD_HASH(hc4->nextToUpdate);
323
+ hc4->nextToUpdate++;
324
+ }
325
+ }
326
+
327
+
328
+ inline static int LZ4HC_InsertAndFindBestMatch (LZ4HC_Data_Structure* hc4, const BYTE* ip, const BYTE* const matchlimit, const BYTE** matchpos)
329
+ {
330
+ U16* const chainTable = hc4->chainTable;
331
+ HTYPE* const HashTable = hc4->hashTable;
332
+ const BYTE* ref;
333
+ INITBASE(base,hc4->base);
334
+ int nbAttempts=MAX_NB_ATTEMPTS;
335
+ int ml=0;
336
+
337
+ // HC4 match finder
338
+ LZ4HC_Insert(hc4, ip);
339
+ ref = HASH_POINTER(ip);
340
+ while ((ref > (ip-MAX_DISTANCE)) && (nbAttempts))
341
+ {
342
+ nbAttempts--;
343
+ if (*(ref+ml) == *(ip+ml))
344
+ if (*(U32*)ref == *(U32*)ip)
345
+ {
346
+ const BYTE* reft = ref+MINMATCH;
347
+ const BYTE* ipt = ip+MINMATCH;
348
+
349
+ while (ipt<matchlimit-(STEPSIZE-1))
350
+ {
351
+ UARCH diff = AARCH(reft) ^ AARCH(ipt);
352
+ if (!diff) { ipt+=STEPSIZE; reft+=STEPSIZE; continue; }
353
+ ipt += LZ4_NbCommonBytes(diff);
354
+ goto _endCount;
355
+ }
356
+ if (LZ4_ARCH64) if ((ipt<(matchlimit-3)) && (A32(reft) == A32(ipt))) { ipt+=4; reft+=4; }
357
+ if ((ipt<(matchlimit-1)) && (A16(reft) == A16(ipt))) { ipt+=2; reft+=2; }
358
+ if ((ipt<matchlimit) && (*reft == *ipt)) ipt++;
359
+ _endCount:
360
+
361
+ if (ipt-ip > ml) { ml = (int)(ipt-ip); *matchpos = ref; }
362
+ }
363
+ ref = GETNEXT(ref);
364
+ }
365
+
366
+ return ml;
367
+ }
368
+
369
+
370
+ inline static int LZ4HC_InsertAndGetWiderMatch (LZ4HC_Data_Structure* hc4, const BYTE* ip, const BYTE* startLimit, const BYTE* matchlimit, int longest, const BYTE** matchpos, const BYTE** startpos)
371
+ {
372
+ U16* const chainTable = hc4->chainTable;
373
+ HTYPE* const HashTable = hc4->hashTable;
374
+ INITBASE(base,hc4->base);
375
+ const BYTE* ref;
376
+ int nbAttempts = MAX_NB_ATTEMPTS;
377
+ int delta = (int)(ip-startLimit);
378
+
379
+ // First Match
380
+ LZ4HC_Insert(hc4, ip);
381
+ ref = HASH_POINTER(ip);
382
+
383
+ while ((ref > ip-MAX_DISTANCE) && (ref >= hc4->base) && (nbAttempts))
384
+ {
385
+ nbAttempts--;
386
+ if (*(startLimit + longest) == *(ref - delta + longest))
387
+ if (*(U32*)ref == *(U32*)ip)
388
+ {
389
+ const BYTE* reft = ref+MINMATCH;
390
+ const BYTE* ipt = ip+MINMATCH;
391
+ const BYTE* startt = ip;
392
+
393
+ while (ipt<matchlimit-(STEPSIZE-1))
394
+ {
395
+ UARCH diff = AARCH(reft) ^ AARCH(ipt);
396
+ if (!diff) { ipt+=STEPSIZE; reft+=STEPSIZE; continue; }
397
+ ipt += LZ4_NbCommonBytes(diff);
398
+ goto _endCount;
399
+ }
400
+ if (LZ4_ARCH64) if ((ipt<(matchlimit-3)) && (A32(reft) == A32(ipt))) { ipt+=4; reft+=4; }
401
+ if ((ipt<(matchlimit-1)) && (A16(reft) == A16(ipt))) { ipt+=2; reft+=2; }
402
+ if ((ipt<matchlimit) && (*reft == *ipt)) ipt++;
403
+ _endCount:
404
+
405
+ reft = ref;
406
+ while ((startt>startLimit) && (reft > hc4->base) && (startt[-1] == reft[-1])) {startt--; reft--;}
407
+
408
+ if ((ipt-startt) > longest)
409
+ {
410
+ longest = (int)(ipt-startt);
411
+ *matchpos = reft;
412
+ *startpos = startt;
413
+ }
414
+ }
415
+ ref = GETNEXT(ref);
416
+ }
417
+
418
+ return longest;
419
+ }
420
+
421
+
422
+ inline static int LZ4_encodeSequence(const BYTE** ip, BYTE** op, const BYTE** anchor, int ml, const BYTE* ref)
423
+ {
424
+ int length, len;
425
+ BYTE* token;
426
+
427
+ // Encode Literal length
428
+ length = (int)(*ip - *anchor);
429
+ token = (*op)++;
430
+ if (length>=(int)RUN_MASK) { *token=(RUN_MASK<<ML_BITS); len = length-RUN_MASK; for(; len > 254 ; len-=255) *(*op)++ = 255; *(*op)++ = (BYTE)len; }
431
+ else *token = (length<<ML_BITS);
432
+
433
+ // Copy Literals
434
+ LZ4_BLINDCOPY(*anchor, *op, length);
435
+
436
+ // Encode Offset
437
+ LZ4_WRITE_LITTLEENDIAN_16(*op,(U16)(*ip-ref));
438
+
439
+ // Encode MatchLength
440
+ len = (int)(ml-MINMATCH);
441
+ if (len>=(int)ML_MASK) { *token+=ML_MASK; len-=ML_MASK; for(; len > 509 ; len-=510) { *(*op)++ = 255; *(*op)++ = 255; } if (len > 254) { len-=255; *(*op)++ = 255; } *(*op)++ = (BYTE)len; }
442
+ else *token += len;
443
+
444
+ // Prepare next loop
445
+ *ip += ml;
446
+ *anchor = *ip;
447
+
448
+ return 0;
449
+ }
450
+
451
+
452
+ //****************************
453
+ // Compression CODE
454
+ //****************************
455
+
456
+ int LZ4_compressHCCtx(LZ4HC_Data_Structure* ctx,
457
+ const char* source,
458
+ char* dest,
459
+ int isize)
460
+ {
461
+ const BYTE* ip = (const BYTE*) source;
462
+ const BYTE* anchor = ip;
463
+ const BYTE* const iend = ip + isize;
464
+ const BYTE* const mflimit = iend - MFLIMIT;
465
+ const BYTE* const matchlimit = (iend - LASTLITERALS);
466
+
467
+ BYTE* op = (BYTE*) dest;
468
+
469
+ int ml, ml2, ml3, ml0;
470
+ const BYTE* ref=NULL;
471
+ const BYTE* start2=NULL;
472
+ const BYTE* ref2=NULL;
473
+ const BYTE* start3=NULL;
474
+ const BYTE* ref3=NULL;
475
+ const BYTE* start0;
476
+ const BYTE* ref0;
477
+
478
+ ip++;
479
+
480
+ // Main Loop
481
+ while (ip < mflimit)
482
+ {
483
+ ml = LZ4HC_InsertAndFindBestMatch (ctx, ip, matchlimit, (&ref));
484
+ if (!ml) { ip++; continue; }
485
+
486
+ // saved, in case we would skip too much
487
+ start0 = ip;
488
+ ref0 = ref;
489
+ ml0 = ml;
490
+
491
+ _Search2:
492
+ if (ip+ml < mflimit)
493
+ ml2 = LZ4HC_InsertAndGetWiderMatch(ctx, ip + ml - 2, ip + 1, matchlimit, ml, &ref2, &start2);
494
+ else ml2=ml;
495
+
496
+ if (ml2 == ml) // No better match
497
+ {
498
+ LZ4_encodeSequence(&ip, &op, &anchor, ml, ref);
499
+ continue;
500
+ }
501
+
502
+ if (start0 < ip)
503
+ {
504
+ if (start2 < ip + ml0) // empirical
505
+ {
506
+ ip = start0;
507
+ ref = ref0;
508
+ ml = ml0;
509
+ }
510
+ }
511
+
512
+ // Here, start0==ip
513
+ if ((start2 - ip) < 3) // First Match too small : removed
514
+ {
515
+ ml = ml2;
516
+ ip = start2;
517
+ ref =ref2;
518
+ goto _Search2;
519
+ }
520
+
521
+ _Search3:
522
+ // Currently we have :
523
+ // ml2 > ml1, and
524
+ // ip1+3 <= ip2 (usually < ip1+ml1)
525
+ if ((start2 - ip) < OPTIMAL_ML)
526
+ {
527
+ int correction;
528
+ int new_ml = ml;
529
+ if (new_ml > OPTIMAL_ML) new_ml = OPTIMAL_ML;
530
+ if (ip+new_ml > start2 + ml2 - MINMATCH) new_ml = (int)(start2 - ip) + ml2 - MINMATCH;
531
+ correction = new_ml - (int)(start2 - ip);
532
+ if (correction > 0)
533
+ {
534
+ start2 += correction;
535
+ ref2 += correction;
536
+ ml2 -= correction;
537
+ }
538
+ }
539
+ // Now, we have start2 = ip+new_ml, with new_ml=min(ml, OPTIMAL_ML=18)
540
+
541
+ if (start2 + ml2 < mflimit)
542
+ ml3 = LZ4HC_InsertAndGetWiderMatch(ctx, start2 + ml2 - 3, start2, matchlimit, ml2, &ref3, &start3);
543
+ else ml3=ml2;
544
+
545
+ if (ml3 == ml2) // No better match : 2 sequences to encode
546
+ {
547
+ // ip & ref are known; Now for ml
548
+ if (start2 < ip+ml)
549
+ {
550
+ if ((start2 - ip) < OPTIMAL_ML)
551
+ {
552
+ int correction;
553
+ if (ml > OPTIMAL_ML) ml = OPTIMAL_ML;
554
+ if (ip+ml > start2 + ml2 - MINMATCH) ml = (int)(start2 - ip) + ml2 - MINMATCH;
555
+ correction = ml - (int)(start2 - ip);
556
+ if (correction > 0)
557
+ {
558
+ start2 += correction;
559
+ ref2 += correction;
560
+ ml2 -= correction;
561
+ }
562
+ }
563
+ else
564
+ {
565
+ ml = (int)(start2 - ip);
566
+ }
567
+ }
568
+ // Now, encode 2 sequences
569
+ LZ4_encodeSequence(&ip, &op, &anchor, ml, ref);
570
+ ip = start2;
571
+ LZ4_encodeSequence(&ip, &op, &anchor, ml2, ref2);
572
+ continue;
573
+ }
574
+
575
+ if (start3 < ip+ml+3) // Not enough space for match 2 : remove it
576
+ {
577
+ if (start3 >= (ip+ml)) // can write Seq1 immediately ==> Seq2 is removed, so Seq3 becomes Seq1
578
+ {
579
+ if (start2 < ip+ml)
580
+ {
581
+ int correction = (int)(ip+ml - start2);
582
+ start2 += correction;
583
+ ref2 += correction;
584
+ ml2 -= correction;
585
+ if (ml2 < MINMATCH)
586
+ {
587
+ start2 = start3;
588
+ ref2 = ref3;
589
+ ml2 = ml3;
590
+ }
591
+ }
592
+
593
+ LZ4_encodeSequence(&ip, &op, &anchor, ml, ref);
594
+ ip = start3;
595
+ ref = ref3;
596
+ ml = ml3;
597
+
598
+ start0 = start2;
599
+ ref0 = ref2;
600
+ ml0 = ml2;
601
+ goto _Search2;
602
+ }
603
+
604
+ start2 = start3;
605
+ ref2 = ref3;
606
+ ml2 = ml3;
607
+ goto _Search3;
608
+ }
609
+
610
+ // OK, now we have 3 ascending matches; let's write at least the first one
611
+ // ip & ref are known; Now for ml
612
+ if (start2 < ip+ml)
613
+ {
614
+ if ((start2 - ip) < (int)ML_MASK)
615
+ {
616
+ int correction;
617
+ if (ml > OPTIMAL_ML) ml = OPTIMAL_ML;
618
+ if (ip + ml > start2 + ml2 - MINMATCH) ml = (int)(start2 - ip) + ml2 - MINMATCH;
619
+ correction = ml - (int)(start2 - ip);
620
+ if (correction > 0)
621
+ {
622
+ start2 += correction;
623
+ ref2 += correction;
624
+ ml2 -= correction;
625
+ }
626
+ }
627
+ else
628
+ {
629
+ ml = (int)(start2 - ip);
630
+ }
631
+ }
632
+ LZ4_encodeSequence(&ip, &op, &anchor, ml, ref);
633
+
634
+ ip = start2;
635
+ ref = ref2;
636
+ ml = ml2;
637
+
638
+ start2 = start3;
639
+ ref2 = ref3;
640
+ ml2 = ml3;
641
+
642
+ goto _Search3;
643
+
644
+ }
645
+
646
+ // Encode Last Literals
647
+ {
648
+ int lastRun = (int)(iend - anchor);
649
+ if (lastRun>=(int)RUN_MASK) { *op++=(RUN_MASK<<ML_BITS); lastRun-=RUN_MASK; for(; lastRun > 254 ; lastRun-=255) *op++ = 255; *op++ = (BYTE) lastRun; }
650
+ else *op++ = (lastRun<<ML_BITS);
651
+ memcpy(op, anchor, iend - anchor);
652
+ op += iend-anchor;
653
+ }
654
+
655
+ // End
656
+ return (int) (((char*)op)-dest);
657
+ }
658
+
659
+
660
+ int LZ4_compressHC(const char* source,
661
+ char* dest,
662
+ int isize)
663
+ {
664
+ void* ctx = LZ4HC_Create((const BYTE*)source);
665
+ int result = LZ4_compressHCCtx(ctx, source, dest, isize);
666
+ LZ4HC_Free (&ctx);
667
+
668
+ return result;
669
+ }
670
+
671
+