zstd-ruby 1.4.0.0 → 1.4.9.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/.github/workflows/ruby.yml +35 -0
- data/README.md +2 -2
- data/ext/zstdruby/libzstd/Makefile +274 -107
- data/ext/zstdruby/libzstd/README.md +75 -16
- data/ext/zstdruby/libzstd/common/bitstream.h +59 -51
- data/ext/zstdruby/libzstd/common/compiler.h +154 -5
- data/ext/zstdruby/libzstd/common/cpu.h +1 -3
- data/ext/zstdruby/libzstd/common/debug.c +11 -31
- data/ext/zstdruby/libzstd/common/debug.h +22 -49
- data/ext/zstdruby/libzstd/common/entropy_common.c +201 -75
- data/ext/zstdruby/libzstd/common/error_private.c +3 -1
- data/ext/zstdruby/libzstd/common/error_private.h +7 -3
- data/ext/zstdruby/libzstd/common/fse.h +50 -42
- data/ext/zstdruby/libzstd/common/fse_decompress.c +134 -50
- data/ext/zstdruby/libzstd/common/huf.h +41 -38
- data/ext/zstdruby/libzstd/common/mem.h +68 -22
- data/ext/zstdruby/libzstd/common/pool.c +30 -20
- data/ext/zstdruby/libzstd/common/pool.h +3 -3
- data/ext/zstdruby/libzstd/common/threading.c +51 -4
- data/ext/zstdruby/libzstd/common/threading.h +36 -4
- data/ext/zstdruby/libzstd/common/xxhash.c +39 -89
- data/ext/zstdruby/libzstd/common/xxhash.h +12 -32
- data/ext/zstdruby/libzstd/common/zstd_common.c +10 -10
- data/ext/zstdruby/libzstd/common/zstd_deps.h +111 -0
- data/ext/zstdruby/libzstd/common/zstd_errors.h +3 -1
- data/ext/zstdruby/libzstd/common/zstd_internal.h +231 -72
- data/ext/zstdruby/libzstd/common/zstd_trace.c +42 -0
- data/ext/zstdruby/libzstd/common/zstd_trace.h +152 -0
- data/ext/zstdruby/libzstd/compress/fse_compress.c +47 -63
- data/ext/zstdruby/libzstd/compress/hist.c +41 -63
- data/ext/zstdruby/libzstd/compress/hist.h +13 -33
- data/ext/zstdruby/libzstd/compress/huf_compress.c +288 -172
- data/ext/zstdruby/libzstd/compress/zstd_compress.c +2504 -1626
- data/ext/zstdruby/libzstd/compress/zstd_compress_internal.h +446 -85
- data/ext/zstdruby/libzstd/compress/zstd_compress_literals.c +158 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_literals.h +29 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_sequences.c +433 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_sequences.h +54 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_superblock.c +849 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_superblock.h +32 -0
- data/ext/zstdruby/libzstd/compress/zstd_cwksp.h +561 -0
- data/ext/zstdruby/libzstd/compress/zstd_double_fast.c +82 -60
- data/ext/zstdruby/libzstd/compress/zstd_double_fast.h +2 -2
- data/ext/zstdruby/libzstd/compress/zstd_fast.c +106 -80
- data/ext/zstdruby/libzstd/compress/zstd_fast.h +2 -2
- data/ext/zstdruby/libzstd/compress/zstd_lazy.c +411 -105
- data/ext/zstdruby/libzstd/compress/zstd_lazy.h +21 -1
- data/ext/zstdruby/libzstd/compress/zstd_ldm.c +296 -207
- data/ext/zstdruby/libzstd/compress/zstd_ldm.h +14 -3
- data/ext/zstdruby/libzstd/compress/zstd_ldm_geartab.h +103 -0
- data/ext/zstdruby/libzstd/compress/zstd_opt.c +260 -148
- data/ext/zstdruby/libzstd/compress/zstd_opt.h +1 -1
- data/ext/zstdruby/libzstd/compress/zstdmt_compress.c +153 -440
- data/ext/zstdruby/libzstd/compress/zstdmt_compress.h +29 -110
- data/ext/zstdruby/libzstd/decompress/huf_decompress.c +356 -238
- data/ext/zstdruby/libzstd/decompress/zstd_ddict.c +20 -16
- data/ext/zstdruby/libzstd/decompress/zstd_ddict.h +3 -3
- data/ext/zstdruby/libzstd/decompress/zstd_decompress.c +641 -238
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_block.c +600 -371
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_block.h +8 -5
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_internal.h +40 -9
- data/ext/zstdruby/libzstd/deprecated/zbuff.h +9 -8
- data/ext/zstdruby/libzstd/deprecated/zbuff_common.c +2 -2
- data/ext/zstdruby/libzstd/deprecated/zbuff_compress.c +1 -1
- data/ext/zstdruby/libzstd/deprecated/zbuff_decompress.c +1 -1
- data/ext/zstdruby/libzstd/dictBuilder/cover.c +197 -78
- data/ext/zstdruby/libzstd/dictBuilder/cover.h +52 -7
- data/ext/zstdruby/libzstd/dictBuilder/divsufsort.c +1 -1
- data/ext/zstdruby/libzstd/dictBuilder/fastcover.c +84 -66
- data/ext/zstdruby/libzstd/dictBuilder/zdict.c +58 -36
- data/ext/zstdruby/libzstd/dictBuilder/zdict.h +60 -31
- data/ext/zstdruby/libzstd/dll/example/Makefile +2 -1
- data/ext/zstdruby/libzstd/dll/example/README.md +16 -22
- data/ext/zstdruby/libzstd/legacy/zstd_legacy.h +8 -4
- data/ext/zstdruby/libzstd/legacy/zstd_v01.c +115 -111
- data/ext/zstdruby/libzstd/legacy/zstd_v01.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v02.c +28 -14
- data/ext/zstdruby/libzstd/legacy/zstd_v02.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v03.c +28 -14
- data/ext/zstdruby/libzstd/legacy/zstd_v03.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v04.c +36 -19
- data/ext/zstdruby/libzstd/legacy/zstd_v04.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v05.c +122 -107
- data/ext/zstdruby/libzstd/legacy/zstd_v05.h +2 -2
- data/ext/zstdruby/libzstd/legacy/zstd_v06.c +29 -23
- data/ext/zstdruby/libzstd/legacy/zstd_v06.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v07.c +34 -24
- data/ext/zstdruby/libzstd/legacy/zstd_v07.h +1 -1
- data/ext/zstdruby/libzstd/libzstd.pc.in +2 -1
- data/ext/zstdruby/libzstd/zstd.h +655 -118
- data/lib/zstd-ruby/version.rb +1 -1
- data/zstd-ruby.gemspec +1 -1
- metadata +20 -10
- data/.travis.yml +0 -14
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
/*
|
|
2
|
-
* Copyright (c) 2018-
|
|
2
|
+
* Copyright (c) 2018-2021, Facebook, Inc.
|
|
3
3
|
* All rights reserved.
|
|
4
4
|
*
|
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
|
@@ -16,8 +16,6 @@
|
|
|
16
16
|
* https://github.com/facebook/folly/blob/master/folly/CpuId.h
|
|
17
17
|
*/
|
|
18
18
|
|
|
19
|
-
#include <string.h>
|
|
20
|
-
|
|
21
19
|
#include "mem.h"
|
|
22
20
|
|
|
23
21
|
#ifdef _MSC_VER
|
|
@@ -1,35 +1,15 @@
|
|
|
1
1
|
/* ******************************************************************
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
notice, this list of conditions and the following disclaimer.
|
|
14
|
-
* Redistributions in binary form must reproduce the above
|
|
15
|
-
copyright notice, this list of conditions and the following disclaimer
|
|
16
|
-
in the documentation and/or other materials provided with the
|
|
17
|
-
distribution.
|
|
18
|
-
|
|
19
|
-
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
20
|
-
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
21
|
-
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
22
|
-
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
23
|
-
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
24
|
-
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
25
|
-
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
26
|
-
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
27
|
-
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
28
|
-
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
29
|
-
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
30
|
-
|
|
31
|
-
You can contact the author at :
|
|
32
|
-
- Source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
2
|
+
* debug
|
|
3
|
+
* Part of FSE library
|
|
4
|
+
* Copyright (c) 2013-2021, Yann Collet, Facebook, Inc.
|
|
5
|
+
*
|
|
6
|
+
* You can contact the author at :
|
|
7
|
+
* - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
8
|
+
*
|
|
9
|
+
* This source code is licensed under both the BSD-style license (found in the
|
|
10
|
+
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
|
11
|
+
* in the COPYING file in the root directory of this source tree).
|
|
12
|
+
* You may select, at your option, one of the above-listed licenses.
|
|
33
13
|
****************************************************************** */
|
|
34
14
|
|
|
35
15
|
|
|
@@ -1,35 +1,15 @@
|
|
|
1
1
|
/* ******************************************************************
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
notice, this list of conditions and the following disclaimer.
|
|
14
|
-
* Redistributions in binary form must reproduce the above
|
|
15
|
-
copyright notice, this list of conditions and the following disclaimer
|
|
16
|
-
in the documentation and/or other materials provided with the
|
|
17
|
-
distribution.
|
|
18
|
-
|
|
19
|
-
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
20
|
-
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
21
|
-
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
22
|
-
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
23
|
-
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
24
|
-
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
25
|
-
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
26
|
-
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
27
|
-
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
28
|
-
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
29
|
-
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
30
|
-
|
|
31
|
-
You can contact the author at :
|
|
32
|
-
- Source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
2
|
+
* debug
|
|
3
|
+
* Part of FSE library
|
|
4
|
+
* Copyright (c) 2013-2021, Yann Collet, Facebook, Inc.
|
|
5
|
+
*
|
|
6
|
+
* You can contact the author at :
|
|
7
|
+
* - Source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
8
|
+
*
|
|
9
|
+
* This source code is licensed under both the BSD-style license (found in the
|
|
10
|
+
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
|
11
|
+
* in the COPYING file in the root directory of this source tree).
|
|
12
|
+
* You may select, at your option, one of the above-listed licenses.
|
|
33
13
|
****************************************************************** */
|
|
34
14
|
|
|
35
15
|
|
|
@@ -71,15 +51,6 @@ extern "C" {
|
|
|
71
51
|
#endif
|
|
72
52
|
|
|
73
53
|
|
|
74
|
-
/* DEBUGFILE can be defined externally,
|
|
75
|
-
* typically through compiler command line.
|
|
76
|
-
* note : currently useless.
|
|
77
|
-
* Value must be stderr or stdout */
|
|
78
|
-
#ifndef DEBUGFILE
|
|
79
|
-
# define DEBUGFILE stderr
|
|
80
|
-
#endif
|
|
81
|
-
|
|
82
|
-
|
|
83
54
|
/* recommended values for DEBUGLEVEL :
|
|
84
55
|
* 0 : release mode, no debug, all run-time checks disabled
|
|
85
56
|
* 1 : enables assert() only, no display
|
|
@@ -96,7 +67,8 @@ extern "C" {
|
|
|
96
67
|
*/
|
|
97
68
|
|
|
98
69
|
#if (DEBUGLEVEL>=1)
|
|
99
|
-
#
|
|
70
|
+
# define ZSTD_DEPS_NEED_ASSERT
|
|
71
|
+
# include "zstd_deps.h"
|
|
100
72
|
#else
|
|
101
73
|
# ifndef assert /* assert may be already defined, due to prior #include <assert.h> */
|
|
102
74
|
# define assert(condition) ((void)0) /* disable assert (default) */
|
|
@@ -104,7 +76,8 @@ extern "C" {
|
|
|
104
76
|
#endif
|
|
105
77
|
|
|
106
78
|
#if (DEBUGLEVEL>=2)
|
|
107
|
-
#
|
|
79
|
+
# define ZSTD_DEPS_NEED_IO
|
|
80
|
+
# include "zstd_deps.h"
|
|
108
81
|
extern int g_debuglevel; /* the variable is only declared,
|
|
109
82
|
it actually lives in debug.c,
|
|
110
83
|
and is shared by the whole process.
|
|
@@ -112,14 +85,14 @@ extern int g_debuglevel; /* the variable is only declared,
|
|
|
112
85
|
It's useful when enabling very verbose levels
|
|
113
86
|
on selective conditions (such as position in src) */
|
|
114
87
|
|
|
115
|
-
# define RAWLOG(l, ...) {
|
|
116
|
-
if (l<=g_debuglevel) {
|
|
117
|
-
|
|
88
|
+
# define RAWLOG(l, ...) { \
|
|
89
|
+
if (l<=g_debuglevel) { \
|
|
90
|
+
ZSTD_DEBUG_PRINT(__VA_ARGS__); \
|
|
118
91
|
} }
|
|
119
|
-
# define DEBUGLOG(l, ...) {
|
|
120
|
-
if (l<=g_debuglevel) {
|
|
121
|
-
|
|
122
|
-
|
|
92
|
+
# define DEBUGLOG(l, ...) { \
|
|
93
|
+
if (l<=g_debuglevel) { \
|
|
94
|
+
ZSTD_DEBUG_PRINT(__FILE__ ": " __VA_ARGS__); \
|
|
95
|
+
ZSTD_DEBUG_PRINT(" \n"); \
|
|
123
96
|
} }
|
|
124
97
|
#else
|
|
125
98
|
# define RAWLOG(l, ...) {} /* disabled */
|
|
@@ -1,36 +1,16 @@
|
|
|
1
|
-
/*
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
copyright notice, this list of conditions and the following disclaimer
|
|
15
|
-
in the documentation and/or other materials provided with the
|
|
16
|
-
distribution.
|
|
17
|
-
|
|
18
|
-
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
|
|
19
|
-
"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
|
|
20
|
-
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
|
|
21
|
-
A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
|
|
22
|
-
OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
|
23
|
-
SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
|
24
|
-
LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
|
|
25
|
-
DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
|
|
26
|
-
THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
27
|
-
(INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
28
|
-
OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
29
|
-
|
|
30
|
-
You can contact the author at :
|
|
31
|
-
- FSE+HUF source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
32
|
-
- Public forum : https://groups.google.com/forum/#!forum/lz4c
|
|
33
|
-
*************************************************************************** */
|
|
1
|
+
/* ******************************************************************
|
|
2
|
+
* Common functions of New Generation Entropy library
|
|
3
|
+
* Copyright (c) 2016-2021, Yann Collet, Facebook, Inc.
|
|
4
|
+
*
|
|
5
|
+
* You can contact the author at :
|
|
6
|
+
* - FSE+HUF source repository : https://github.com/Cyan4973/FiniteStateEntropy
|
|
7
|
+
* - Public forum : https://groups.google.com/forum/#!forum/lz4c
|
|
8
|
+
*
|
|
9
|
+
* This source code is licensed under both the BSD-style license (found in the
|
|
10
|
+
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
|
11
|
+
* in the COPYING file in the root directory of this source tree).
|
|
12
|
+
* You may select, at your option, one of the above-listed licenses.
|
|
13
|
+
****************************************************************** */
|
|
34
14
|
|
|
35
15
|
/* *************************************
|
|
36
16
|
* Dependencies
|
|
@@ -58,8 +38,31 @@ const char* HUF_getErrorName(size_t code) { return ERR_getErrorName(code); }
|
|
|
58
38
|
/*-**************************************************************
|
|
59
39
|
* FSE NCount encoding-decoding
|
|
60
40
|
****************************************************************/
|
|
61
|
-
|
|
62
|
-
|
|
41
|
+
static U32 FSE_ctz(U32 val)
|
|
42
|
+
{
|
|
43
|
+
assert(val != 0);
|
|
44
|
+
{
|
|
45
|
+
# if defined(_MSC_VER) /* Visual */
|
|
46
|
+
unsigned long r=0;
|
|
47
|
+
return _BitScanForward(&r, val) ? (unsigned)r : 0;
|
|
48
|
+
# elif defined(__GNUC__) && (__GNUC__ >= 3) /* GCC Intrinsic */
|
|
49
|
+
return __builtin_ctz(val);
|
|
50
|
+
# elif defined(__ICCARM__) /* IAR Intrinsic */
|
|
51
|
+
return __CTZ(val);
|
|
52
|
+
# else /* Software version */
|
|
53
|
+
U32 count = 0;
|
|
54
|
+
while ((val & 1) == 0) {
|
|
55
|
+
val >>= 1;
|
|
56
|
+
++count;
|
|
57
|
+
}
|
|
58
|
+
return count;
|
|
59
|
+
# endif
|
|
60
|
+
}
|
|
61
|
+
}
|
|
62
|
+
|
|
63
|
+
FORCE_INLINE_TEMPLATE
|
|
64
|
+
size_t FSE_readNCount_body(short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
|
|
65
|
+
const void* headerBuffer, size_t hbSize)
|
|
63
66
|
{
|
|
64
67
|
const BYTE* const istart = (const BYTE*) headerBuffer;
|
|
65
68
|
const BYTE* const iend = istart + hbSize;
|
|
@@ -70,23 +73,23 @@ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* t
|
|
|
70
73
|
U32 bitStream;
|
|
71
74
|
int bitCount;
|
|
72
75
|
unsigned charnum = 0;
|
|
76
|
+
unsigned const maxSV1 = *maxSVPtr + 1;
|
|
73
77
|
int previous0 = 0;
|
|
74
78
|
|
|
75
|
-
if (hbSize <
|
|
76
|
-
/* This function only works when hbSize >=
|
|
77
|
-
char buffer[
|
|
78
|
-
|
|
79
|
-
memcpy(buffer, headerBuffer, hbSize);
|
|
79
|
+
if (hbSize < 8) {
|
|
80
|
+
/* This function only works when hbSize >= 8 */
|
|
81
|
+
char buffer[8] = {0};
|
|
82
|
+
ZSTD_memcpy(buffer, headerBuffer, hbSize);
|
|
80
83
|
{ size_t const countSize = FSE_readNCount(normalizedCounter, maxSVPtr, tableLogPtr,
|
|
81
84
|
buffer, sizeof(buffer));
|
|
82
85
|
if (FSE_isError(countSize)) return countSize;
|
|
83
86
|
if (countSize > hbSize) return ERROR(corruption_detected);
|
|
84
87
|
return countSize;
|
|
85
88
|
} }
|
|
86
|
-
assert(hbSize >=
|
|
89
|
+
assert(hbSize >= 8);
|
|
87
90
|
|
|
88
91
|
/* init */
|
|
89
|
-
|
|
92
|
+
ZSTD_memset(normalizedCounter, 0, (*maxSVPtr+1) * sizeof(normalizedCounter[0])); /* all symbols not present in NCount have a frequency of 0 */
|
|
90
93
|
bitStream = MEM_readLE32(ip);
|
|
91
94
|
nbBits = (bitStream & 0xF) + FSE_MIN_TABLELOG; /* extract tableLog */
|
|
92
95
|
if (nbBits > FSE_TABLELOG_ABSOLUTE_MAX) return ERROR(tableLog_tooLarge);
|
|
@@ -97,36 +100,58 @@ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* t
|
|
|
97
100
|
threshold = 1<<nbBits;
|
|
98
101
|
nbBits++;
|
|
99
102
|
|
|
100
|
-
|
|
103
|
+
for (;;) {
|
|
101
104
|
if (previous0) {
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
105
|
+
/* Count the number of repeats. Each time the
|
|
106
|
+
* 2-bit repeat code is 0b11 there is another
|
|
107
|
+
* repeat.
|
|
108
|
+
* Avoid UB by setting the high bit to 1.
|
|
109
|
+
*/
|
|
110
|
+
int repeats = FSE_ctz(~bitStream | 0x80000000) >> 1;
|
|
111
|
+
while (repeats >= 12) {
|
|
112
|
+
charnum += 3 * 12;
|
|
113
|
+
if (LIKELY(ip <= iend-7)) {
|
|
114
|
+
ip += 3;
|
|
108
115
|
} else {
|
|
109
|
-
|
|
110
|
-
bitCount
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
bitStream
|
|
115
|
-
bitCount += 2;
|
|
116
|
+
bitCount -= (int)(8 * (iend - 7 - ip));
|
|
117
|
+
bitCount &= 31;
|
|
118
|
+
ip = iend - 4;
|
|
119
|
+
}
|
|
120
|
+
bitStream = MEM_readLE32(ip) >> bitCount;
|
|
121
|
+
repeats = FSE_ctz(~bitStream | 0x80000000) >> 1;
|
|
116
122
|
}
|
|
117
|
-
|
|
123
|
+
charnum += 3 * repeats;
|
|
124
|
+
bitStream >>= 2 * repeats;
|
|
125
|
+
bitCount += 2 * repeats;
|
|
126
|
+
|
|
127
|
+
/* Add the final repeat which isn't 0b11. */
|
|
128
|
+
assert((bitStream & 3) < 3);
|
|
129
|
+
charnum += bitStream & 3;
|
|
118
130
|
bitCount += 2;
|
|
119
|
-
|
|
120
|
-
|
|
121
|
-
|
|
131
|
+
|
|
132
|
+
/* This is an error, but break and return an error
|
|
133
|
+
* at the end, because returning out of a loop makes
|
|
134
|
+
* it harder for the compiler to optimize.
|
|
135
|
+
*/
|
|
136
|
+
if (charnum >= maxSV1) break;
|
|
137
|
+
|
|
138
|
+
/* We don't need to set the normalized count to 0
|
|
139
|
+
* because we already memset the whole buffer to 0.
|
|
140
|
+
*/
|
|
141
|
+
|
|
142
|
+
if (LIKELY(ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
|
|
122
143
|
assert((bitCount >> 3) <= 3); /* For first condition to work */
|
|
123
144
|
ip += bitCount>>3;
|
|
124
145
|
bitCount &= 7;
|
|
125
|
-
bitStream = MEM_readLE32(ip) >> bitCount;
|
|
126
146
|
} else {
|
|
127
|
-
|
|
128
|
-
|
|
129
|
-
|
|
147
|
+
bitCount -= (int)(8 * (iend - 4 - ip));
|
|
148
|
+
bitCount &= 31;
|
|
149
|
+
ip = iend - 4;
|
|
150
|
+
}
|
|
151
|
+
bitStream = MEM_readLE32(ip) >> bitCount;
|
|
152
|
+
}
|
|
153
|
+
{
|
|
154
|
+
int const max = (2*threshold-1) - remaining;
|
|
130
155
|
int count;
|
|
131
156
|
|
|
132
157
|
if ((bitStream & (threshold-1)) < (U32)max) {
|
|
@@ -139,24 +164,43 @@ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* t
|
|
|
139
164
|
}
|
|
140
165
|
|
|
141
166
|
count--; /* extra accuracy */
|
|
142
|
-
|
|
167
|
+
/* When it matters (small blocks), this is a
|
|
168
|
+
* predictable branch, because we don't use -1.
|
|
169
|
+
*/
|
|
170
|
+
if (count >= 0) {
|
|
171
|
+
remaining -= count;
|
|
172
|
+
} else {
|
|
173
|
+
assert(count == -1);
|
|
174
|
+
remaining += count;
|
|
175
|
+
}
|
|
143
176
|
normalizedCounter[charnum++] = (short)count;
|
|
144
177
|
previous0 = !count;
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
178
|
+
|
|
179
|
+
assert(threshold > 1);
|
|
180
|
+
if (remaining < threshold) {
|
|
181
|
+
/* This branch can be folded into the
|
|
182
|
+
* threshold update condition because we
|
|
183
|
+
* know that threshold > 1.
|
|
184
|
+
*/
|
|
185
|
+
if (remaining <= 1) break;
|
|
186
|
+
nbBits = BIT_highbit32(remaining) + 1;
|
|
187
|
+
threshold = 1 << (nbBits - 1);
|
|
148
188
|
}
|
|
189
|
+
if (charnum >= maxSV1) break;
|
|
149
190
|
|
|
150
|
-
if ((ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
|
|
191
|
+
if (LIKELY(ip <= iend-7) || (ip + (bitCount>>3) <= iend-4)) {
|
|
151
192
|
ip += bitCount>>3;
|
|
152
193
|
bitCount &= 7;
|
|
153
194
|
} else {
|
|
154
195
|
bitCount -= (int)(8 * (iend - 4 - ip));
|
|
196
|
+
bitCount &= 31;
|
|
155
197
|
ip = iend - 4;
|
|
156
198
|
}
|
|
157
|
-
bitStream = MEM_readLE32(ip) >>
|
|
158
|
-
} }
|
|
199
|
+
bitStream = MEM_readLE32(ip) >> bitCount;
|
|
200
|
+
} }
|
|
159
201
|
if (remaining != 1) return ERROR(corruption_detected);
|
|
202
|
+
/* Only possible when there are too many zeros. */
|
|
203
|
+
if (charnum > maxSV1) return ERROR(maxSymbolValue_tooSmall);
|
|
160
204
|
if (bitCount > 32) return ERROR(corruption_detected);
|
|
161
205
|
*maxSVPtr = charnum-1;
|
|
162
206
|
|
|
@@ -164,6 +208,43 @@ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* t
|
|
|
164
208
|
return ip-istart;
|
|
165
209
|
}
|
|
166
210
|
|
|
211
|
+
/* Avoids the FORCE_INLINE of the _body() function. */
|
|
212
|
+
static size_t FSE_readNCount_body_default(
|
|
213
|
+
short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
|
|
214
|
+
const void* headerBuffer, size_t hbSize)
|
|
215
|
+
{
|
|
216
|
+
return FSE_readNCount_body(normalizedCounter, maxSVPtr, tableLogPtr, headerBuffer, hbSize);
|
|
217
|
+
}
|
|
218
|
+
|
|
219
|
+
#if DYNAMIC_BMI2
|
|
220
|
+
TARGET_ATTRIBUTE("bmi2") static size_t FSE_readNCount_body_bmi2(
|
|
221
|
+
short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
|
|
222
|
+
const void* headerBuffer, size_t hbSize)
|
|
223
|
+
{
|
|
224
|
+
return FSE_readNCount_body(normalizedCounter, maxSVPtr, tableLogPtr, headerBuffer, hbSize);
|
|
225
|
+
}
|
|
226
|
+
#endif
|
|
227
|
+
|
|
228
|
+
size_t FSE_readNCount_bmi2(
|
|
229
|
+
short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
|
|
230
|
+
const void* headerBuffer, size_t hbSize, int bmi2)
|
|
231
|
+
{
|
|
232
|
+
#if DYNAMIC_BMI2
|
|
233
|
+
if (bmi2) {
|
|
234
|
+
return FSE_readNCount_body_bmi2(normalizedCounter, maxSVPtr, tableLogPtr, headerBuffer, hbSize);
|
|
235
|
+
}
|
|
236
|
+
#endif
|
|
237
|
+
(void)bmi2;
|
|
238
|
+
return FSE_readNCount_body_default(normalizedCounter, maxSVPtr, tableLogPtr, headerBuffer, hbSize);
|
|
239
|
+
}
|
|
240
|
+
|
|
241
|
+
size_t FSE_readNCount(
|
|
242
|
+
short* normalizedCounter, unsigned* maxSVPtr, unsigned* tableLogPtr,
|
|
243
|
+
const void* headerBuffer, size_t hbSize)
|
|
244
|
+
{
|
|
245
|
+
return FSE_readNCount_bmi2(normalizedCounter, maxSVPtr, tableLogPtr, headerBuffer, hbSize, /* bmi2 */ 0);
|
|
246
|
+
}
|
|
247
|
+
|
|
167
248
|
|
|
168
249
|
/*! HUF_readStats() :
|
|
169
250
|
Read compact Huffman tree, saved by HUF_writeCTable().
|
|
@@ -175,6 +256,17 @@ size_t FSE_readNCount (short* normalizedCounter, unsigned* maxSVPtr, unsigned* t
|
|
|
175
256
|
size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
176
257
|
U32* nbSymbolsPtr, U32* tableLogPtr,
|
|
177
258
|
const void* src, size_t srcSize)
|
|
259
|
+
{
|
|
260
|
+
U32 wksp[HUF_READ_STATS_WORKSPACE_SIZE_U32];
|
|
261
|
+
return HUF_readStats_wksp(huffWeight, hwSize, rankStats, nbSymbolsPtr, tableLogPtr, src, srcSize, wksp, sizeof(wksp), /* bmi2 */ 0);
|
|
262
|
+
}
|
|
263
|
+
|
|
264
|
+
FORCE_INLINE_TEMPLATE size_t
|
|
265
|
+
HUF_readStats_body(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
266
|
+
U32* nbSymbolsPtr, U32* tableLogPtr,
|
|
267
|
+
const void* src, size_t srcSize,
|
|
268
|
+
void* workSpace, size_t wkspSize,
|
|
269
|
+
int bmi2)
|
|
178
270
|
{
|
|
179
271
|
U32 weightTotal;
|
|
180
272
|
const BYTE* ip = (const BYTE*) src;
|
|
@@ -183,7 +275,7 @@ size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
|
183
275
|
|
|
184
276
|
if (!srcSize) return ERROR(srcSize_wrong);
|
|
185
277
|
iSize = ip[0];
|
|
186
|
-
/*
|
|
278
|
+
/* ZSTD_memset(huffWeight, 0, hwSize); *//* is not necessary, even though some analyzer complain ... */
|
|
187
279
|
|
|
188
280
|
if (iSize >= 128) { /* special header */
|
|
189
281
|
oSize = iSize - 127;
|
|
@@ -197,14 +289,14 @@ size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
|
197
289
|
huffWeight[n+1] = ip[n/2] & 15;
|
|
198
290
|
} } }
|
|
199
291
|
else { /* header compressed with FSE (normal case) */
|
|
200
|
-
FSE_DTable fseWorkspace[FSE_DTABLE_SIZE_U32(6)]; /* 6 is max possible tableLog for HUF header (maybe even 5, to be tested) */
|
|
201
292
|
if (iSize+1 > srcSize) return ERROR(srcSize_wrong);
|
|
202
|
-
|
|
293
|
+
/* max (hwSize-1) values decoded, as last one is implied */
|
|
294
|
+
oSize = FSE_decompress_wksp_bmi2(huffWeight, hwSize-1, ip+1, iSize, 6, workSpace, wkspSize, bmi2);
|
|
203
295
|
if (FSE_isError(oSize)) return oSize;
|
|
204
296
|
}
|
|
205
297
|
|
|
206
298
|
/* collect weight stats */
|
|
207
|
-
|
|
299
|
+
ZSTD_memset(rankStats, 0, (HUF_TABLELOG_MAX + 1) * sizeof(U32));
|
|
208
300
|
weightTotal = 0;
|
|
209
301
|
{ U32 n; for (n=0; n<oSize; n++) {
|
|
210
302
|
if (huffWeight[n] >= HUF_TABLELOG_MAX) return ERROR(corruption_detected);
|
|
@@ -234,3 +326,37 @@ size_t HUF_readStats(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
|
234
326
|
*nbSymbolsPtr = (U32)(oSize+1);
|
|
235
327
|
return iSize+1;
|
|
236
328
|
}
|
|
329
|
+
|
|
330
|
+
/* Avoids the FORCE_INLINE of the _body() function. */
|
|
331
|
+
static size_t HUF_readStats_body_default(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
332
|
+
U32* nbSymbolsPtr, U32* tableLogPtr,
|
|
333
|
+
const void* src, size_t srcSize,
|
|
334
|
+
void* workSpace, size_t wkspSize)
|
|
335
|
+
{
|
|
336
|
+
return HUF_readStats_body(huffWeight, hwSize, rankStats, nbSymbolsPtr, tableLogPtr, src, srcSize, workSpace, wkspSize, 0);
|
|
337
|
+
}
|
|
338
|
+
|
|
339
|
+
#if DYNAMIC_BMI2
|
|
340
|
+
static TARGET_ATTRIBUTE("bmi2") size_t HUF_readStats_body_bmi2(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
341
|
+
U32* nbSymbolsPtr, U32* tableLogPtr,
|
|
342
|
+
const void* src, size_t srcSize,
|
|
343
|
+
void* workSpace, size_t wkspSize)
|
|
344
|
+
{
|
|
345
|
+
return HUF_readStats_body(huffWeight, hwSize, rankStats, nbSymbolsPtr, tableLogPtr, src, srcSize, workSpace, wkspSize, 1);
|
|
346
|
+
}
|
|
347
|
+
#endif
|
|
348
|
+
|
|
349
|
+
size_t HUF_readStats_wksp(BYTE* huffWeight, size_t hwSize, U32* rankStats,
|
|
350
|
+
U32* nbSymbolsPtr, U32* tableLogPtr,
|
|
351
|
+
const void* src, size_t srcSize,
|
|
352
|
+
void* workSpace, size_t wkspSize,
|
|
353
|
+
int bmi2)
|
|
354
|
+
{
|
|
355
|
+
#if DYNAMIC_BMI2
|
|
356
|
+
if (bmi2) {
|
|
357
|
+
return HUF_readStats_body_bmi2(huffWeight, hwSize, rankStats, nbSymbolsPtr, tableLogPtr, src, srcSize, workSpace, wkspSize);
|
|
358
|
+
}
|
|
359
|
+
#endif
|
|
360
|
+
(void)bmi2;
|
|
361
|
+
return HUF_readStats_body_default(huffWeight, hwSize, rankStats, nbSymbolsPtr, tableLogPtr, src, srcSize, workSpace, wkspSize);
|
|
362
|
+
}
|