zstd-ruby 1.4.1.0 → 1.5.0.0
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/.github/dependabot.yml +8 -0
- data/.github/workflows/ruby.yml +35 -0
- data/README.md +2 -2
- data/ext/zstdruby/libzstd/BUCK +5 -7
- data/ext/zstdruby/libzstd/Makefile +304 -113
- data/ext/zstdruby/libzstd/README.md +83 -20
- data/ext/zstdruby/libzstd/common/bitstream.h +59 -51
- data/ext/zstdruby/libzstd/common/compiler.h +150 -8
- data/ext/zstdruby/libzstd/common/cpu.h +1 -3
- data/ext/zstdruby/libzstd/common/debug.c +11 -31
- data/ext/zstdruby/libzstd/common/debug.h +22 -49
- data/ext/zstdruby/libzstd/common/entropy_common.c +201 -75
- data/ext/zstdruby/libzstd/common/error_private.c +3 -1
- data/ext/zstdruby/libzstd/common/error_private.h +8 -4
- data/ext/zstdruby/libzstd/common/fse.h +50 -42
- data/ext/zstdruby/libzstd/common/fse_decompress.c +149 -55
- data/ext/zstdruby/libzstd/common/huf.h +43 -39
- data/ext/zstdruby/libzstd/common/mem.h +69 -25
- data/ext/zstdruby/libzstd/common/pool.c +30 -20
- data/ext/zstdruby/libzstd/common/pool.h +3 -3
- data/ext/zstdruby/libzstd/common/threading.c +51 -4
- data/ext/zstdruby/libzstd/common/threading.h +36 -4
- data/ext/zstdruby/libzstd/common/xxhash.c +40 -92
- data/ext/zstdruby/libzstd/common/xxhash.h +12 -32
- data/ext/zstdruby/libzstd/common/zstd_common.c +10 -10
- data/ext/zstdruby/libzstd/common/zstd_deps.h +111 -0
- data/ext/zstdruby/libzstd/common/zstd_internal.h +230 -111
- data/ext/zstdruby/libzstd/common/zstd_trace.h +154 -0
- data/ext/zstdruby/libzstd/compress/fse_compress.c +47 -63
- data/ext/zstdruby/libzstd/compress/hist.c +41 -63
- data/ext/zstdruby/libzstd/compress/hist.h +13 -33
- data/ext/zstdruby/libzstd/compress/huf_compress.c +332 -193
- data/ext/zstdruby/libzstd/compress/zstd_compress.c +3614 -1696
- data/ext/zstdruby/libzstd/compress/zstd_compress_internal.h +546 -86
- data/ext/zstdruby/libzstd/compress/zstd_compress_literals.c +158 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_literals.h +29 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_sequences.c +441 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_sequences.h +54 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_superblock.c +572 -0
- data/ext/zstdruby/libzstd/compress/zstd_compress_superblock.h +32 -0
- data/ext/zstdruby/libzstd/compress/zstd_cwksp.h +662 -0
- data/ext/zstdruby/libzstd/compress/zstd_double_fast.c +43 -41
- data/ext/zstdruby/libzstd/compress/zstd_double_fast.h +2 -2
- data/ext/zstdruby/libzstd/compress/zstd_fast.c +85 -80
- data/ext/zstdruby/libzstd/compress/zstd_fast.h +2 -2
- data/ext/zstdruby/libzstd/compress/zstd_lazy.c +1184 -111
- data/ext/zstdruby/libzstd/compress/zstd_lazy.h +59 -1
- data/ext/zstdruby/libzstd/compress/zstd_ldm.c +333 -208
- data/ext/zstdruby/libzstd/compress/zstd_ldm.h +15 -3
- data/ext/zstdruby/libzstd/compress/zstd_ldm_geartab.h +103 -0
- data/ext/zstdruby/libzstd/compress/zstd_opt.c +228 -129
- data/ext/zstdruby/libzstd/compress/zstd_opt.h +1 -1
- data/ext/zstdruby/libzstd/compress/zstdmt_compress.c +151 -440
- data/ext/zstdruby/libzstd/compress/zstdmt_compress.h +32 -114
- data/ext/zstdruby/libzstd/decompress/huf_decompress.c +395 -276
- data/ext/zstdruby/libzstd/decompress/zstd_ddict.c +20 -16
- data/ext/zstdruby/libzstd/decompress/zstd_ddict.h +3 -3
- data/ext/zstdruby/libzstd/decompress/zstd_decompress.c +630 -231
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_block.c +606 -380
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_block.h +8 -5
- data/ext/zstdruby/libzstd/decompress/zstd_decompress_internal.h +39 -9
- data/ext/zstdruby/libzstd/deprecated/zbuff.h +9 -8
- data/ext/zstdruby/libzstd/deprecated/zbuff_common.c +2 -2
- data/ext/zstdruby/libzstd/deprecated/zbuff_compress.c +1 -1
- data/ext/zstdruby/libzstd/deprecated/zbuff_decompress.c +1 -1
- data/ext/zstdruby/libzstd/dictBuilder/cover.c +55 -46
- data/ext/zstdruby/libzstd/dictBuilder/cover.h +20 -9
- data/ext/zstdruby/libzstd/dictBuilder/divsufsort.c +1 -1
- data/ext/zstdruby/libzstd/dictBuilder/fastcover.c +43 -31
- data/ext/zstdruby/libzstd/dictBuilder/zdict.c +53 -30
- data/ext/zstdruby/libzstd/dll/example/Makefile +2 -1
- data/ext/zstdruby/libzstd/dll/example/README.md +16 -22
- data/ext/zstdruby/libzstd/legacy/zstd_legacy.h +4 -4
- data/ext/zstdruby/libzstd/legacy/zstd_v01.c +24 -14
- data/ext/zstdruby/libzstd/legacy/zstd_v01.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v02.c +17 -8
- data/ext/zstdruby/libzstd/legacy/zstd_v02.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v03.c +17 -8
- data/ext/zstdruby/libzstd/legacy/zstd_v03.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v04.c +25 -11
- data/ext/zstdruby/libzstd/legacy/zstd_v04.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v05.c +43 -32
- data/ext/zstdruby/libzstd/legacy/zstd_v05.h +2 -2
- data/ext/zstdruby/libzstd/legacy/zstd_v06.c +27 -19
- data/ext/zstdruby/libzstd/legacy/zstd_v06.h +1 -1
- data/ext/zstdruby/libzstd/legacy/zstd_v07.c +32 -20
- data/ext/zstdruby/libzstd/legacy/zstd_v07.h +1 -1
- data/ext/zstdruby/libzstd/libzstd.pc.in +2 -1
- data/ext/zstdruby/libzstd/{dictBuilder/zdict.h → zdict.h} +201 -31
- data/ext/zstdruby/libzstd/zstd.h +740 -153
- data/ext/zstdruby/libzstd/{common/zstd_errors.h → zstd_errors.h} +3 -1
- data/lib/zstd-ruby/version.rb +1 -1
- data/zstd-ruby.gemspec +1 -1
- metadata +21 -10
- data/.travis.yml +0 -14
@@ -1,10 +1,11 @@
|
|
1
1
|
/*
|
2
|
-
* Copyright (c)
|
2
|
+
* Copyright (c) Yann Collet, Facebook, Inc.
|
3
3
|
* All rights reserved.
|
4
4
|
*
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
6
6
|
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
7
7
|
* in the COPYING file in the root directory of this source tree).
|
8
|
+
* You may select, at your option, one of the above-listed licenses.
|
8
9
|
*/
|
9
10
|
|
10
11
|
#ifndef ZSTD_LDM_H
|
@@ -15,7 +16,7 @@ extern "C" {
|
|
15
16
|
#endif
|
16
17
|
|
17
18
|
#include "zstd_compress_internal.h" /* ldmParams_t, U32 */
|
18
|
-
#include "zstd.h" /* ZSTD_CCtx, size_t */
|
19
|
+
#include "../zstd.h" /* ZSTD_CCtx, size_t */
|
19
20
|
|
20
21
|
/*-*************************************
|
21
22
|
* Long distance matching
|
@@ -23,6 +24,10 @@ extern "C" {
|
|
23
24
|
|
24
25
|
#define ZSTD_LDM_DEFAULT_WINDOW_LOG ZSTD_WINDOWLOG_LIMIT_DEFAULT
|
25
26
|
|
27
|
+
void ZSTD_ldm_fillHashTable(
|
28
|
+
ldmState_t* state, const BYTE* ip,
|
29
|
+
const BYTE* iend, ldmParams_t const* params);
|
30
|
+
|
26
31
|
/**
|
27
32
|
* ZSTD_ldm_generateSequences():
|
28
33
|
*
|
@@ -61,6 +66,7 @@ size_t ZSTD_ldm_generateSequences(
|
|
61
66
|
*/
|
62
67
|
size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,
|
63
68
|
ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
|
69
|
+
ZSTD_useRowMatchFinderMode_e useRowMatchFinder,
|
64
70
|
void const* src, size_t srcSize);
|
65
71
|
|
66
72
|
/**
|
@@ -68,11 +74,17 @@ size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,
|
|
68
74
|
*
|
69
75
|
* Skip past `srcSize` bytes worth of sequences in `rawSeqStore`.
|
70
76
|
* Avoids emitting matches less than `minMatch` bytes.
|
71
|
-
* Must be called for data
|
77
|
+
* Must be called for data that is not passed to ZSTD_ldm_blockCompress().
|
72
78
|
*/
|
73
79
|
void ZSTD_ldm_skipSequences(rawSeqStore_t* rawSeqStore, size_t srcSize,
|
74
80
|
U32 const minMatch);
|
75
81
|
|
82
|
+
/* ZSTD_ldm_skipRawSeqStoreBytes():
|
83
|
+
* Moves forward in rawSeqStore by nbBytes, updating fields 'pos' and 'posInSequence'.
|
84
|
+
* Not to be used in conjunction with ZSTD_ldm_skipSequences().
|
85
|
+
* Must be called for data with is not passed to ZSTD_ldm_blockCompress().
|
86
|
+
*/
|
87
|
+
void ZSTD_ldm_skipRawSeqStoreBytes(rawSeqStore_t* rawSeqStore, size_t nbBytes);
|
76
88
|
|
77
89
|
/** ZSTD_ldm_getTableSize() :
|
78
90
|
* Estimate the space needed for long distance matching tables or 0 if LDM is
|
@@ -0,0 +1,103 @@
|
|
1
|
+
/*
|
2
|
+
* Copyright (c) Yann Collet, Facebook, Inc.
|
3
|
+
* All rights reserved.
|
4
|
+
*
|
5
|
+
* This source code is licensed under both the BSD-style license (found in the
|
6
|
+
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
7
|
+
* in the COPYING file in the root directory of this source tree).
|
8
|
+
* You may select, at your option, one of the above-listed licenses.
|
9
|
+
*/
|
10
|
+
|
11
|
+
#ifndef ZSTD_LDM_GEARTAB_H
|
12
|
+
#define ZSTD_LDM_GEARTAB_H
|
13
|
+
|
14
|
+
static U64 ZSTD_ldm_gearTab[256] = {
|
15
|
+
0xf5b8f72c5f77775c, 0x84935f266b7ac412, 0xb647ada9ca730ccc,
|
16
|
+
0xb065bb4b114fb1de, 0x34584e7e8c3a9fd0, 0x4e97e17c6ae26b05,
|
17
|
+
0x3a03d743bc99a604, 0xcecd042422c4044f, 0x76de76c58524259e,
|
18
|
+
0x9c8528f65badeaca, 0x86563706e2097529, 0x2902475fa375d889,
|
19
|
+
0xafb32a9739a5ebe6, 0xce2714da3883e639, 0x21eaf821722e69e,
|
20
|
+
0x37b628620b628, 0x49a8d455d88caf5, 0x8556d711e6958140,
|
21
|
+
0x4f7ae74fc605c1f, 0x829f0c3468bd3a20, 0x4ffdc885c625179e,
|
22
|
+
0x8473de048a3daf1b, 0x51008822b05646b2, 0x69d75d12b2d1cc5f,
|
23
|
+
0x8c9d4a19159154bc, 0xc3cc10f4abbd4003, 0xd06ddc1cecb97391,
|
24
|
+
0xbe48e6e7ed80302e, 0x3481db31cee03547, 0xacc3f67cdaa1d210,
|
25
|
+
0x65cb771d8c7f96cc, 0x8eb27177055723dd, 0xc789950d44cd94be,
|
26
|
+
0x934feadc3700b12b, 0x5e485f11edbdf182, 0x1e2e2a46fd64767a,
|
27
|
+
0x2969ca71d82efa7c, 0x9d46e9935ebbba2e, 0xe056b67e05e6822b,
|
28
|
+
0x94d73f55739d03a0, 0xcd7010bdb69b5a03, 0x455ef9fcd79b82f4,
|
29
|
+
0x869cb54a8749c161, 0x38d1a4fa6185d225, 0xb475166f94bbe9bb,
|
30
|
+
0xa4143548720959f1, 0x7aed4780ba6b26ba, 0xd0ce264439e02312,
|
31
|
+
0x84366d746078d508, 0xa8ce973c72ed17be, 0x21c323a29a430b01,
|
32
|
+
0x9962d617e3af80ee, 0xab0ce91d9c8cf75b, 0x530e8ee6d19a4dbc,
|
33
|
+
0x2ef68c0cf53f5d72, 0xc03a681640a85506, 0x496e4e9f9c310967,
|
34
|
+
0x78580472b59b14a0, 0x273824c23b388577, 0x66bf923ad45cb553,
|
35
|
+
0x47ae1a5a2492ba86, 0x35e304569e229659, 0x4765182a46870b6f,
|
36
|
+
0x6cbab625e9099412, 0xddac9a2e598522c1, 0x7172086e666624f2,
|
37
|
+
0xdf5003ca503b7837, 0x88c0c1db78563d09, 0x58d51865acfc289d,
|
38
|
+
0x177671aec65224f1, 0xfb79d8a241e967d7, 0x2be1e101cad9a49a,
|
39
|
+
0x6625682f6e29186b, 0x399553457ac06e50, 0x35dffb4c23abb74,
|
40
|
+
0x429db2591f54aade, 0xc52802a8037d1009, 0x6acb27381f0b25f3,
|
41
|
+
0xf45e2551ee4f823b, 0x8b0ea2d99580c2f7, 0x3bed519cbcb4e1e1,
|
42
|
+
0xff452823dbb010a, 0x9d42ed614f3dd267, 0x5b9313c06257c57b,
|
43
|
+
0xa114b8008b5e1442, 0xc1fe311c11c13d4b, 0x66e8763ea34c5568,
|
44
|
+
0x8b982af1c262f05d, 0xee8876faaa75fbb7, 0x8a62a4d0d172bb2a,
|
45
|
+
0xc13d94a3b7449a97, 0x6dbbba9dc15d037c, 0xc786101f1d92e0f1,
|
46
|
+
0xd78681a907a0b79b, 0xf61aaf2962c9abb9, 0x2cfd16fcd3cb7ad9,
|
47
|
+
0x868c5b6744624d21, 0x25e650899c74ddd7, 0xba042af4a7c37463,
|
48
|
+
0x4eb1a539465a3eca, 0xbe09dbf03b05d5ca, 0x774e5a362b5472ba,
|
49
|
+
0x47a1221229d183cd, 0x504b0ca18ef5a2df, 0xdffbdfbde2456eb9,
|
50
|
+
0x46cd2b2fbee34634, 0xf2aef8fe819d98c3, 0x357f5276d4599d61,
|
51
|
+
0x24a5483879c453e3, 0x88026889192b4b9, 0x28da96671782dbec,
|
52
|
+
0x4ef37c40588e9aaa, 0x8837b90651bc9fb3, 0xc164f741d3f0e5d6,
|
53
|
+
0xbc135a0a704b70ba, 0x69cd868f7622ada, 0xbc37ba89e0b9c0ab,
|
54
|
+
0x47c14a01323552f6, 0x4f00794bacee98bb, 0x7107de7d637a69d5,
|
55
|
+
0x88af793bb6f2255e, 0xf3c6466b8799b598, 0xc288c616aa7f3b59,
|
56
|
+
0x81ca63cf42fca3fd, 0x88d85ace36a2674b, 0xd056bd3792389e7,
|
57
|
+
0xe55c396c4e9dd32d, 0xbefb504571e6c0a6, 0x96ab32115e91e8cc,
|
58
|
+
0xbf8acb18de8f38d1, 0x66dae58801672606, 0x833b6017872317fb,
|
59
|
+
0xb87c16f2d1c92864, 0xdb766a74e58b669c, 0x89659f85c61417be,
|
60
|
+
0xc8daad856011ea0c, 0x76a4b565b6fe7eae, 0xa469d085f6237312,
|
61
|
+
0xaaf0365683a3e96c, 0x4dbb746f8424f7b8, 0x638755af4e4acc1,
|
62
|
+
0x3d7807f5bde64486, 0x17be6d8f5bbb7639, 0x903f0cd44dc35dc,
|
63
|
+
0x67b672eafdf1196c, 0xa676ff93ed4c82f1, 0x521d1004c5053d9d,
|
64
|
+
0x37ba9ad09ccc9202, 0x84e54d297aacfb51, 0xa0b4b776a143445,
|
65
|
+
0x820d471e20b348e, 0x1874383cb83d46dc, 0x97edeec7a1efe11c,
|
66
|
+
0xb330e50b1bdc42aa, 0x1dd91955ce70e032, 0xa514cdb88f2939d5,
|
67
|
+
0x2791233fd90db9d3, 0x7b670a4cc50f7a9b, 0x77c07d2a05c6dfa5,
|
68
|
+
0xe3778b6646d0a6fa, 0xb39c8eda47b56749, 0x933ed448addbef28,
|
69
|
+
0xaf846af6ab7d0bf4, 0xe5af208eb666e49, 0x5e6622f73534cd6a,
|
70
|
+
0x297daeca42ef5b6e, 0x862daef3d35539a6, 0xe68722498f8e1ea9,
|
71
|
+
0x981c53093dc0d572, 0xfa09b0bfbf86fbf5, 0x30b1e96166219f15,
|
72
|
+
0x70e7d466bdc4fb83, 0x5a66736e35f2a8e9, 0xcddb59d2b7c1baef,
|
73
|
+
0xd6c7d247d26d8996, 0xea4e39eac8de1ba3, 0x539c8bb19fa3aff2,
|
74
|
+
0x9f90e4c5fd508d8, 0xa34e5956fbaf3385, 0x2e2f8e151d3ef375,
|
75
|
+
0x173691e9b83faec1, 0xb85a8d56bf016379, 0x8382381267408ae3,
|
76
|
+
0xb90f901bbdc0096d, 0x7c6ad32933bcec65, 0x76bb5e2f2c8ad595,
|
77
|
+
0x390f851a6cf46d28, 0xc3e6064da1c2da72, 0xc52a0c101cfa5389,
|
78
|
+
0xd78eaf84a3fbc530, 0x3781b9e2288b997e, 0x73c2f6dea83d05c4,
|
79
|
+
0x4228e364c5b5ed7, 0x9d7a3edf0da43911, 0x8edcfeda24686756,
|
80
|
+
0x5e7667a7b7a9b3a1, 0x4c4f389fa143791d, 0xb08bc1023da7cddc,
|
81
|
+
0x7ab4be3ae529b1cc, 0x754e6132dbe74ff9, 0x71635442a839df45,
|
82
|
+
0x2f6fb1643fbe52de, 0x961e0a42cf7a8177, 0xf3b45d83d89ef2ea,
|
83
|
+
0xee3de4cf4a6e3e9b, 0xcd6848542c3295e7, 0xe4cee1664c78662f,
|
84
|
+
0x9947548b474c68c4, 0x25d73777a5ed8b0b, 0xc915b1d636b7fc,
|
85
|
+
0x21c2ba75d9b0d2da, 0x5f6b5dcf608a64a1, 0xdcf333255ff9570c,
|
86
|
+
0x633b922418ced4ee, 0xc136dde0b004b34a, 0x58cc83b05d4b2f5a,
|
87
|
+
0x5eb424dda28e42d2, 0x62df47369739cd98, 0xb4e0b42485e4ce17,
|
88
|
+
0x16e1f0c1f9a8d1e7, 0x8ec3916707560ebf, 0x62ba6e2df2cc9db3,
|
89
|
+
0xcbf9f4ff77d83a16, 0x78d9d7d07d2bbcc4, 0xef554ce1e02c41f4,
|
90
|
+
0x8d7581127eccf94d, 0xa9b53336cb3c8a05, 0x38c42c0bf45c4f91,
|
91
|
+
0x640893cdf4488863, 0x80ec34bc575ea568, 0x39f324f5b48eaa40,
|
92
|
+
0xe9d9ed1f8eff527f, 0x9224fc058cc5a214, 0xbaba00b04cfe7741,
|
93
|
+
0x309a9f120fcf52af, 0xa558f3ec65626212, 0x424bec8b7adabe2f,
|
94
|
+
0x41622513a6aea433, 0xb88da2d5324ca798, 0xd287733b245528a4,
|
95
|
+
0x9a44697e6d68aec3, 0x7b1093be2f49bb28, 0x50bbec632e3d8aad,
|
96
|
+
0x6cd90723e1ea8283, 0x897b9e7431b02bf3, 0x219efdcb338a7047,
|
97
|
+
0x3b0311f0a27c0656, 0xdb17bf91c0db96e7, 0x8cd4fd6b4e85a5b2,
|
98
|
+
0xfab071054ba6409d, 0x40d6fe831fa9dfd9, 0xaf358debad7d791e,
|
99
|
+
0xeb8d0e25a65e3e58, 0xbbcbd3df14e08580, 0xcf751f27ecdab2b,
|
100
|
+
0x2b4da14f2613d8f4
|
101
|
+
};
|
102
|
+
|
103
|
+
#endif /* ZSTD_LDM_GEARTAB_H */
|
@@ -1,5 +1,5 @@
|
|
1
1
|
/*
|
2
|
-
* Copyright (c)
|
2
|
+
* Copyright (c) Przemyslaw Skibinski, Yann Collet, Facebook, Inc.
|
3
3
|
* All rights reserved.
|
4
4
|
*
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
@@ -249,40 +249,6 @@ static U32 ZSTD_litLengthPrice(U32 const litLength, const optState_t* const optP
|
|
249
249
|
}
|
250
250
|
}
|
251
251
|
|
252
|
-
/* ZSTD_litLengthContribution() :
|
253
|
-
* @return ( cost(litlength) - cost(0) )
|
254
|
-
* this value can then be added to rawLiteralsCost()
|
255
|
-
* to provide a cost which is directly comparable to a match ending at same position */
|
256
|
-
static int ZSTD_litLengthContribution(U32 const litLength, const optState_t* const optPtr, int optLevel)
|
257
|
-
{
|
258
|
-
if (optPtr->priceType >= zop_predef) return (int)WEIGHT(litLength, optLevel);
|
259
|
-
|
260
|
-
/* dynamic statistics */
|
261
|
-
{ U32 const llCode = ZSTD_LLcode(litLength);
|
262
|
-
int const contribution = (int)(LL_bits[llCode] * BITCOST_MULTIPLIER)
|
263
|
-
+ (int)WEIGHT(optPtr->litLengthFreq[0], optLevel) /* note: log2litLengthSum cancel out */
|
264
|
-
- (int)WEIGHT(optPtr->litLengthFreq[llCode], optLevel);
|
265
|
-
#if 1
|
266
|
-
return contribution;
|
267
|
-
#else
|
268
|
-
return MAX(0, contribution); /* sometimes better, sometimes not ... */
|
269
|
-
#endif
|
270
|
-
}
|
271
|
-
}
|
272
|
-
|
273
|
-
/* ZSTD_literalsContribution() :
|
274
|
-
* creates a fake cost for the literals part of a sequence
|
275
|
-
* which can be compared to the ending cost of a match
|
276
|
-
* should a new match start at this position */
|
277
|
-
static int ZSTD_literalsContribution(const BYTE* const literals, U32 const litLength,
|
278
|
-
const optState_t* const optPtr,
|
279
|
-
int optLevel)
|
280
|
-
{
|
281
|
-
int const contribution = (int)ZSTD_rawLiteralsCost(literals, litLength, optPtr, optLevel)
|
282
|
-
+ ZSTD_litLengthContribution(litLength, optPtr, optLevel);
|
283
|
-
return contribution;
|
284
|
-
}
|
285
|
-
|
286
252
|
/* ZSTD_getMatchPrice() :
|
287
253
|
* Provides the cost of the match part (offset + matchLength) of a sequence
|
288
254
|
* Must be combined with ZSTD_fullLiteralsCost() to get the full cost of a sequence.
|
@@ -420,32 +386,32 @@ static U32 ZSTD_insertBt1(
|
|
420
386
|
const BYTE* const dictEnd = dictBase + dictLimit;
|
421
387
|
const BYTE* const prefixStart = base + dictLimit;
|
422
388
|
const BYTE* match;
|
423
|
-
const U32
|
424
|
-
const U32 btLow = btMask >=
|
425
|
-
U32* smallerPtr = bt + 2*(
|
389
|
+
const U32 curr = (U32)(ip-base);
|
390
|
+
const U32 btLow = btMask >= curr ? 0 : curr - btMask;
|
391
|
+
U32* smallerPtr = bt + 2*(curr&btMask);
|
426
392
|
U32* largerPtr = smallerPtr + 1;
|
427
393
|
U32 dummy32; /* to be nullified at the end */
|
428
394
|
U32 const windowLow = ms->window.lowLimit;
|
429
|
-
U32 matchEndIdx =
|
395
|
+
U32 matchEndIdx = curr+8+1;
|
430
396
|
size_t bestLength = 8;
|
431
397
|
U32 nbCompares = 1U << cParams->searchLog;
|
432
398
|
#ifdef ZSTD_C_PREDICT
|
433
|
-
U32 predictedSmall = *(bt + 2*((
|
434
|
-
U32 predictedLarge = *(bt + 2*((
|
399
|
+
U32 predictedSmall = *(bt + 2*((curr-1)&btMask) + 0);
|
400
|
+
U32 predictedLarge = *(bt + 2*((curr-1)&btMask) + 1);
|
435
401
|
predictedSmall += (predictedSmall>0);
|
436
402
|
predictedLarge += (predictedLarge>0);
|
437
403
|
#endif /* ZSTD_C_PREDICT */
|
438
404
|
|
439
|
-
DEBUGLOG(8, "ZSTD_insertBt1 (%u)",
|
405
|
+
DEBUGLOG(8, "ZSTD_insertBt1 (%u)", curr);
|
440
406
|
|
441
407
|
assert(ip <= iend-8); /* required for h calculation */
|
442
|
-
hashTable[h] =
|
408
|
+
hashTable[h] = curr; /* Update Hash Table */
|
443
409
|
|
444
410
|
assert(windowLow > 0);
|
445
411
|
while (nbCompares-- && (matchIndex >= windowLow)) {
|
446
412
|
U32* const nextPtr = bt + 2*(matchIndex & btMask);
|
447
413
|
size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger); /* guaranteed minimum nb of common bytes */
|
448
|
-
assert(matchIndex <
|
414
|
+
assert(matchIndex < curr);
|
449
415
|
|
450
416
|
#ifdef ZSTD_C_PREDICT /* note : can create issues when hlog small <= 11 */
|
451
417
|
const U32* predictPtr = bt + 2*((matchIndex-1) & btMask); /* written this way, as bt is a roll buffer */
|
@@ -508,8 +474,8 @@ static U32 ZSTD_insertBt1(
|
|
508
474
|
*smallerPtr = *largerPtr = 0;
|
509
475
|
{ U32 positions = 0;
|
510
476
|
if (bestLength > 384) positions = MIN(192, (U32)(bestLength - 384)); /* speed optimization */
|
511
|
-
assert(matchEndIdx >
|
512
|
-
return MAX(positions, matchEndIdx - (
|
477
|
+
assert(matchEndIdx > curr + 8);
|
478
|
+
return MAX(positions, matchEndIdx - (curr + 8));
|
513
479
|
}
|
514
480
|
}
|
515
481
|
|
@@ -552,9 +518,8 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
552
518
|
{
|
553
519
|
const ZSTD_compressionParameters* const cParams = &ms->cParams;
|
554
520
|
U32 const sufficient_len = MIN(cParams->targetLength, ZSTD_OPT_NUM -1);
|
555
|
-
U32 const maxDistance = 1U << cParams->windowLog;
|
556
521
|
const BYTE* const base = ms->window.base;
|
557
|
-
U32 const
|
522
|
+
U32 const curr = (U32)(ip-base);
|
558
523
|
U32 const hashLog = cParams->hashLog;
|
559
524
|
U32 const minMatch = (mls==3) ? 3 : 4;
|
560
525
|
U32* const hashTable = ms->hashTable;
|
@@ -568,13 +533,12 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
568
533
|
U32 const dictLimit = ms->window.dictLimit;
|
569
534
|
const BYTE* const dictEnd = dictBase + dictLimit;
|
570
535
|
const BYTE* const prefixStart = base + dictLimit;
|
571
|
-
U32 const btLow = (btMask >=
|
572
|
-
U32 const
|
573
|
-
U32 const windowLow = ((current - windowValid) > maxDistance) ? current - maxDistance : windowValid;
|
536
|
+
U32 const btLow = (btMask >= curr) ? 0 : curr - btMask;
|
537
|
+
U32 const windowLow = ZSTD_getLowestMatchIndex(ms, curr, cParams->windowLog);
|
574
538
|
U32 const matchLow = windowLow ? windowLow : 1;
|
575
|
-
U32* smallerPtr = bt + 2*(
|
576
|
-
U32* largerPtr = bt + 2*(
|
577
|
-
U32 matchEndIdx =
|
539
|
+
U32* smallerPtr = bt + 2*(curr&btMask);
|
540
|
+
U32* largerPtr = bt + 2*(curr&btMask) + 1;
|
541
|
+
U32 matchEndIdx = curr+8+1; /* farthest referenced position of any match => detects repetitive patterns */
|
578
542
|
U32 dummy32; /* to be nullified at the end */
|
579
543
|
U32 mnum = 0;
|
580
544
|
U32 nbCompares = 1U << cParams->searchLog;
|
@@ -593,7 +557,7 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
593
557
|
U32 const dmsBtLow = dictMode == ZSTD_dictMatchState && dmsBtMask < dmsHighLimit - dmsLowLimit ? dmsHighLimit - dmsBtMask : dmsLowLimit;
|
594
558
|
|
595
559
|
size_t bestLength = lengthToBeat-1;
|
596
|
-
DEBUGLOG(8, "ZSTD_insertBtAndGetAllMatches: current=%u",
|
560
|
+
DEBUGLOG(8, "ZSTD_insertBtAndGetAllMatches: current=%u", curr);
|
597
561
|
|
598
562
|
/* check repCode */
|
599
563
|
assert(ll0 <= 1); /* necessarily 1 or 0 */
|
@@ -601,26 +565,29 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
601
565
|
U32 repCode;
|
602
566
|
for (repCode = ll0; repCode < lastR; repCode++) {
|
603
567
|
U32 const repOffset = (repCode==ZSTD_REP_NUM) ? (rep[0] - 1) : rep[repCode];
|
604
|
-
U32 const repIndex =
|
568
|
+
U32 const repIndex = curr - repOffset;
|
605
569
|
U32 repLen = 0;
|
606
|
-
assert(
|
607
|
-
if (repOffset-1 /* intentional overflow, discards 0 and -1 */ <
|
608
|
-
|
570
|
+
assert(curr >= dictLimit);
|
571
|
+
if (repOffset-1 /* intentional overflow, discards 0 and -1 */ < curr-dictLimit) { /* equivalent to `curr > repIndex >= dictLimit` */
|
572
|
+
/* We must validate the repcode offset because when we're using a dictionary the
|
573
|
+
* valid offset range shrinks when the dictionary goes out of bounds.
|
574
|
+
*/
|
575
|
+
if ((repIndex >= windowLow) & (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(ip - repOffset, minMatch))) {
|
609
576
|
repLen = (U32)ZSTD_count(ip+minMatch, ip+minMatch-repOffset, iLimit) + minMatch;
|
610
577
|
}
|
611
|
-
} else { /* repIndex < dictLimit || repIndex >=
|
578
|
+
} else { /* repIndex < dictLimit || repIndex >= curr */
|
612
579
|
const BYTE* const repMatch = dictMode == ZSTD_dictMatchState ?
|
613
580
|
dmsBase + repIndex - dmsIndexDelta :
|
614
581
|
dictBase + repIndex;
|
615
|
-
assert(
|
582
|
+
assert(curr >= windowLow);
|
616
583
|
if ( dictMode == ZSTD_extDict
|
617
|
-
&& ( ((repOffset-1) /*intentional overflow*/ <
|
584
|
+
&& ( ((repOffset-1) /*intentional overflow*/ < curr - windowLow) /* equivalent to `curr > repIndex >= windowLow` */
|
618
585
|
& (((U32)((dictLimit-1) - repIndex) >= 3) ) /* intentional overflow : do not test positions overlapping 2 memory segments */)
|
619
586
|
&& (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch)) ) {
|
620
587
|
repLen = (U32)ZSTD_count_2segments(ip+minMatch, repMatch+minMatch, iLimit, dictEnd, prefixStart) + minMatch;
|
621
588
|
}
|
622
589
|
if (dictMode == ZSTD_dictMatchState
|
623
|
-
&& ( ((repOffset-1) /*intentional overflow*/ <
|
590
|
+
&& ( ((repOffset-1) /*intentional overflow*/ < curr - (dmsLowLimit + dmsIndexDelta)) /* equivalent to `curr > repIndex >= dmsLowLimit` */
|
624
591
|
& ((U32)((dictLimit-1) - repIndex) >= 3) ) /* intentional overflow : do not test positions overlapping 2 memory segments */
|
625
592
|
&& (ZSTD_readMINMATCH(ip, minMatch) == ZSTD_readMINMATCH(repMatch, minMatch)) ) {
|
626
593
|
repLen = (U32)ZSTD_count_2segments(ip+minMatch, repMatch+minMatch, iLimit, dmsEnd, prefixStart) + minMatch;
|
@@ -642,7 +609,7 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
642
609
|
if ((mls == 3) /*static*/ && (bestLength < mls)) {
|
643
610
|
U32 const matchIndex3 = ZSTD_insertAndFindFirstIndexHash3(ms, nextToUpdate3, ip);
|
644
611
|
if ((matchIndex3 >= matchLow)
|
645
|
-
& (
|
612
|
+
& (curr - matchIndex3 < (1<<18)) /*heuristic : longer distance likely too expensive*/ ) {
|
646
613
|
size_t mlen;
|
647
614
|
if ((dictMode == ZSTD_noDict) /*static*/ || (dictMode == ZSTD_dictMatchState) /*static*/ || (matchIndex3 >= dictLimit)) {
|
648
615
|
const BYTE* const match = base + matchIndex3;
|
@@ -657,46 +624,48 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
657
624
|
DEBUGLOG(8, "found small match with hlog3, of length %u",
|
658
625
|
(U32)mlen);
|
659
626
|
bestLength = mlen;
|
660
|
-
assert(
|
627
|
+
assert(curr > matchIndex3);
|
661
628
|
assert(mnum==0); /* no prior solution */
|
662
|
-
matches[0].off = (
|
629
|
+
matches[0].off = (curr - matchIndex3) + ZSTD_REP_MOVE;
|
663
630
|
matches[0].len = (U32)mlen;
|
664
631
|
mnum = 1;
|
665
632
|
if ( (mlen > sufficient_len) |
|
666
633
|
(ip+mlen == iLimit) ) { /* best possible length */
|
667
|
-
ms->nextToUpdate =
|
634
|
+
ms->nextToUpdate = curr+1; /* skip insertion */
|
668
635
|
return 1;
|
669
636
|
} } }
|
670
637
|
/* no dictMatchState lookup: dicts don't have a populated HC3 table */
|
671
638
|
}
|
672
639
|
|
673
|
-
hashTable[h] =
|
640
|
+
hashTable[h] = curr; /* Update Hash Table */
|
674
641
|
|
675
642
|
while (nbCompares-- && (matchIndex >= matchLow)) {
|
676
643
|
U32* const nextPtr = bt + 2*(matchIndex & btMask);
|
677
|
-
size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger); /* guaranteed minimum nb of common bytes */
|
678
644
|
const BYTE* match;
|
679
|
-
|
645
|
+
size_t matchLength = MIN(commonLengthSmaller, commonLengthLarger); /* guaranteed minimum nb of common bytes */
|
646
|
+
assert(curr > matchIndex);
|
680
647
|
|
681
648
|
if ((dictMode == ZSTD_noDict) || (dictMode == ZSTD_dictMatchState) || (matchIndex+matchLength >= dictLimit)) {
|
682
649
|
assert(matchIndex+matchLength >= dictLimit); /* ensure the condition is correct when !extDict */
|
683
650
|
match = base + matchIndex;
|
651
|
+
if (matchIndex >= dictLimit) assert(memcmp(match, ip, matchLength) == 0); /* ensure early section of match is equal as expected */
|
684
652
|
matchLength += ZSTD_count(ip+matchLength, match+matchLength, iLimit);
|
685
653
|
} else {
|
686
654
|
match = dictBase + matchIndex;
|
655
|
+
assert(memcmp(match, ip, matchLength) == 0); /* ensure early section of match is equal as expected */
|
687
656
|
matchLength += ZSTD_count_2segments(ip+matchLength, match+matchLength, iLimit, dictEnd, prefixStart);
|
688
657
|
if (matchIndex+matchLength >= dictLimit)
|
689
|
-
match = base + matchIndex; /* prepare for match[matchLength] */
|
658
|
+
match = base + matchIndex; /* prepare for match[matchLength] read */
|
690
659
|
}
|
691
660
|
|
692
661
|
if (matchLength > bestLength) {
|
693
662
|
DEBUGLOG(8, "found match of length %u at distance %u (offCode=%u)",
|
694
|
-
(U32)matchLength,
|
663
|
+
(U32)matchLength, curr - matchIndex, curr - matchIndex + ZSTD_REP_MOVE);
|
695
664
|
assert(matchEndIdx > matchIndex);
|
696
665
|
if (matchLength > matchEndIdx - matchIndex)
|
697
666
|
matchEndIdx = matchIndex + (U32)matchLength;
|
698
667
|
bestLength = matchLength;
|
699
|
-
matches[mnum].off = (
|
668
|
+
matches[mnum].off = (curr - matchIndex) + ZSTD_REP_MOVE;
|
700
669
|
matches[mnum].len = (U32)matchLength;
|
701
670
|
mnum++;
|
702
671
|
if ( (matchLength > ZSTD_OPT_NUM)
|
@@ -739,11 +708,11 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
739
708
|
if (matchLength > bestLength) {
|
740
709
|
matchIndex = dictMatchIndex + dmsIndexDelta;
|
741
710
|
DEBUGLOG(8, "found dms match of length %u at distance %u (offCode=%u)",
|
742
|
-
(U32)matchLength,
|
711
|
+
(U32)matchLength, curr - matchIndex, curr - matchIndex + ZSTD_REP_MOVE);
|
743
712
|
if (matchLength > matchEndIdx - matchIndex)
|
744
713
|
matchEndIdx = matchIndex + (U32)matchLength;
|
745
714
|
bestLength = matchLength;
|
746
|
-
matches[mnum].off = (
|
715
|
+
matches[mnum].off = (curr - matchIndex) + ZSTD_REP_MOVE;
|
747
716
|
matches[mnum].len = (U32)matchLength;
|
748
717
|
mnum++;
|
749
718
|
if ( (matchLength > ZSTD_OPT_NUM)
|
@@ -764,7 +733,7 @@ U32 ZSTD_insertBtAndGetAllMatches (
|
|
764
733
|
}
|
765
734
|
}
|
766
735
|
|
767
|
-
assert(matchEndIdx >
|
736
|
+
assert(matchEndIdx > curr+8);
|
768
737
|
ms->nextToUpdate = matchEndIdx - 8; /* skip repetitive patterns */
|
769
738
|
return mnum;
|
770
739
|
}
|
@@ -795,35 +764,145 @@ FORCE_INLINE_TEMPLATE U32 ZSTD_BtGetAllMatches (
|
|
795
764
|
}
|
796
765
|
}
|
797
766
|
|
767
|
+
/*************************
|
768
|
+
* LDM helper functions *
|
769
|
+
*************************/
|
798
770
|
|
799
|
-
|
800
|
-
|
801
|
-
|
802
|
-
|
803
|
-
U32
|
804
|
-
|
771
|
+
/* Struct containing info needed to make decision about ldm inclusion */
|
772
|
+
typedef struct {
|
773
|
+
rawSeqStore_t seqStore; /* External match candidates store for this block */
|
774
|
+
U32 startPosInBlock; /* Start position of the current match candidate */
|
775
|
+
U32 endPosInBlock; /* End position of the current match candidate */
|
776
|
+
U32 offset; /* Offset of the match candidate */
|
777
|
+
} ZSTD_optLdm_t;
|
805
778
|
|
806
|
-
|
807
|
-
|
808
|
-
|
809
|
-
|
810
|
-
|
811
|
-
|
812
|
-
|
813
|
-
|
814
|
-
|
815
|
-
|
816
|
-
|
817
|
-
|
818
|
-
|
819
|
-
newReps.rep[0] = currentOffset;
|
820
|
-
} else { /* repCode == 0 */
|
821
|
-
memcpy(&newReps, rep, sizeof(newReps));
|
779
|
+
/* ZSTD_optLdm_skipRawSeqStoreBytes():
|
780
|
+
* Moves forward in rawSeqStore by nbBytes, which will update the fields 'pos' and 'posInSequence'.
|
781
|
+
*/
|
782
|
+
static void ZSTD_optLdm_skipRawSeqStoreBytes(rawSeqStore_t* rawSeqStore, size_t nbBytes) {
|
783
|
+
U32 currPos = (U32)(rawSeqStore->posInSequence + nbBytes);
|
784
|
+
while (currPos && rawSeqStore->pos < rawSeqStore->size) {
|
785
|
+
rawSeq currSeq = rawSeqStore->seq[rawSeqStore->pos];
|
786
|
+
if (currPos >= currSeq.litLength + currSeq.matchLength) {
|
787
|
+
currPos -= currSeq.litLength + currSeq.matchLength;
|
788
|
+
rawSeqStore->pos++;
|
789
|
+
} else {
|
790
|
+
rawSeqStore->posInSequence = currPos;
|
791
|
+
break;
|
822
792
|
}
|
823
793
|
}
|
824
|
-
|
794
|
+
if (currPos == 0 || rawSeqStore->pos == rawSeqStore->size) {
|
795
|
+
rawSeqStore->posInSequence = 0;
|
796
|
+
}
|
797
|
+
}
|
798
|
+
|
799
|
+
/* ZSTD_opt_getNextMatchAndUpdateSeqStore():
|
800
|
+
* Calculates the beginning and end of the next match in the current block.
|
801
|
+
* Updates 'pos' and 'posInSequence' of the ldmSeqStore.
|
802
|
+
*/
|
803
|
+
static void ZSTD_opt_getNextMatchAndUpdateSeqStore(ZSTD_optLdm_t* optLdm, U32 currPosInBlock,
|
804
|
+
U32 blockBytesRemaining) {
|
805
|
+
rawSeq currSeq;
|
806
|
+
U32 currBlockEndPos;
|
807
|
+
U32 literalsBytesRemaining;
|
808
|
+
U32 matchBytesRemaining;
|
809
|
+
|
810
|
+
/* Setting match end position to MAX to ensure we never use an LDM during this block */
|
811
|
+
if (optLdm->seqStore.size == 0 || optLdm->seqStore.pos >= optLdm->seqStore.size) {
|
812
|
+
optLdm->startPosInBlock = UINT_MAX;
|
813
|
+
optLdm->endPosInBlock = UINT_MAX;
|
814
|
+
return;
|
815
|
+
}
|
816
|
+
/* Calculate appropriate bytes left in matchLength and litLength after adjusting
|
817
|
+
based on ldmSeqStore->posInSequence */
|
818
|
+
currSeq = optLdm->seqStore.seq[optLdm->seqStore.pos];
|
819
|
+
assert(optLdm->seqStore.posInSequence <= currSeq.litLength + currSeq.matchLength);
|
820
|
+
currBlockEndPos = currPosInBlock + blockBytesRemaining;
|
821
|
+
literalsBytesRemaining = (optLdm->seqStore.posInSequence < currSeq.litLength) ?
|
822
|
+
currSeq.litLength - (U32)optLdm->seqStore.posInSequence :
|
823
|
+
0;
|
824
|
+
matchBytesRemaining = (literalsBytesRemaining == 0) ?
|
825
|
+
currSeq.matchLength - ((U32)optLdm->seqStore.posInSequence - currSeq.litLength) :
|
826
|
+
currSeq.matchLength;
|
827
|
+
|
828
|
+
/* If there are more literal bytes than bytes remaining in block, no ldm is possible */
|
829
|
+
if (literalsBytesRemaining >= blockBytesRemaining) {
|
830
|
+
optLdm->startPosInBlock = UINT_MAX;
|
831
|
+
optLdm->endPosInBlock = UINT_MAX;
|
832
|
+
ZSTD_optLdm_skipRawSeqStoreBytes(&optLdm->seqStore, blockBytesRemaining);
|
833
|
+
return;
|
834
|
+
}
|
835
|
+
|
836
|
+
/* Matches may be < MINMATCH by this process. In that case, we will reject them
|
837
|
+
when we are deciding whether or not to add the ldm */
|
838
|
+
optLdm->startPosInBlock = currPosInBlock + literalsBytesRemaining;
|
839
|
+
optLdm->endPosInBlock = optLdm->startPosInBlock + matchBytesRemaining;
|
840
|
+
optLdm->offset = currSeq.offset;
|
841
|
+
|
842
|
+
if (optLdm->endPosInBlock > currBlockEndPos) {
|
843
|
+
/* Match ends after the block ends, we can't use the whole match */
|
844
|
+
optLdm->endPosInBlock = currBlockEndPos;
|
845
|
+
ZSTD_optLdm_skipRawSeqStoreBytes(&optLdm->seqStore, currBlockEndPos - currPosInBlock);
|
846
|
+
} else {
|
847
|
+
/* Consume nb of bytes equal to size of sequence left */
|
848
|
+
ZSTD_optLdm_skipRawSeqStoreBytes(&optLdm->seqStore, literalsBytesRemaining + matchBytesRemaining);
|
849
|
+
}
|
825
850
|
}
|
826
851
|
|
852
|
+
/* ZSTD_optLdm_maybeAddMatch():
|
853
|
+
* Adds a match if it's long enough, based on it's 'matchStartPosInBlock'
|
854
|
+
* and 'matchEndPosInBlock', into 'matches'. Maintains the correct ordering of 'matches'
|
855
|
+
*/
|
856
|
+
static void ZSTD_optLdm_maybeAddMatch(ZSTD_match_t* matches, U32* nbMatches,
|
857
|
+
ZSTD_optLdm_t* optLdm, U32 currPosInBlock) {
|
858
|
+
U32 posDiff = currPosInBlock - optLdm->startPosInBlock;
|
859
|
+
/* Note: ZSTD_match_t actually contains offCode and matchLength (before subtracting MINMATCH) */
|
860
|
+
U32 candidateMatchLength = optLdm->endPosInBlock - optLdm->startPosInBlock - posDiff;
|
861
|
+
U32 candidateOffCode = optLdm->offset + ZSTD_REP_MOVE;
|
862
|
+
|
863
|
+
/* Ensure that current block position is not outside of the match */
|
864
|
+
if (currPosInBlock < optLdm->startPosInBlock
|
865
|
+
|| currPosInBlock >= optLdm->endPosInBlock
|
866
|
+
|| candidateMatchLength < MINMATCH) {
|
867
|
+
return;
|
868
|
+
}
|
869
|
+
|
870
|
+
if (*nbMatches == 0 || ((candidateMatchLength > matches[*nbMatches-1].len) && *nbMatches < ZSTD_OPT_NUM)) {
|
871
|
+
DEBUGLOG(6, "ZSTD_optLdm_maybeAddMatch(): Adding ldm candidate match (offCode: %u matchLength %u) at block position=%u",
|
872
|
+
candidateOffCode, candidateMatchLength, currPosInBlock);
|
873
|
+
matches[*nbMatches].len = candidateMatchLength;
|
874
|
+
matches[*nbMatches].off = candidateOffCode;
|
875
|
+
(*nbMatches)++;
|
876
|
+
}
|
877
|
+
}
|
878
|
+
|
879
|
+
/* ZSTD_optLdm_processMatchCandidate():
|
880
|
+
* Wrapper function to update ldm seq store and call ldm functions as necessary.
|
881
|
+
*/
|
882
|
+
static void ZSTD_optLdm_processMatchCandidate(ZSTD_optLdm_t* optLdm, ZSTD_match_t* matches, U32* nbMatches,
|
883
|
+
U32 currPosInBlock, U32 remainingBytes) {
|
884
|
+
if (optLdm->seqStore.size == 0 || optLdm->seqStore.pos >= optLdm->seqStore.size) {
|
885
|
+
return;
|
886
|
+
}
|
887
|
+
|
888
|
+
if (currPosInBlock >= optLdm->endPosInBlock) {
|
889
|
+
if (currPosInBlock > optLdm->endPosInBlock) {
|
890
|
+
/* The position at which ZSTD_optLdm_processMatchCandidate() is called is not necessarily
|
891
|
+
* at the end of a match from the ldm seq store, and will often be some bytes
|
892
|
+
* over beyond matchEndPosInBlock. As such, we need to correct for these "overshoots"
|
893
|
+
*/
|
894
|
+
U32 posOvershoot = currPosInBlock - optLdm->endPosInBlock;
|
895
|
+
ZSTD_optLdm_skipRawSeqStoreBytes(&optLdm->seqStore, posOvershoot);
|
896
|
+
}
|
897
|
+
ZSTD_opt_getNextMatchAndUpdateSeqStore(optLdm, currPosInBlock, remainingBytes);
|
898
|
+
}
|
899
|
+
ZSTD_optLdm_maybeAddMatch(matches, nbMatches, optLdm, currPosInBlock);
|
900
|
+
}
|
901
|
+
|
902
|
+
/*-*******************************
|
903
|
+
* Optimal parser
|
904
|
+
*********************************/
|
905
|
+
|
827
906
|
|
828
907
|
static U32 ZSTD_totalLen(ZSTD_optimal_t sol)
|
829
908
|
{
|
@@ -839,7 +918,7 @@ listStats(const U32* table, int lastEltID)
|
|
839
918
|
int enb;
|
840
919
|
for (enb=0; enb < nbElts; enb++) {
|
841
920
|
(void)table;
|
842
|
-
|
921
|
+
/* RAWLOG(2, "%3i:%3i, ", enb, table[enb]); */
|
843
922
|
RAWLOG(2, "%4i,", table[enb]);
|
844
923
|
}
|
845
924
|
RAWLOG(2, " \n");
|
@@ -872,6 +951,11 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
872
951
|
ZSTD_optimal_t* const opt = optStatePtr->priceTable;
|
873
952
|
ZSTD_match_t* const matches = optStatePtr->matchTable;
|
874
953
|
ZSTD_optimal_t lastSequence;
|
954
|
+
ZSTD_optLdm_t optLdm;
|
955
|
+
|
956
|
+
optLdm.seqStore = ms->ldmSeqStore ? *ms->ldmSeqStore : kNullRawSeqStore;
|
957
|
+
optLdm.endPosInBlock = optLdm.startPosInBlock = optLdm.offset = 0;
|
958
|
+
ZSTD_opt_getNextMatchAndUpdateSeqStore(&optLdm, (U32)(ip-istart), (U32)(iend-ip));
|
875
959
|
|
876
960
|
/* init */
|
877
961
|
DEBUGLOG(5, "ZSTD_compressBlock_opt_generic: current=%u, prefix=%u, nextToUpdate=%u",
|
@@ -887,14 +971,21 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
887
971
|
/* find first match */
|
888
972
|
{ U32 const litlen = (U32)(ip - anchor);
|
889
973
|
U32 const ll0 = !litlen;
|
890
|
-
U32
|
974
|
+
U32 nbMatches = ZSTD_BtGetAllMatches(matches, ms, &nextToUpdate3, ip, iend, dictMode, rep, ll0, minMatch);
|
975
|
+
ZSTD_optLdm_processMatchCandidate(&optLdm, matches, &nbMatches,
|
976
|
+
(U32)(ip-istart), (U32)(iend - ip));
|
891
977
|
if (!nbMatches) { ip++; continue; }
|
892
978
|
|
893
979
|
/* initialize opt[0] */
|
894
980
|
{ U32 i ; for (i=0; i<ZSTD_REP_NUM; i++) opt[0].rep[i] = rep[i]; }
|
895
981
|
opt[0].mlen = 0; /* means is_a_literal */
|
896
982
|
opt[0].litlen = litlen;
|
897
|
-
|
983
|
+
/* We don't need to include the actual price of the literals because
|
984
|
+
* it is static for the duration of the forward pass, and is included
|
985
|
+
* in every price. We include the literal length to avoid negative
|
986
|
+
* prices when we subtract the previous literal length.
|
987
|
+
*/
|
988
|
+
opt[0].price = ZSTD_litLengthPrice(litlen, optStatePtr, optLevel);
|
898
989
|
|
899
990
|
/* large match -> immediate encoding */
|
900
991
|
{ U32 const maxML = matches[nbMatches-1].len;
|
@@ -923,7 +1014,6 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
923
1014
|
for (matchNb = 0; matchNb < nbMatches; matchNb++) {
|
924
1015
|
U32 const offset = matches[matchNb].off;
|
925
1016
|
U32 const end = matches[matchNb].len;
|
926
|
-
repcodes_t const repHistory = ZSTD_updateRep(rep, offset, ll0);
|
927
1017
|
for ( ; pos <= end ; pos++ ) {
|
928
1018
|
U32 const matchPrice = ZSTD_getMatchPrice(offset, pos, optStatePtr, optLevel);
|
929
1019
|
U32 const sequencePrice = literalsPrice + matchPrice;
|
@@ -933,8 +1023,6 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
933
1023
|
opt[pos].off = offset;
|
934
1024
|
opt[pos].litlen = litlen;
|
935
1025
|
opt[pos].price = sequencePrice;
|
936
|
-
ZSTD_STATIC_ASSERT(sizeof(opt[pos].rep) == sizeof(repHistory));
|
937
|
-
memcpy(opt[pos].rep, &repHistory, sizeof(repHistory));
|
938
1026
|
} }
|
939
1027
|
last_pos = pos-1;
|
940
1028
|
}
|
@@ -961,7 +1049,6 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
961
1049
|
opt[cur].off = 0;
|
962
1050
|
opt[cur].litlen = litlen;
|
963
1051
|
opt[cur].price = price;
|
964
|
-
memcpy(opt[cur].rep, opt[cur-1].rep, sizeof(opt[cur].rep));
|
965
1052
|
} else {
|
966
1053
|
DEBUGLOG(7, "cPos:%zi==rPos:%u : literal would cost more (%.2f>%.2f) (hist:%u,%u,%u)",
|
967
1054
|
inr-istart, cur, ZSTD_fCost(price), ZSTD_fCost(opt[cur].price),
|
@@ -969,6 +1056,21 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
969
1056
|
}
|
970
1057
|
}
|
971
1058
|
|
1059
|
+
/* Set the repcodes of the current position. We must do it here
|
1060
|
+
* because we rely on the repcodes of the 2nd to last sequence being
|
1061
|
+
* correct to set the next chunks repcodes during the backward
|
1062
|
+
* traversal.
|
1063
|
+
*/
|
1064
|
+
ZSTD_STATIC_ASSERT(sizeof(opt[cur].rep) == sizeof(repcodes_t));
|
1065
|
+
assert(cur >= opt[cur].mlen);
|
1066
|
+
if (opt[cur].mlen != 0) {
|
1067
|
+
U32 const prev = cur - opt[cur].mlen;
|
1068
|
+
repcodes_t newReps = ZSTD_updateRep(opt[prev].rep, opt[cur].off, opt[cur].litlen==0);
|
1069
|
+
ZSTD_memcpy(opt[cur].rep, &newReps, sizeof(repcodes_t));
|
1070
|
+
} else {
|
1071
|
+
ZSTD_memcpy(opt[cur].rep, opt[cur - 1].rep, sizeof(repcodes_t));
|
1072
|
+
}
|
1073
|
+
|
972
1074
|
/* last match must start at a minimum distance of 8 from oend */
|
973
1075
|
if (inr > ilimit) continue;
|
974
1076
|
|
@@ -984,8 +1086,12 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
984
1086
|
U32 const litlen = (opt[cur].mlen == 0) ? opt[cur].litlen : 0;
|
985
1087
|
U32 const previousPrice = opt[cur].price;
|
986
1088
|
U32 const basePrice = previousPrice + ZSTD_litLengthPrice(0, optStatePtr, optLevel);
|
987
|
-
U32
|
1089
|
+
U32 nbMatches = ZSTD_BtGetAllMatches(matches, ms, &nextToUpdate3, inr, iend, dictMode, opt[cur].rep, ll0, minMatch);
|
988
1090
|
U32 matchNb;
|
1091
|
+
|
1092
|
+
ZSTD_optLdm_processMatchCandidate(&optLdm, matches, &nbMatches,
|
1093
|
+
(U32)(inr-istart), (U32)(iend-inr));
|
1094
|
+
|
989
1095
|
if (!nbMatches) {
|
990
1096
|
DEBUGLOG(7, "rPos:%u : no match found", cur);
|
991
1097
|
continue;
|
@@ -1009,7 +1115,6 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
1009
1115
|
/* set prices using matches found at position == cur */
|
1010
1116
|
for (matchNb = 0; matchNb < nbMatches; matchNb++) {
|
1011
1117
|
U32 const offset = matches[matchNb].off;
|
1012
|
-
repcodes_t const repHistory = ZSTD_updateRep(opt[cur].rep, offset, ll0);
|
1013
1118
|
U32 const lastML = matches[matchNb].len;
|
1014
1119
|
U32 const startML = (matchNb>0) ? matches[matchNb-1].len+1 : minMatch;
|
1015
1120
|
U32 mlen;
|
@@ -1029,8 +1134,6 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
1029
1134
|
opt[pos].off = offset;
|
1030
1135
|
opt[pos].litlen = litlen;
|
1031
1136
|
opt[pos].price = price;
|
1032
|
-
ZSTD_STATIC_ASSERT(sizeof(opt[pos].rep) == sizeof(repHistory));
|
1033
|
-
memcpy(opt[pos].rep, &repHistory, sizeof(repHistory));
|
1034
1137
|
} else {
|
1035
1138
|
DEBUGLOG(7, "rPos:%u (ml=%2u) => new price is worse (%.2f>=%.2f)",
|
1036
1139
|
pos, mlen, ZSTD_fCost(price), ZSTD_fCost(opt[pos].price));
|
@@ -1046,6 +1149,17 @@ ZSTD_compressBlock_opt_generic(ZSTD_matchState_t* ms,
|
|
1046
1149
|
_shortestPath: /* cur, last_pos, best_mlen, best_off have to be set */
|
1047
1150
|
assert(opt[0].mlen == 0);
|
1048
1151
|
|
1152
|
+
/* Set the next chunk's repcodes based on the repcodes of the beginning
|
1153
|
+
* of the last match, and the last sequence. This avoids us having to
|
1154
|
+
* update them while traversing the sequences.
|
1155
|
+
*/
|
1156
|
+
if (lastSequence.mlen != 0) {
|
1157
|
+
repcodes_t reps = ZSTD_updateRep(opt[cur].rep, lastSequence.off, lastSequence.litlen==0);
|
1158
|
+
ZSTD_memcpy(rep, &reps, sizeof(reps));
|
1159
|
+
} else {
|
1160
|
+
ZSTD_memcpy(rep, opt[cur].rep, sizeof(repcodes_t));
|
1161
|
+
}
|
1162
|
+
|
1049
1163
|
{ U32 const storeEnd = cur + 1;
|
1050
1164
|
U32 storeStart = storeEnd;
|
1051
1165
|
U32 seqPos = cur;
|
@@ -1082,29 +1196,14 @@ _shortestPath: /* cur, last_pos, best_mlen, best_off have to be set */
|
|
1082
1196
|
continue; /* will finish */
|
1083
1197
|
}
|
1084
1198
|
|
1085
|
-
/* repcodes update : like ZSTD_updateRep(), but update in place */
|
1086
|
-
if (offCode >= ZSTD_REP_NUM) { /* full offset */
|
1087
|
-
rep[2] = rep[1];
|
1088
|
-
rep[1] = rep[0];
|
1089
|
-
rep[0] = offCode - ZSTD_REP_MOVE;
|
1090
|
-
} else { /* repcode */
|
1091
|
-
U32 const repCode = offCode + (llen==0);
|
1092
|
-
if (repCode) { /* note : if repCode==0, no change */
|
1093
|
-
U32 const currentOffset = (repCode==ZSTD_REP_NUM) ? (rep[0] - 1) : rep[repCode];
|
1094
|
-
if (repCode >= 2) rep[2] = rep[1];
|
1095
|
-
rep[1] = rep[0];
|
1096
|
-
rep[0] = currentOffset;
|
1097
|
-
} }
|
1098
|
-
|
1099
1199
|
assert(anchor + llen <= iend);
|
1100
1200
|
ZSTD_updateStats(optStatePtr, llen, anchor, offCode, mlen);
|
1101
|
-
ZSTD_storeSeq(seqStore, llen, anchor, offCode, mlen-MINMATCH);
|
1201
|
+
ZSTD_storeSeq(seqStore, llen, anchor, iend, offCode, mlen-MINMATCH);
|
1102
1202
|
anchor += advance;
|
1103
1203
|
ip = anchor;
|
1104
1204
|
} }
|
1105
1205
|
ZSTD_setBasePrices(optStatePtr, optLevel);
|
1106
1206
|
}
|
1107
|
-
|
1108
1207
|
} /* while (ip < ilimit) */
|
1109
1208
|
|
1110
1209
|
/* Return the last literals size */
|
@@ -1156,7 +1255,7 @@ ZSTD_initStats_ultra(ZSTD_matchState_t* ms,
|
|
1156
1255
|
const void* src, size_t srcSize)
|
1157
1256
|
{
|
1158
1257
|
U32 tmpRep[ZSTD_REP_NUM]; /* updated rep codes will sink here */
|
1159
|
-
|
1258
|
+
ZSTD_memcpy(tmpRep, rep, sizeof(tmpRep));
|
1160
1259
|
|
1161
1260
|
DEBUGLOG(4, "ZSTD_initStats_ultra (srcSize=%zu)", srcSize);
|
1162
1261
|
assert(ms->opt.litLengthSum == 0); /* first block */
|
@@ -1189,7 +1288,7 @@ size_t ZSTD_compressBlock_btultra2(
|
|
1189
1288
|
ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM],
|
1190
1289
|
const void* src, size_t srcSize)
|
1191
1290
|
{
|
1192
|
-
U32 const
|
1291
|
+
U32 const curr = (U32)((const BYTE*)src - ms->window.base);
|
1193
1292
|
DEBUGLOG(5, "ZSTD_compressBlock_btultra2 (srcSize=%zu)", srcSize);
|
1194
1293
|
|
1195
1294
|
/* 2-pass strategy:
|
@@ -1204,7 +1303,7 @@ size_t ZSTD_compressBlock_btultra2(
|
|
1204
1303
|
if ( (ms->opt.litLengthSum==0) /* first block */
|
1205
1304
|
&& (seqStore->sequences == seqStore->sequencesStart) /* no ldm */
|
1206
1305
|
&& (ms->window.dictLimit == ms->window.lowLimit) /* no dictionary */
|
1207
|
-
&& (
|
1306
|
+
&& (curr == ms->window.dictLimit) /* start of frame, nothing already loaded nor skipped */
|
1208
1307
|
&& (srcSize > ZSTD_PREDEF_THRESHOLD)
|
1209
1308
|
) {
|
1210
1309
|
ZSTD_initStats_ultra(ms, seqStore, rep, src, srcSize);
|