zstdlib 0.7.0-x64-mingw32 → 0.8.0-x64-mingw32
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/CHANGES.md +5 -0
- data/ext/zstdlib/extconf.rb +1 -1
- data/ext/zstdlib/ruby/zlib-3.0/zstdlib.c +4994 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/bitstream.h +25 -16
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/compiler.h +118 -4
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/cpu.h +1 -3
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/debug.c +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/debug.h +12 -19
- data/ext/zstdlib/zstd-1.5.0/lib/common/entropy_common.c +362 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/error_private.c +2 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/error_private.h +3 -3
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/fse.h +40 -12
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/fse_decompress.c +139 -22
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/huf.h +29 -7
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/mem.h +69 -98
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/pool.c +23 -17
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/pool.h +2 -2
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/threading.c +6 -5
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/threading.h +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/xxhash.c +20 -60
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/xxhash.h +2 -2
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/zstd_common.c +10 -10
- data/ext/zstdlib/zstd-1.5.0/lib/common/zstd_deps.h +111 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/common/zstd_internal.h +105 -62
- data/ext/zstdlib/zstd-1.5.0/lib/common/zstd_trace.h +154 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/fse_compress.c +31 -24
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/hist.c +27 -29
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/hist.h +2 -2
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/huf_compress.c +265 -126
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress.c +2843 -728
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_internal.h +305 -63
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_literals.c +8 -8
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_literals.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_sequences.c +29 -7
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_sequences.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_superblock.c +22 -295
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_compress_superblock.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_cwksp.h +204 -67
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_double_fast.c +25 -25
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_double_fast.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_fast.c +23 -23
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_fast.h +1 -1
- data/ext/zstdlib/zstd-1.5.0/lib/compress/zstd_lazy.c +2184 -0
- data/ext/zstdlib/zstd-1.5.0/lib/compress/zstd_lazy.h +125 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_ldm.c +314 -211
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_ldm.h +9 -2
- data/ext/zstdlib/zstd-1.5.0/lib/compress/zstd_ldm_geartab.h +103 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_opt.c +191 -46
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstd_opt.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/compress/zstdmt_compress.c +93 -415
- data/ext/zstdlib/zstd-1.5.0/lib/compress/zstdmt_compress.h +110 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/huf_decompress.c +342 -239
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_ddict.c +9 -9
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_ddict.h +2 -2
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_decompress.c +369 -87
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_decompress_block.c +191 -75
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_decompress_block.h +6 -3
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/decompress/zstd_decompress_internal.h +27 -11
- data/ext/zstdlib/zstd-1.5.0/lib/zdict.h +452 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/lib/zstd.h +568 -126
- data/ext/zstdlib/{zstd-1.4.5/lib/common → zstd-1.5.0/lib}/zstd_errors.h +2 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzclose.c +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzcompatibility.h +1 -1
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzguts.h +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzlib.c +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzread.c +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/gzwrite.c +0 -0
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/zstd_zlibwrapper.c +126 -44
- data/ext/zstdlib/{zstd-1.4.5 → zstd-1.5.0}/zlibWrapper/zstd_zlibwrapper.h +1 -1
- data/lib/2.2/zstdlib.so +0 -0
- data/lib/2.3/zstdlib.so +0 -0
- data/lib/2.4/zstdlib.so +0 -0
- data/lib/2.5/zstdlib.so +0 -0
- data/lib/2.6/zstdlib.so +0 -0
- data/lib/2.7/zstdlib.so +0 -0
- metadata +69 -64
- data/ext/zstdlib/zstd-1.4.5/lib/common/entropy_common.c +0 -216
- data/ext/zstdlib/zstd-1.4.5/lib/compress/zstd_lazy.c +0 -1138
- data/ext/zstdlib/zstd-1.4.5/lib/compress/zstd_lazy.h +0 -67
- data/ext/zstdlib/zstd-1.4.5/lib/compress/zstdmt_compress.h +0 -192
@@ -1,5 +1,5 @@
|
|
1
1
|
/*
|
2
|
-
* Copyright (c)
|
2
|
+
* Copyright (c) Yann Collet, Facebook, Inc.
|
3
3
|
* All rights reserved.
|
4
4
|
*
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
@@ -20,8 +20,7 @@
|
|
20
20
|
|
21
21
|
|
22
22
|
/* ====== Dependencies ====== */
|
23
|
-
#include
|
24
|
-
#include <limits.h> /* INT_MAX, UINT_MAX */
|
23
|
+
#include "../common/zstd_deps.h" /* ZSTD_memcpy, ZSTD_memset, INT_MAX, UINT_MAX */
|
25
24
|
#include "../common/mem.h" /* MEM_STATIC */
|
26
25
|
#include "../common/pool.h" /* threadpool */
|
27
26
|
#include "../common/threading.h" /* mutex */
|
@@ -106,11 +105,11 @@ typedef struct ZSTDMT_bufferPool_s {
|
|
106
105
|
static ZSTDMT_bufferPool* ZSTDMT_createBufferPool(unsigned nbWorkers, ZSTD_customMem cMem)
|
107
106
|
{
|
108
107
|
unsigned const maxNbBuffers = 2*nbWorkers + 3;
|
109
|
-
ZSTDMT_bufferPool* const bufPool = (ZSTDMT_bufferPool*)
|
108
|
+
ZSTDMT_bufferPool* const bufPool = (ZSTDMT_bufferPool*)ZSTD_customCalloc(
|
110
109
|
sizeof(ZSTDMT_bufferPool) + (maxNbBuffers-1) * sizeof(buffer_t), cMem);
|
111
110
|
if (bufPool==NULL) return NULL;
|
112
111
|
if (ZSTD_pthread_mutex_init(&bufPool->poolMutex, NULL)) {
|
113
|
-
|
112
|
+
ZSTD_customFree(bufPool, cMem);
|
114
113
|
return NULL;
|
115
114
|
}
|
116
115
|
bufPool->bufferSize = 64 KB;
|
@@ -127,10 +126,10 @@ static void ZSTDMT_freeBufferPool(ZSTDMT_bufferPool* bufPool)
|
|
127
126
|
if (!bufPool) return; /* compatibility with free on NULL */
|
128
127
|
for (u=0; u<bufPool->totalBuffers; u++) {
|
129
128
|
DEBUGLOG(4, "free buffer %2u (address:%08X)", u, (U32)(size_t)bufPool->bTable[u].start);
|
130
|
-
|
129
|
+
ZSTD_customFree(bufPool->bTable[u].start, bufPool->cMem);
|
131
130
|
}
|
132
131
|
ZSTD_pthread_mutex_destroy(&bufPool->poolMutex);
|
133
|
-
|
132
|
+
ZSTD_customFree(bufPool, bufPool->cMem);
|
134
133
|
}
|
135
134
|
|
136
135
|
/* only works at initialization, not during compression */
|
@@ -201,13 +200,13 @@ static buffer_t ZSTDMT_getBuffer(ZSTDMT_bufferPool* bufPool)
|
|
201
200
|
}
|
202
201
|
/* size conditions not respected : scratch this buffer, create new one */
|
203
202
|
DEBUGLOG(5, "ZSTDMT_getBuffer: existing buffer does not meet size conditions => freeing");
|
204
|
-
|
203
|
+
ZSTD_customFree(buf.start, bufPool->cMem);
|
205
204
|
}
|
206
205
|
ZSTD_pthread_mutex_unlock(&bufPool->poolMutex);
|
207
206
|
/* create new buffer */
|
208
207
|
DEBUGLOG(5, "ZSTDMT_getBuffer: create a new buffer");
|
209
208
|
{ buffer_t buffer;
|
210
|
-
void* const start =
|
209
|
+
void* const start = ZSTD_customMalloc(bSize, bufPool->cMem);
|
211
210
|
buffer.start = start; /* note : start can be NULL if malloc fails ! */
|
212
211
|
buffer.capacity = (start==NULL) ? 0 : bSize;
|
213
212
|
if (start==NULL) {
|
@@ -229,13 +228,13 @@ static buffer_t ZSTDMT_resizeBuffer(ZSTDMT_bufferPool* bufPool, buffer_t buffer)
|
|
229
228
|
{
|
230
229
|
size_t const bSize = bufPool->bufferSize;
|
231
230
|
if (buffer.capacity < bSize) {
|
232
|
-
void* const start =
|
231
|
+
void* const start = ZSTD_customMalloc(bSize, bufPool->cMem);
|
233
232
|
buffer_t newBuffer;
|
234
233
|
newBuffer.start = start;
|
235
234
|
newBuffer.capacity = start == NULL ? 0 : bSize;
|
236
235
|
if (start != NULL) {
|
237
236
|
assert(newBuffer.capacity >= buffer.capacity);
|
238
|
-
|
237
|
+
ZSTD_memcpy(newBuffer.start, buffer.start, buffer.capacity);
|
239
238
|
DEBUGLOG(5, "ZSTDMT_resizeBuffer: created buffer of size %u", (U32)bSize);
|
240
239
|
return newBuffer;
|
241
240
|
}
|
@@ -261,14 +260,12 @@ static void ZSTDMT_releaseBuffer(ZSTDMT_bufferPool* bufPool, buffer_t buf)
|
|
261
260
|
ZSTD_pthread_mutex_unlock(&bufPool->poolMutex);
|
262
261
|
/* Reached bufferPool capacity (should not happen) */
|
263
262
|
DEBUGLOG(5, "ZSTDMT_releaseBuffer: pool capacity reached => freeing ");
|
264
|
-
|
263
|
+
ZSTD_customFree(buf.start, bufPool->cMem);
|
265
264
|
}
|
266
265
|
|
267
266
|
|
268
267
|
/* ===== Seq Pool Wrapper ====== */
|
269
268
|
|
270
|
-
static rawSeqStore_t kNullRawSeqStore = {NULL, 0, 0, 0};
|
271
|
-
|
272
269
|
typedef ZSTDMT_bufferPool ZSTDMT_seqPool;
|
273
270
|
|
274
271
|
static size_t ZSTDMT_sizeof_seqPool(ZSTDMT_seqPool* seqPool)
|
@@ -278,7 +275,7 @@ static size_t ZSTDMT_sizeof_seqPool(ZSTDMT_seqPool* seqPool)
|
|
278
275
|
|
279
276
|
static rawSeqStore_t bufferToSeq(buffer_t buffer)
|
280
277
|
{
|
281
|
-
rawSeqStore_t seq =
|
278
|
+
rawSeqStore_t seq = kNullRawSeqStore;
|
282
279
|
seq.seq = (rawSeq*)buffer.start;
|
283
280
|
seq.capacity = buffer.capacity / sizeof(rawSeq);
|
284
281
|
return seq;
|
@@ -354,7 +351,7 @@ static void ZSTDMT_freeCCtxPool(ZSTDMT_CCtxPool* pool)
|
|
354
351
|
for (cid=0; cid<pool->totalCCtx; cid++)
|
355
352
|
ZSTD_freeCCtx(pool->cctx[cid]); /* note : compatible with free on NULL */
|
356
353
|
ZSTD_pthread_mutex_destroy(&pool->poolMutex);
|
357
|
-
|
354
|
+
ZSTD_customFree(pool, pool->cMem);
|
358
355
|
}
|
359
356
|
|
360
357
|
/* ZSTDMT_createCCtxPool() :
|
@@ -362,12 +359,12 @@ static void ZSTDMT_freeCCtxPool(ZSTDMT_CCtxPool* pool)
|
|
362
359
|
static ZSTDMT_CCtxPool* ZSTDMT_createCCtxPool(int nbWorkers,
|
363
360
|
ZSTD_customMem cMem)
|
364
361
|
{
|
365
|
-
ZSTDMT_CCtxPool* const cctxPool = (ZSTDMT_CCtxPool*)
|
362
|
+
ZSTDMT_CCtxPool* const cctxPool = (ZSTDMT_CCtxPool*) ZSTD_customCalloc(
|
366
363
|
sizeof(ZSTDMT_CCtxPool) + (nbWorkers-1)*sizeof(ZSTD_CCtx*), cMem);
|
367
364
|
assert(nbWorkers > 0);
|
368
365
|
if (!cctxPool) return NULL;
|
369
366
|
if (ZSTD_pthread_mutex_init(&cctxPool->poolMutex, NULL)) {
|
370
|
-
|
367
|
+
ZSTD_customFree(cctxPool, cMem);
|
371
368
|
return NULL;
|
372
369
|
}
|
373
370
|
cctxPool->cMem = cMem;
|
@@ -475,10 +472,8 @@ ZSTDMT_serialState_reset(serialState_t* serialState,
|
|
475
472
|
ZSTD_ldm_adjustParameters(¶ms.ldmParams, ¶ms.cParams);
|
476
473
|
assert(params.ldmParams.hashLog >= params.ldmParams.bucketSizeLog);
|
477
474
|
assert(params.ldmParams.hashRateLog < 32);
|
478
|
-
serialState->ldmState.hashPower =
|
479
|
-
ZSTD_rollingHash_primePower(params.ldmParams.minMatchLength);
|
480
475
|
} else {
|
481
|
-
|
476
|
+
ZSTD_memset(¶ms.ldmParams, 0, sizeof(params.ldmParams));
|
482
477
|
}
|
483
478
|
serialState->nextJobID = 0;
|
484
479
|
if (params.fParams.checksumFlag)
|
@@ -489,35 +484,35 @@ ZSTDMT_serialState_reset(serialState_t* serialState,
|
|
489
484
|
size_t const hashSize = ((size_t)1 << hashLog) * sizeof(ldmEntry_t);
|
490
485
|
unsigned const bucketLog =
|
491
486
|
params.ldmParams.hashLog - params.ldmParams.bucketSizeLog;
|
492
|
-
size_t const bucketSize = (size_t)1 << bucketLog;
|
493
487
|
unsigned const prevBucketLog =
|
494
488
|
serialState->params.ldmParams.hashLog -
|
495
489
|
serialState->params.ldmParams.bucketSizeLog;
|
490
|
+
size_t const numBuckets = (size_t)1 << bucketLog;
|
496
491
|
/* Size the seq pool tables */
|
497
492
|
ZSTDMT_setNbSeq(seqPool, ZSTD_ldm_getMaxNbSeq(params.ldmParams, jobSize));
|
498
493
|
/* Reset the window */
|
499
494
|
ZSTD_window_init(&serialState->ldmState.window);
|
500
495
|
/* Resize tables and output space if necessary. */
|
501
496
|
if (serialState->ldmState.hashTable == NULL || serialState->params.ldmParams.hashLog < hashLog) {
|
502
|
-
|
503
|
-
serialState->ldmState.hashTable = (ldmEntry_t*)
|
497
|
+
ZSTD_customFree(serialState->ldmState.hashTable, cMem);
|
498
|
+
serialState->ldmState.hashTable = (ldmEntry_t*)ZSTD_customMalloc(hashSize, cMem);
|
504
499
|
}
|
505
500
|
if (serialState->ldmState.bucketOffsets == NULL || prevBucketLog < bucketLog) {
|
506
|
-
|
507
|
-
serialState->ldmState.bucketOffsets = (BYTE*)
|
501
|
+
ZSTD_customFree(serialState->ldmState.bucketOffsets, cMem);
|
502
|
+
serialState->ldmState.bucketOffsets = (BYTE*)ZSTD_customMalloc(numBuckets, cMem);
|
508
503
|
}
|
509
504
|
if (!serialState->ldmState.hashTable || !serialState->ldmState.bucketOffsets)
|
510
505
|
return 1;
|
511
506
|
/* Zero the tables */
|
512
|
-
|
513
|
-
|
507
|
+
ZSTD_memset(serialState->ldmState.hashTable, 0, hashSize);
|
508
|
+
ZSTD_memset(serialState->ldmState.bucketOffsets, 0, numBuckets);
|
514
509
|
|
515
510
|
/* Update window state and fill hash table with dict */
|
516
511
|
serialState->ldmState.loadedDictEnd = 0;
|
517
512
|
if (dictSize > 0) {
|
518
513
|
if (dictContentType == ZSTD_dct_rawContent) {
|
519
514
|
BYTE const* const dictEnd = (const BYTE*)dict + dictSize;
|
520
|
-
ZSTD_window_update(&serialState->ldmState.window, dict, dictSize);
|
515
|
+
ZSTD_window_update(&serialState->ldmState.window, dict, dictSize, /* forceNonContiguous */ 0);
|
521
516
|
ZSTD_ldm_fillHashTable(&serialState->ldmState, (const BYTE*)dict, dictEnd, ¶ms.ldmParams);
|
522
517
|
serialState->ldmState.loadedDictEnd = params.forceWindow ? 0 : (U32)(dictEnd - serialState->ldmState.window.base);
|
523
518
|
} else {
|
@@ -537,7 +532,7 @@ ZSTDMT_serialState_reset(serialState_t* serialState,
|
|
537
532
|
static int ZSTDMT_serialState_init(serialState_t* serialState)
|
538
533
|
{
|
539
534
|
int initError = 0;
|
540
|
-
|
535
|
+
ZSTD_memset(serialState, 0, sizeof(*serialState));
|
541
536
|
initError |= ZSTD_pthread_mutex_init(&serialState->mutex, NULL);
|
542
537
|
initError |= ZSTD_pthread_cond_init(&serialState->cond, NULL);
|
543
538
|
initError |= ZSTD_pthread_mutex_init(&serialState->ldmWindowMutex, NULL);
|
@@ -552,8 +547,8 @@ static void ZSTDMT_serialState_free(serialState_t* serialState)
|
|
552
547
|
ZSTD_pthread_cond_destroy(&serialState->cond);
|
553
548
|
ZSTD_pthread_mutex_destroy(&serialState->ldmWindowMutex);
|
554
549
|
ZSTD_pthread_cond_destroy(&serialState->ldmWindowCond);
|
555
|
-
|
556
|
-
|
550
|
+
ZSTD_customFree(serialState->ldmState.hashTable, cMem);
|
551
|
+
ZSTD_customFree(serialState->ldmState.bucketOffsets, cMem);
|
557
552
|
}
|
558
553
|
|
559
554
|
static void ZSTDMT_serialState_update(serialState_t* serialState,
|
@@ -574,7 +569,7 @@ static void ZSTDMT_serialState_update(serialState_t* serialState,
|
|
574
569
|
assert(seqStore.seq != NULL && seqStore.pos == 0 &&
|
575
570
|
seqStore.size == 0 && seqStore.capacity > 0);
|
576
571
|
assert(src.size <= serialState->params.jobSize);
|
577
|
-
ZSTD_window_update(&serialState->ldmState.window, src.start, src.size);
|
572
|
+
ZSTD_window_update(&serialState->ldmState.window, src.start, src.size, /* forceNonContiguous */ 0);
|
578
573
|
error = ZSTD_ldm_generateSequences(
|
579
574
|
&serialState->ldmState, &seqStore,
|
580
575
|
&serialState->params.ldmParams, src.start, src.size);
|
@@ -686,6 +681,8 @@ static void ZSTDMT_compressionJob(void* jobDescription)
|
|
686
681
|
if (job->jobID != 0) jobParams.fParams.checksumFlag = 0;
|
687
682
|
/* Don't run LDM for the chunks, since we handle it externally */
|
688
683
|
jobParams.ldmParams.enableLdm = 0;
|
684
|
+
/* Correct nbWorkers to 0. */
|
685
|
+
jobParams.nbWorkers = 0;
|
689
686
|
|
690
687
|
|
691
688
|
/* init */
|
@@ -698,6 +695,10 @@ static void ZSTDMT_compressionJob(void* jobDescription)
|
|
698
695
|
{ size_t const forceWindowError = ZSTD_CCtxParams_setParameter(&jobParams, ZSTD_c_forceMaxWindow, !job->firstJob);
|
699
696
|
if (ZSTD_isError(forceWindowError)) JOB_ERROR(forceWindowError);
|
700
697
|
}
|
698
|
+
if (!job->firstJob) {
|
699
|
+
size_t const err = ZSTD_CCtxParams_setParameter(&jobParams, ZSTD_c_deterministicRefPrefix, 0);
|
700
|
+
if (ZSTD_isError(err)) JOB_ERROR(err);
|
701
|
+
}
|
701
702
|
{ size_t const initError = ZSTD_compressBegin_advanced_internal(cctx,
|
702
703
|
job->prefix.start, job->prefix.size, ZSTD_dct_rawContent, /* load dictionary in "content-only" mode (no header analysis) */
|
703
704
|
ZSTD_dtlm_fast,
|
@@ -753,6 +754,13 @@ static void ZSTDMT_compressionJob(void* jobDescription)
|
|
753
754
|
if (ZSTD_isError(cSize)) JOB_ERROR(cSize);
|
754
755
|
lastCBlockSize = cSize;
|
755
756
|
} }
|
757
|
+
if (!job->firstJob) {
|
758
|
+
/* Double check that we don't have an ext-dict, because then our
|
759
|
+
* repcode invalidation doesn't work.
|
760
|
+
*/
|
761
|
+
assert(!ZSTD_window_hasExtDict(cctx->blockState.matchState.window));
|
762
|
+
}
|
763
|
+
ZSTD_CCtx_trace(cctx, 0);
|
756
764
|
|
757
765
|
_endJob:
|
758
766
|
ZSTDMT_serialState_ensureFinished(job->serial, job->jobID, job->cSize);
|
@@ -820,7 +828,6 @@ struct ZSTDMT_CCtx_s {
|
|
820
828
|
roundBuff_t roundBuff;
|
821
829
|
serialState_t serial;
|
822
830
|
rsyncState_t rsync;
|
823
|
-
unsigned singleBlockingThread;
|
824
831
|
unsigned jobIDMask;
|
825
832
|
unsigned doneJobID;
|
826
833
|
unsigned nextJobID;
|
@@ -832,6 +839,7 @@ struct ZSTDMT_CCtx_s {
|
|
832
839
|
ZSTD_customMem cMem;
|
833
840
|
ZSTD_CDict* cdictLocal;
|
834
841
|
const ZSTD_CDict* cdict;
|
842
|
+
unsigned providedFactory: 1;
|
835
843
|
};
|
836
844
|
|
837
845
|
static void ZSTDMT_freeJobsTable(ZSTDMT_jobDescription* jobTable, U32 nbJobs, ZSTD_customMem cMem)
|
@@ -842,7 +850,7 @@ static void ZSTDMT_freeJobsTable(ZSTDMT_jobDescription* jobTable, U32 nbJobs, ZS
|
|
842
850
|
ZSTD_pthread_mutex_destroy(&jobTable[jobNb].job_mutex);
|
843
851
|
ZSTD_pthread_cond_destroy(&jobTable[jobNb].job_cond);
|
844
852
|
}
|
845
|
-
|
853
|
+
ZSTD_customFree(jobTable, cMem);
|
846
854
|
}
|
847
855
|
|
848
856
|
/* ZSTDMT_allocJobsTable()
|
@@ -854,7 +862,7 @@ static ZSTDMT_jobDescription* ZSTDMT_createJobsTable(U32* nbJobsPtr, ZSTD_custom
|
|
854
862
|
U32 const nbJobs = 1 << nbJobsLog2;
|
855
863
|
U32 jobNb;
|
856
864
|
ZSTDMT_jobDescription* const jobTable = (ZSTDMT_jobDescription*)
|
857
|
-
|
865
|
+
ZSTD_customCalloc(nbJobs * sizeof(ZSTDMT_jobDescription), cMem);
|
858
866
|
int initError = 0;
|
859
867
|
if (jobTable==NULL) return NULL;
|
860
868
|
*nbJobsPtr = nbJobs;
|
@@ -885,12 +893,12 @@ static size_t ZSTDMT_expandJobsTable (ZSTDMT_CCtx* mtctx, U32 nbWorkers) {
|
|
885
893
|
|
886
894
|
/* ZSTDMT_CCtxParam_setNbWorkers():
|
887
895
|
* Internal use only */
|
888
|
-
size_t ZSTDMT_CCtxParam_setNbWorkers(ZSTD_CCtx_params* params, unsigned nbWorkers)
|
896
|
+
static size_t ZSTDMT_CCtxParam_setNbWorkers(ZSTD_CCtx_params* params, unsigned nbWorkers)
|
889
897
|
{
|
890
898
|
return ZSTD_CCtxParams_setParameter(params, ZSTD_c_nbWorkers, (int)nbWorkers);
|
891
899
|
}
|
892
900
|
|
893
|
-
MEM_STATIC ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced_internal(unsigned nbWorkers, ZSTD_customMem cMem)
|
901
|
+
MEM_STATIC ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced_internal(unsigned nbWorkers, ZSTD_customMem cMem, ZSTD_threadPool* pool)
|
894
902
|
{
|
895
903
|
ZSTDMT_CCtx* mtctx;
|
896
904
|
U32 nbJobs = nbWorkers + 2;
|
@@ -903,12 +911,19 @@ MEM_STATIC ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced_internal(unsigned nbWorkers,
|
|
903
911
|
/* invalid custom allocator */
|
904
912
|
return NULL;
|
905
913
|
|
906
|
-
mtctx = (ZSTDMT_CCtx*)
|
914
|
+
mtctx = (ZSTDMT_CCtx*) ZSTD_customCalloc(sizeof(ZSTDMT_CCtx), cMem);
|
907
915
|
if (!mtctx) return NULL;
|
908
916
|
ZSTDMT_CCtxParam_setNbWorkers(&mtctx->params, nbWorkers);
|
909
917
|
mtctx->cMem = cMem;
|
910
918
|
mtctx->allJobsCompleted = 1;
|
911
|
-
|
919
|
+
if (pool != NULL) {
|
920
|
+
mtctx->factory = pool;
|
921
|
+
mtctx->providedFactory = 1;
|
922
|
+
}
|
923
|
+
else {
|
924
|
+
mtctx->factory = POOL_create_advanced(nbWorkers, 0, cMem);
|
925
|
+
mtctx->providedFactory = 0;
|
926
|
+
}
|
912
927
|
mtctx->jobs = ZSTDMT_createJobsTable(&nbJobs, cMem);
|
913
928
|
assert(nbJobs > 0); assert((nbJobs & (nbJobs - 1)) == 0); /* ensure nbJobs is a power of 2 */
|
914
929
|
mtctx->jobIDMask = nbJobs - 1;
|
@@ -925,22 +940,18 @@ MEM_STATIC ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced_internal(unsigned nbWorkers,
|
|
925
940
|
return mtctx;
|
926
941
|
}
|
927
942
|
|
928
|
-
ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced(unsigned nbWorkers, ZSTD_customMem cMem)
|
943
|
+
ZSTDMT_CCtx* ZSTDMT_createCCtx_advanced(unsigned nbWorkers, ZSTD_customMem cMem, ZSTD_threadPool* pool)
|
929
944
|
{
|
930
945
|
#ifdef ZSTD_MULTITHREAD
|
931
|
-
return ZSTDMT_createCCtx_advanced_internal(nbWorkers, cMem);
|
946
|
+
return ZSTDMT_createCCtx_advanced_internal(nbWorkers, cMem, pool);
|
932
947
|
#else
|
933
948
|
(void)nbWorkers;
|
934
949
|
(void)cMem;
|
950
|
+
(void)pool;
|
935
951
|
return NULL;
|
936
952
|
#endif
|
937
953
|
}
|
938
954
|
|
939
|
-
ZSTDMT_CCtx* ZSTDMT_createCCtx(unsigned nbWorkers)
|
940
|
-
{
|
941
|
-
return ZSTDMT_createCCtx_advanced(nbWorkers, ZSTD_defaultCMem);
|
942
|
-
}
|
943
|
-
|
944
955
|
|
945
956
|
/* ZSTDMT_releaseAllJobResources() :
|
946
957
|
* note : ensure all workers are killed first ! */
|
@@ -957,7 +968,7 @@ static void ZSTDMT_releaseAllJobResources(ZSTDMT_CCtx* mtctx)
|
|
957
968
|
ZSTDMT_releaseBuffer(mtctx->bufPool, mtctx->jobs[jobID].dstBuff);
|
958
969
|
|
959
970
|
/* Clear the job description, but keep the mutex/cond */
|
960
|
-
|
971
|
+
ZSTD_memset(&mtctx->jobs[jobID], 0, sizeof(mtctx->jobs[jobID]));
|
961
972
|
mtctx->jobs[jobID].job_mutex = mutex;
|
962
973
|
mtctx->jobs[jobID].job_cond = cond;
|
963
974
|
}
|
@@ -984,7 +995,8 @@ static void ZSTDMT_waitForAllJobsCompleted(ZSTDMT_CCtx* mtctx)
|
|
984
995
|
size_t ZSTDMT_freeCCtx(ZSTDMT_CCtx* mtctx)
|
985
996
|
{
|
986
997
|
if (mtctx==NULL) return 0; /* compatible with free on NULL */
|
987
|
-
|
998
|
+
if (!mtctx->providedFactory)
|
999
|
+
POOL_free(mtctx->factory); /* stop and free worker threads */
|
988
1000
|
ZSTDMT_releaseAllJobResources(mtctx); /* release job resources into pools first */
|
989
1001
|
ZSTDMT_freeJobsTable(mtctx->jobs, mtctx->jobIDMask+1, mtctx->cMem);
|
990
1002
|
ZSTDMT_freeBufferPool(mtctx->bufPool);
|
@@ -993,8 +1005,8 @@ size_t ZSTDMT_freeCCtx(ZSTDMT_CCtx* mtctx)
|
|
993
1005
|
ZSTDMT_serialState_free(&mtctx->serial);
|
994
1006
|
ZSTD_freeCDict(mtctx->cdictLocal);
|
995
1007
|
if (mtctx->roundBuff.buffer)
|
996
|
-
|
997
|
-
|
1008
|
+
ZSTD_customFree(mtctx->roundBuff.buffer, mtctx->cMem);
|
1009
|
+
ZSTD_customFree(mtctx, mtctx->cMem);
|
998
1010
|
return 0;
|
999
1011
|
}
|
1000
1012
|
|
@@ -1011,65 +1023,6 @@ size_t ZSTDMT_sizeof_CCtx(ZSTDMT_CCtx* mtctx)
|
|
1011
1023
|
+ mtctx->roundBuff.capacity;
|
1012
1024
|
}
|
1013
1025
|
|
1014
|
-
/* Internal only */
|
1015
|
-
size_t
|
1016
|
-
ZSTDMT_CCtxParam_setMTCtxParameter(ZSTD_CCtx_params* params,
|
1017
|
-
ZSTDMT_parameter parameter,
|
1018
|
-
int value)
|
1019
|
-
{
|
1020
|
-
DEBUGLOG(4, "ZSTDMT_CCtxParam_setMTCtxParameter");
|
1021
|
-
switch(parameter)
|
1022
|
-
{
|
1023
|
-
case ZSTDMT_p_jobSize :
|
1024
|
-
DEBUGLOG(4, "ZSTDMT_CCtxParam_setMTCtxParameter : set jobSize to %i", value);
|
1025
|
-
return ZSTD_CCtxParams_setParameter(params, ZSTD_c_jobSize, value);
|
1026
|
-
case ZSTDMT_p_overlapLog :
|
1027
|
-
DEBUGLOG(4, "ZSTDMT_p_overlapLog : %i", value);
|
1028
|
-
return ZSTD_CCtxParams_setParameter(params, ZSTD_c_overlapLog, value);
|
1029
|
-
case ZSTDMT_p_rsyncable :
|
1030
|
-
DEBUGLOG(4, "ZSTD_p_rsyncable : %i", value);
|
1031
|
-
return ZSTD_CCtxParams_setParameter(params, ZSTD_c_rsyncable, value);
|
1032
|
-
default :
|
1033
|
-
return ERROR(parameter_unsupported);
|
1034
|
-
}
|
1035
|
-
}
|
1036
|
-
|
1037
|
-
size_t ZSTDMT_setMTCtxParameter(ZSTDMT_CCtx* mtctx, ZSTDMT_parameter parameter, int value)
|
1038
|
-
{
|
1039
|
-
DEBUGLOG(4, "ZSTDMT_setMTCtxParameter");
|
1040
|
-
return ZSTDMT_CCtxParam_setMTCtxParameter(&mtctx->params, parameter, value);
|
1041
|
-
}
|
1042
|
-
|
1043
|
-
size_t ZSTDMT_getMTCtxParameter(ZSTDMT_CCtx* mtctx, ZSTDMT_parameter parameter, int* value)
|
1044
|
-
{
|
1045
|
-
switch (parameter) {
|
1046
|
-
case ZSTDMT_p_jobSize:
|
1047
|
-
return ZSTD_CCtxParams_getParameter(&mtctx->params, ZSTD_c_jobSize, value);
|
1048
|
-
case ZSTDMT_p_overlapLog:
|
1049
|
-
return ZSTD_CCtxParams_getParameter(&mtctx->params, ZSTD_c_overlapLog, value);
|
1050
|
-
case ZSTDMT_p_rsyncable:
|
1051
|
-
return ZSTD_CCtxParams_getParameter(&mtctx->params, ZSTD_c_rsyncable, value);
|
1052
|
-
default:
|
1053
|
-
return ERROR(parameter_unsupported);
|
1054
|
-
}
|
1055
|
-
}
|
1056
|
-
|
1057
|
-
/* Sets parameters relevant to the compression job,
|
1058
|
-
* initializing others to default values. */
|
1059
|
-
static ZSTD_CCtx_params ZSTDMT_initJobCCtxParams(const ZSTD_CCtx_params* params)
|
1060
|
-
{
|
1061
|
-
ZSTD_CCtx_params jobParams = *params;
|
1062
|
-
/* Clear parameters related to multithreading */
|
1063
|
-
jobParams.forceWindow = 0;
|
1064
|
-
jobParams.nbWorkers = 0;
|
1065
|
-
jobParams.jobSize = 0;
|
1066
|
-
jobParams.overlapLog = 0;
|
1067
|
-
jobParams.rsyncable = 0;
|
1068
|
-
memset(&jobParams.ldmParams, 0, sizeof(ldmParams_t));
|
1069
|
-
memset(&jobParams.customMem, 0, sizeof(ZSTD_customMem));
|
1070
|
-
return jobParams;
|
1071
|
-
}
|
1072
|
-
|
1073
1026
|
|
1074
1027
|
/* ZSTDMT_resize() :
|
1075
1028
|
* @return : error code if fails, 0 on success */
|
@@ -1098,7 +1051,7 @@ void ZSTDMT_updateCParams_whileCompressing(ZSTDMT_CCtx* mtctx, const ZSTD_CCtx_p
|
|
1098
1051
|
DEBUGLOG(5, "ZSTDMT_updateCParams_whileCompressing (level:%i)",
|
1099
1052
|
compressionLevel);
|
1100
1053
|
mtctx->params.compressionLevel = compressionLevel;
|
1101
|
-
{ ZSTD_compressionParameters cParams = ZSTD_getCParamsFromCCtxParams(cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, 0);
|
1054
|
+
{ ZSTD_compressionParameters cParams = ZSTD_getCParamsFromCCtxParams(cctxParams, ZSTD_CONTENTSIZE_UNKNOWN, 0, ZSTD_cpm_noAttachDict);
|
1102
1055
|
cParams.windowLog = saved_wlog;
|
1103
1056
|
mtctx->params.cParams = cParams;
|
1104
1057
|
}
|
@@ -1185,8 +1138,8 @@ static unsigned ZSTDMT_computeTargetJobLog(const ZSTD_CCtx_params* params)
|
|
1185
1138
|
if (params->ldmParams.enableLdm) {
|
1186
1139
|
/* In Long Range Mode, the windowLog is typically oversized.
|
1187
1140
|
* In which case, it's preferable to determine the jobSize
|
1188
|
-
* based on
|
1189
|
-
jobLog = MAX(21, params->cParams.chainLog +
|
1141
|
+
* based on cycleLog instead. */
|
1142
|
+
jobLog = MAX(21, ZSTD_cycleLog(params->cParams.chainLog, params->cParams.strategy) + 3);
|
1190
1143
|
} else {
|
1191
1144
|
jobLog = MAX(20, params->cParams.windowLog + 2);
|
1192
1145
|
}
|
@@ -1240,174 +1193,6 @@ static size_t ZSTDMT_computeOverlapSize(const ZSTD_CCtx_params* params)
|
|
1240
1193
|
return (ovLog==0) ? 0 : (size_t)1 << ovLog;
|
1241
1194
|
}
|
1242
1195
|
|
1243
|
-
static unsigned
|
1244
|
-
ZSTDMT_computeNbJobs(const ZSTD_CCtx_params* params, size_t srcSize, unsigned nbWorkers)
|
1245
|
-
{
|
1246
|
-
assert(nbWorkers>0);
|
1247
|
-
{ size_t const jobSizeTarget = (size_t)1 << ZSTDMT_computeTargetJobLog(params);
|
1248
|
-
size_t const jobMaxSize = jobSizeTarget << 2;
|
1249
|
-
size_t const passSizeMax = jobMaxSize * nbWorkers;
|
1250
|
-
unsigned const multiplier = (unsigned)(srcSize / passSizeMax) + 1;
|
1251
|
-
unsigned const nbJobsLarge = multiplier * nbWorkers;
|
1252
|
-
unsigned const nbJobsMax = (unsigned)(srcSize / jobSizeTarget) + 1;
|
1253
|
-
unsigned const nbJobsSmall = MIN(nbJobsMax, nbWorkers);
|
1254
|
-
return (multiplier>1) ? nbJobsLarge : nbJobsSmall;
|
1255
|
-
} }
|
1256
|
-
|
1257
|
-
/* ZSTDMT_compress_advanced_internal() :
|
1258
|
-
* This is a blocking function : it will only give back control to caller after finishing its compression job.
|
1259
|
-
*/
|
1260
|
-
static size_t
|
1261
|
-
ZSTDMT_compress_advanced_internal(
|
1262
|
-
ZSTDMT_CCtx* mtctx,
|
1263
|
-
void* dst, size_t dstCapacity,
|
1264
|
-
const void* src, size_t srcSize,
|
1265
|
-
const ZSTD_CDict* cdict,
|
1266
|
-
ZSTD_CCtx_params params)
|
1267
|
-
{
|
1268
|
-
ZSTD_CCtx_params const jobParams = ZSTDMT_initJobCCtxParams(¶ms);
|
1269
|
-
size_t const overlapSize = ZSTDMT_computeOverlapSize(¶ms);
|
1270
|
-
unsigned const nbJobs = ZSTDMT_computeNbJobs(¶ms, srcSize, params.nbWorkers);
|
1271
|
-
size_t const proposedJobSize = (srcSize + (nbJobs-1)) / nbJobs;
|
1272
|
-
size_t const avgJobSize = (((proposedJobSize-1) & 0x1FFFF) < 0x7FFF) ? proposedJobSize + 0xFFFF : proposedJobSize; /* avoid too small last block */
|
1273
|
-
const char* const srcStart = (const char*)src;
|
1274
|
-
size_t remainingSrcSize = srcSize;
|
1275
|
-
unsigned const compressWithinDst = (dstCapacity >= ZSTD_compressBound(srcSize)) ? nbJobs : (unsigned)(dstCapacity / ZSTD_compressBound(avgJobSize)); /* presumes avgJobSize >= 256 KB, which should be the case */
|
1276
|
-
size_t frameStartPos = 0, dstBufferPos = 0;
|
1277
|
-
assert(jobParams.nbWorkers == 0);
|
1278
|
-
assert(mtctx->cctxPool->totalCCtx == params.nbWorkers);
|
1279
|
-
|
1280
|
-
params.jobSize = (U32)avgJobSize;
|
1281
|
-
DEBUGLOG(4, "ZSTDMT_compress_advanced_internal: nbJobs=%2u (rawSize=%u bytes; fixedSize=%u) ",
|
1282
|
-
nbJobs, (U32)proposedJobSize, (U32)avgJobSize);
|
1283
|
-
|
1284
|
-
if ((nbJobs==1) | (params.nbWorkers<=1)) { /* fallback to single-thread mode : this is a blocking invocation anyway */
|
1285
|
-
ZSTD_CCtx* const cctx = mtctx->cctxPool->cctx[0];
|
1286
|
-
DEBUGLOG(4, "ZSTDMT_compress_advanced_internal: fallback to single-thread mode");
|
1287
|
-
if (cdict) return ZSTD_compress_usingCDict_advanced(cctx, dst, dstCapacity, src, srcSize, cdict, jobParams.fParams);
|
1288
|
-
return ZSTD_compress_advanced_internal(cctx, dst, dstCapacity, src, srcSize, NULL, 0, &jobParams);
|
1289
|
-
}
|
1290
|
-
|
1291
|
-
assert(avgJobSize >= 256 KB); /* condition for ZSTD_compressBound(A) + ZSTD_compressBound(B) <= ZSTD_compressBound(A+B), required to compress directly into Dst (no additional buffer) */
|
1292
|
-
ZSTDMT_setBufferSize(mtctx->bufPool, ZSTD_compressBound(avgJobSize) );
|
1293
|
-
/* LDM doesn't even try to load the dictionary in single-ingestion mode */
|
1294
|
-
if (ZSTDMT_serialState_reset(&mtctx->serial, mtctx->seqPool, params, avgJobSize, NULL, 0, ZSTD_dct_auto))
|
1295
|
-
return ERROR(memory_allocation);
|
1296
|
-
|
1297
|
-
FORWARD_IF_ERROR( ZSTDMT_expandJobsTable(mtctx, nbJobs) , ""); /* only expands if necessary */
|
1298
|
-
|
1299
|
-
{ unsigned u;
|
1300
|
-
for (u=0; u<nbJobs; u++) {
|
1301
|
-
size_t const jobSize = MIN(remainingSrcSize, avgJobSize);
|
1302
|
-
size_t const dstBufferCapacity = ZSTD_compressBound(jobSize);
|
1303
|
-
buffer_t const dstAsBuffer = { (char*)dst + dstBufferPos, dstBufferCapacity };
|
1304
|
-
buffer_t const dstBuffer = u < compressWithinDst ? dstAsBuffer : g_nullBuffer;
|
1305
|
-
size_t dictSize = u ? overlapSize : 0;
|
1306
|
-
|
1307
|
-
mtctx->jobs[u].prefix.start = srcStart + frameStartPos - dictSize;
|
1308
|
-
mtctx->jobs[u].prefix.size = dictSize;
|
1309
|
-
mtctx->jobs[u].src.start = srcStart + frameStartPos;
|
1310
|
-
mtctx->jobs[u].src.size = jobSize; assert(jobSize > 0); /* avoid job.src.size == 0 */
|
1311
|
-
mtctx->jobs[u].consumed = 0;
|
1312
|
-
mtctx->jobs[u].cSize = 0;
|
1313
|
-
mtctx->jobs[u].cdict = (u==0) ? cdict : NULL;
|
1314
|
-
mtctx->jobs[u].fullFrameSize = srcSize;
|
1315
|
-
mtctx->jobs[u].params = jobParams;
|
1316
|
-
/* do not calculate checksum within sections, but write it in header for first section */
|
1317
|
-
mtctx->jobs[u].dstBuff = dstBuffer;
|
1318
|
-
mtctx->jobs[u].cctxPool = mtctx->cctxPool;
|
1319
|
-
mtctx->jobs[u].bufPool = mtctx->bufPool;
|
1320
|
-
mtctx->jobs[u].seqPool = mtctx->seqPool;
|
1321
|
-
mtctx->jobs[u].serial = &mtctx->serial;
|
1322
|
-
mtctx->jobs[u].jobID = u;
|
1323
|
-
mtctx->jobs[u].firstJob = (u==0);
|
1324
|
-
mtctx->jobs[u].lastJob = (u==nbJobs-1);
|
1325
|
-
|
1326
|
-
DEBUGLOG(5, "ZSTDMT_compress_advanced_internal: posting job %u (%u bytes)", u, (U32)jobSize);
|
1327
|
-
DEBUG_PRINTHEX(6, mtctx->jobs[u].prefix.start, 12);
|
1328
|
-
POOL_add(mtctx->factory, ZSTDMT_compressionJob, &mtctx->jobs[u]);
|
1329
|
-
|
1330
|
-
frameStartPos += jobSize;
|
1331
|
-
dstBufferPos += dstBufferCapacity;
|
1332
|
-
remainingSrcSize -= jobSize;
|
1333
|
-
} }
|
1334
|
-
|
1335
|
-
/* collect result */
|
1336
|
-
{ size_t error = 0, dstPos = 0;
|
1337
|
-
unsigned jobID;
|
1338
|
-
for (jobID=0; jobID<nbJobs; jobID++) {
|
1339
|
-
DEBUGLOG(5, "waiting for job %u ", jobID);
|
1340
|
-
ZSTD_PTHREAD_MUTEX_LOCK(&mtctx->jobs[jobID].job_mutex);
|
1341
|
-
while (mtctx->jobs[jobID].consumed < mtctx->jobs[jobID].src.size) {
|
1342
|
-
DEBUGLOG(5, "waiting for jobCompleted signal from job %u", jobID);
|
1343
|
-
ZSTD_pthread_cond_wait(&mtctx->jobs[jobID].job_cond, &mtctx->jobs[jobID].job_mutex);
|
1344
|
-
}
|
1345
|
-
ZSTD_pthread_mutex_unlock(&mtctx->jobs[jobID].job_mutex);
|
1346
|
-
DEBUGLOG(5, "ready to write job %u ", jobID);
|
1347
|
-
|
1348
|
-
{ size_t const cSize = mtctx->jobs[jobID].cSize;
|
1349
|
-
if (ZSTD_isError(cSize)) error = cSize;
|
1350
|
-
if ((!error) && (dstPos + cSize > dstCapacity)) error = ERROR(dstSize_tooSmall);
|
1351
|
-
if (jobID) { /* note : job 0 is written directly at dst, which is correct position */
|
1352
|
-
if (!error)
|
1353
|
-
memmove((char*)dst + dstPos, mtctx->jobs[jobID].dstBuff.start, cSize); /* may overlap when job compressed within dst */
|
1354
|
-
if (jobID >= compressWithinDst) { /* job compressed into its own buffer, which must be released */
|
1355
|
-
DEBUGLOG(5, "releasing buffer %u>=%u", jobID, compressWithinDst);
|
1356
|
-
ZSTDMT_releaseBuffer(mtctx->bufPool, mtctx->jobs[jobID].dstBuff);
|
1357
|
-
} }
|
1358
|
-
mtctx->jobs[jobID].dstBuff = g_nullBuffer;
|
1359
|
-
mtctx->jobs[jobID].cSize = 0;
|
1360
|
-
dstPos += cSize ;
|
1361
|
-
}
|
1362
|
-
} /* for (jobID=0; jobID<nbJobs; jobID++) */
|
1363
|
-
|
1364
|
-
DEBUGLOG(4, "checksumFlag : %u ", params.fParams.checksumFlag);
|
1365
|
-
if (params.fParams.checksumFlag) {
|
1366
|
-
U32 const checksum = (U32)XXH64_digest(&mtctx->serial.xxhState);
|
1367
|
-
if (dstPos + 4 > dstCapacity) {
|
1368
|
-
error = ERROR(dstSize_tooSmall);
|
1369
|
-
} else {
|
1370
|
-
DEBUGLOG(4, "writing checksum : %08X \n", checksum);
|
1371
|
-
MEM_writeLE32((char*)dst + dstPos, checksum);
|
1372
|
-
dstPos += 4;
|
1373
|
-
} }
|
1374
|
-
|
1375
|
-
if (!error) DEBUGLOG(4, "compressed size : %u ", (U32)dstPos);
|
1376
|
-
return error ? error : dstPos;
|
1377
|
-
}
|
1378
|
-
}
|
1379
|
-
|
1380
|
-
size_t ZSTDMT_compress_advanced(ZSTDMT_CCtx* mtctx,
|
1381
|
-
void* dst, size_t dstCapacity,
|
1382
|
-
const void* src, size_t srcSize,
|
1383
|
-
const ZSTD_CDict* cdict,
|
1384
|
-
ZSTD_parameters params,
|
1385
|
-
int overlapLog)
|
1386
|
-
{
|
1387
|
-
ZSTD_CCtx_params cctxParams = mtctx->params;
|
1388
|
-
cctxParams.cParams = params.cParams;
|
1389
|
-
cctxParams.fParams = params.fParams;
|
1390
|
-
assert(ZSTD_OVERLAPLOG_MIN <= overlapLog && overlapLog <= ZSTD_OVERLAPLOG_MAX);
|
1391
|
-
cctxParams.overlapLog = overlapLog;
|
1392
|
-
return ZSTDMT_compress_advanced_internal(mtctx,
|
1393
|
-
dst, dstCapacity,
|
1394
|
-
src, srcSize,
|
1395
|
-
cdict, cctxParams);
|
1396
|
-
}
|
1397
|
-
|
1398
|
-
|
1399
|
-
size_t ZSTDMT_compressCCtx(ZSTDMT_CCtx* mtctx,
|
1400
|
-
void* dst, size_t dstCapacity,
|
1401
|
-
const void* src, size_t srcSize,
|
1402
|
-
int compressionLevel)
|
1403
|
-
{
|
1404
|
-
ZSTD_parameters params = ZSTD_getParams(compressionLevel, srcSize, 0);
|
1405
|
-
int const overlapLog = ZSTDMT_overlapLog_default(params.cParams.strategy);
|
1406
|
-
params.fParams.contentSizeFlag = 1;
|
1407
|
-
return ZSTDMT_compress_advanced(mtctx, dst, dstCapacity, src, srcSize, NULL, params, overlapLog);
|
1408
|
-
}
|
1409
|
-
|
1410
|
-
|
1411
1196
|
/* ====================================== */
|
1412
1197
|
/* ======= Streaming API ======= */
|
1413
1198
|
/* ====================================== */
|
@@ -1432,16 +1217,6 @@ size_t ZSTDMT_initCStream_internal(
|
|
1432
1217
|
if (params.jobSize != 0 && params.jobSize < ZSTDMT_JOBSIZE_MIN) params.jobSize = ZSTDMT_JOBSIZE_MIN;
|
1433
1218
|
if (params.jobSize > (size_t)ZSTDMT_JOBSIZE_MAX) params.jobSize = (size_t)ZSTDMT_JOBSIZE_MAX;
|
1434
1219
|
|
1435
|
-
mtctx->singleBlockingThread = (pledgedSrcSize <= ZSTDMT_JOBSIZE_MIN); /* do not trigger multi-threading when srcSize is too small */
|
1436
|
-
if (mtctx->singleBlockingThread) {
|
1437
|
-
ZSTD_CCtx_params const singleThreadParams = ZSTDMT_initJobCCtxParams(¶ms);
|
1438
|
-
DEBUGLOG(5, "ZSTDMT_initCStream_internal: switch to single blocking thread mode");
|
1439
|
-
assert(singleThreadParams.nbWorkers == 0);
|
1440
|
-
return ZSTD_initCStream_internal(mtctx->cctxPool->cctx[0],
|
1441
|
-
dict, dictSize, cdict,
|
1442
|
-
&singleThreadParams, pledgedSrcSize);
|
1443
|
-
}
|
1444
|
-
|
1445
1220
|
DEBUGLOG(4, "ZSTDMT_initCStream_internal: %u workers", params.nbWorkers);
|
1446
1221
|
|
1447
1222
|
if (mtctx->allJobsCompleted == 0) { /* previous compression not correctly finished */
|
@@ -1475,9 +1250,8 @@ size_t ZSTDMT_initCStream_internal(
|
|
1475
1250
|
|
1476
1251
|
if (params.rsyncable) {
|
1477
1252
|
/* Aim for the targetsectionSize as the average job size. */
|
1478
|
-
U32 const
|
1479
|
-
U32 const rsyncBits = ZSTD_highbit32(
|
1480
|
-
assert(jobSizeMB >= 1);
|
1253
|
+
U32 const jobSizeKB = (U32)(mtctx->targetSectionSize >> 10);
|
1254
|
+
U32 const rsyncBits = (assert(jobSizeKB >= 1), ZSTD_highbit32(jobSizeKB) + 10);
|
1481
1255
|
DEBUGLOG(4, "rsyncLog = %u", rsyncBits);
|
1482
1256
|
mtctx->rsync.hash = 0;
|
1483
1257
|
mtctx->rsync.hitMask = (1ULL << rsyncBits) - 1;
|
@@ -1504,8 +1278,8 @@ size_t ZSTDMT_initCStream_internal(
|
|
1504
1278
|
size_t const capacity = MAX(windowSize, sectionsSize) + slackSize;
|
1505
1279
|
if (mtctx->roundBuff.capacity < capacity) {
|
1506
1280
|
if (mtctx->roundBuff.buffer)
|
1507
|
-
|
1508
|
-
mtctx->roundBuff.buffer = (BYTE*)
|
1281
|
+
ZSTD_customFree(mtctx->roundBuff.buffer, mtctx->cMem);
|
1282
|
+
mtctx->roundBuff.buffer = (BYTE*)ZSTD_customMalloc(capacity, mtctx->cMem);
|
1509
1283
|
if (mtctx->roundBuff.buffer == NULL) {
|
1510
1284
|
mtctx->roundBuff.capacity = 0;
|
1511
1285
|
return ERROR(memory_allocation);
|
@@ -1530,53 +1304,6 @@ size_t ZSTDMT_initCStream_internal(
|
|
1530
1304
|
return 0;
|
1531
1305
|
}
|
1532
1306
|
|
1533
|
-
size_t ZSTDMT_initCStream_advanced(ZSTDMT_CCtx* mtctx,
|
1534
|
-
const void* dict, size_t dictSize,
|
1535
|
-
ZSTD_parameters params,
|
1536
|
-
unsigned long long pledgedSrcSize)
|
1537
|
-
{
|
1538
|
-
ZSTD_CCtx_params cctxParams = mtctx->params; /* retrieve sticky params */
|
1539
|
-
DEBUGLOG(4, "ZSTDMT_initCStream_advanced (pledgedSrcSize=%u)", (U32)pledgedSrcSize);
|
1540
|
-
cctxParams.cParams = params.cParams;
|
1541
|
-
cctxParams.fParams = params.fParams;
|
1542
|
-
return ZSTDMT_initCStream_internal(mtctx, dict, dictSize, ZSTD_dct_auto, NULL,
|
1543
|
-
cctxParams, pledgedSrcSize);
|
1544
|
-
}
|
1545
|
-
|
1546
|
-
size_t ZSTDMT_initCStream_usingCDict(ZSTDMT_CCtx* mtctx,
|
1547
|
-
const ZSTD_CDict* cdict,
|
1548
|
-
ZSTD_frameParameters fParams,
|
1549
|
-
unsigned long long pledgedSrcSize)
|
1550
|
-
{
|
1551
|
-
ZSTD_CCtx_params cctxParams = mtctx->params;
|
1552
|
-
if (cdict==NULL) return ERROR(dictionary_wrong); /* method incompatible with NULL cdict */
|
1553
|
-
cctxParams.cParams = ZSTD_getCParamsFromCDict(cdict);
|
1554
|
-
cctxParams.fParams = fParams;
|
1555
|
-
return ZSTDMT_initCStream_internal(mtctx, NULL, 0 /*dictSize*/, ZSTD_dct_auto, cdict,
|
1556
|
-
cctxParams, pledgedSrcSize);
|
1557
|
-
}
|
1558
|
-
|
1559
|
-
|
1560
|
-
/* ZSTDMT_resetCStream() :
|
1561
|
-
* pledgedSrcSize can be zero == unknown (for the time being)
|
1562
|
-
* prefer using ZSTD_CONTENTSIZE_UNKNOWN,
|
1563
|
-
* as `0` might mean "empty" in the future */
|
1564
|
-
size_t ZSTDMT_resetCStream(ZSTDMT_CCtx* mtctx, unsigned long long pledgedSrcSize)
|
1565
|
-
{
|
1566
|
-
if (!pledgedSrcSize) pledgedSrcSize = ZSTD_CONTENTSIZE_UNKNOWN;
|
1567
|
-
return ZSTDMT_initCStream_internal(mtctx, NULL, 0, ZSTD_dct_auto, 0, mtctx->params,
|
1568
|
-
pledgedSrcSize);
|
1569
|
-
}
|
1570
|
-
|
1571
|
-
size_t ZSTDMT_initCStream(ZSTDMT_CCtx* mtctx, int compressionLevel) {
|
1572
|
-
ZSTD_parameters const params = ZSTD_getParams(compressionLevel, ZSTD_CONTENTSIZE_UNKNOWN, 0);
|
1573
|
-
ZSTD_CCtx_params cctxParams = mtctx->params; /* retrieve sticky params */
|
1574
|
-
DEBUGLOG(4, "ZSTDMT_initCStream (cLevel=%i)", compressionLevel);
|
1575
|
-
cctxParams.cParams = params.cParams;
|
1576
|
-
cctxParams.fParams = params.fParams;
|
1577
|
-
return ZSTDMT_initCStream_internal(mtctx, NULL, 0, ZSTD_dct_auto, NULL, cctxParams, ZSTD_CONTENTSIZE_UNKNOWN);
|
1578
|
-
}
|
1579
|
-
|
1580
1307
|
|
1581
1308
|
/* ZSTDMT_writeLastEmptyBlock()
|
1582
1309
|
* Write a single empty block with an end-of-frame to finish a frame.
|
@@ -1740,7 +1467,7 @@ static size_t ZSTDMT_flushProduced(ZSTDMT_CCtx* mtctx, ZSTD_outBuffer* output, u
|
|
1740
1467
|
assert(cSize >= mtctx->jobs[wJobID].dstFlushed);
|
1741
1468
|
assert(mtctx->jobs[wJobID].dstBuff.start != NULL);
|
1742
1469
|
if (toFlush > 0) {
|
1743
|
-
|
1470
|
+
ZSTD_memcpy((char*)output->dst + output->pos,
|
1744
1471
|
(const char*)mtctx->jobs[wJobID].dstBuff.start + mtctx->jobs[wJobID].dstFlushed,
|
1745
1472
|
toFlush);
|
1746
1473
|
}
|
@@ -1894,7 +1621,7 @@ static int ZSTDMT_tryGetInputRange(ZSTDMT_CCtx* mtctx)
|
|
1894
1621
|
return 0;
|
1895
1622
|
}
|
1896
1623
|
ZSTDMT_waitForLdmComplete(mtctx, buffer);
|
1897
|
-
|
1624
|
+
ZSTD_memmove(start, mtctx->inBuff.prefix.start, prefixSize);
|
1898
1625
|
mtctx->inBuff.prefix.start = start;
|
1899
1626
|
mtctx->roundBuff.pos = prefixSize;
|
1900
1627
|
}
|
@@ -1968,6 +1695,16 @@ findSynchronizationPoint(ZSTDMT_CCtx const* mtctx, ZSTD_inBuffer const input)
|
|
1968
1695
|
pos = 0;
|
1969
1696
|
prev = (BYTE const*)mtctx->inBuff.buffer.start + mtctx->inBuff.filled - RSYNC_LENGTH;
|
1970
1697
|
hash = ZSTD_rollingHash_compute(prev, RSYNC_LENGTH);
|
1698
|
+
if ((hash & hitMask) == hitMask) {
|
1699
|
+
/* We're already at a sync point so don't load any more until
|
1700
|
+
* we're able to flush this sync point.
|
1701
|
+
* This likely happened because the job table was full so we
|
1702
|
+
* couldn't add our job.
|
1703
|
+
*/
|
1704
|
+
syncPoint.toLoad = 0;
|
1705
|
+
syncPoint.flush = 1;
|
1706
|
+
return syncPoint;
|
1707
|
+
}
|
1971
1708
|
} else {
|
1972
1709
|
/* We don't have enough bytes buffered to initialize the hash, but
|
1973
1710
|
* we know we have at least RSYNC_LENGTH bytes total.
|
@@ -2022,34 +1759,11 @@ size_t ZSTDMT_compressStream_generic(ZSTDMT_CCtx* mtctx,
|
|
2022
1759
|
assert(output->pos <= output->size);
|
2023
1760
|
assert(input->pos <= input->size);
|
2024
1761
|
|
2025
|
-
if (mtctx->singleBlockingThread) { /* delegate to single-thread (synchronous) */
|
2026
|
-
return ZSTD_compressStream2(mtctx->cctxPool->cctx[0], output, input, endOp);
|
2027
|
-
}
|
2028
|
-
|
2029
1762
|
if ((mtctx->frameEnded) && (endOp==ZSTD_e_continue)) {
|
2030
1763
|
/* current frame being ended. Only flush/end are allowed */
|
2031
1764
|
return ERROR(stage_wrong);
|
2032
1765
|
}
|
2033
1766
|
|
2034
|
-
/* single-pass shortcut (note : synchronous-mode) */
|
2035
|
-
if ( (!mtctx->params.rsyncable) /* rsyncable mode is disabled */
|
2036
|
-
&& (mtctx->nextJobID == 0) /* just started */
|
2037
|
-
&& (mtctx->inBuff.filled == 0) /* nothing buffered */
|
2038
|
-
&& (!mtctx->jobReady) /* no job already created */
|
2039
|
-
&& (endOp == ZSTD_e_end) /* end order */
|
2040
|
-
&& (output->size - output->pos >= ZSTD_compressBound(input->size - input->pos)) ) { /* enough space in dst */
|
2041
|
-
size_t const cSize = ZSTDMT_compress_advanced_internal(mtctx,
|
2042
|
-
(char*)output->dst + output->pos, output->size - output->pos,
|
2043
|
-
(const char*)input->src + input->pos, input->size - input->pos,
|
2044
|
-
mtctx->cdict, mtctx->params);
|
2045
|
-
if (ZSTD_isError(cSize)) return cSize;
|
2046
|
-
input->pos = input->size;
|
2047
|
-
output->pos += cSize;
|
2048
|
-
mtctx->allJobsCompleted = 1;
|
2049
|
-
mtctx->frameEnded = 1;
|
2050
|
-
return 0;
|
2051
|
-
}
|
2052
|
-
|
2053
1767
|
/* fill input buffer */
|
2054
1768
|
if ( (!mtctx->jobReady)
|
2055
1769
|
&& (input->size > input->pos) ) { /* support NULL input */
|
@@ -2072,13 +1786,21 @@ size_t ZSTDMT_compressStream_generic(ZSTDMT_CCtx* mtctx,
|
|
2072
1786
|
assert(mtctx->inBuff.buffer.capacity >= mtctx->targetSectionSize);
|
2073
1787
|
DEBUGLOG(5, "ZSTDMT_compressStream_generic: adding %u bytes on top of %u to buffer of size %u",
|
2074
1788
|
(U32)syncPoint.toLoad, (U32)mtctx->inBuff.filled, (U32)mtctx->targetSectionSize);
|
2075
|
-
|
1789
|
+
ZSTD_memcpy((char*)mtctx->inBuff.buffer.start + mtctx->inBuff.filled, (const char*)input->src + input->pos, syncPoint.toLoad);
|
2076
1790
|
input->pos += syncPoint.toLoad;
|
2077
1791
|
mtctx->inBuff.filled += syncPoint.toLoad;
|
2078
1792
|
forwardInputProgress = syncPoint.toLoad>0;
|
2079
1793
|
}
|
2080
|
-
|
2081
|
-
|
1794
|
+
}
|
1795
|
+
if ((input->pos < input->size) && (endOp == ZSTD_e_end)) {
|
1796
|
+
/* Can't end yet because the input is not fully consumed.
|
1797
|
+
* We are in one of these cases:
|
1798
|
+
* - mtctx->inBuff is NULL & empty: we couldn't get an input buffer so don't create a new job.
|
1799
|
+
* - We filled the input buffer: flush this job but don't end the frame.
|
1800
|
+
* - We hit a synchronization point: flush this job but don't end the frame.
|
1801
|
+
*/
|
1802
|
+
assert(mtctx->inBuff.filled == 0 || mtctx->inBuff.filled == mtctx->targetSectionSize || mtctx->params.rsyncable);
|
1803
|
+
endOp = ZSTD_e_flush;
|
2082
1804
|
}
|
2083
1805
|
|
2084
1806
|
if ( (mtctx->jobReady)
|
@@ -2097,47 +1819,3 @@ size_t ZSTDMT_compressStream_generic(ZSTDMT_CCtx* mtctx,
|
|
2097
1819
|
return remainingToFlush;
|
2098
1820
|
}
|
2099
1821
|
}
|
2100
|
-
|
2101
|
-
|
2102
|
-
size_t ZSTDMT_compressStream(ZSTDMT_CCtx* mtctx, ZSTD_outBuffer* output, ZSTD_inBuffer* input)
|
2103
|
-
{
|
2104
|
-
FORWARD_IF_ERROR( ZSTDMT_compressStream_generic(mtctx, output, input, ZSTD_e_continue) , "");
|
2105
|
-
|
2106
|
-
/* recommended next input size : fill current input buffer */
|
2107
|
-
return mtctx->targetSectionSize - mtctx->inBuff.filled; /* note : could be zero when input buffer is fully filled and no more availability to create new job */
|
2108
|
-
}
|
2109
|
-
|
2110
|
-
|
2111
|
-
static size_t ZSTDMT_flushStream_internal(ZSTDMT_CCtx* mtctx, ZSTD_outBuffer* output, ZSTD_EndDirective endFrame)
|
2112
|
-
{
|
2113
|
-
size_t const srcSize = mtctx->inBuff.filled;
|
2114
|
-
DEBUGLOG(5, "ZSTDMT_flushStream_internal");
|
2115
|
-
|
2116
|
-
if ( mtctx->jobReady /* one job ready for a worker to pick up */
|
2117
|
-
|| (srcSize > 0) /* still some data within input buffer */
|
2118
|
-
|| ((endFrame==ZSTD_e_end) && !mtctx->frameEnded)) { /* need a last 0-size block to end frame */
|
2119
|
-
DEBUGLOG(5, "ZSTDMT_flushStream_internal : create a new job (%u bytes, end:%u)",
|
2120
|
-
(U32)srcSize, (U32)endFrame);
|
2121
|
-
FORWARD_IF_ERROR( ZSTDMT_createCompressionJob(mtctx, srcSize, endFrame) , "");
|
2122
|
-
}
|
2123
|
-
|
2124
|
-
/* check if there is any data available to flush */
|
2125
|
-
return ZSTDMT_flushProduced(mtctx, output, 1 /* blockToFlush */, endFrame);
|
2126
|
-
}
|
2127
|
-
|
2128
|
-
|
2129
|
-
size_t ZSTDMT_flushStream(ZSTDMT_CCtx* mtctx, ZSTD_outBuffer* output)
|
2130
|
-
{
|
2131
|
-
DEBUGLOG(5, "ZSTDMT_flushStream");
|
2132
|
-
if (mtctx->singleBlockingThread)
|
2133
|
-
return ZSTD_flushStream(mtctx->cctxPool->cctx[0], output);
|
2134
|
-
return ZSTDMT_flushStream_internal(mtctx, output, ZSTD_e_flush);
|
2135
|
-
}
|
2136
|
-
|
2137
|
-
size_t ZSTDMT_endStream(ZSTDMT_CCtx* mtctx, ZSTD_outBuffer* output)
|
2138
|
-
{
|
2139
|
-
DEBUGLOG(4, "ZSTDMT_endStream");
|
2140
|
-
if (mtctx->singleBlockingThread)
|
2141
|
-
return ZSTD_endStream(mtctx->cctxPool->cctx[0], output);
|
2142
|
-
return ZSTDMT_flushStream_internal(mtctx, output, ZSTD_e_end);
|
2143
|
-
}
|