extzstd 0.3.2 → 0.4
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +4 -4
- data/README.md +4 -3
- data/contrib/zstd/CHANGELOG +225 -1
- data/contrib/zstd/CONTRIBUTING.md +158 -75
- data/contrib/zstd/LICENSE +4 -4
- data/contrib/zstd/Makefile +106 -69
- data/contrib/zstd/Package.swift +36 -0
- data/contrib/zstd/README.md +64 -36
- data/contrib/zstd/SECURITY.md +15 -0
- data/contrib/zstd/TESTING.md +2 -3
- data/contrib/zstd/lib/BUCK +5 -7
- data/contrib/zstd/lib/Makefile +117 -199
- data/contrib/zstd/lib/README.md +37 -7
- data/contrib/zstd/lib/common/allocations.h +55 -0
- data/contrib/zstd/lib/common/bits.h +200 -0
- data/contrib/zstd/lib/common/bitstream.h +80 -86
- data/contrib/zstd/lib/common/compiler.h +225 -63
- data/contrib/zstd/lib/common/cpu.h +37 -1
- data/contrib/zstd/lib/common/debug.c +7 -1
- data/contrib/zstd/lib/common/debug.h +21 -12
- data/contrib/zstd/lib/common/entropy_common.c +15 -37
- data/contrib/zstd/lib/common/error_private.c +9 -2
- data/contrib/zstd/lib/common/error_private.h +93 -5
- data/contrib/zstd/lib/common/fse.h +12 -87
- data/contrib/zstd/lib/common/fse_decompress.c +37 -117
- data/contrib/zstd/lib/common/huf.h +97 -172
- data/contrib/zstd/lib/common/mem.h +58 -58
- data/contrib/zstd/lib/common/pool.c +38 -17
- data/contrib/zstd/lib/common/pool.h +10 -4
- data/contrib/zstd/lib/common/portability_macros.h +158 -0
- data/contrib/zstd/lib/common/threading.c +74 -14
- data/contrib/zstd/lib/common/threading.h +5 -10
- data/contrib/zstd/lib/common/xxhash.c +6 -814
- data/contrib/zstd/lib/common/xxhash.h +6930 -195
- data/contrib/zstd/lib/common/zstd_common.c +1 -36
- data/contrib/zstd/lib/common/zstd_deps.h +1 -1
- data/contrib/zstd/lib/common/zstd_internal.h +68 -154
- data/contrib/zstd/lib/common/zstd_trace.h +163 -0
- data/contrib/zstd/lib/compress/clevels.h +134 -0
- data/contrib/zstd/lib/compress/fse_compress.c +75 -155
- data/contrib/zstd/lib/compress/hist.c +1 -1
- data/contrib/zstd/lib/compress/hist.h +1 -1
- data/contrib/zstd/lib/compress/huf_compress.c +810 -259
- data/contrib/zstd/lib/compress/zstd_compress.c +2864 -919
- data/contrib/zstd/lib/compress/zstd_compress_internal.h +523 -192
- data/contrib/zstd/lib/compress/zstd_compress_literals.c +117 -40
- data/contrib/zstd/lib/compress/zstd_compress_literals.h +16 -6
- data/contrib/zstd/lib/compress/zstd_compress_sequences.c +28 -19
- data/contrib/zstd/lib/compress/zstd_compress_sequences.h +1 -1
- data/contrib/zstd/lib/compress/zstd_compress_superblock.c +251 -412
- data/contrib/zstd/lib/compress/zstd_compress_superblock.h +1 -1
- data/contrib/zstd/lib/compress/zstd_cwksp.h +284 -97
- data/contrib/zstd/lib/compress/zstd_double_fast.c +382 -133
- data/contrib/zstd/lib/compress/zstd_double_fast.h +14 -2
- data/contrib/zstd/lib/compress/zstd_fast.c +732 -260
- data/contrib/zstd/lib/compress/zstd_fast.h +3 -2
- data/contrib/zstd/lib/compress/zstd_lazy.c +1177 -390
- data/contrib/zstd/lib/compress/zstd_lazy.h +129 -14
- data/contrib/zstd/lib/compress/zstd_ldm.c +280 -210
- data/contrib/zstd/lib/compress/zstd_ldm.h +3 -2
- data/contrib/zstd/lib/compress/zstd_ldm_geartab.h +106 -0
- data/contrib/zstd/lib/compress/zstd_opt.c +516 -285
- data/contrib/zstd/lib/compress/zstd_opt.h +32 -8
- data/contrib/zstd/lib/compress/zstdmt_compress.c +202 -131
- data/contrib/zstd/lib/compress/zstdmt_compress.h +9 -6
- data/contrib/zstd/lib/decompress/huf_decompress.c +1149 -555
- data/contrib/zstd/lib/decompress/huf_decompress_amd64.S +595 -0
- data/contrib/zstd/lib/decompress/zstd_ddict.c +4 -4
- data/contrib/zstd/lib/decompress/zstd_ddict.h +1 -1
- data/contrib/zstd/lib/decompress/zstd_decompress.c +583 -106
- data/contrib/zstd/lib/decompress/zstd_decompress_block.c +1054 -379
- data/contrib/zstd/lib/decompress/zstd_decompress_block.h +14 -3
- data/contrib/zstd/lib/decompress/zstd_decompress_internal.h +56 -6
- data/contrib/zstd/lib/deprecated/zbuff.h +1 -1
- data/contrib/zstd/lib/deprecated/zbuff_common.c +1 -1
- data/contrib/zstd/lib/deprecated/zbuff_compress.c +24 -4
- data/contrib/zstd/lib/deprecated/zbuff_decompress.c +3 -1
- data/contrib/zstd/lib/dictBuilder/cover.c +60 -44
- data/contrib/zstd/lib/dictBuilder/cover.h +6 -11
- data/contrib/zstd/lib/dictBuilder/divsufsort.c +1 -1
- data/contrib/zstd/lib/dictBuilder/fastcover.c +26 -18
- data/contrib/zstd/lib/dictBuilder/zdict.c +100 -101
- data/contrib/zstd/lib/legacy/zstd_legacy.h +38 -1
- data/contrib/zstd/lib/legacy/zstd_v01.c +18 -53
- data/contrib/zstd/lib/legacy/zstd_v01.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v02.c +28 -85
- data/contrib/zstd/lib/legacy/zstd_v02.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v03.c +29 -88
- data/contrib/zstd/lib/legacy/zstd_v03.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v04.c +27 -80
- data/contrib/zstd/lib/legacy/zstd_v04.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v05.c +36 -85
- data/contrib/zstd/lib/legacy/zstd_v05.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v06.c +44 -96
- data/contrib/zstd/lib/legacy/zstd_v06.h +1 -1
- data/contrib/zstd/lib/legacy/zstd_v07.c +37 -92
- data/contrib/zstd/lib/legacy/zstd_v07.h +1 -1
- data/contrib/zstd/lib/libzstd.mk +237 -0
- data/contrib/zstd/lib/libzstd.pc.in +4 -3
- data/contrib/zstd/lib/module.modulemap +35 -0
- data/contrib/zstd/lib/{dictBuilder/zdict.h → zdict.h} +202 -33
- data/contrib/zstd/lib/zstd.h +1030 -332
- data/contrib/zstd/lib/{common/zstd_errors.h → zstd_errors.h} +27 -8
- data/ext/extconf.rb +26 -7
- data/ext/extzstd.c +51 -24
- data/ext/extzstd.h +33 -6
- data/ext/extzstd_stream.c +74 -31
- data/ext/libzstd_conf.h +0 -1
- data/ext/zstd_decompress_asm.S +1 -0
- metadata +17 -7
- data/contrib/zstd/appveyor.yml +0 -292
- data/ext/depend +0 -2
@@ -1,5 +1,5 @@
|
|
1
1
|
/*
|
2
|
-
* Copyright (c)
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
3
3
|
* All rights reserved.
|
4
4
|
*
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
@@ -10,9 +10,9 @@
|
|
10
10
|
|
11
11
|
|
12
12
|
/* ====== Dependencies ======= */
|
13
|
+
#include "../common/allocations.h" /* ZSTD_customCalloc, ZSTD_customFree */
|
13
14
|
#include "zstd_deps.h" /* size_t */
|
14
15
|
#include "debug.h" /* assert */
|
15
|
-
#include "zstd_internal.h" /* ZSTD_customMalloc, ZSTD_customFree */
|
16
16
|
#include "pool.h"
|
17
17
|
|
18
18
|
/* ====== Compiler specifics ====== */
|
@@ -86,7 +86,7 @@ static void* POOL_thread(void* opaque) {
|
|
86
86
|
{ POOL_job const job = ctx->queue[ctx->queueHead];
|
87
87
|
ctx->queueHead = (ctx->queueHead + 1) % ctx->queueSize;
|
88
88
|
ctx->numThreadsBusy++;
|
89
|
-
ctx->queueEmpty = ctx->queueHead == ctx->queueTail;
|
89
|
+
ctx->queueEmpty = (ctx->queueHead == ctx->queueTail);
|
90
90
|
/* Unlock the mutex, signal a pusher, and run the job */
|
91
91
|
ZSTD_pthread_cond_signal(&ctx->queuePushCond);
|
92
92
|
ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
|
@@ -96,15 +96,14 @@ static void* POOL_thread(void* opaque) {
|
|
96
96
|
/* If the intended queue size was 0, signal after finishing job */
|
97
97
|
ZSTD_pthread_mutex_lock(&ctx->queueMutex);
|
98
98
|
ctx->numThreadsBusy--;
|
99
|
-
|
100
|
-
ZSTD_pthread_cond_signal(&ctx->queuePushCond);
|
101
|
-
}
|
99
|
+
ZSTD_pthread_cond_signal(&ctx->queuePushCond);
|
102
100
|
ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
|
103
101
|
}
|
104
102
|
} /* for (;;) */
|
105
103
|
assert(0); /* Unreachable */
|
106
104
|
}
|
107
105
|
|
106
|
+
/* ZSTD_createThreadPool() : public access point */
|
108
107
|
POOL_ctx* ZSTD_createThreadPool(size_t numThreads) {
|
109
108
|
return POOL_create (numThreads, 0);
|
110
109
|
}
|
@@ -114,7 +113,8 @@ POOL_ctx* POOL_create(size_t numThreads, size_t queueSize) {
|
|
114
113
|
}
|
115
114
|
|
116
115
|
POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
|
117
|
-
ZSTD_customMem customMem)
|
116
|
+
ZSTD_customMem customMem)
|
117
|
+
{
|
118
118
|
POOL_ctx* ctx;
|
119
119
|
/* Check parameters */
|
120
120
|
if (!numThreads) { return NULL; }
|
@@ -126,7 +126,7 @@ POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
|
|
126
126
|
* empty and full queues.
|
127
127
|
*/
|
128
128
|
ctx->queueSize = queueSize + 1;
|
129
|
-
ctx->queue = (POOL_job*)
|
129
|
+
ctx->queue = (POOL_job*)ZSTD_customCalloc(ctx->queueSize * sizeof(POOL_job), customMem);
|
130
130
|
ctx->queueHead = 0;
|
131
131
|
ctx->queueTail = 0;
|
132
132
|
ctx->numThreadsBusy = 0;
|
@@ -140,7 +140,7 @@ POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
|
|
140
140
|
}
|
141
141
|
ctx->shutdown = 0;
|
142
142
|
/* Allocate space for the thread handles */
|
143
|
-
ctx->threads = (ZSTD_pthread_t*)
|
143
|
+
ctx->threads = (ZSTD_pthread_t*)ZSTD_customCalloc(numThreads * sizeof(ZSTD_pthread_t), customMem);
|
144
144
|
ctx->threadCapacity = 0;
|
145
145
|
ctx->customMem = customMem;
|
146
146
|
/* Check for errors */
|
@@ -173,7 +173,7 @@ static void POOL_join(POOL_ctx* ctx) {
|
|
173
173
|
/* Join all of the threads */
|
174
174
|
{ size_t i;
|
175
175
|
for (i = 0; i < ctx->threadCapacity; ++i) {
|
176
|
-
ZSTD_pthread_join(ctx->threads[i]
|
176
|
+
ZSTD_pthread_join(ctx->threads[i]); /* note : could fail */
|
177
177
|
} }
|
178
178
|
}
|
179
179
|
|
@@ -188,11 +188,22 @@ void POOL_free(POOL_ctx *ctx) {
|
|
188
188
|
ZSTD_customFree(ctx, ctx->customMem);
|
189
189
|
}
|
190
190
|
|
191
|
+
/*! POOL_joinJobs() :
|
192
|
+
* Waits for all queued jobs to finish executing.
|
193
|
+
*/
|
194
|
+
void POOL_joinJobs(POOL_ctx* ctx) {
|
195
|
+
ZSTD_pthread_mutex_lock(&ctx->queueMutex);
|
196
|
+
while(!ctx->queueEmpty || ctx->numThreadsBusy > 0) {
|
197
|
+
ZSTD_pthread_cond_wait(&ctx->queuePushCond, &ctx->queueMutex);
|
198
|
+
}
|
199
|
+
ZSTD_pthread_mutex_unlock(&ctx->queueMutex);
|
200
|
+
}
|
201
|
+
|
191
202
|
void ZSTD_freeThreadPool (ZSTD_threadPool* pool) {
|
192
203
|
POOL_free (pool);
|
193
204
|
}
|
194
205
|
|
195
|
-
size_t POOL_sizeof(POOL_ctx
|
206
|
+
size_t POOL_sizeof(const POOL_ctx* ctx) {
|
196
207
|
if (ctx==NULL) return 0; /* supports sizeof NULL */
|
197
208
|
return sizeof(*ctx)
|
198
209
|
+ ctx->queueSize * sizeof(POOL_job)
|
@@ -209,10 +220,10 @@ static int POOL_resize_internal(POOL_ctx* ctx, size_t numThreads)
|
|
209
220
|
return 0;
|
210
221
|
}
|
211
222
|
/* numThreads > threadCapacity */
|
212
|
-
{ ZSTD_pthread_t* const threadPool = (ZSTD_pthread_t*)
|
223
|
+
{ ZSTD_pthread_t* const threadPool = (ZSTD_pthread_t*)ZSTD_customCalloc(numThreads * sizeof(ZSTD_pthread_t), ctx->customMem);
|
213
224
|
if (!threadPool) return 1;
|
214
225
|
/* replace existing thread pool */
|
215
|
-
ZSTD_memcpy(threadPool, ctx->threads, ctx->threadCapacity * sizeof(
|
226
|
+
ZSTD_memcpy(threadPool, ctx->threads, ctx->threadCapacity * sizeof(ZSTD_pthread_t));
|
216
227
|
ZSTD_customFree(ctx->threads, ctx->customMem);
|
217
228
|
ctx->threads = threadPool;
|
218
229
|
/* Initialize additional threads */
|
@@ -257,9 +268,12 @@ static int isQueueFull(POOL_ctx const* ctx) {
|
|
257
268
|
}
|
258
269
|
|
259
270
|
|
260
|
-
static void
|
271
|
+
static void
|
272
|
+
POOL_add_internal(POOL_ctx* ctx, POOL_function function, void *opaque)
|
261
273
|
{
|
262
|
-
POOL_job
|
274
|
+
POOL_job job;
|
275
|
+
job.function = function;
|
276
|
+
job.opaque = opaque;
|
263
277
|
assert(ctx != NULL);
|
264
278
|
if (ctx->shutdown) return;
|
265
279
|
|
@@ -313,7 +327,9 @@ POOL_ctx* POOL_create(size_t numThreads, size_t queueSize) {
|
|
313
327
|
return POOL_create_advanced(numThreads, queueSize, ZSTD_defaultCMem);
|
314
328
|
}
|
315
329
|
|
316
|
-
POOL_ctx*
|
330
|
+
POOL_ctx*
|
331
|
+
POOL_create_advanced(size_t numThreads, size_t queueSize, ZSTD_customMem customMem)
|
332
|
+
{
|
317
333
|
(void)numThreads;
|
318
334
|
(void)queueSize;
|
319
335
|
(void)customMem;
|
@@ -325,6 +341,11 @@ void POOL_free(POOL_ctx* ctx) {
|
|
325
341
|
(void)ctx;
|
326
342
|
}
|
327
343
|
|
344
|
+
void POOL_joinJobs(POOL_ctx* ctx){
|
345
|
+
assert(!ctx || ctx == &g_poolCtx);
|
346
|
+
(void)ctx;
|
347
|
+
}
|
348
|
+
|
328
349
|
int POOL_resize(POOL_ctx* ctx, size_t numThreads) {
|
329
350
|
(void)ctx; (void)numThreads;
|
330
351
|
return 0;
|
@@ -341,7 +362,7 @@ int POOL_tryAdd(POOL_ctx* ctx, POOL_function function, void* opaque) {
|
|
341
362
|
return 1;
|
342
363
|
}
|
343
364
|
|
344
|
-
size_t POOL_sizeof(POOL_ctx* ctx) {
|
365
|
+
size_t POOL_sizeof(const POOL_ctx* ctx) {
|
345
366
|
if (ctx==NULL) return 0; /* supports sizeof NULL */
|
346
367
|
assert(ctx == &g_poolCtx);
|
347
368
|
return sizeof(*ctx);
|
@@ -1,5 +1,5 @@
|
|
1
1
|
/*
|
2
|
-
* Copyright (c)
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
3
3
|
* All rights reserved.
|
4
4
|
*
|
5
5
|
* This source code is licensed under both the BSD-style license (found in the
|
@@ -38,10 +38,16 @@ POOL_ctx* POOL_create_advanced(size_t numThreads, size_t queueSize,
|
|
38
38
|
*/
|
39
39
|
void POOL_free(POOL_ctx* ctx);
|
40
40
|
|
41
|
+
|
42
|
+
/*! POOL_joinJobs() :
|
43
|
+
* Waits for all queued jobs to finish executing.
|
44
|
+
*/
|
45
|
+
void POOL_joinJobs(POOL_ctx* ctx);
|
46
|
+
|
41
47
|
/*! POOL_resize() :
|
42
48
|
* Expands or shrinks pool's number of threads.
|
43
49
|
* This is more efficient than releasing + creating a new context,
|
44
|
-
* since it tries to preserve and
|
50
|
+
* since it tries to preserve and reuse existing threads.
|
45
51
|
* `numThreads` must be at least 1.
|
46
52
|
* @return : 0 when resize was successful,
|
47
53
|
* !0 (typically 1) if there is an error.
|
@@ -53,7 +59,7 @@ int POOL_resize(POOL_ctx* ctx, size_t numThreads);
|
|
53
59
|
* @return threadpool memory usage
|
54
60
|
* note : compatible with NULL (returns 0 in this case)
|
55
61
|
*/
|
56
|
-
size_t POOL_sizeof(POOL_ctx* ctx);
|
62
|
+
size_t POOL_sizeof(const POOL_ctx* ctx);
|
57
63
|
|
58
64
|
/*! POOL_function :
|
59
65
|
* The function type that can be added to a thread pool.
|
@@ -70,7 +76,7 @@ void POOL_add(POOL_ctx* ctx, POOL_function function, void* opaque);
|
|
70
76
|
|
71
77
|
|
72
78
|
/*! POOL_tryAdd() :
|
73
|
-
* Add the job `function(opaque)` to thread pool _if_ a
|
79
|
+
* Add the job `function(opaque)` to thread pool _if_ a queue slot is available.
|
74
80
|
* Returns immediately even if not (does not block).
|
75
81
|
* @return : 1 if successful, 0 if not.
|
76
82
|
*/
|
@@ -0,0 +1,158 @@
|
|
1
|
+
/*
|
2
|
+
* Copyright (c) Meta Platforms, Inc. and affiliates.
|
3
|
+
* All rights reserved.
|
4
|
+
*
|
5
|
+
* This source code is licensed under both the BSD-style license (found in the
|
6
|
+
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
7
|
+
* in the COPYING file in the root directory of this source tree).
|
8
|
+
* You may select, at your option, one of the above-listed licenses.
|
9
|
+
*/
|
10
|
+
|
11
|
+
#ifndef ZSTD_PORTABILITY_MACROS_H
|
12
|
+
#define ZSTD_PORTABILITY_MACROS_H
|
13
|
+
|
14
|
+
/**
|
15
|
+
* This header file contains macro definitions to support portability.
|
16
|
+
* This header is shared between C and ASM code, so it MUST only
|
17
|
+
* contain macro definitions. It MUST not contain any C code.
|
18
|
+
*
|
19
|
+
* This header ONLY defines macros to detect platforms/feature support.
|
20
|
+
*
|
21
|
+
*/
|
22
|
+
|
23
|
+
|
24
|
+
/* compat. with non-clang compilers */
|
25
|
+
#ifndef __has_attribute
|
26
|
+
#define __has_attribute(x) 0
|
27
|
+
#endif
|
28
|
+
|
29
|
+
/* compat. with non-clang compilers */
|
30
|
+
#ifndef __has_builtin
|
31
|
+
# define __has_builtin(x) 0
|
32
|
+
#endif
|
33
|
+
|
34
|
+
/* compat. with non-clang compilers */
|
35
|
+
#ifndef __has_feature
|
36
|
+
# define __has_feature(x) 0
|
37
|
+
#endif
|
38
|
+
|
39
|
+
/* detects whether we are being compiled under msan */
|
40
|
+
#ifndef ZSTD_MEMORY_SANITIZER
|
41
|
+
# if __has_feature(memory_sanitizer)
|
42
|
+
# define ZSTD_MEMORY_SANITIZER 1
|
43
|
+
# else
|
44
|
+
# define ZSTD_MEMORY_SANITIZER 0
|
45
|
+
# endif
|
46
|
+
#endif
|
47
|
+
|
48
|
+
/* detects whether we are being compiled under asan */
|
49
|
+
#ifndef ZSTD_ADDRESS_SANITIZER
|
50
|
+
# if __has_feature(address_sanitizer)
|
51
|
+
# define ZSTD_ADDRESS_SANITIZER 1
|
52
|
+
# elif defined(__SANITIZE_ADDRESS__)
|
53
|
+
# define ZSTD_ADDRESS_SANITIZER 1
|
54
|
+
# else
|
55
|
+
# define ZSTD_ADDRESS_SANITIZER 0
|
56
|
+
# endif
|
57
|
+
#endif
|
58
|
+
|
59
|
+
/* detects whether we are being compiled under dfsan */
|
60
|
+
#ifndef ZSTD_DATAFLOW_SANITIZER
|
61
|
+
# if __has_feature(dataflow_sanitizer)
|
62
|
+
# define ZSTD_DATAFLOW_SANITIZER 1
|
63
|
+
# else
|
64
|
+
# define ZSTD_DATAFLOW_SANITIZER 0
|
65
|
+
# endif
|
66
|
+
#endif
|
67
|
+
|
68
|
+
/* Mark the internal assembly functions as hidden */
|
69
|
+
#ifdef __ELF__
|
70
|
+
# define ZSTD_HIDE_ASM_FUNCTION(func) .hidden func
|
71
|
+
#elif defined(__APPLE__)
|
72
|
+
# define ZSTD_HIDE_ASM_FUNCTION(func) .private_extern func
|
73
|
+
#else
|
74
|
+
# define ZSTD_HIDE_ASM_FUNCTION(func)
|
75
|
+
#endif
|
76
|
+
|
77
|
+
/* Enable runtime BMI2 dispatch based on the CPU.
|
78
|
+
* Enabled for clang & gcc >=4.8 on x86 when BMI2 isn't enabled by default.
|
79
|
+
*/
|
80
|
+
#ifndef DYNAMIC_BMI2
|
81
|
+
#if ((defined(__clang__) && __has_attribute(__target__)) \
|
82
|
+
|| (defined(__GNUC__) \
|
83
|
+
&& (__GNUC__ >= 5 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8)))) \
|
84
|
+
&& (defined(__x86_64__) || defined(_M_X64)) \
|
85
|
+
&& !defined(__BMI2__)
|
86
|
+
# define DYNAMIC_BMI2 1
|
87
|
+
#else
|
88
|
+
# define DYNAMIC_BMI2 0
|
89
|
+
#endif
|
90
|
+
#endif
|
91
|
+
|
92
|
+
/**
|
93
|
+
* Only enable assembly for GNUC compatible compilers,
|
94
|
+
* because other platforms may not support GAS assembly syntax.
|
95
|
+
*
|
96
|
+
* Only enable assembly for Linux / MacOS, other platforms may
|
97
|
+
* work, but they haven't been tested. This could likely be
|
98
|
+
* extended to BSD systems.
|
99
|
+
*
|
100
|
+
* Disable assembly when MSAN is enabled, because MSAN requires
|
101
|
+
* 100% of code to be instrumented to work.
|
102
|
+
*/
|
103
|
+
#if defined(__GNUC__)
|
104
|
+
# if defined(__linux__) || defined(__linux) || defined(__APPLE__)
|
105
|
+
# if ZSTD_MEMORY_SANITIZER
|
106
|
+
# define ZSTD_ASM_SUPPORTED 0
|
107
|
+
# elif ZSTD_DATAFLOW_SANITIZER
|
108
|
+
# define ZSTD_ASM_SUPPORTED 0
|
109
|
+
# else
|
110
|
+
# define ZSTD_ASM_SUPPORTED 1
|
111
|
+
# endif
|
112
|
+
# else
|
113
|
+
# define ZSTD_ASM_SUPPORTED 0
|
114
|
+
# endif
|
115
|
+
#else
|
116
|
+
# define ZSTD_ASM_SUPPORTED 0
|
117
|
+
#endif
|
118
|
+
|
119
|
+
/**
|
120
|
+
* Determines whether we should enable assembly for x86-64
|
121
|
+
* with BMI2.
|
122
|
+
*
|
123
|
+
* Enable if all of the following conditions hold:
|
124
|
+
* - ASM hasn't been explicitly disabled by defining ZSTD_DISABLE_ASM
|
125
|
+
* - Assembly is supported
|
126
|
+
* - We are compiling for x86-64 and either:
|
127
|
+
* - DYNAMIC_BMI2 is enabled
|
128
|
+
* - BMI2 is supported at compile time
|
129
|
+
*/
|
130
|
+
#if !defined(ZSTD_DISABLE_ASM) && \
|
131
|
+
ZSTD_ASM_SUPPORTED && \
|
132
|
+
defined(__x86_64__) && \
|
133
|
+
(DYNAMIC_BMI2 || defined(__BMI2__))
|
134
|
+
# define ZSTD_ENABLE_ASM_X86_64_BMI2 1
|
135
|
+
#else
|
136
|
+
# define ZSTD_ENABLE_ASM_X86_64_BMI2 0
|
137
|
+
#endif
|
138
|
+
|
139
|
+
/*
|
140
|
+
* For x86 ELF targets, add .note.gnu.property section for Intel CET in
|
141
|
+
* assembly sources when CET is enabled.
|
142
|
+
*
|
143
|
+
* Additionally, any function that may be called indirectly must begin
|
144
|
+
* with ZSTD_CET_ENDBRANCH.
|
145
|
+
*/
|
146
|
+
#if defined(__ELF__) && (defined(__x86_64__) || defined(__i386__)) \
|
147
|
+
&& defined(__has_include)
|
148
|
+
# if __has_include(<cet.h>)
|
149
|
+
# include <cet.h>
|
150
|
+
# define ZSTD_CET_ENDBRANCH _CET_ENDBR
|
151
|
+
# endif
|
152
|
+
#endif
|
153
|
+
|
154
|
+
#ifndef ZSTD_CET_ENDBRANCH
|
155
|
+
# define ZSTD_CET_ENDBRANCH
|
156
|
+
#endif
|
157
|
+
|
158
|
+
#endif /* ZSTD_PORTABILITY_MACROS_H */
|
@@ -23,8 +23,7 @@ int g_ZSTD_threading_useless_symbol;
|
|
23
23
|
#if defined(ZSTD_MULTITHREAD) && defined(_WIN32)
|
24
24
|
|
25
25
|
/**
|
26
|
-
* Windows minimalist Pthread Wrapper
|
27
|
-
* http://www.cse.wustl.edu/~schmidt/win32-cv-1.html
|
26
|
+
* Windows minimalist Pthread Wrapper
|
28
27
|
*/
|
29
28
|
|
30
29
|
|
@@ -35,37 +34,94 @@ int g_ZSTD_threading_useless_symbol;
|
|
35
34
|
|
36
35
|
/* === Implementation === */
|
37
36
|
|
37
|
+
typedef struct {
|
38
|
+
void* (*start_routine)(void*);
|
39
|
+
void* arg;
|
40
|
+
int initialized;
|
41
|
+
ZSTD_pthread_cond_t initialized_cond;
|
42
|
+
ZSTD_pthread_mutex_t initialized_mutex;
|
43
|
+
} ZSTD_thread_params_t;
|
44
|
+
|
38
45
|
static unsigned __stdcall worker(void *arg)
|
39
46
|
{
|
40
|
-
|
41
|
-
|
47
|
+
void* (*start_routine)(void*);
|
48
|
+
void* thread_arg;
|
49
|
+
|
50
|
+
/* Initialized thread_arg and start_routine and signal main thread that we don't need it
|
51
|
+
* to wait any longer.
|
52
|
+
*/
|
53
|
+
{
|
54
|
+
ZSTD_thread_params_t* thread_param = (ZSTD_thread_params_t*)arg;
|
55
|
+
thread_arg = thread_param->arg;
|
56
|
+
start_routine = thread_param->start_routine;
|
57
|
+
|
58
|
+
/* Signal main thread that we are running and do not depend on its memory anymore */
|
59
|
+
ZSTD_pthread_mutex_lock(&thread_param->initialized_mutex);
|
60
|
+
thread_param->initialized = 1;
|
61
|
+
ZSTD_pthread_cond_signal(&thread_param->initialized_cond);
|
62
|
+
ZSTD_pthread_mutex_unlock(&thread_param->initialized_mutex);
|
63
|
+
}
|
64
|
+
|
65
|
+
start_routine(thread_arg);
|
66
|
+
|
42
67
|
return 0;
|
43
68
|
}
|
44
69
|
|
45
70
|
int ZSTD_pthread_create(ZSTD_pthread_t* thread, const void* unused,
|
46
71
|
void* (*start_routine) (void*), void* arg)
|
47
72
|
{
|
73
|
+
ZSTD_thread_params_t thread_param;
|
48
74
|
(void)unused;
|
49
|
-
thread->arg = arg;
|
50
|
-
thread->start_routine = start_routine;
|
51
|
-
thread->handle = (HANDLE) _beginthreadex(NULL, 0, worker, thread, 0, NULL);
|
52
75
|
|
53
|
-
if (
|
76
|
+
if (thread==NULL) return -1;
|
77
|
+
*thread = NULL;
|
78
|
+
|
79
|
+
thread_param.start_routine = start_routine;
|
80
|
+
thread_param.arg = arg;
|
81
|
+
thread_param.initialized = 0;
|
82
|
+
|
83
|
+
/* Setup thread initialization synchronization */
|
84
|
+
if(ZSTD_pthread_cond_init(&thread_param.initialized_cond, NULL)) {
|
85
|
+
/* Should never happen on Windows */
|
86
|
+
return -1;
|
87
|
+
}
|
88
|
+
if(ZSTD_pthread_mutex_init(&thread_param.initialized_mutex, NULL)) {
|
89
|
+
/* Should never happen on Windows */
|
90
|
+
ZSTD_pthread_cond_destroy(&thread_param.initialized_cond);
|
91
|
+
return -1;
|
92
|
+
}
|
93
|
+
|
94
|
+
/* Spawn thread */
|
95
|
+
*thread = (HANDLE)_beginthreadex(NULL, 0, worker, &thread_param, 0, NULL);
|
96
|
+
if (*thread==NULL) {
|
97
|
+
ZSTD_pthread_mutex_destroy(&thread_param.initialized_mutex);
|
98
|
+
ZSTD_pthread_cond_destroy(&thread_param.initialized_cond);
|
54
99
|
return errno;
|
55
|
-
|
56
|
-
|
100
|
+
}
|
101
|
+
|
102
|
+
/* Wait for thread to be initialized */
|
103
|
+
ZSTD_pthread_mutex_lock(&thread_param.initialized_mutex);
|
104
|
+
while(!thread_param.initialized) {
|
105
|
+
ZSTD_pthread_cond_wait(&thread_param.initialized_cond, &thread_param.initialized_mutex);
|
106
|
+
}
|
107
|
+
ZSTD_pthread_mutex_unlock(&thread_param.initialized_mutex);
|
108
|
+
ZSTD_pthread_mutex_destroy(&thread_param.initialized_mutex);
|
109
|
+
ZSTD_pthread_cond_destroy(&thread_param.initialized_cond);
|
110
|
+
|
111
|
+
return 0;
|
57
112
|
}
|
58
113
|
|
59
|
-
int ZSTD_pthread_join(ZSTD_pthread_t thread
|
114
|
+
int ZSTD_pthread_join(ZSTD_pthread_t thread)
|
60
115
|
{
|
61
116
|
DWORD result;
|
62
117
|
|
63
|
-
if (!thread
|
118
|
+
if (!thread) return 0;
|
119
|
+
|
120
|
+
result = WaitForSingleObject(thread, INFINITE);
|
121
|
+
CloseHandle(thread);
|
64
122
|
|
65
|
-
result = WaitForSingleObject(thread.handle, INFINITE);
|
66
123
|
switch (result) {
|
67
124
|
case WAIT_OBJECT_0:
|
68
|
-
if (value_ptr) *value_ptr = thread.arg;
|
69
125
|
return 0;
|
70
126
|
case WAIT_ABANDONED:
|
71
127
|
return EINVAL;
|
@@ -83,6 +139,7 @@ int ZSTD_pthread_join(ZSTD_pthread_t thread, void **value_ptr)
|
|
83
139
|
|
84
140
|
int ZSTD_pthread_mutex_init(ZSTD_pthread_mutex_t* mutex, pthread_mutexattr_t const* attr)
|
85
141
|
{
|
142
|
+
assert(mutex != NULL);
|
86
143
|
*mutex = (pthread_mutex_t*)ZSTD_malloc(sizeof(pthread_mutex_t));
|
87
144
|
if (!*mutex)
|
88
145
|
return 1;
|
@@ -91,6 +148,7 @@ int ZSTD_pthread_mutex_init(ZSTD_pthread_mutex_t* mutex, pthread_mutexattr_t con
|
|
91
148
|
|
92
149
|
int ZSTD_pthread_mutex_destroy(ZSTD_pthread_mutex_t* mutex)
|
93
150
|
{
|
151
|
+
assert(mutex != NULL);
|
94
152
|
if (!*mutex)
|
95
153
|
return 0;
|
96
154
|
{
|
@@ -102,6 +160,7 @@ int ZSTD_pthread_mutex_destroy(ZSTD_pthread_mutex_t* mutex)
|
|
102
160
|
|
103
161
|
int ZSTD_pthread_cond_init(ZSTD_pthread_cond_t* cond, pthread_condattr_t const* attr)
|
104
162
|
{
|
163
|
+
assert(cond != NULL);
|
105
164
|
*cond = (pthread_cond_t*)ZSTD_malloc(sizeof(pthread_cond_t));
|
106
165
|
if (!*cond)
|
107
166
|
return 1;
|
@@ -110,6 +169,7 @@ int ZSTD_pthread_cond_init(ZSTD_pthread_cond_t* cond, pthread_condattr_t const*
|
|
110
169
|
|
111
170
|
int ZSTD_pthread_cond_destroy(ZSTD_pthread_cond_t* cond)
|
112
171
|
{
|
172
|
+
assert(cond != NULL);
|
113
173
|
if (!*cond)
|
114
174
|
return 0;
|
115
175
|
{
|
@@ -23,8 +23,7 @@ extern "C" {
|
|
23
23
|
#if defined(ZSTD_MULTITHREAD) && defined(_WIN32)
|
24
24
|
|
25
25
|
/**
|
26
|
-
* Windows minimalist Pthread Wrapper
|
27
|
-
* http://www.cse.wustl.edu/~schmidt/win32-cv-1.html
|
26
|
+
* Windows minimalist Pthread Wrapper
|
28
27
|
*/
|
29
28
|
#ifdef WINVER
|
30
29
|
# undef WINVER
|
@@ -62,16 +61,12 @@ extern "C" {
|
|
62
61
|
#define ZSTD_pthread_cond_broadcast(a) WakeAllConditionVariable((a))
|
63
62
|
|
64
63
|
/* ZSTD_pthread_create() and ZSTD_pthread_join() */
|
65
|
-
typedef
|
66
|
-
HANDLE handle;
|
67
|
-
void* (*start_routine)(void*);
|
68
|
-
void* arg;
|
69
|
-
} ZSTD_pthread_t;
|
64
|
+
typedef HANDLE ZSTD_pthread_t;
|
70
65
|
|
71
66
|
int ZSTD_pthread_create(ZSTD_pthread_t* thread, const void* unused,
|
72
67
|
void* (*start_routine) (void*), void* arg);
|
73
68
|
|
74
|
-
int ZSTD_pthread_join(ZSTD_pthread_t thread
|
69
|
+
int ZSTD_pthread_join(ZSTD_pthread_t thread);
|
75
70
|
|
76
71
|
/**
|
77
72
|
* add here more wrappers as required
|
@@ -99,7 +94,7 @@ int ZSTD_pthread_join(ZSTD_pthread_t thread, void** value_ptr);
|
|
99
94
|
|
100
95
|
#define ZSTD_pthread_t pthread_t
|
101
96
|
#define ZSTD_pthread_create(a, b, c, d) pthread_create((a), (b), (c), (d))
|
102
|
-
#define ZSTD_pthread_join(a
|
97
|
+
#define ZSTD_pthread_join(a) pthread_join((a),NULL)
|
103
98
|
|
104
99
|
#else /* DEBUGLEVEL >= 1 */
|
105
100
|
|
@@ -124,7 +119,7 @@ int ZSTD_pthread_cond_destroy(ZSTD_pthread_cond_t* cond);
|
|
124
119
|
|
125
120
|
#define ZSTD_pthread_t pthread_t
|
126
121
|
#define ZSTD_pthread_create(a, b, c, d) pthread_create((a), (b), (c), (d))
|
127
|
-
#define ZSTD_pthread_join(a
|
122
|
+
#define ZSTD_pthread_join(a) pthread_join((a),NULL)
|
128
123
|
|
129
124
|
#endif
|
130
125
|
|