extbzip3 0.0.1
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE +24 -0
- data/README.md +159 -0
- data/Rakefile +247 -0
- data/ext/compat.h +32 -0
- data/ext/extbzip3.c +220 -0
- data/ext/extbzip3.h +279 -0
- data/ext/extbzip3_decoder.c +484 -0
- data/ext/extbzip3_encoder.c +344 -0
- data/ext/extconf.rb +43 -0
- data/gemstub.rb +17 -0
- data/lib/extbzip3/decoder.rb +90 -0
- data/lib/extbzip3/fordoc.rb +38 -0
- data/lib/extbzip3/version.rb +8 -0
- data/lib/extbzip3.rb +65 -0
- data/test/test_bzip3.rb +77 -0
- metadata +91 -0
@@ -0,0 +1,344 @@
|
|
1
|
+
#include "extbzip3.h"
|
2
|
+
|
3
|
+
static inline int
|
4
|
+
aux_oneshot_encode(int format, uint32_t blocksize, const void *in, void *out, size_t insize, size_t *outsize)
|
5
|
+
{
|
6
|
+
if (blocksize < AUX_BZIP3_BLOCKSIZE_MIN) {
|
7
|
+
blocksize = AUX_BZIP3_BLOCKSIZE_MIN;
|
8
|
+
} else if (blocksize > AUX_BZIP3_BLOCKSIZE_MAX) {
|
9
|
+
return BZ3_ERR_INIT;
|
10
|
+
}
|
11
|
+
|
12
|
+
if (!outsize) {
|
13
|
+
return BZ3_ERR_INIT;
|
14
|
+
}
|
15
|
+
|
16
|
+
int headersize;
|
17
|
+
size_t blockcount;
|
18
|
+
if (format == AUX_BZIP3_V1_FILE_FORMAT) {
|
19
|
+
headersize = 9;
|
20
|
+
blockcount = 0;
|
21
|
+
} else {
|
22
|
+
headersize = 13;
|
23
|
+
blockcount = (insize / blocksize) + ((insize % blocksize != 0) ? 1 : 0);
|
24
|
+
|
25
|
+
if (blockcount > (UINT32_MAX - 1)) {
|
26
|
+
return BZ3_ERR_DATA_TOO_BIG;
|
27
|
+
}
|
28
|
+
}
|
29
|
+
|
30
|
+
if (*outsize < (size_t)headersize) {
|
31
|
+
return BZ3_ERR_INIT;
|
32
|
+
}
|
33
|
+
|
34
|
+
struct bz3_state *bz3 = bz3_new(blocksize);
|
35
|
+
if (bz3 == NULL) {
|
36
|
+
return BZ3_ERR_INIT;
|
37
|
+
}
|
38
|
+
|
39
|
+
const uint8_t *inp = (const uint8_t *)in;
|
40
|
+
const uint8_t *const inend = inp + insize;
|
41
|
+
uint8_t *outp = (uint8_t *)out + headersize;
|
42
|
+
uint8_t *const outend = outp + *outsize;
|
43
|
+
|
44
|
+
while (inend - inp > 0) {
|
45
|
+
uint32_t origsize = ((inend - inp) > blocksize) ? blocksize : (uint32_t)(inend - inp);
|
46
|
+
uint32_t packedsize = (uint32_t)bz3_bound(origsize); // TODO???: 過剰な値かも?
|
47
|
+
|
48
|
+
if (outend - outp < packedsize) {
|
49
|
+
bz3_free(bz3);
|
50
|
+
return BZ3_ERR_DATA_TOO_BIG;
|
51
|
+
}
|
52
|
+
|
53
|
+
outp += 8;
|
54
|
+
|
55
|
+
memmove(outp, inp, origsize);
|
56
|
+
int32_t ret = aux_bz3_encode_block_nogvl(bz3, outp, origsize);
|
57
|
+
if (ret < 0) {
|
58
|
+
bz3_free(bz3);
|
59
|
+
return ret;
|
60
|
+
}
|
61
|
+
|
62
|
+
storeu32le(outp - 8, ret);
|
63
|
+
storeu32le(outp - 4, origsize);
|
64
|
+
|
65
|
+
inp += origsize;
|
66
|
+
outp += ret;
|
67
|
+
}
|
68
|
+
|
69
|
+
bz3_free(bz3);
|
70
|
+
|
71
|
+
*outsize = (size_t)(outp - (const uint8_t *)out);
|
72
|
+
|
73
|
+
memmove(out, aux_bzip3_signature, sizeof(aux_bzip3_signature));
|
74
|
+
storeu32le((char *)out + 5, blocksize);
|
75
|
+
|
76
|
+
if (format == AUX_BZIP3_V1_FRAME_FORMAT) {
|
77
|
+
storeu32le((char *)out + 9, (uint32_t)blockcount);
|
78
|
+
}
|
79
|
+
|
80
|
+
return BZ3_OK;
|
81
|
+
}
|
82
|
+
|
83
|
+
struct encoder
|
84
|
+
{
|
85
|
+
struct bz3_state *bzip3;
|
86
|
+
uint32_t blocksize;
|
87
|
+
int firstwrite:1;
|
88
|
+
int closed:1;
|
89
|
+
VALUE outport;
|
90
|
+
VALUE srcbuf;
|
91
|
+
VALUE destbuf;
|
92
|
+
};
|
93
|
+
|
94
|
+
#define ENCODER_FREE_BLOCK(P) \
|
95
|
+
if ((P)->bzip3) { \
|
96
|
+
bz3_free((P)->bzip3); \
|
97
|
+
} \
|
98
|
+
|
99
|
+
#define ENCODER_VALUE_FOREACH(DEF) \
|
100
|
+
DEF(outport) \
|
101
|
+
DEF(srcbuf) \
|
102
|
+
DEF(destbuf) \
|
103
|
+
|
104
|
+
AUX_DEFINE_TYPED_DATA(encoder, encoder_allocate, ENCODER_FREE_BLOCK, ENCODER_VALUE_FOREACH)
|
105
|
+
|
106
|
+
/*
|
107
|
+
* @overload initialize(blocksize: (16 << 20))
|
108
|
+
*/
|
109
|
+
static VALUE
|
110
|
+
encoder_initialize(int argc, VALUE argv[], VALUE self)
|
111
|
+
{
|
112
|
+
struct { VALUE outport, opts; } args;
|
113
|
+
rb_scan_args(argc, argv, "1:", &args.outport, &args.opts);
|
114
|
+
|
115
|
+
enum { numkw = 1 };
|
116
|
+
ID idtab[numkw] = { rb_intern("blocksize") };
|
117
|
+
union { struct { VALUE blocksize; }; VALUE vect[numkw]; } opts;
|
118
|
+
rb_get_kwargs(args.opts, idtab, 0, numkw, opts.vect);
|
119
|
+
|
120
|
+
struct encoder *p = (struct encoder *)rb_check_typeddata(self, &encoder_type);
|
121
|
+
if (p == NULL || p->bzip3) {
|
122
|
+
rb_raise(rb_eTypeError, "wrong initialized or re-initializing - %" PRIsVALUE, self);
|
123
|
+
}
|
124
|
+
|
125
|
+
p->blocksize = aux_conv_to_blocksize(opts.blocksize);
|
126
|
+
p->outport = args.outport;
|
127
|
+
p->srcbuf = Qnil;
|
128
|
+
p->destbuf = Qnil;
|
129
|
+
p->bzip3 = aux_bz3_new(p->blocksize);
|
130
|
+
p->firstwrite = 1;
|
131
|
+
|
132
|
+
return self;
|
133
|
+
}
|
134
|
+
|
135
|
+
static VALUE
|
136
|
+
encoder_outport(VALUE self)
|
137
|
+
{
|
138
|
+
return get_encoder(self)->outport;
|
139
|
+
}
|
140
|
+
|
141
|
+
static void
|
142
|
+
encoder_write_encode(VALUE self, struct encoder *p, const void *buf, size_t len)
|
143
|
+
{
|
144
|
+
size_t bufoff = 8 + (p->firstwrite ? 9 : 0);
|
145
|
+
|
146
|
+
p->destbuf = aux_str_new_recycle(p->destbuf, bufoff + bz3_bound(len));
|
147
|
+
rb_str_set_len(p->destbuf, bufoff);
|
148
|
+
rb_str_cat(p->destbuf, buf, len);
|
149
|
+
|
150
|
+
int32_t res = aux_bz3_encode_block_nogvl(p->bzip3, RSTRING_PTR(p->destbuf) + bufoff, RSTRING_LEN(p->destbuf) - bufoff);
|
151
|
+
|
152
|
+
if (res < 0) {
|
153
|
+
extbzip3_check_error(res);
|
154
|
+
}
|
155
|
+
|
156
|
+
rb_str_set_len(p->destbuf, bufoff + res);
|
157
|
+
storeu32le(RSTRING_PTR(p->destbuf) + bufoff - 8, res);
|
158
|
+
storeu32le(RSTRING_PTR(p->destbuf) + bufoff - 4, (uint32_t)len);
|
159
|
+
|
160
|
+
if (p->firstwrite) {
|
161
|
+
memcpy(RSTRING_PTR(p->destbuf), "BZ3v1", 5);
|
162
|
+
storeu32le(RSTRING_PTR(p->destbuf) + 5, p->blocksize);
|
163
|
+
p->firstwrite = 0;
|
164
|
+
}
|
165
|
+
|
166
|
+
rb_funcallv(p->outport, rb_intern("<<"), 1, &p->destbuf);
|
167
|
+
}
|
168
|
+
|
169
|
+
static VALUE
|
170
|
+
encoder_write(VALUE self, VALUE src)
|
171
|
+
{
|
172
|
+
struct encoder *p = get_encoder(self);
|
173
|
+
|
174
|
+
rb_check_type(src, RUBY_T_STRING);
|
175
|
+
|
176
|
+
size_t srclen = RSTRING_LEN(src);
|
177
|
+
|
178
|
+
if (srclen <= p->blocksize) {
|
179
|
+
if (rb_type_p(p->srcbuf, RUBY_T_STRING)) {
|
180
|
+
size_t srcbuflen = RSTRING_LEN(p->srcbuf);
|
181
|
+
size_t catlen = srclen + srcbuflen;
|
182
|
+
|
183
|
+
if (catlen >= p->blocksize) {
|
184
|
+
rb_str_cat(p->srcbuf, RSTRING_PTR(src), p->blocksize - srcbuflen);
|
185
|
+
encoder_write_encode(self, p, RSTRING_PTR(p->srcbuf), RSTRING_LEN(p->srcbuf));
|
186
|
+
rb_str_set_len(p->srcbuf, 0);
|
187
|
+
rb_str_cat(p->srcbuf, RSTRING_PTR(src) + p->blocksize - srcbuflen, srclen - (p->blocksize - srcbuflen));
|
188
|
+
|
189
|
+
return self;
|
190
|
+
}
|
191
|
+
} else {
|
192
|
+
p->srcbuf = rb_str_new(0, 0);
|
193
|
+
}
|
194
|
+
|
195
|
+
rb_str_cat(p->srcbuf, RSTRING_PTR(src), srclen);
|
196
|
+
|
197
|
+
return self;
|
198
|
+
} else {
|
199
|
+
size_t srcoff = 0;
|
200
|
+
|
201
|
+
if (rb_type_p(p->srcbuf, RUBY_T_STRING) && RSTRING_LEN(p->srcbuf) > 0) {
|
202
|
+
srcoff = p->blocksize - RSTRING_LEN(p->srcbuf);
|
203
|
+
rb_str_cat(p->srcbuf, RSTRING_PTR(src), srcoff);
|
204
|
+
encoder_write_encode(self, p, RSTRING_PTR(p->srcbuf), RSTRING_LEN(p->srcbuf));
|
205
|
+
rb_str_set_len(p->srcbuf, 0);
|
206
|
+
srclen = RSTRING_LEN(src); // maybe changed src with `outport << destbuf`
|
207
|
+
if (srclen < srcoff) {
|
208
|
+
return self;
|
209
|
+
}
|
210
|
+
}
|
211
|
+
|
212
|
+
while (srclen - srcoff > p->blocksize) {
|
213
|
+
encoder_write_encode(self, p, RSTRING_PTR(src) + srcoff, p->blocksize);
|
214
|
+
srcoff += p->blocksize;
|
215
|
+
srclen = RSTRING_LEN(src); // maybe changed src with `outport << destbuf`
|
216
|
+
if (srclen < srcoff) {
|
217
|
+
return self;
|
218
|
+
}
|
219
|
+
}
|
220
|
+
|
221
|
+
if (srcoff < srclen) {
|
222
|
+
if (!rb_type_p(p->srcbuf, RUBY_T_STRING)) {
|
223
|
+
p->srcbuf = rb_str_new(0, 0);
|
224
|
+
}
|
225
|
+
|
226
|
+
rb_str_cat(p->srcbuf, RSTRING_PTR(src), srclen - srcoff);
|
227
|
+
}
|
228
|
+
|
229
|
+
return self;
|
230
|
+
}
|
231
|
+
}
|
232
|
+
|
233
|
+
static VALUE
|
234
|
+
encoder_flush(VALUE self)
|
235
|
+
{
|
236
|
+
struct encoder *p = get_encoder(self);
|
237
|
+
|
238
|
+
if (rb_type_p(p->srcbuf, RUBY_T_STRING) && RSTRING_LEN(p->srcbuf) > 0) {
|
239
|
+
encoder_write_encode(self, p, RSTRING_PTR(p->srcbuf), RSTRING_LEN(p->srcbuf));
|
240
|
+
rb_str_set_len(p->srcbuf, 0);
|
241
|
+
}
|
242
|
+
|
243
|
+
return Qnil;
|
244
|
+
}
|
245
|
+
|
246
|
+
static VALUE
|
247
|
+
encoder_close(VALUE self)
|
248
|
+
{
|
249
|
+
struct encoder *p = get_encoder(self);
|
250
|
+
|
251
|
+
if (rb_type_p(p->srcbuf, RUBY_T_STRING) && RSTRING_LEN(p->srcbuf) > 0) {
|
252
|
+
encoder_write_encode(self, p, RSTRING_PTR(p->srcbuf), RSTRING_LEN(p->srcbuf));
|
253
|
+
rb_str_set_len(p->srcbuf, 0);
|
254
|
+
}
|
255
|
+
|
256
|
+
p->closed = 1;
|
257
|
+
|
258
|
+
return Qnil;
|
259
|
+
}
|
260
|
+
|
261
|
+
static VALUE
|
262
|
+
encoder_closed_p(VALUE self)
|
263
|
+
{
|
264
|
+
return get_encoder(self)->closed ? Qtrue : Qfalse;
|
265
|
+
}
|
266
|
+
|
267
|
+
/*
|
268
|
+
* @overload encode(src, maxdest = nil, dest = "", **opts)
|
269
|
+
* @overload encode(src, dest, **opts)
|
270
|
+
*
|
271
|
+
* @return [String]
|
272
|
+
* dest as decompression data
|
273
|
+
* @param [String] src
|
274
|
+
* @param [Integer] maxdest
|
275
|
+
* @param [String] dest
|
276
|
+
* @option opts [Integer] :blocksize ((16 << 20))
|
277
|
+
* @option opts :format (Bzip3::V1_FILE_FORMAT)
|
278
|
+
* Bzip3::V1_FILE_FORMAT, Bzip3::V1_FRAME_FORMAT
|
279
|
+
*/
|
280
|
+
static VALUE
|
281
|
+
encoder_s_encode(int argc, VALUE argv[], VALUE mod)
|
282
|
+
{
|
283
|
+
size_t insize, outsize;
|
284
|
+
struct { VALUE src, maxdest, dest, opts; } args;
|
285
|
+
switch (rb_scan_args(argc, argv, "12:", &args.src, &args.maxdest, &args.dest, &args.opts)) {
|
286
|
+
case 1:
|
287
|
+
insize = RSTRING_LEN(args.src);
|
288
|
+
outsize = bz3_bound(insize);
|
289
|
+
args.dest = rb_str_buf_new(outsize);
|
290
|
+
break;
|
291
|
+
case 2:
|
292
|
+
insize = RSTRING_LEN(args.src);
|
293
|
+
|
294
|
+
if (rb_type_p(args.maxdest, RUBY_T_FIXNUM) || rb_type_p(args.maxdest, RUBY_T_BIGNUM)) {
|
295
|
+
outsize = NUM2SIZET(args.maxdest);
|
296
|
+
args.dest = rb_str_buf_new(outsize);
|
297
|
+
} else {
|
298
|
+
args.dest = args.maxdest;
|
299
|
+
outsize = bz3_bound(insize);
|
300
|
+
rb_str_modify(args.dest);
|
301
|
+
rb_str_set_len(args.dest, 0);
|
302
|
+
rb_str_modify_expand(args.dest, outsize);
|
303
|
+
}
|
304
|
+
|
305
|
+
break;
|
306
|
+
case 3:
|
307
|
+
insize = RSTRING_LEN(args.src);
|
308
|
+
outsize = NUM2SIZET(args.maxdest);
|
309
|
+
rb_str_modify(args.dest);
|
310
|
+
rb_str_set_len(args.dest, 0);
|
311
|
+
rb_str_modify_expand(args.dest, outsize);
|
312
|
+
|
313
|
+
break;
|
314
|
+
}
|
315
|
+
|
316
|
+
enum { numkw = 2 };
|
317
|
+
ID idtab[numkw] = { rb_intern("blocksize"), rb_intern("format") };
|
318
|
+
union { struct { VALUE blocksize, format; }; VALUE vect[numkw]; } opts;
|
319
|
+
rb_get_kwargs(args.opts, idtab, 0, numkw, opts.vect);
|
320
|
+
|
321
|
+
uint32_t blocksize = aux_conv_to_blocksize(opts.blocksize);
|
322
|
+
int status = aux_oneshot_encode(aux_conv_to_format(opts.format), blocksize,
|
323
|
+
RSTRING_PTR(args.src), RSTRING_PTR(args.dest),
|
324
|
+
insize, &outsize);
|
325
|
+
extbzip3_check_error(status);
|
326
|
+
rb_str_set_len(args.dest, outsize);
|
327
|
+
|
328
|
+
return args.dest;
|
329
|
+
}
|
330
|
+
|
331
|
+
void
|
332
|
+
extbzip3_init_encoder(VALUE bzip3_module)
|
333
|
+
{
|
334
|
+
VALUE encoder_class = rb_define_class_under(bzip3_module, "Encoder", rb_cObject);
|
335
|
+
rb_define_alloc_func(encoder_class, encoder_allocate);
|
336
|
+
rb_define_singleton_method(encoder_class, "encode", encoder_s_encode, -1);
|
337
|
+
rb_define_method(encoder_class, "initialize", encoder_initialize, -1);
|
338
|
+
rb_define_method(encoder_class, "outport", encoder_outport, 0);
|
339
|
+
rb_define_method(encoder_class, "write", encoder_write, 1);
|
340
|
+
rb_define_method(encoder_class, "flush", encoder_flush, 0);
|
341
|
+
rb_define_method(encoder_class, "close", encoder_close, 0);
|
342
|
+
rb_define_method(encoder_class, "closed?", encoder_closed_p, 0);
|
343
|
+
rb_define_alias(encoder_class, "<<", "write");
|
344
|
+
}
|
data/ext/extconf.rb
ADDED
@@ -0,0 +1,43 @@
|
|
1
|
+
#!ruby
|
2
|
+
|
3
|
+
require "mkmf"
|
4
|
+
|
5
|
+
using Module.new {
|
6
|
+
refine Object do
|
7
|
+
def has_function_modifier?(modifier_code)
|
8
|
+
try_compile(<<~CODE)
|
9
|
+
#{modifier_code}
|
10
|
+
void
|
11
|
+
func1(void) {
|
12
|
+
}
|
13
|
+
CODE
|
14
|
+
end
|
15
|
+
end
|
16
|
+
}
|
17
|
+
|
18
|
+
MakeMakefile::CONFIG["optflags"] = "-O0 -g3" if ENV["RUBY_EXTBZIP3_DEBUG"].to_i > 0
|
19
|
+
|
20
|
+
have_header("libbz3.h") or abort "need libbz3.h header file"
|
21
|
+
have_library("bzip3") or abort "need libbzip3 library"
|
22
|
+
|
23
|
+
if RbConfig::CONFIG["arch"] =~ /mingw/i
|
24
|
+
#$LDFLAGS << " -static-libgcc" if try_ldflags("-static-libgcc")
|
25
|
+
else
|
26
|
+
if try_compile(<<~"VISIBILITY")
|
27
|
+
__attribute__((visibility("hidden"))) int conftest(void) { return 0; }
|
28
|
+
VISIBILITY
|
29
|
+
|
30
|
+
if try_cflags("-fvisibility=hidden")
|
31
|
+
$CFLAGS << " -fvisibility=hidden"
|
32
|
+
$defs << %(-DEXTBZIP3_API='__attribute__((visibility("default")))')
|
33
|
+
end
|
34
|
+
end
|
35
|
+
end
|
36
|
+
|
37
|
+
mod = %w(__attribute__((__noreturn__)) __declspec(noreturn) [[noreturn]] _Noreturn).find { |m|
|
38
|
+
has_function_modifier?(m)
|
39
|
+
}
|
40
|
+
$defs << %(-DRBEXT_NORETURN='#{mod}')
|
41
|
+
|
42
|
+
create_header
|
43
|
+
create_makefile File.join(RUBY_VERSION.slice(/\d+\.\d+/), "extbzip3")
|
data/gemstub.rb
ADDED
@@ -0,0 +1,17 @@
|
|
1
|
+
require_relative "lib/extbzip3/version"
|
2
|
+
|
3
|
+
GEMSTUB = Gem::Specification.new do |s|
|
4
|
+
s.name = "extbzip3"
|
5
|
+
s.version = Bzip3::VERSION
|
6
|
+
s.summary = "ruby bindings for bzip3 (bz3)"
|
7
|
+
s.description = <<~DESCRIPT
|
8
|
+
unoficial ruby bindings for bzip3 (bz3) <https://github.com/kspalaiologos/bzip3>.
|
9
|
+
DESCRIPT
|
10
|
+
s.homepage = "https://github.com/dearblue/ruby-extbzip3"
|
11
|
+
s.licenses = %w(BSD-2-Clause LGPL-3.0+ Apache-2.0)
|
12
|
+
s.author = "dearblue"
|
13
|
+
s.email = "dearblue@users.osdn.me"
|
14
|
+
|
15
|
+
#s.required_ruby_version = ">= 2.0"
|
16
|
+
s.add_development_dependency "rake", "~> 0"
|
17
|
+
end
|
@@ -0,0 +1,90 @@
|
|
1
|
+
module Bzip3
|
2
|
+
remove_const :Decoder rescue nil
|
3
|
+
|
4
|
+
class Decoder
|
5
|
+
def initialize(inport, blocksize = 16 << 20)
|
6
|
+
@bzip3 = BlockProcessor.new(blocksize)
|
7
|
+
@inport = inport
|
8
|
+
@readbuf = nil
|
9
|
+
@destbuf = nil
|
10
|
+
@closed = false
|
11
|
+
@eof = false
|
12
|
+
|
13
|
+
self
|
14
|
+
end
|
15
|
+
|
16
|
+
def read(size = nil, buf = "".b)
|
17
|
+
buf ||= "".b
|
18
|
+
buf[0..-1] = "".b
|
19
|
+
|
20
|
+
return buf if size == 0
|
21
|
+
|
22
|
+
size &&= 0 | Integer(0 + size)
|
23
|
+
|
24
|
+
@readbuf ||= "".b
|
25
|
+
|
26
|
+
while true
|
27
|
+
if @destbuf
|
28
|
+
if size && @destbuf.bytesize >= size
|
29
|
+
buf << @destbuf.byteslice(0, size)
|
30
|
+
@destbuf[0...size] = "".b
|
31
|
+
break
|
32
|
+
else
|
33
|
+
buf << @destbuf
|
34
|
+
size -= @destbuf.bytesize if size
|
35
|
+
@destbuf[0..-1] = "".b
|
36
|
+
end
|
37
|
+
else
|
38
|
+
@destbuf = "".b
|
39
|
+
|
40
|
+
(sig, bs) = @inport.read(9)&.unpack("a5V")
|
41
|
+
raise "意図しない EOF" unless bs
|
42
|
+
raise "シグネチャが違う" unless sig == "BZ3v1"
|
43
|
+
raise "おかしなブロックサイズ" unless ((65 << 10) .. (511 << 20)).include? bs
|
44
|
+
raise "ブロックサイズがでかすぎ" unless bs <= @bzip3.blocksize
|
45
|
+
end
|
46
|
+
|
47
|
+
unless b1 = @inport.read(8)
|
48
|
+
@eof = true
|
49
|
+
break
|
50
|
+
end
|
51
|
+
raise "意図しない EOF" if b1.bytesize < 8
|
52
|
+
if b1.byteslice(0, 5) == "BZ3v1"
|
53
|
+
b2 = @inport.read(1)
|
54
|
+
if b2 && b2.bytesize > 0
|
55
|
+
b1 << b2
|
56
|
+
bs = b1.unpack1("@5V")
|
57
|
+
raise "ブロックサイズがでかすぎ" unless bs <= @bzip3.blocksize
|
58
|
+
next
|
59
|
+
end
|
60
|
+
end
|
61
|
+
(packedsize, originsize) = b1.unpack("VV")
|
62
|
+
raise "元のデータがデカすぎ" unless originsize <= @bzip3.blocksize
|
63
|
+
raise "意図しない EOF" unless @inport.read(packedsize, @readbuf)
|
64
|
+
raise "大きさがあってない" unless @readbuf.bytesize == packedsize
|
65
|
+
@bzip3.decode(@readbuf, @destbuf, originsize)
|
66
|
+
end
|
67
|
+
|
68
|
+
buf.empty? ? nil : buf
|
69
|
+
end
|
70
|
+
|
71
|
+
def close
|
72
|
+
@closed = true
|
73
|
+
@bzip3 = nil
|
74
|
+
@readbuf = nil
|
75
|
+
@destbuf = nil
|
76
|
+
|
77
|
+
self
|
78
|
+
end
|
79
|
+
|
80
|
+
def closed?
|
81
|
+
@closed
|
82
|
+
end
|
83
|
+
|
84
|
+
def eof?
|
85
|
+
@eof
|
86
|
+
end
|
87
|
+
|
88
|
+
alias :eof :eof?
|
89
|
+
end
|
90
|
+
end
|
@@ -0,0 +1,38 @@
|
|
1
|
+
# This file is for additional documents
|
2
|
+
|
3
|
+
0 / 0
|
4
|
+
|
5
|
+
#
|
6
|
+
# Bzip3 module.
|
7
|
+
#
|
8
|
+
module Bzip3
|
9
|
+
#
|
10
|
+
# Decoder class.
|
11
|
+
#
|
12
|
+
class Decoder
|
13
|
+
end
|
14
|
+
|
15
|
+
#
|
16
|
+
# Encoder class.
|
17
|
+
#
|
18
|
+
class Encoder
|
19
|
+
end
|
20
|
+
end
|
21
|
+
|
22
|
+
class BasicObject
|
23
|
+
# 自身を出力ストリームと見立てて bzip3 を行うエンコーダオブジェクトを生成します。
|
24
|
+
def to_bzip3
|
25
|
+
end
|
26
|
+
|
27
|
+
# 自身を入力ストリームと見立てて bunzip3 を行うデコーダオブジェクトを生成します。
|
28
|
+
def bunzip3
|
29
|
+
end
|
30
|
+
end
|
31
|
+
|
32
|
+
class String
|
33
|
+
def to_bzip3
|
34
|
+
end
|
35
|
+
|
36
|
+
def bunzip3
|
37
|
+
end
|
38
|
+
end
|
data/lib/extbzip3.rb
ADDED
@@ -0,0 +1,65 @@
|
|
1
|
+
ver = RUBY_VERSION.slice(/\d+\.\d+/)
|
2
|
+
soname = File.basename(__FILE__, ".rb") << ".so"
|
3
|
+
require File.join(ver, soname)
|
4
|
+
|
5
|
+
module Bzip3
|
6
|
+
refine String do
|
7
|
+
def to_bzip3(*args, **opts)
|
8
|
+
Bzip3::Encoder.encode(self, *args, **opts)
|
9
|
+
end
|
10
|
+
|
11
|
+
def bunzip3(*args, **opts)
|
12
|
+
Bzip3::Decoder.decode(self, *args, **opts)
|
13
|
+
end
|
14
|
+
end
|
15
|
+
|
16
|
+
refine BasicObject do
|
17
|
+
def to_bzip3(*args, **opts, &block)
|
18
|
+
Bzip3::Encoder.open(self, *args, **opts, &block)
|
19
|
+
end
|
20
|
+
|
21
|
+
def bunzip3(*args, **opts, &block)
|
22
|
+
Bzip3::Decoder.open(self, *args, **opts, &block)
|
23
|
+
end
|
24
|
+
end
|
25
|
+
|
26
|
+
class << Bzip3
|
27
|
+
using Bzip3
|
28
|
+
|
29
|
+
def encode(src, *args, **opts, &block)
|
30
|
+
src.to_bzip3(*args, **opts, &block)
|
31
|
+
end
|
32
|
+
|
33
|
+
def decode(src, *args, **opts, &block)
|
34
|
+
src.bunzip3(*args, **opts, &block)
|
35
|
+
end
|
36
|
+
end
|
37
|
+
|
38
|
+
class << Decoder
|
39
|
+
def open(*args, **opts, &block)
|
40
|
+
bz3 = new(*args, **opts)
|
41
|
+
return bz3 unless block
|
42
|
+
|
43
|
+
begin
|
44
|
+
yield bz3
|
45
|
+
ensure
|
46
|
+
bz3.close unless bz3.closed?
|
47
|
+
end
|
48
|
+
end
|
49
|
+
end
|
50
|
+
|
51
|
+
class << Encoder
|
52
|
+
def open(*args, **opts, &block)
|
53
|
+
bz3 = new(*args, **opts)
|
54
|
+
return bz3 unless block
|
55
|
+
|
56
|
+
begin
|
57
|
+
yield bz3
|
58
|
+
ensure
|
59
|
+
bz3.close unless bz3.closed?
|
60
|
+
end
|
61
|
+
end
|
62
|
+
end
|
63
|
+
|
64
|
+
Bzip3 = self
|
65
|
+
end
|
data/test/test_bzip3.rb
ADDED
@@ -0,0 +1,77 @@
|
|
1
|
+
#!ruby
|
2
|
+
|
3
|
+
require "test-unit"
|
4
|
+
require "extbzip3"
|
5
|
+
|
6
|
+
SAMPLES = File.join(__dir__, "../sampledata")
|
7
|
+
|
8
|
+
class << SAMPLES
|
9
|
+
def load_file(path)
|
10
|
+
File.binread File.join(self, path)
|
11
|
+
end
|
12
|
+
|
13
|
+
def open_file(path, *args, **opts, &block)
|
14
|
+
File.open File.join(self, path), *args, **opts, &block
|
15
|
+
end
|
16
|
+
end
|
17
|
+
|
18
|
+
SAMPLES.freeze
|
19
|
+
|
20
|
+
class TestBzip3 < Test::Unit::TestCase
|
21
|
+
def test_oneshot
|
22
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\n",
|
23
|
+
Bzip3.decode(SAMPLES.load_file("single.bz3"))
|
24
|
+
|
25
|
+
assert_raise RuntimeError do
|
26
|
+
Bzip3.decode(SAMPLES.load_file("single.bz3-frame"))
|
27
|
+
end
|
28
|
+
|
29
|
+
assert_raise RuntimeError do
|
30
|
+
Bzip3.decode(SAMPLES.load_file("single.bz3-frame"), format: Bzip3::V1_FILE_FORMAT)
|
31
|
+
end
|
32
|
+
|
33
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\nZYXWVUTSRQPONMLKJIHGFEDCBA987654321\n",
|
34
|
+
Bzip3.decode(SAMPLES.load_file("double.bz3"))
|
35
|
+
|
36
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\n",
|
37
|
+
Bzip3.decode(SAMPLES.load_file("double.bz3"), concat: false)
|
38
|
+
|
39
|
+
assert_raise RuntimeError do
|
40
|
+
Bzip3.decode(SAMPLES.load_file("single+junks.bz3"))
|
41
|
+
end
|
42
|
+
end
|
43
|
+
|
44
|
+
def test_oneshot_frame
|
45
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\n",
|
46
|
+
Bzip3.decode(SAMPLES.load_file("single.bz3-frame"), format: Bzip3::V1_FRAME_FORMAT)
|
47
|
+
|
48
|
+
assert_raise RuntimeError do
|
49
|
+
Bzip3.decode(SAMPLES.load_file("single.bz3"), format: Bzip3::V1_FRAME_FORMAT)
|
50
|
+
end
|
51
|
+
end
|
52
|
+
|
53
|
+
def test_stream
|
54
|
+
io = SAMPLES.open_file("single.bz3")
|
55
|
+
assert_kind_of Bzip3::Decoder, Bzip3.decode(io)
|
56
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\n", Bzip3.decode(io).read
|
57
|
+
io.rewind
|
58
|
+
assert_equal "OK",
|
59
|
+
Bzip3.decode(io) { |bz3|
|
60
|
+
assert_equal "", bz3.read(0, "")
|
61
|
+
assert_equal "12345", bz3.read(5, "")
|
62
|
+
assert_equal "6789AB", bz3.read(6)
|
63
|
+
assert_equal "", bz3.read(0)
|
64
|
+
assert_equal "CDEFGHIJKLMNOPQRSTUVWXYZ\n", bz3.read
|
65
|
+
assert_equal "", bz3.read(0)
|
66
|
+
assert_equal nil, bz3.read
|
67
|
+
"OK"
|
68
|
+
}
|
69
|
+
|
70
|
+
if defined? Ractor
|
71
|
+
assert_equal "123456789ABCDEFGHIJKLMNOPQRSTUVWXYZ\n", Ractor.new {
|
72
|
+
io2 = SAMPLES.open_file("single.bz3")
|
73
|
+
Bzip3.decode(io2).read
|
74
|
+
}.take
|
75
|
+
end
|
76
|
+
end
|
77
|
+
end
|