json 2.7.2 → 2.10.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/BSDL +22 -0
- data/CHANGES.md +98 -17
- data/LEGAL +8 -0
- data/README.md +68 -216
- data/ext/json/ext/fbuffer/fbuffer.h +110 -92
- data/ext/json/ext/generator/extconf.rb +8 -2
- data/ext/json/ext/generator/generator.c +952 -833
- data/ext/json/ext/parser/extconf.rb +7 -27
- data/ext/json/ext/parser/parser.c +1207 -1940
- data/json.gemspec +44 -49
- data/lib/json/add/bigdecimal.rb +2 -2
- data/lib/json/add/complex.rb +1 -1
- data/lib/json/add/core.rb +1 -1
- data/lib/json/add/date.rb +1 -1
- data/lib/json/add/date_time.rb +1 -1
- data/lib/json/add/exception.rb +1 -1
- data/lib/json/add/ostruct.rb +1 -1
- data/lib/json/add/range.rb +1 -1
- data/lib/json/add/rational.rb +1 -1
- data/lib/json/add/regexp.rb +1 -1
- data/lib/json/add/struct.rb +1 -1
- data/lib/json/add/symbol.rb +8 -4
- data/lib/json/add/time.rb +3 -10
- data/lib/json/common.rb +401 -106
- data/lib/json/ext/generator/state.rb +106 -0
- data/lib/json/ext.rb +34 -4
- data/lib/json/generic_object.rb +1 -1
- data/lib/json/{pure → truffle_ruby}/generator.rb +322 -145
- data/lib/json/version.rb +3 -7
- data/lib/json.rb +16 -21
- metadata +15 -22
- data/ext/json/ext/generator/depend +0 -1
- data/ext/json/ext/generator/generator.h +0 -177
- data/ext/json/ext/parser/depend +0 -1
- data/ext/json/ext/parser/parser.h +0 -96
- data/ext/json/ext/parser/parser.rl +0 -971
- data/ext/json/extconf.rb +0 -3
- data/lib/json/pure/parser.rb +0 -337
- data/lib/json/pure.rb +0 -15
- /data/{LICENSE → COPYING} +0 -0
@@ -1,30 +1,346 @@
|
|
1
|
-
|
2
|
-
#
|
3
|
-
#include "../fbuffer/fbuffer.h"
|
4
|
-
#include "parser.h"
|
5
|
-
|
6
|
-
#if defined HAVE_RUBY_ENCODING_H
|
7
|
-
# define EXC_ENCODING rb_utf8_encoding(),
|
8
|
-
# ifndef HAVE_RB_ENC_RAISE
|
9
|
-
static void
|
10
|
-
enc_raise(rb_encoding *enc, VALUE exc, const char *fmt, ...)
|
11
|
-
{
|
12
|
-
va_list args;
|
13
|
-
VALUE mesg;
|
1
|
+
#include "ruby.h"
|
2
|
+
#include "ruby/encoding.h"
|
14
3
|
|
15
|
-
|
16
|
-
|
17
|
-
va_end(args);
|
4
|
+
/* shims */
|
5
|
+
/* This is the fallback definition from Ruby 3.4 */
|
18
6
|
|
19
|
-
|
20
|
-
|
21
|
-
#
|
7
|
+
#ifndef RBIMPL_STDBOOL_H
|
8
|
+
#if defined(__cplusplus)
|
9
|
+
# if defined(HAVE_STDBOOL_H) && (__cplusplus >= 201103L)
|
10
|
+
# include <cstdbool>
|
22
11
|
# endif
|
12
|
+
#elif defined(HAVE_STDBOOL_H)
|
13
|
+
# include <stdbool.h>
|
14
|
+
#elif !defined(HAVE__BOOL)
|
15
|
+
typedef unsigned char _Bool;
|
16
|
+
# define bool _Bool
|
17
|
+
# define true ((_Bool)+1)
|
18
|
+
# define false ((_Bool)+0)
|
19
|
+
# define __bool_true_false_are_defined
|
20
|
+
#endif
|
21
|
+
#endif
|
22
|
+
|
23
|
+
#ifndef RB_UNLIKELY
|
24
|
+
#define RB_UNLIKELY(expr) expr
|
25
|
+
#endif
|
26
|
+
|
27
|
+
#ifndef RB_LIKELY
|
28
|
+
#define RB_LIKELY(expr) expr
|
29
|
+
#endif
|
30
|
+
|
31
|
+
static VALUE mJSON, eNestingError, Encoding_UTF_8;
|
32
|
+
static VALUE CNaN, CInfinity, CMinusInfinity;
|
33
|
+
|
34
|
+
static ID i_json_creatable_p, i_json_create, i_create_id,
|
35
|
+
i_chr, i_deep_const_get, i_match, i_aset, i_aref,
|
36
|
+
i_leftshift, i_new, i_try_convert, i_uminus, i_encode;
|
37
|
+
|
38
|
+
static VALUE sym_max_nesting, sym_allow_nan, sym_allow_trailing_comma, sym_symbolize_names, sym_freeze,
|
39
|
+
sym_create_additions, sym_create_id, sym_object_class, sym_array_class,
|
40
|
+
sym_decimal_class, sym_match_string;
|
41
|
+
|
42
|
+
static int binary_encindex;
|
43
|
+
static int utf8_encindex;
|
44
|
+
|
45
|
+
#ifdef HAVE_RB_CATEGORY_WARN
|
46
|
+
# define json_deprecated(message) rb_category_warn(RB_WARN_CATEGORY_DEPRECATED, message)
|
23
47
|
#else
|
24
|
-
# define
|
25
|
-
# define rb_enc_raise rb_raise
|
48
|
+
# define json_deprecated(message) rb_warn(message)
|
26
49
|
#endif
|
27
50
|
|
51
|
+
static const char deprecated_create_additions_warning[] =
|
52
|
+
"JSON.load implicit support for `create_additions: true` is deprecated "
|
53
|
+
"and will be removed in 3.0, use JSON.unsafe_load or explicitly "
|
54
|
+
"pass `create_additions: true`";
|
55
|
+
|
56
|
+
#ifndef HAVE_RB_HASH_BULK_INSERT
|
57
|
+
// For TruffleRuby
|
58
|
+
void
|
59
|
+
rb_hash_bulk_insert(long count, const VALUE *pairs, VALUE hash)
|
60
|
+
{
|
61
|
+
long index = 0;
|
62
|
+
while (index < count) {
|
63
|
+
VALUE name = pairs[index++];
|
64
|
+
VALUE value = pairs[index++];
|
65
|
+
rb_hash_aset(hash, name, value);
|
66
|
+
}
|
67
|
+
RB_GC_GUARD(hash);
|
68
|
+
}
|
69
|
+
#endif
|
70
|
+
|
71
|
+
#ifndef HAVE_RB_HASH_NEW_CAPA
|
72
|
+
#define rb_hash_new_capa(n) rb_hash_new()
|
73
|
+
#endif
|
74
|
+
|
75
|
+
|
76
|
+
/* name cache */
|
77
|
+
|
78
|
+
#include <string.h>
|
79
|
+
#include <ctype.h>
|
80
|
+
|
81
|
+
// Object names are likely to be repeated, and are frozen.
|
82
|
+
// As such we can re-use them if we keep a cache of the ones we've seen so far,
|
83
|
+
// and save much more expensive lookups into the global fstring table.
|
84
|
+
// This cache implementation is deliberately simple, as we're optimizing for compactness,
|
85
|
+
// to be able to fit safely on the stack.
|
86
|
+
// As such, binary search into a sorted array gives a good tradeoff between compactness and
|
87
|
+
// performance.
|
88
|
+
#define JSON_RVALUE_CACHE_CAPA 63
|
89
|
+
typedef struct rvalue_cache_struct {
|
90
|
+
int length;
|
91
|
+
VALUE entries[JSON_RVALUE_CACHE_CAPA];
|
92
|
+
} rvalue_cache;
|
93
|
+
|
94
|
+
static rb_encoding *enc_utf8;
|
95
|
+
|
96
|
+
#define JSON_RVALUE_CACHE_MAX_ENTRY_LENGTH 55
|
97
|
+
|
98
|
+
static inline VALUE build_interned_string(const char *str, const long length)
|
99
|
+
{
|
100
|
+
# ifdef HAVE_RB_ENC_INTERNED_STR
|
101
|
+
return rb_enc_interned_str(str, length, enc_utf8);
|
102
|
+
# else
|
103
|
+
VALUE rstring = rb_utf8_str_new(str, length);
|
104
|
+
return rb_funcall(rb_str_freeze(rstring), i_uminus, 0);
|
105
|
+
# endif
|
106
|
+
}
|
107
|
+
|
108
|
+
static inline VALUE build_symbol(const char *str, const long length)
|
109
|
+
{
|
110
|
+
return rb_str_intern(build_interned_string(str, length));
|
111
|
+
}
|
112
|
+
|
113
|
+
static void rvalue_cache_insert_at(rvalue_cache *cache, int index, VALUE rstring)
|
114
|
+
{
|
115
|
+
MEMMOVE(&cache->entries[index + 1], &cache->entries[index], VALUE, cache->length - index);
|
116
|
+
cache->length++;
|
117
|
+
cache->entries[index] = rstring;
|
118
|
+
}
|
119
|
+
|
120
|
+
static inline int rstring_cache_cmp(const char *str, const long length, VALUE rstring)
|
121
|
+
{
|
122
|
+
long rstring_length = RSTRING_LEN(rstring);
|
123
|
+
if (length == rstring_length) {
|
124
|
+
return memcmp(str, RSTRING_PTR(rstring), length);
|
125
|
+
} else {
|
126
|
+
return (int)(length - rstring_length);
|
127
|
+
}
|
128
|
+
}
|
129
|
+
|
130
|
+
static VALUE rstring_cache_fetch(rvalue_cache *cache, const char *str, const long length)
|
131
|
+
{
|
132
|
+
if (RB_UNLIKELY(length > JSON_RVALUE_CACHE_MAX_ENTRY_LENGTH)) {
|
133
|
+
// Common names aren't likely to be very long. So we just don't
|
134
|
+
// cache names above an arbitrary threshold.
|
135
|
+
return Qfalse;
|
136
|
+
}
|
137
|
+
|
138
|
+
if (RB_UNLIKELY(!isalpha((unsigned char)str[0]))) {
|
139
|
+
// Simple heuristic, if the first character isn't a letter,
|
140
|
+
// we're much less likely to see this string again.
|
141
|
+
// We mostly want to cache strings that are likely to be repeated.
|
142
|
+
return Qfalse;
|
143
|
+
}
|
144
|
+
|
145
|
+
int low = 0;
|
146
|
+
int high = cache->length - 1;
|
147
|
+
int mid = 0;
|
148
|
+
int last_cmp = 0;
|
149
|
+
|
150
|
+
while (low <= high) {
|
151
|
+
mid = (high + low) >> 1;
|
152
|
+
VALUE entry = cache->entries[mid];
|
153
|
+
last_cmp = rstring_cache_cmp(str, length, entry);
|
154
|
+
|
155
|
+
if (last_cmp == 0) {
|
156
|
+
return entry;
|
157
|
+
} else if (last_cmp > 0) {
|
158
|
+
low = mid + 1;
|
159
|
+
} else {
|
160
|
+
high = mid - 1;
|
161
|
+
}
|
162
|
+
}
|
163
|
+
|
164
|
+
if (RB_UNLIKELY(memchr(str, '\\', length))) {
|
165
|
+
// We assume the overwhelming majority of names don't need to be escaped.
|
166
|
+
// But if they do, we have to fallback to the slow path.
|
167
|
+
return Qfalse;
|
168
|
+
}
|
169
|
+
|
170
|
+
VALUE rstring = build_interned_string(str, length);
|
171
|
+
|
172
|
+
if (cache->length < JSON_RVALUE_CACHE_CAPA) {
|
173
|
+
if (last_cmp > 0) {
|
174
|
+
mid += 1;
|
175
|
+
}
|
176
|
+
|
177
|
+
rvalue_cache_insert_at(cache, mid, rstring);
|
178
|
+
}
|
179
|
+
return rstring;
|
180
|
+
}
|
181
|
+
|
182
|
+
static VALUE rsymbol_cache_fetch(rvalue_cache *cache, const char *str, const long length)
|
183
|
+
{
|
184
|
+
if (RB_UNLIKELY(length > JSON_RVALUE_CACHE_MAX_ENTRY_LENGTH)) {
|
185
|
+
// Common names aren't likely to be very long. So we just don't
|
186
|
+
// cache names above an arbitrary threshold.
|
187
|
+
return Qfalse;
|
188
|
+
}
|
189
|
+
|
190
|
+
if (RB_UNLIKELY(!isalpha((unsigned char)str[0]))) {
|
191
|
+
// Simple heuristic, if the first character isn't a letter,
|
192
|
+
// we're much less likely to see this string again.
|
193
|
+
// We mostly want to cache strings that are likely to be repeated.
|
194
|
+
return Qfalse;
|
195
|
+
}
|
196
|
+
|
197
|
+
int low = 0;
|
198
|
+
int high = cache->length - 1;
|
199
|
+
int mid = 0;
|
200
|
+
int last_cmp = 0;
|
201
|
+
|
202
|
+
while (low <= high) {
|
203
|
+
mid = (high + low) >> 1;
|
204
|
+
VALUE entry = cache->entries[mid];
|
205
|
+
last_cmp = rstring_cache_cmp(str, length, rb_sym2str(entry));
|
206
|
+
|
207
|
+
if (last_cmp == 0) {
|
208
|
+
return entry;
|
209
|
+
} else if (last_cmp > 0) {
|
210
|
+
low = mid + 1;
|
211
|
+
} else {
|
212
|
+
high = mid - 1;
|
213
|
+
}
|
214
|
+
}
|
215
|
+
|
216
|
+
if (RB_UNLIKELY(memchr(str, '\\', length))) {
|
217
|
+
// We assume the overwhelming majority of names don't need to be escaped.
|
218
|
+
// But if they do, we have to fallback to the slow path.
|
219
|
+
return Qfalse;
|
220
|
+
}
|
221
|
+
|
222
|
+
VALUE rsymbol = build_symbol(str, length);
|
223
|
+
|
224
|
+
if (cache->length < JSON_RVALUE_CACHE_CAPA) {
|
225
|
+
if (last_cmp > 0) {
|
226
|
+
mid += 1;
|
227
|
+
}
|
228
|
+
|
229
|
+
rvalue_cache_insert_at(cache, mid, rsymbol);
|
230
|
+
}
|
231
|
+
return rsymbol;
|
232
|
+
}
|
233
|
+
|
234
|
+
/* rvalue stack */
|
235
|
+
|
236
|
+
#define RVALUE_STACK_INITIAL_CAPA 128
|
237
|
+
|
238
|
+
enum rvalue_stack_type {
|
239
|
+
RVALUE_STACK_HEAP_ALLOCATED = 0,
|
240
|
+
RVALUE_STACK_STACK_ALLOCATED = 1,
|
241
|
+
};
|
242
|
+
|
243
|
+
typedef struct rvalue_stack_struct {
|
244
|
+
enum rvalue_stack_type type;
|
245
|
+
long capa;
|
246
|
+
long head;
|
247
|
+
VALUE *ptr;
|
248
|
+
} rvalue_stack;
|
249
|
+
|
250
|
+
static rvalue_stack *rvalue_stack_spill(rvalue_stack *old_stack, VALUE *handle, rvalue_stack **stack_ref);
|
251
|
+
|
252
|
+
static rvalue_stack *rvalue_stack_grow(rvalue_stack *stack, VALUE *handle, rvalue_stack **stack_ref)
|
253
|
+
{
|
254
|
+
long required = stack->capa * 2;
|
255
|
+
|
256
|
+
if (stack->type == RVALUE_STACK_STACK_ALLOCATED) {
|
257
|
+
stack = rvalue_stack_spill(stack, handle, stack_ref);
|
258
|
+
} else {
|
259
|
+
REALLOC_N(stack->ptr, VALUE, required);
|
260
|
+
stack->capa = required;
|
261
|
+
}
|
262
|
+
return stack;
|
263
|
+
}
|
264
|
+
|
265
|
+
static VALUE rvalue_stack_push(rvalue_stack *stack, VALUE value, VALUE *handle, rvalue_stack **stack_ref)
|
266
|
+
{
|
267
|
+
if (RB_UNLIKELY(stack->head >= stack->capa)) {
|
268
|
+
stack = rvalue_stack_grow(stack, handle, stack_ref);
|
269
|
+
}
|
270
|
+
stack->ptr[stack->head] = value;
|
271
|
+
stack->head++;
|
272
|
+
return value;
|
273
|
+
}
|
274
|
+
|
275
|
+
static inline VALUE *rvalue_stack_peek(rvalue_stack *stack, long count)
|
276
|
+
{
|
277
|
+
return stack->ptr + (stack->head - count);
|
278
|
+
}
|
279
|
+
|
280
|
+
static inline void rvalue_stack_pop(rvalue_stack *stack, long count)
|
281
|
+
{
|
282
|
+
stack->head -= count;
|
283
|
+
}
|
284
|
+
|
285
|
+
static void rvalue_stack_mark(void *ptr)
|
286
|
+
{
|
287
|
+
rvalue_stack *stack = (rvalue_stack *)ptr;
|
288
|
+
long index;
|
289
|
+
for (index = 0; index < stack->head; index++) {
|
290
|
+
rb_gc_mark(stack->ptr[index]);
|
291
|
+
}
|
292
|
+
}
|
293
|
+
|
294
|
+
static void rvalue_stack_free(void *ptr)
|
295
|
+
{
|
296
|
+
rvalue_stack *stack = (rvalue_stack *)ptr;
|
297
|
+
if (stack) {
|
298
|
+
ruby_xfree(stack->ptr);
|
299
|
+
ruby_xfree(stack);
|
300
|
+
}
|
301
|
+
}
|
302
|
+
|
303
|
+
static size_t rvalue_stack_memsize(const void *ptr)
|
304
|
+
{
|
305
|
+
const rvalue_stack *stack = (const rvalue_stack *)ptr;
|
306
|
+
return sizeof(rvalue_stack) + sizeof(VALUE) * stack->capa;
|
307
|
+
}
|
308
|
+
|
309
|
+
static const rb_data_type_t JSON_Parser_rvalue_stack_type = {
|
310
|
+
"JSON::Ext::Parser/rvalue_stack",
|
311
|
+
{
|
312
|
+
.dmark = rvalue_stack_mark,
|
313
|
+
.dfree = rvalue_stack_free,
|
314
|
+
.dsize = rvalue_stack_memsize,
|
315
|
+
},
|
316
|
+
0, 0,
|
317
|
+
RUBY_TYPED_FREE_IMMEDIATELY,
|
318
|
+
};
|
319
|
+
|
320
|
+
static rvalue_stack *rvalue_stack_spill(rvalue_stack *old_stack, VALUE *handle, rvalue_stack **stack_ref)
|
321
|
+
{
|
322
|
+
rvalue_stack *stack;
|
323
|
+
*handle = TypedData_Make_Struct(0, rvalue_stack, &JSON_Parser_rvalue_stack_type, stack);
|
324
|
+
*stack_ref = stack;
|
325
|
+
MEMCPY(stack, old_stack, rvalue_stack, 1);
|
326
|
+
|
327
|
+
stack->capa = old_stack->capa << 1;
|
328
|
+
stack->ptr = ALLOC_N(VALUE, stack->capa);
|
329
|
+
stack->type = RVALUE_STACK_HEAP_ALLOCATED;
|
330
|
+
MEMCPY(stack->ptr, old_stack->ptr, VALUE, old_stack->head);
|
331
|
+
return stack;
|
332
|
+
}
|
333
|
+
|
334
|
+
static void rvalue_stack_eagerly_release(VALUE handle)
|
335
|
+
{
|
336
|
+
if (handle) {
|
337
|
+
rvalue_stack *stack;
|
338
|
+
TypedData_Get_Struct(handle, rvalue_stack, &JSON_Parser_rvalue_stack_type, stack);
|
339
|
+
RTYPEDDATA_DATA(handle) = NULL;
|
340
|
+
rvalue_stack_free(stack);
|
341
|
+
}
|
342
|
+
}
|
343
|
+
|
28
344
|
/* unicode */
|
29
345
|
|
30
346
|
static const signed char digit_values[256] = {
|
@@ -44,26 +360,28 @@ static const signed char digit_values[256] = {
|
|
44
360
|
-1, -1, -1, -1, -1, -1, -1
|
45
361
|
};
|
46
362
|
|
47
|
-
static
|
363
|
+
static uint32_t unescape_unicode(const unsigned char *p)
|
48
364
|
{
|
365
|
+
const uint32_t replacement_char = 0xFFFD;
|
366
|
+
|
49
367
|
signed char b;
|
50
|
-
|
368
|
+
uint32_t result = 0;
|
51
369
|
b = digit_values[p[0]];
|
52
|
-
if (b < 0) return
|
370
|
+
if (b < 0) return replacement_char;
|
53
371
|
result = (result << 4) | (unsigned char)b;
|
54
372
|
b = digit_values[p[1]];
|
55
|
-
if (b < 0) return
|
373
|
+
if (b < 0) return replacement_char;
|
56
374
|
result = (result << 4) | (unsigned char)b;
|
57
375
|
b = digit_values[p[2]];
|
58
|
-
if (b < 0) return
|
376
|
+
if (b < 0) return replacement_char;
|
59
377
|
result = (result << 4) | (unsigned char)b;
|
60
378
|
b = digit_values[p[3]];
|
61
|
-
if (b < 0) return
|
379
|
+
if (b < 0) return replacement_char;
|
62
380
|
result = (result << 4) | (unsigned char)b;
|
63
381
|
return result;
|
64
382
|
}
|
65
383
|
|
66
|
-
static int convert_UTF32_to_UTF8(char *buf,
|
384
|
+
static int convert_UTF32_to_UTF8(char *buf, uint32_t ch)
|
67
385
|
{
|
68
386
|
int len = 1;
|
69
387
|
if (ch <= 0x7F) {
|
@@ -89,1677 +407,762 @@ static int convert_UTF32_to_UTF8(char *buf, UTF32 ch)
|
|
89
407
|
return len;
|
90
408
|
}
|
91
409
|
|
92
|
-
|
93
|
-
|
410
|
+
typedef struct JSON_ParserStruct {
|
411
|
+
VALUE create_id;
|
412
|
+
VALUE object_class;
|
413
|
+
VALUE array_class;
|
414
|
+
VALUE decimal_class;
|
415
|
+
ID decimal_method_id;
|
416
|
+
VALUE match_string;
|
417
|
+
int max_nesting;
|
418
|
+
bool allow_nan;
|
419
|
+
bool allow_trailing_comma;
|
420
|
+
bool parsing_name;
|
421
|
+
bool symbolize_names;
|
422
|
+
bool freeze;
|
423
|
+
bool create_additions;
|
424
|
+
bool deprecated_create_additions;
|
425
|
+
} JSON_ParserConfig;
|
426
|
+
|
427
|
+
typedef struct JSON_ParserStateStruct {
|
428
|
+
VALUE stack_handle;
|
429
|
+
const char *cursor;
|
430
|
+
const char *end;
|
431
|
+
rvalue_stack *stack;
|
432
|
+
rvalue_cache name_cache;
|
433
|
+
int in_array;
|
434
|
+
int current_nesting;
|
435
|
+
} JSON_ParserState;
|
436
|
+
|
437
|
+
#define GET_PARSER_CONFIG \
|
438
|
+
JSON_ParserConfig *config; \
|
439
|
+
TypedData_Get_Struct(self, JSON_ParserConfig, &JSON_ParserConfig_type, config)
|
440
|
+
|
441
|
+
static const rb_data_type_t JSON_ParserConfig_type;
|
442
|
+
|
443
|
+
#ifndef HAVE_STRNLEN
|
444
|
+
static size_t strnlen(const char *s, size_t maxlen)
|
445
|
+
{
|
446
|
+
char *p;
|
447
|
+
return ((p = memchr(s, '\0', maxlen)) ? p - s : maxlen);
|
448
|
+
}
|
449
|
+
#endif
|
94
450
|
|
95
|
-
|
96
|
-
|
97
|
-
|
98
|
-
|
99
|
-
|
451
|
+
#define PARSE_ERROR_FRAGMENT_LEN 32
|
452
|
+
#ifdef RBIMPL_ATTR_NORETURN
|
453
|
+
RBIMPL_ATTR_NORETURN()
|
454
|
+
#endif
|
455
|
+
static void raise_parse_error(const char *format, const char *start)
|
456
|
+
{
|
457
|
+
char buffer[PARSE_ERROR_FRAGMENT_LEN + 1];
|
100
458
|
|
459
|
+
size_t len = start ? strnlen(start, PARSE_ERROR_FRAGMENT_LEN) : 0;
|
460
|
+
const char *ptr = start;
|
101
461
|
|
102
|
-
|
462
|
+
if (len == PARSE_ERROR_FRAGMENT_LEN) {
|
463
|
+
MEMCPY(buffer, start, char, PARSE_ERROR_FRAGMENT_LEN);
|
464
|
+
buffer[PARSE_ERROR_FRAGMENT_LEN] = '\0';
|
465
|
+
ptr = buffer;
|
466
|
+
}
|
103
467
|
|
468
|
+
rb_enc_raise(enc_utf8, rb_path2class("JSON::ParserError"), format, ptr);
|
469
|
+
}
|
104
470
|
|
471
|
+
static const bool whitespace[256] = {
|
472
|
+
[' '] = 1,
|
473
|
+
['\t'] = 1,
|
474
|
+
['\n'] = 1,
|
475
|
+
['\r'] = 1,
|
476
|
+
['/'] = 1,
|
477
|
+
};
|
105
478
|
|
106
|
-
|
107
|
-
|
108
|
-
|
109
|
-
|
479
|
+
static void
|
480
|
+
json_eat_comments(JSON_ParserState *state)
|
481
|
+
{
|
482
|
+
if (state->cursor + 1 < state->end) {
|
483
|
+
switch(state->cursor[1]) {
|
484
|
+
case '/': {
|
485
|
+
state->cursor = memchr(state->cursor, '\n', state->end - state->cursor);
|
486
|
+
if (!state->cursor) {
|
487
|
+
state->cursor = state->end;
|
488
|
+
} else {
|
489
|
+
state->cursor++;
|
490
|
+
}
|
491
|
+
break;
|
492
|
+
}
|
493
|
+
case '*': {
|
494
|
+
state->cursor += 2;
|
495
|
+
while (true) {
|
496
|
+
state->cursor = memchr(state->cursor, '*', state->end - state->cursor);
|
497
|
+
if (!state->cursor) {
|
498
|
+
state->cursor = state->end;
|
499
|
+
raise_parse_error("unexpected end of input, expected closing '*/'", state->cursor);
|
500
|
+
} else {
|
501
|
+
state->cursor++;
|
502
|
+
if (state->cursor < state->end && *state->cursor == '/') {
|
503
|
+
state->cursor++;
|
504
|
+
break;
|
505
|
+
}
|
506
|
+
}
|
507
|
+
}
|
508
|
+
break;
|
509
|
+
}
|
510
|
+
default:
|
511
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
512
|
+
break;
|
513
|
+
}
|
514
|
+
} else {
|
515
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
516
|
+
}
|
517
|
+
}
|
110
518
|
|
111
|
-
|
519
|
+
static inline void
|
520
|
+
json_eat_whitespace(JSON_ParserState *state)
|
521
|
+
{
|
522
|
+
while (state->cursor < state->end && RB_UNLIKELY(whitespace[(unsigned char)*state->cursor])) {
|
523
|
+
if (RB_LIKELY(*state->cursor != '/')) {
|
524
|
+
state->cursor++;
|
525
|
+
} else {
|
526
|
+
json_eat_comments(state);
|
527
|
+
}
|
528
|
+
}
|
529
|
+
}
|
112
530
|
|
531
|
+
static inline VALUE build_string(const char *start, const char *end, bool intern, bool symbolize)
|
532
|
+
{
|
533
|
+
if (symbolize) {
|
534
|
+
intern = true;
|
535
|
+
}
|
536
|
+
VALUE result;
|
537
|
+
# ifdef HAVE_RB_ENC_INTERNED_STR
|
538
|
+
if (intern) {
|
539
|
+
result = rb_enc_interned_str(start, (long)(end - start), enc_utf8);
|
540
|
+
} else {
|
541
|
+
result = rb_utf8_str_new(start, (long)(end - start));
|
542
|
+
}
|
543
|
+
# else
|
544
|
+
result = rb_utf8_str_new(start, (long)(end - start));
|
545
|
+
if (intern) {
|
546
|
+
result = rb_funcall(rb_str_freeze(result), i_uminus, 0);
|
547
|
+
}
|
548
|
+
# endif
|
113
549
|
|
114
|
-
|
550
|
+
if (symbolize) {
|
551
|
+
result = rb_str_intern(result);
|
552
|
+
}
|
115
553
|
|
554
|
+
return result;
|
555
|
+
}
|
116
556
|
|
117
|
-
static
|
557
|
+
static inline VALUE json_string_fastpath(JSON_ParserState *state, const char *string, const char *stringEnd, bool is_name, bool intern, bool symbolize)
|
118
558
|
{
|
119
|
-
|
120
|
-
VALUE last_name = Qnil;
|
121
|
-
VALUE object_class = json->object_class;
|
559
|
+
size_t bufferSize = stringEnd - string;
|
122
560
|
|
123
|
-
if (
|
124
|
-
|
125
|
-
|
561
|
+
if (is_name && state->in_array) {
|
562
|
+
VALUE cached_key;
|
563
|
+
if (RB_UNLIKELY(symbolize)) {
|
564
|
+
cached_key = rsymbol_cache_fetch(&state->name_cache, string, bufferSize);
|
565
|
+
} else {
|
566
|
+
cached_key = rstring_cache_fetch(&state->name_cache, string, bufferSize);
|
567
|
+
}
|
126
568
|
|
127
|
-
|
128
|
-
|
129
|
-
|
130
|
-
#line 131 "parser.c"
|
131
|
-
{
|
132
|
-
cs = JSON_object_start;
|
133
|
-
}
|
134
|
-
|
135
|
-
#line 182 "parser.rl"
|
136
|
-
|
137
|
-
#line 138 "parser.c"
|
138
|
-
{
|
139
|
-
if ( p == pe )
|
140
|
-
goto _test_eof;
|
141
|
-
switch ( cs )
|
142
|
-
{
|
143
|
-
case 1:
|
144
|
-
if ( (*p) == 123 )
|
145
|
-
goto st2;
|
146
|
-
goto st0;
|
147
|
-
st0:
|
148
|
-
cs = 0;
|
149
|
-
goto _out;
|
150
|
-
st2:
|
151
|
-
if ( ++p == pe )
|
152
|
-
goto _test_eof2;
|
153
|
-
case 2:
|
154
|
-
switch( (*p) ) {
|
155
|
-
case 13: goto st2;
|
156
|
-
case 32: goto st2;
|
157
|
-
case 34: goto tr2;
|
158
|
-
case 47: goto st23;
|
159
|
-
case 125: goto tr4;
|
160
|
-
}
|
161
|
-
if ( 9 <= (*p) && (*p) <= 10 )
|
162
|
-
goto st2;
|
163
|
-
goto st0;
|
164
|
-
tr2:
|
165
|
-
#line 149 "parser.rl"
|
166
|
-
{
|
167
|
-
char *np;
|
168
|
-
json->parsing_name = 1;
|
169
|
-
np = JSON_parse_string(json, p, pe, &last_name);
|
170
|
-
json->parsing_name = 0;
|
171
|
-
if (np == NULL) { p--; {p++; cs = 3; goto _out;} } else {p = (( np))-1;}
|
569
|
+
if (RB_LIKELY(cached_key)) {
|
570
|
+
return cached_key;
|
571
|
+
}
|
172
572
|
}
|
173
|
-
|
174
|
-
|
175
|
-
|
176
|
-
|
177
|
-
|
178
|
-
|
179
|
-
|
180
|
-
|
181
|
-
|
182
|
-
|
183
|
-
|
184
|
-
|
185
|
-
|
186
|
-
|
187
|
-
|
188
|
-
|
189
|
-
if ( ++p == pe )
|
190
|
-
goto _test_eof4;
|
191
|
-
case 4:
|
192
|
-
switch( (*p) ) {
|
193
|
-
case 42: goto st5;
|
194
|
-
case 47: goto st7;
|
195
|
-
}
|
196
|
-
goto st0;
|
197
|
-
st5:
|
198
|
-
if ( ++p == pe )
|
199
|
-
goto _test_eof5;
|
200
|
-
case 5:
|
201
|
-
if ( (*p) == 42 )
|
202
|
-
goto st6;
|
203
|
-
goto st5;
|
204
|
-
st6:
|
205
|
-
if ( ++p == pe )
|
206
|
-
goto _test_eof6;
|
207
|
-
case 6:
|
208
|
-
switch( (*p) ) {
|
209
|
-
case 42: goto st6;
|
210
|
-
case 47: goto st3;
|
211
|
-
}
|
212
|
-
goto st5;
|
213
|
-
st7:
|
214
|
-
if ( ++p == pe )
|
215
|
-
goto _test_eof7;
|
216
|
-
case 7:
|
217
|
-
if ( (*p) == 10 )
|
218
|
-
goto st3;
|
219
|
-
goto st7;
|
220
|
-
st8:
|
221
|
-
if ( ++p == pe )
|
222
|
-
goto _test_eof8;
|
223
|
-
case 8:
|
224
|
-
switch( (*p) ) {
|
225
|
-
case 13: goto st8;
|
226
|
-
case 32: goto st8;
|
227
|
-
case 34: goto tr11;
|
228
|
-
case 45: goto tr11;
|
229
|
-
case 47: goto st19;
|
230
|
-
case 73: goto tr11;
|
231
|
-
case 78: goto tr11;
|
232
|
-
case 91: goto tr11;
|
233
|
-
case 102: goto tr11;
|
234
|
-
case 110: goto tr11;
|
235
|
-
case 116: goto tr11;
|
236
|
-
case 123: goto tr11;
|
237
|
-
}
|
238
|
-
if ( (*p) > 10 ) {
|
239
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
240
|
-
goto tr11;
|
241
|
-
} else if ( (*p) >= 9 )
|
242
|
-
goto st8;
|
243
|
-
goto st0;
|
244
|
-
tr11:
|
245
|
-
#line 133 "parser.rl"
|
246
|
-
{
|
247
|
-
VALUE v = Qnil;
|
248
|
-
char *np = JSON_parse_value(json, p, pe, &v, current_nesting);
|
249
|
-
if (np == NULL) {
|
250
|
-
p--; {p++; cs = 9; goto _out;}
|
573
|
+
|
574
|
+
return build_string(string, stringEnd, intern, symbolize);
|
575
|
+
}
|
576
|
+
|
577
|
+
static VALUE json_string_unescape(JSON_ParserState *state, const char *string, const char *stringEnd, bool is_name, bool intern, bool symbolize)
|
578
|
+
{
|
579
|
+
size_t bufferSize = stringEnd - string;
|
580
|
+
const char *p = string, *pe = string, *unescape, *bufferStart;
|
581
|
+
char *buffer;
|
582
|
+
int unescape_len;
|
583
|
+
char buf[4];
|
584
|
+
|
585
|
+
if (is_name && state->in_array) {
|
586
|
+
VALUE cached_key;
|
587
|
+
if (RB_UNLIKELY(symbolize)) {
|
588
|
+
cached_key = rsymbol_cache_fetch(&state->name_cache, string, bufferSize);
|
251
589
|
} else {
|
252
|
-
|
253
|
-
|
254
|
-
|
255
|
-
|
256
|
-
|
257
|
-
}
|
258
|
-
{p = (( np))-1;}
|
590
|
+
cached_key = rstring_cache_fetch(&state->name_cache, string, bufferSize);
|
591
|
+
}
|
592
|
+
|
593
|
+
if (RB_LIKELY(cached_key)) {
|
594
|
+
return cached_key;
|
259
595
|
}
|
260
596
|
}
|
261
|
-
|
262
|
-
|
263
|
-
|
264
|
-
|
265
|
-
|
266
|
-
|
267
|
-
|
268
|
-
|
269
|
-
|
270
|
-
|
271
|
-
|
272
|
-
|
273
|
-
|
274
|
-
|
275
|
-
|
276
|
-
|
277
|
-
|
278
|
-
|
279
|
-
|
280
|
-
|
281
|
-
|
282
|
-
|
283
|
-
|
284
|
-
|
285
|
-
|
286
|
-
|
287
|
-
|
288
|
-
|
289
|
-
|
290
|
-
|
291
|
-
|
292
|
-
|
293
|
-
case
|
294
|
-
|
295
|
-
|
296
|
-
|
297
|
-
|
298
|
-
|
299
|
-
|
300
|
-
|
301
|
-
|
302
|
-
|
303
|
-
|
304
|
-
|
305
|
-
|
306
|
-
|
307
|
-
|
308
|
-
|
309
|
-
|
310
|
-
|
311
|
-
|
312
|
-
|
313
|
-
|
314
|
-
|
315
|
-
|
316
|
-
|
317
|
-
|
318
|
-
|
319
|
-
|
320
|
-
|
321
|
-
|
322
|
-
|
323
|
-
|
324
|
-
|
325
|
-
|
326
|
-
|
327
|
-
|
328
|
-
|
329
|
-
}
|
330
|
-
goto st0;
|
331
|
-
st16:
|
332
|
-
if ( ++p == pe )
|
333
|
-
goto _test_eof16;
|
334
|
-
case 16:
|
335
|
-
if ( (*p) == 42 )
|
336
|
-
goto st17;
|
337
|
-
goto st16;
|
338
|
-
st17:
|
339
|
-
if ( ++p == pe )
|
340
|
-
goto _test_eof17;
|
341
|
-
case 17:
|
342
|
-
switch( (*p) ) {
|
343
|
-
case 42: goto st17;
|
344
|
-
case 47: goto st9;
|
345
|
-
}
|
346
|
-
goto st16;
|
347
|
-
st18:
|
348
|
-
if ( ++p == pe )
|
349
|
-
goto _test_eof18;
|
350
|
-
case 18:
|
351
|
-
if ( (*p) == 10 )
|
352
|
-
goto st9;
|
353
|
-
goto st18;
|
354
|
-
tr4:
|
355
|
-
#line 157 "parser.rl"
|
356
|
-
{ p--; {p++; cs = 27; goto _out;} }
|
357
|
-
goto st27;
|
358
|
-
st27:
|
359
|
-
if ( ++p == pe )
|
360
|
-
goto _test_eof27;
|
361
|
-
case 27:
|
362
|
-
#line 363 "parser.c"
|
363
|
-
goto st0;
|
364
|
-
st19:
|
365
|
-
if ( ++p == pe )
|
366
|
-
goto _test_eof19;
|
367
|
-
case 19:
|
368
|
-
switch( (*p) ) {
|
369
|
-
case 42: goto st20;
|
370
|
-
case 47: goto st22;
|
371
|
-
}
|
372
|
-
goto st0;
|
373
|
-
st20:
|
374
|
-
if ( ++p == pe )
|
375
|
-
goto _test_eof20;
|
376
|
-
case 20:
|
377
|
-
if ( (*p) == 42 )
|
378
|
-
goto st21;
|
379
|
-
goto st20;
|
380
|
-
st21:
|
381
|
-
if ( ++p == pe )
|
382
|
-
goto _test_eof21;
|
383
|
-
case 21:
|
384
|
-
switch( (*p) ) {
|
385
|
-
case 42: goto st21;
|
386
|
-
case 47: goto st8;
|
387
|
-
}
|
388
|
-
goto st20;
|
389
|
-
st22:
|
390
|
-
if ( ++p == pe )
|
391
|
-
goto _test_eof22;
|
392
|
-
case 22:
|
393
|
-
if ( (*p) == 10 )
|
394
|
-
goto st8;
|
395
|
-
goto st22;
|
396
|
-
st23:
|
397
|
-
if ( ++p == pe )
|
398
|
-
goto _test_eof23;
|
399
|
-
case 23:
|
400
|
-
switch( (*p) ) {
|
401
|
-
case 42: goto st24;
|
402
|
-
case 47: goto st26;
|
403
|
-
}
|
404
|
-
goto st0;
|
405
|
-
st24:
|
406
|
-
if ( ++p == pe )
|
407
|
-
goto _test_eof24;
|
408
|
-
case 24:
|
409
|
-
if ( (*p) == 42 )
|
410
|
-
goto st25;
|
411
|
-
goto st24;
|
412
|
-
st25:
|
413
|
-
if ( ++p == pe )
|
414
|
-
goto _test_eof25;
|
415
|
-
case 25:
|
416
|
-
switch( (*p) ) {
|
417
|
-
case 42: goto st25;
|
418
|
-
case 47: goto st2;
|
419
|
-
}
|
420
|
-
goto st24;
|
421
|
-
st26:
|
422
|
-
if ( ++p == pe )
|
423
|
-
goto _test_eof26;
|
424
|
-
case 26:
|
425
|
-
if ( (*p) == 10 )
|
426
|
-
goto st2;
|
427
|
-
goto st26;
|
428
|
-
}
|
429
|
-
_test_eof2: cs = 2; goto _test_eof;
|
430
|
-
_test_eof3: cs = 3; goto _test_eof;
|
431
|
-
_test_eof4: cs = 4; goto _test_eof;
|
432
|
-
_test_eof5: cs = 5; goto _test_eof;
|
433
|
-
_test_eof6: cs = 6; goto _test_eof;
|
434
|
-
_test_eof7: cs = 7; goto _test_eof;
|
435
|
-
_test_eof8: cs = 8; goto _test_eof;
|
436
|
-
_test_eof9: cs = 9; goto _test_eof;
|
437
|
-
_test_eof10: cs = 10; goto _test_eof;
|
438
|
-
_test_eof11: cs = 11; goto _test_eof;
|
439
|
-
_test_eof12: cs = 12; goto _test_eof;
|
440
|
-
_test_eof13: cs = 13; goto _test_eof;
|
441
|
-
_test_eof14: cs = 14; goto _test_eof;
|
442
|
-
_test_eof15: cs = 15; goto _test_eof;
|
443
|
-
_test_eof16: cs = 16; goto _test_eof;
|
444
|
-
_test_eof17: cs = 17; goto _test_eof;
|
445
|
-
_test_eof18: cs = 18; goto _test_eof;
|
446
|
-
_test_eof27: cs = 27; goto _test_eof;
|
447
|
-
_test_eof19: cs = 19; goto _test_eof;
|
448
|
-
_test_eof20: cs = 20; goto _test_eof;
|
449
|
-
_test_eof21: cs = 21; goto _test_eof;
|
450
|
-
_test_eof22: cs = 22; goto _test_eof;
|
451
|
-
_test_eof23: cs = 23; goto _test_eof;
|
452
|
-
_test_eof24: cs = 24; goto _test_eof;
|
453
|
-
_test_eof25: cs = 25; goto _test_eof;
|
454
|
-
_test_eof26: cs = 26; goto _test_eof;
|
455
|
-
|
456
|
-
_test_eof: {}
|
457
|
-
_out: {}
|
458
|
-
}
|
459
|
-
|
460
|
-
#line 183 "parser.rl"
|
461
|
-
|
462
|
-
if (cs >= JSON_object_first_final) {
|
463
|
-
if (json->create_additions) {
|
464
|
-
VALUE klassname;
|
465
|
-
if (NIL_P(json->object_class)) {
|
466
|
-
klassname = rb_hash_aref(*result, json->create_id);
|
467
|
-
} else {
|
468
|
-
klassname = rb_funcall(*result, i_aref, 1, json->create_id);
|
469
|
-
}
|
470
|
-
if (!NIL_P(klassname)) {
|
471
|
-
VALUE klass = rb_funcall(mJSON, i_deep_const_get, 1, klassname);
|
472
|
-
if (RTEST(rb_funcall(klass, i_json_creatable_p, 0))) {
|
473
|
-
*result = rb_funcall(klass, i_json_create, 1, *result);
|
597
|
+
|
598
|
+
VALUE result = rb_str_buf_new(bufferSize);
|
599
|
+
rb_enc_associate_index(result, utf8_encindex);
|
600
|
+
buffer = RSTRING_PTR(result);
|
601
|
+
bufferStart = buffer;
|
602
|
+
|
603
|
+
while ((pe = memchr(pe, '\\', stringEnd - pe))) {
|
604
|
+
unescape = (char *) "?";
|
605
|
+
unescape_len = 1;
|
606
|
+
if (pe > p) {
|
607
|
+
MEMCPY(buffer, p, char, pe - p);
|
608
|
+
buffer += pe - p;
|
609
|
+
}
|
610
|
+
switch (*++pe) {
|
611
|
+
case 'n':
|
612
|
+
unescape = (char *) "\n";
|
613
|
+
break;
|
614
|
+
case 'r':
|
615
|
+
unescape = (char *) "\r";
|
616
|
+
break;
|
617
|
+
case 't':
|
618
|
+
unescape = (char *) "\t";
|
619
|
+
break;
|
620
|
+
case '"':
|
621
|
+
unescape = (char *) "\"";
|
622
|
+
break;
|
623
|
+
case '\\':
|
624
|
+
unescape = (char *) "\\";
|
625
|
+
break;
|
626
|
+
case 'b':
|
627
|
+
unescape = (char *) "\b";
|
628
|
+
break;
|
629
|
+
case 'f':
|
630
|
+
unescape = (char *) "\f";
|
631
|
+
break;
|
632
|
+
case 'u':
|
633
|
+
if (pe > stringEnd - 5) {
|
634
|
+
raise_parse_error("incomplete unicode character escape sequence at '%s'", p);
|
635
|
+
} else {
|
636
|
+
uint32_t ch = unescape_unicode((unsigned char *) ++pe);
|
637
|
+
pe += 3;
|
638
|
+
/* To handle values above U+FFFF, we take a sequence of
|
639
|
+
* \uXXXX escapes in the U+D800..U+DBFF then
|
640
|
+
* U+DC00..U+DFFF ranges, take the low 10 bits from each
|
641
|
+
* to make a 20-bit number, then add 0x10000 to get the
|
642
|
+
* final codepoint.
|
643
|
+
*
|
644
|
+
* See Unicode 15: 3.8 "Surrogates", 5.3 "Handling
|
645
|
+
* Surrogate Pairs in UTF-16", and 23.6 "Surrogates
|
646
|
+
* Area".
|
647
|
+
*/
|
648
|
+
if ((ch & 0xFC00) == 0xD800) {
|
649
|
+
pe++;
|
650
|
+
if (pe > stringEnd - 6) {
|
651
|
+
raise_parse_error("incomplete surrogate pair at '%s'", p);
|
652
|
+
}
|
653
|
+
if (pe[0] == '\\' && pe[1] == 'u') {
|
654
|
+
uint32_t sur = unescape_unicode((unsigned char *) pe + 2);
|
655
|
+
ch = (((ch & 0x3F) << 10) | ((((ch >> 6) & 0xF) + 1) << 16)
|
656
|
+
| (sur & 0x3FF));
|
657
|
+
pe += 5;
|
658
|
+
} else {
|
659
|
+
unescape = (char *) "?";
|
660
|
+
break;
|
661
|
+
}
|
662
|
+
}
|
663
|
+
unescape_len = convert_UTF32_to_UTF8(buf, ch);
|
664
|
+
unescape = buf;
|
474
665
|
}
|
475
|
-
|
666
|
+
break;
|
667
|
+
default:
|
668
|
+
p = pe;
|
669
|
+
continue;
|
476
670
|
}
|
477
|
-
|
478
|
-
|
479
|
-
|
671
|
+
MEMCPY(buffer, unescape, char, unescape_len);
|
672
|
+
buffer += unescape_len;
|
673
|
+
p = ++pe;
|
480
674
|
}
|
481
|
-
}
|
482
675
|
|
676
|
+
if (stringEnd > p) {
|
677
|
+
MEMCPY(buffer, p, char, stringEnd - p);
|
678
|
+
buffer += stringEnd - p;
|
679
|
+
}
|
680
|
+
rb_str_set_len(result, buffer - bufferStart);
|
483
681
|
|
682
|
+
if (symbolize) {
|
683
|
+
result = rb_str_intern(result);
|
684
|
+
} else if (intern) {
|
685
|
+
result = rb_funcall(rb_str_freeze(result), i_uminus, 0);
|
686
|
+
}
|
484
687
|
|
485
|
-
|
486
|
-
|
487
|
-
enum {JSON_value_first_final = 29};
|
488
|
-
enum {JSON_value_error = 0};
|
688
|
+
return result;
|
689
|
+
}
|
489
690
|
|
490
|
-
|
691
|
+
#define MAX_FAST_INTEGER_SIZE 18
|
692
|
+
static inline VALUE fast_decode_integer(const char *p, const char *pe)
|
693
|
+
{
|
694
|
+
bool negative = false;
|
695
|
+
if (*p == '-') {
|
696
|
+
negative = true;
|
697
|
+
p++;
|
698
|
+
}
|
491
699
|
|
700
|
+
long long memo = 0;
|
701
|
+
while (p < pe) {
|
702
|
+
memo *= 10;
|
703
|
+
memo += *p - '0';
|
704
|
+
p++;
|
705
|
+
}
|
492
706
|
|
493
|
-
|
707
|
+
if (negative) {
|
708
|
+
memo = -memo;
|
709
|
+
}
|
710
|
+
return LL2NUM(memo);
|
711
|
+
}
|
494
712
|
|
713
|
+
static VALUE json_decode_large_integer(const char *start, long len)
|
714
|
+
{
|
715
|
+
VALUE buffer_v;
|
716
|
+
char *buffer = RB_ALLOCV_N(char, buffer_v, len + 1);
|
717
|
+
MEMCPY(buffer, start, char, len);
|
718
|
+
buffer[len] = '\0';
|
719
|
+
VALUE number = rb_cstr2inum(buffer, 10);
|
720
|
+
RB_ALLOCV_END(buffer_v);
|
721
|
+
return number;
|
722
|
+
}
|
495
723
|
|
496
|
-
static
|
724
|
+
static inline VALUE
|
725
|
+
json_decode_integer(const char *start, const char *end)
|
497
726
|
{
|
498
|
-
|
499
|
-
|
500
|
-
|
501
|
-
#line 502 "parser.c"
|
502
|
-
{
|
503
|
-
cs = JSON_value_start;
|
504
|
-
}
|
505
|
-
|
506
|
-
#line 290 "parser.rl"
|
507
|
-
|
508
|
-
#line 509 "parser.c"
|
509
|
-
{
|
510
|
-
if ( p == pe )
|
511
|
-
goto _test_eof;
|
512
|
-
switch ( cs )
|
513
|
-
{
|
514
|
-
st1:
|
515
|
-
if ( ++p == pe )
|
516
|
-
goto _test_eof1;
|
517
|
-
case 1:
|
518
|
-
switch( (*p) ) {
|
519
|
-
case 13: goto st1;
|
520
|
-
case 32: goto st1;
|
521
|
-
case 34: goto tr2;
|
522
|
-
case 45: goto tr3;
|
523
|
-
case 47: goto st6;
|
524
|
-
case 73: goto st10;
|
525
|
-
case 78: goto st17;
|
526
|
-
case 91: goto tr7;
|
527
|
-
case 102: goto st19;
|
528
|
-
case 110: goto st23;
|
529
|
-
case 116: goto st26;
|
530
|
-
case 123: goto tr11;
|
531
|
-
}
|
532
|
-
if ( (*p) > 10 ) {
|
533
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
534
|
-
goto tr3;
|
535
|
-
} else if ( (*p) >= 9 )
|
536
|
-
goto st1;
|
537
|
-
goto st0;
|
538
|
-
st0:
|
539
|
-
cs = 0;
|
540
|
-
goto _out;
|
541
|
-
tr2:
|
542
|
-
#line 235 "parser.rl"
|
543
|
-
{
|
544
|
-
char *np = JSON_parse_string(json, p, pe, result);
|
545
|
-
if (np == NULL) { p--; {p++; cs = 29; goto _out;} } else {p = (( np))-1;}
|
546
|
-
}
|
547
|
-
goto st29;
|
548
|
-
tr3:
|
549
|
-
#line 240 "parser.rl"
|
550
|
-
{
|
551
|
-
char *np;
|
552
|
-
if(pe > p + 8 && !strncmp(MinusInfinity, p, 9)) {
|
553
|
-
if (json->allow_nan) {
|
554
|
-
*result = CMinusInfinity;
|
555
|
-
{p = (( p + 10))-1;}
|
556
|
-
p--; {p++; cs = 29; goto _out;}
|
557
|
-
} else {
|
558
|
-
rb_enc_raise(EXC_ENCODING eParserError, "unexpected token at '%s'", p);
|
559
|
-
}
|
727
|
+
long len = end - start;
|
728
|
+
if (RB_LIKELY(len < MAX_FAST_INTEGER_SIZE)) {
|
729
|
+
return fast_decode_integer(start, end);
|
560
730
|
}
|
561
|
-
|
562
|
-
|
563
|
-
|
564
|
-
|
565
|
-
|
731
|
+
return json_decode_large_integer(start, len);
|
732
|
+
}
|
733
|
+
|
734
|
+
static VALUE json_decode_large_float(const char *start, long len)
|
735
|
+
{
|
736
|
+
VALUE buffer_v;
|
737
|
+
char *buffer = RB_ALLOCV_N(char, buffer_v, len + 1);
|
738
|
+
MEMCPY(buffer, start, char, len);
|
739
|
+
buffer[len] = '\0';
|
740
|
+
VALUE number = DBL2NUM(rb_cstr_to_dbl(buffer, 1));
|
741
|
+
RB_ALLOCV_END(buffer_v);
|
742
|
+
return number;
|
743
|
+
}
|
744
|
+
|
745
|
+
static VALUE json_decode_float(JSON_ParserConfig *config, const char *start, const char *end)
|
746
|
+
{
|
747
|
+
long len = end - start;
|
748
|
+
|
749
|
+
if (RB_UNLIKELY(config->decimal_class)) {
|
750
|
+
VALUE text = rb_str_new(start, len);
|
751
|
+
return rb_funcallv(config->decimal_class, config->decimal_method_id, 1, &text);
|
752
|
+
} else if (RB_LIKELY(len < 64)) {
|
753
|
+
char buffer[64];
|
754
|
+
MEMCPY(buffer, start, char, len);
|
755
|
+
buffer[len] = '\0';
|
756
|
+
return DBL2NUM(rb_cstr_to_dbl(buffer, 1));
|
757
|
+
} else {
|
758
|
+
return json_decode_large_float(start, len);
|
566
759
|
}
|
567
|
-
|
568
|
-
|
569
|
-
|
570
|
-
|
571
|
-
|
572
|
-
|
573
|
-
|
760
|
+
}
|
761
|
+
|
762
|
+
static inline VALUE json_decode_array(JSON_ParserState *state, JSON_ParserConfig *config, long count)
|
763
|
+
{
|
764
|
+
VALUE array;
|
765
|
+
if (RB_UNLIKELY(config->array_class)) {
|
766
|
+
array = rb_class_new_instance(0, 0, config->array_class);
|
767
|
+
VALUE *items = rvalue_stack_peek(state->stack, count);
|
768
|
+
long index;
|
769
|
+
for (index = 0; index < count; index++) {
|
770
|
+
rb_funcall(array, i_leftshift, 1, items[index]);
|
771
|
+
}
|
772
|
+
} else {
|
773
|
+
array = rb_ary_new_from_values(count, rvalue_stack_peek(state->stack, count));
|
574
774
|
}
|
575
|
-
|
576
|
-
|
577
|
-
|
578
|
-
|
579
|
-
|
580
|
-
np = JSON_parse_object(json, p, pe, result, current_nesting + 1);
|
581
|
-
if (np == NULL) { p--; {p++; cs = 29; goto _out;} } else {p = (( np))-1;}
|
775
|
+
|
776
|
+
rvalue_stack_pop(state->stack, count);
|
777
|
+
|
778
|
+
if (config->freeze) {
|
779
|
+
RB_OBJ_FREEZE(array);
|
582
780
|
}
|
583
|
-
|
584
|
-
|
585
|
-
|
586
|
-
|
587
|
-
|
588
|
-
|
589
|
-
|
590
|
-
|
781
|
+
|
782
|
+
return array;
|
783
|
+
}
|
784
|
+
|
785
|
+
static inline VALUE json_decode_object(JSON_ParserState *state, JSON_ParserConfig *config, long count)
|
786
|
+
{
|
787
|
+
VALUE object;
|
788
|
+
if (RB_UNLIKELY(config->object_class)) {
|
789
|
+
object = rb_class_new_instance(0, 0, config->object_class);
|
790
|
+
long index = 0;
|
791
|
+
VALUE *items = rvalue_stack_peek(state->stack, count);
|
792
|
+
while (index < count) {
|
793
|
+
VALUE name = items[index++];
|
794
|
+
VALUE value = items[index++];
|
795
|
+
rb_funcall(object, i_aset, 2, name, value);
|
591
796
|
}
|
797
|
+
} else {
|
798
|
+
object = rb_hash_new_capa(count);
|
799
|
+
rb_hash_bulk_insert(count, rvalue_stack_peek(state->stack, count), object);
|
592
800
|
}
|
593
|
-
|
594
|
-
|
595
|
-
|
596
|
-
|
597
|
-
|
598
|
-
|
801
|
+
|
802
|
+
rvalue_stack_pop(state->stack, count);
|
803
|
+
|
804
|
+
if (RB_UNLIKELY(config->create_additions)) {
|
805
|
+
VALUE klassname;
|
806
|
+
if (config->object_class) {
|
807
|
+
klassname = rb_funcall(object, i_aref, 1, config->create_id);
|
599
808
|
} else {
|
600
|
-
|
809
|
+
klassname = rb_hash_aref(object, config->create_id);
|
810
|
+
}
|
811
|
+
if (!NIL_P(klassname)) {
|
812
|
+
VALUE klass = rb_funcall(mJSON, i_deep_const_get, 1, klassname);
|
813
|
+
if (RTEST(rb_funcall(klass, i_json_creatable_p, 0))) {
|
814
|
+
if (config->deprecated_create_additions) {
|
815
|
+
json_deprecated(deprecated_create_additions_warning);
|
816
|
+
}
|
817
|
+
object = rb_funcall(klass, i_json_create, 1, object);
|
818
|
+
}
|
601
819
|
}
|
602
820
|
}
|
603
|
-
|
604
|
-
|
605
|
-
|
606
|
-
{
|
607
|
-
*result = Qfalse;
|
608
|
-
}
|
609
|
-
goto st29;
|
610
|
-
tr34:
|
611
|
-
#line 212 "parser.rl"
|
612
|
-
{
|
613
|
-
*result = Qnil;
|
614
|
-
}
|
615
|
-
goto st29;
|
616
|
-
tr37:
|
617
|
-
#line 218 "parser.rl"
|
618
|
-
{
|
619
|
-
*result = Qtrue;
|
821
|
+
|
822
|
+
if (config->freeze) {
|
823
|
+
RB_OBJ_FREEZE(object);
|
620
824
|
}
|
621
|
-
|
622
|
-
|
623
|
-
|
624
|
-
|
625
|
-
|
626
|
-
|
627
|
-
|
628
|
-
|
629
|
-
|
630
|
-
|
631
|
-
|
632
|
-
case 47: goto st2;
|
633
|
-
}
|
634
|
-
if ( 9 <= (*p) && (*p) <= 10 )
|
635
|
-
goto st29;
|
636
|
-
goto st0;
|
637
|
-
st2:
|
638
|
-
if ( ++p == pe )
|
639
|
-
goto _test_eof2;
|
640
|
-
case 2:
|
641
|
-
switch( (*p) ) {
|
642
|
-
case 42: goto st3;
|
643
|
-
case 47: goto st5;
|
644
|
-
}
|
645
|
-
goto st0;
|
646
|
-
st3:
|
647
|
-
if ( ++p == pe )
|
648
|
-
goto _test_eof3;
|
649
|
-
case 3:
|
650
|
-
if ( (*p) == 42 )
|
651
|
-
goto st4;
|
652
|
-
goto st3;
|
653
|
-
st4:
|
654
|
-
if ( ++p == pe )
|
655
|
-
goto _test_eof4;
|
656
|
-
case 4:
|
657
|
-
switch( (*p) ) {
|
658
|
-
case 42: goto st4;
|
659
|
-
case 47: goto st29;
|
660
|
-
}
|
661
|
-
goto st3;
|
662
|
-
st5:
|
663
|
-
if ( ++p == pe )
|
664
|
-
goto _test_eof5;
|
665
|
-
case 5:
|
666
|
-
if ( (*p) == 10 )
|
667
|
-
goto st29;
|
668
|
-
goto st5;
|
669
|
-
st6:
|
670
|
-
if ( ++p == pe )
|
671
|
-
goto _test_eof6;
|
672
|
-
case 6:
|
673
|
-
switch( (*p) ) {
|
674
|
-
case 42: goto st7;
|
675
|
-
case 47: goto st9;
|
676
|
-
}
|
677
|
-
goto st0;
|
678
|
-
st7:
|
679
|
-
if ( ++p == pe )
|
680
|
-
goto _test_eof7;
|
681
|
-
case 7:
|
682
|
-
if ( (*p) == 42 )
|
683
|
-
goto st8;
|
684
|
-
goto st7;
|
685
|
-
st8:
|
686
|
-
if ( ++p == pe )
|
687
|
-
goto _test_eof8;
|
688
|
-
case 8:
|
689
|
-
switch( (*p) ) {
|
690
|
-
case 42: goto st8;
|
691
|
-
case 47: goto st1;
|
692
|
-
}
|
693
|
-
goto st7;
|
694
|
-
st9:
|
695
|
-
if ( ++p == pe )
|
696
|
-
goto _test_eof9;
|
697
|
-
case 9:
|
698
|
-
if ( (*p) == 10 )
|
699
|
-
goto st1;
|
700
|
-
goto st9;
|
701
|
-
st10:
|
702
|
-
if ( ++p == pe )
|
703
|
-
goto _test_eof10;
|
704
|
-
case 10:
|
705
|
-
if ( (*p) == 110 )
|
706
|
-
goto st11;
|
707
|
-
goto st0;
|
708
|
-
st11:
|
709
|
-
if ( ++p == pe )
|
710
|
-
goto _test_eof11;
|
711
|
-
case 11:
|
712
|
-
if ( (*p) == 102 )
|
713
|
-
goto st12;
|
714
|
-
goto st0;
|
715
|
-
st12:
|
716
|
-
if ( ++p == pe )
|
717
|
-
goto _test_eof12;
|
718
|
-
case 12:
|
719
|
-
if ( (*p) == 105 )
|
720
|
-
goto st13;
|
721
|
-
goto st0;
|
722
|
-
st13:
|
723
|
-
if ( ++p == pe )
|
724
|
-
goto _test_eof13;
|
725
|
-
case 13:
|
726
|
-
if ( (*p) == 110 )
|
727
|
-
goto st14;
|
728
|
-
goto st0;
|
729
|
-
st14:
|
730
|
-
if ( ++p == pe )
|
731
|
-
goto _test_eof14;
|
732
|
-
case 14:
|
733
|
-
if ( (*p) == 105 )
|
734
|
-
goto st15;
|
735
|
-
goto st0;
|
736
|
-
st15:
|
737
|
-
if ( ++p == pe )
|
738
|
-
goto _test_eof15;
|
739
|
-
case 15:
|
740
|
-
if ( (*p) == 116 )
|
741
|
-
goto st16;
|
742
|
-
goto st0;
|
743
|
-
st16:
|
744
|
-
if ( ++p == pe )
|
745
|
-
goto _test_eof16;
|
746
|
-
case 16:
|
747
|
-
if ( (*p) == 121 )
|
748
|
-
goto tr25;
|
749
|
-
goto st0;
|
750
|
-
st17:
|
751
|
-
if ( ++p == pe )
|
752
|
-
goto _test_eof17;
|
753
|
-
case 17:
|
754
|
-
if ( (*p) == 97 )
|
755
|
-
goto st18;
|
756
|
-
goto st0;
|
757
|
-
st18:
|
758
|
-
if ( ++p == pe )
|
759
|
-
goto _test_eof18;
|
760
|
-
case 18:
|
761
|
-
if ( (*p) == 78 )
|
762
|
-
goto tr27;
|
763
|
-
goto st0;
|
764
|
-
st19:
|
765
|
-
if ( ++p == pe )
|
766
|
-
goto _test_eof19;
|
767
|
-
case 19:
|
768
|
-
if ( (*p) == 97 )
|
769
|
-
goto st20;
|
770
|
-
goto st0;
|
771
|
-
st20:
|
772
|
-
if ( ++p == pe )
|
773
|
-
goto _test_eof20;
|
774
|
-
case 20:
|
775
|
-
if ( (*p) == 108 )
|
776
|
-
goto st21;
|
777
|
-
goto st0;
|
778
|
-
st21:
|
779
|
-
if ( ++p == pe )
|
780
|
-
goto _test_eof21;
|
781
|
-
case 21:
|
782
|
-
if ( (*p) == 115 )
|
783
|
-
goto st22;
|
784
|
-
goto st0;
|
785
|
-
st22:
|
786
|
-
if ( ++p == pe )
|
787
|
-
goto _test_eof22;
|
788
|
-
case 22:
|
789
|
-
if ( (*p) == 101 )
|
790
|
-
goto tr31;
|
791
|
-
goto st0;
|
792
|
-
st23:
|
793
|
-
if ( ++p == pe )
|
794
|
-
goto _test_eof23;
|
795
|
-
case 23:
|
796
|
-
if ( (*p) == 117 )
|
797
|
-
goto st24;
|
798
|
-
goto st0;
|
799
|
-
st24:
|
800
|
-
if ( ++p == pe )
|
801
|
-
goto _test_eof24;
|
802
|
-
case 24:
|
803
|
-
if ( (*p) == 108 )
|
804
|
-
goto st25;
|
805
|
-
goto st0;
|
806
|
-
st25:
|
807
|
-
if ( ++p == pe )
|
808
|
-
goto _test_eof25;
|
809
|
-
case 25:
|
810
|
-
if ( (*p) == 108 )
|
811
|
-
goto tr34;
|
812
|
-
goto st0;
|
813
|
-
st26:
|
814
|
-
if ( ++p == pe )
|
815
|
-
goto _test_eof26;
|
816
|
-
case 26:
|
817
|
-
if ( (*p) == 114 )
|
818
|
-
goto st27;
|
819
|
-
goto st0;
|
820
|
-
st27:
|
821
|
-
if ( ++p == pe )
|
822
|
-
goto _test_eof27;
|
823
|
-
case 27:
|
824
|
-
if ( (*p) == 117 )
|
825
|
-
goto st28;
|
826
|
-
goto st0;
|
827
|
-
st28:
|
828
|
-
if ( ++p == pe )
|
829
|
-
goto _test_eof28;
|
830
|
-
case 28:
|
831
|
-
if ( (*p) == 101 )
|
832
|
-
goto tr37;
|
833
|
-
goto st0;
|
834
|
-
}
|
835
|
-
_test_eof1: cs = 1; goto _test_eof;
|
836
|
-
_test_eof29: cs = 29; goto _test_eof;
|
837
|
-
_test_eof2: cs = 2; goto _test_eof;
|
838
|
-
_test_eof3: cs = 3; goto _test_eof;
|
839
|
-
_test_eof4: cs = 4; goto _test_eof;
|
840
|
-
_test_eof5: cs = 5; goto _test_eof;
|
841
|
-
_test_eof6: cs = 6; goto _test_eof;
|
842
|
-
_test_eof7: cs = 7; goto _test_eof;
|
843
|
-
_test_eof8: cs = 8; goto _test_eof;
|
844
|
-
_test_eof9: cs = 9; goto _test_eof;
|
845
|
-
_test_eof10: cs = 10; goto _test_eof;
|
846
|
-
_test_eof11: cs = 11; goto _test_eof;
|
847
|
-
_test_eof12: cs = 12; goto _test_eof;
|
848
|
-
_test_eof13: cs = 13; goto _test_eof;
|
849
|
-
_test_eof14: cs = 14; goto _test_eof;
|
850
|
-
_test_eof15: cs = 15; goto _test_eof;
|
851
|
-
_test_eof16: cs = 16; goto _test_eof;
|
852
|
-
_test_eof17: cs = 17; goto _test_eof;
|
853
|
-
_test_eof18: cs = 18; goto _test_eof;
|
854
|
-
_test_eof19: cs = 19; goto _test_eof;
|
855
|
-
_test_eof20: cs = 20; goto _test_eof;
|
856
|
-
_test_eof21: cs = 21; goto _test_eof;
|
857
|
-
_test_eof22: cs = 22; goto _test_eof;
|
858
|
-
_test_eof23: cs = 23; goto _test_eof;
|
859
|
-
_test_eof24: cs = 24; goto _test_eof;
|
860
|
-
_test_eof25: cs = 25; goto _test_eof;
|
861
|
-
_test_eof26: cs = 26; goto _test_eof;
|
862
|
-
_test_eof27: cs = 27; goto _test_eof;
|
863
|
-
_test_eof28: cs = 28; goto _test_eof;
|
864
|
-
|
865
|
-
_test_eof: {}
|
866
|
-
_out: {}
|
867
|
-
}
|
868
|
-
|
869
|
-
#line 291 "parser.rl"
|
870
|
-
|
871
|
-
if (json->freeze) {
|
872
|
-
OBJ_FREEZE(*result);
|
825
|
+
|
826
|
+
return object;
|
827
|
+
}
|
828
|
+
|
829
|
+
static int match_i(VALUE regexp, VALUE klass, VALUE memo)
|
830
|
+
{
|
831
|
+
if (regexp == Qundef) return ST_STOP;
|
832
|
+
if (RTEST(rb_funcall(klass, i_json_creatable_p, 0)) &&
|
833
|
+
RTEST(rb_funcall(regexp, i_match, 1, rb_ary_entry(memo, 0)))) {
|
834
|
+
rb_ary_push(memo, klass);
|
835
|
+
return ST_STOP;
|
873
836
|
}
|
837
|
+
return ST_CONTINUE;
|
838
|
+
}
|
874
839
|
|
875
|
-
|
876
|
-
|
840
|
+
static inline VALUE json_decode_string(JSON_ParserState *state, JSON_ParserConfig *config, const char *start, const char *end, bool escaped, bool is_name)
|
841
|
+
{
|
842
|
+
VALUE string;
|
843
|
+
bool intern = is_name || config->freeze;
|
844
|
+
bool symbolize = is_name && config->symbolize_names;
|
845
|
+
if (escaped) {
|
846
|
+
string = json_string_unescape(state, start, end, is_name, intern, symbolize);
|
877
847
|
} else {
|
878
|
-
|
848
|
+
string = json_string_fastpath(state, start, end, is_name, intern, symbolize);
|
879
849
|
}
|
880
|
-
}
|
881
850
|
|
851
|
+
if (RB_UNLIKELY(config->create_additions && RTEST(config->match_string))) {
|
852
|
+
VALUE klass;
|
853
|
+
VALUE memo = rb_ary_new2(2);
|
854
|
+
rb_ary_push(memo, string);
|
855
|
+
rb_hash_foreach(config->match_string, match_i, memo);
|
856
|
+
klass = rb_ary_entry(memo, 1);
|
857
|
+
if (RTEST(klass)) {
|
858
|
+
string = rb_funcall(klass, i_json_create, 1, string);
|
859
|
+
}
|
860
|
+
}
|
882
861
|
|
883
|
-
|
884
|
-
|
885
|
-
enum {JSON_integer_first_final = 3};
|
886
|
-
enum {JSON_integer_error = 0};
|
862
|
+
return string;
|
863
|
+
}
|
887
864
|
|
888
|
-
|
865
|
+
#define PUSH(result) rvalue_stack_push(state->stack, result, &state->stack_handle, &state->stack)
|
866
|
+
|
867
|
+
static const bool string_scan[256] = {
|
868
|
+
// ASCII Control Characters
|
869
|
+
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
870
|
+
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
|
871
|
+
// ASCII Characters
|
872
|
+
0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // '"'
|
873
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
874
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
875
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, // '\\'
|
876
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
877
|
+
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
|
878
|
+
};
|
889
879
|
|
880
|
+
static inline VALUE json_parse_string(JSON_ParserState *state, JSON_ParserConfig *config, bool is_name)
|
881
|
+
{
|
882
|
+
state->cursor++;
|
883
|
+
const char *start = state->cursor;
|
884
|
+
bool escaped = false;
|
885
|
+
|
886
|
+
while (state->cursor < state->end) {
|
887
|
+
if (RB_UNLIKELY(string_scan[(unsigned char)*state->cursor])) {
|
888
|
+
switch (*state->cursor) {
|
889
|
+
case '"': {
|
890
|
+
VALUE string = json_decode_string(state, config, start, state->cursor, escaped, is_name);
|
891
|
+
state->cursor++;
|
892
|
+
return PUSH(string);
|
893
|
+
}
|
894
|
+
case '\\': {
|
895
|
+
state->cursor++;
|
896
|
+
escaped = true;
|
897
|
+
if ((unsigned char)*state->cursor < 0x20) {
|
898
|
+
raise_parse_error("invalid ASCII control character in string: %s", state->cursor);
|
899
|
+
}
|
900
|
+
break;
|
901
|
+
}
|
902
|
+
default:
|
903
|
+
raise_parse_error("invalid ASCII control character in string: %s", state->cursor);
|
904
|
+
break;
|
905
|
+
}
|
906
|
+
}
|
890
907
|
|
891
|
-
|
908
|
+
state->cursor++;
|
909
|
+
}
|
892
910
|
|
911
|
+
raise_parse_error("unexpected end of input, expected closing \"", state->cursor);
|
912
|
+
return Qfalse;
|
913
|
+
}
|
893
914
|
|
894
|
-
static
|
915
|
+
static VALUE json_parse_any(JSON_ParserState *state, JSON_ParserConfig *config)
|
895
916
|
{
|
896
|
-
|
897
|
-
|
898
|
-
|
899
|
-
#line 900 "parser.c"
|
900
|
-
{
|
901
|
-
cs = JSON_integer_start;
|
902
|
-
}
|
903
|
-
|
904
|
-
#line 318 "parser.rl"
|
905
|
-
json->memo = p;
|
906
|
-
|
907
|
-
#line 908 "parser.c"
|
908
|
-
{
|
909
|
-
if ( p == pe )
|
910
|
-
goto _test_eof;
|
911
|
-
switch ( cs )
|
912
|
-
{
|
913
|
-
case 1:
|
914
|
-
switch( (*p) ) {
|
915
|
-
case 45: goto st2;
|
916
|
-
case 48: goto st3;
|
917
|
-
}
|
918
|
-
if ( 49 <= (*p) && (*p) <= 57 )
|
919
|
-
goto st5;
|
920
|
-
goto st0;
|
921
|
-
st0:
|
922
|
-
cs = 0;
|
923
|
-
goto _out;
|
924
|
-
st2:
|
925
|
-
if ( ++p == pe )
|
926
|
-
goto _test_eof2;
|
927
|
-
case 2:
|
928
|
-
if ( (*p) == 48 )
|
929
|
-
goto st3;
|
930
|
-
if ( 49 <= (*p) && (*p) <= 57 )
|
931
|
-
goto st5;
|
932
|
-
goto st0;
|
933
|
-
st3:
|
934
|
-
if ( ++p == pe )
|
935
|
-
goto _test_eof3;
|
936
|
-
case 3:
|
937
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
938
|
-
goto st0;
|
939
|
-
goto tr4;
|
940
|
-
tr4:
|
941
|
-
#line 308 "parser.rl"
|
942
|
-
{ p--; {p++; cs = 4; goto _out;} }
|
943
|
-
goto st4;
|
944
|
-
st4:
|
945
|
-
if ( ++p == pe )
|
946
|
-
goto _test_eof4;
|
947
|
-
case 4:
|
948
|
-
#line 949 "parser.c"
|
949
|
-
goto st0;
|
950
|
-
st5:
|
951
|
-
if ( ++p == pe )
|
952
|
-
goto _test_eof5;
|
953
|
-
case 5:
|
954
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
955
|
-
goto st5;
|
956
|
-
goto tr4;
|
957
|
-
}
|
958
|
-
_test_eof2: cs = 2; goto _test_eof;
|
959
|
-
_test_eof3: cs = 3; goto _test_eof;
|
960
|
-
_test_eof4: cs = 4; goto _test_eof;
|
961
|
-
_test_eof5: cs = 5; goto _test_eof;
|
962
|
-
|
963
|
-
_test_eof: {}
|
964
|
-
_out: {}
|
965
|
-
}
|
966
|
-
|
967
|
-
#line 320 "parser.rl"
|
968
|
-
|
969
|
-
if (cs >= JSON_integer_first_final) {
|
970
|
-
long len = p - json->memo;
|
971
|
-
fbuffer_clear(json->fbuffer);
|
972
|
-
fbuffer_append(json->fbuffer, json->memo, len);
|
973
|
-
fbuffer_append_char(json->fbuffer, '\0');
|
974
|
-
*result = rb_cstr2inum(FBUFFER_PTR(json->fbuffer), 10);
|
975
|
-
return p + 1;
|
976
|
-
} else {
|
977
|
-
return NULL;
|
917
|
+
json_eat_whitespace(state);
|
918
|
+
if (state->cursor >= state->end) {
|
919
|
+
raise_parse_error("unexpected end of input", state->cursor);
|
978
920
|
}
|
979
|
-
}
|
980
|
-
|
981
921
|
|
982
|
-
|
983
|
-
|
984
|
-
|
985
|
-
|
986
|
-
|
987
|
-
|
922
|
+
switch (*state->cursor) {
|
923
|
+
case 'n':
|
924
|
+
if ((state->end - state->cursor >= 4) && (memcmp(state->cursor, "null", 4) == 0)) {
|
925
|
+
state->cursor += 4;
|
926
|
+
return PUSH(Qnil);
|
927
|
+
}
|
988
928
|
|
929
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
930
|
+
break;
|
931
|
+
case 't':
|
932
|
+
if ((state->end - state->cursor >= 4) && (memcmp(state->cursor, "true", 4) == 0)) {
|
933
|
+
state->cursor += 4;
|
934
|
+
return PUSH(Qtrue);
|
935
|
+
}
|
989
936
|
|
990
|
-
|
937
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
938
|
+
break;
|
939
|
+
case 'f':
|
940
|
+
// Note: memcmp with a small power of two compile to an integer comparison
|
941
|
+
if ((state->end - state->cursor >= 5) && (memcmp(state->cursor + 1, "alse", 4) == 0)) {
|
942
|
+
state->cursor += 5;
|
943
|
+
return PUSH(Qfalse);
|
944
|
+
}
|
991
945
|
|
946
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
947
|
+
break;
|
948
|
+
case 'N':
|
949
|
+
// Note: memcmp with a small power of two compile to an integer comparison
|
950
|
+
if (config->allow_nan && (state->end - state->cursor >= 3) && (memcmp(state->cursor + 1, "aN", 2) == 0)) {
|
951
|
+
state->cursor += 3;
|
952
|
+
return PUSH(CNaN);
|
953
|
+
}
|
992
954
|
|
993
|
-
|
994
|
-
|
995
|
-
|
996
|
-
|
997
|
-
|
998
|
-
|
999
|
-
{
|
1000
|
-
cs = JSON_float_start;
|
1001
|
-
}
|
1002
|
-
|
1003
|
-
#line 352 "parser.rl"
|
1004
|
-
json->memo = p;
|
1005
|
-
|
1006
|
-
#line 1007 "parser.c"
|
1007
|
-
{
|
1008
|
-
if ( p == pe )
|
1009
|
-
goto _test_eof;
|
1010
|
-
switch ( cs )
|
1011
|
-
{
|
1012
|
-
case 1:
|
1013
|
-
switch( (*p) ) {
|
1014
|
-
case 45: goto st2;
|
1015
|
-
case 48: goto st3;
|
1016
|
-
}
|
1017
|
-
if ( 49 <= (*p) && (*p) <= 57 )
|
1018
|
-
goto st7;
|
1019
|
-
goto st0;
|
1020
|
-
st0:
|
1021
|
-
cs = 0;
|
1022
|
-
goto _out;
|
1023
|
-
st2:
|
1024
|
-
if ( ++p == pe )
|
1025
|
-
goto _test_eof2;
|
1026
|
-
case 2:
|
1027
|
-
if ( (*p) == 48 )
|
1028
|
-
goto st3;
|
1029
|
-
if ( 49 <= (*p) && (*p) <= 57 )
|
1030
|
-
goto st7;
|
1031
|
-
goto st0;
|
1032
|
-
st3:
|
1033
|
-
if ( ++p == pe )
|
1034
|
-
goto _test_eof3;
|
1035
|
-
case 3:
|
1036
|
-
switch( (*p) ) {
|
1037
|
-
case 46: goto st4;
|
1038
|
-
case 69: goto st5;
|
1039
|
-
case 101: goto st5;
|
1040
|
-
}
|
1041
|
-
goto st0;
|
1042
|
-
st4:
|
1043
|
-
if ( ++p == pe )
|
1044
|
-
goto _test_eof4;
|
1045
|
-
case 4:
|
1046
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1047
|
-
goto st8;
|
1048
|
-
goto st0;
|
1049
|
-
st8:
|
1050
|
-
if ( ++p == pe )
|
1051
|
-
goto _test_eof8;
|
1052
|
-
case 8:
|
1053
|
-
switch( (*p) ) {
|
1054
|
-
case 69: goto st5;
|
1055
|
-
case 101: goto st5;
|
1056
|
-
}
|
1057
|
-
if ( (*p) > 46 ) {
|
1058
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1059
|
-
goto st8;
|
1060
|
-
} else if ( (*p) >= 45 )
|
1061
|
-
goto st0;
|
1062
|
-
goto tr9;
|
1063
|
-
tr9:
|
1064
|
-
#line 339 "parser.rl"
|
1065
|
-
{ p--; {p++; cs = 9; goto _out;} }
|
1066
|
-
goto st9;
|
1067
|
-
st9:
|
1068
|
-
if ( ++p == pe )
|
1069
|
-
goto _test_eof9;
|
1070
|
-
case 9:
|
1071
|
-
#line 1072 "parser.c"
|
1072
|
-
goto st0;
|
1073
|
-
st5:
|
1074
|
-
if ( ++p == pe )
|
1075
|
-
goto _test_eof5;
|
1076
|
-
case 5:
|
1077
|
-
switch( (*p) ) {
|
1078
|
-
case 43: goto st6;
|
1079
|
-
case 45: goto st6;
|
1080
|
-
}
|
1081
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1082
|
-
goto st10;
|
1083
|
-
goto st0;
|
1084
|
-
st6:
|
1085
|
-
if ( ++p == pe )
|
1086
|
-
goto _test_eof6;
|
1087
|
-
case 6:
|
1088
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1089
|
-
goto st10;
|
1090
|
-
goto st0;
|
1091
|
-
st10:
|
1092
|
-
if ( ++p == pe )
|
1093
|
-
goto _test_eof10;
|
1094
|
-
case 10:
|
1095
|
-
switch( (*p) ) {
|
1096
|
-
case 69: goto st0;
|
1097
|
-
case 101: goto st0;
|
1098
|
-
}
|
1099
|
-
if ( (*p) > 46 ) {
|
1100
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1101
|
-
goto st10;
|
1102
|
-
} else if ( (*p) >= 45 )
|
1103
|
-
goto st0;
|
1104
|
-
goto tr9;
|
1105
|
-
st7:
|
1106
|
-
if ( ++p == pe )
|
1107
|
-
goto _test_eof7;
|
1108
|
-
case 7:
|
1109
|
-
switch( (*p) ) {
|
1110
|
-
case 46: goto st4;
|
1111
|
-
case 69: goto st5;
|
1112
|
-
case 101: goto st5;
|
1113
|
-
}
|
1114
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1115
|
-
goto st7;
|
1116
|
-
goto st0;
|
1117
|
-
}
|
1118
|
-
_test_eof2: cs = 2; goto _test_eof;
|
1119
|
-
_test_eof3: cs = 3; goto _test_eof;
|
1120
|
-
_test_eof4: cs = 4; goto _test_eof;
|
1121
|
-
_test_eof8: cs = 8; goto _test_eof;
|
1122
|
-
_test_eof9: cs = 9; goto _test_eof;
|
1123
|
-
_test_eof5: cs = 5; goto _test_eof;
|
1124
|
-
_test_eof6: cs = 6; goto _test_eof;
|
1125
|
-
_test_eof10: cs = 10; goto _test_eof;
|
1126
|
-
_test_eof7: cs = 7; goto _test_eof;
|
1127
|
-
|
1128
|
-
_test_eof: {}
|
1129
|
-
_out: {}
|
1130
|
-
}
|
1131
|
-
|
1132
|
-
#line 354 "parser.rl"
|
1133
|
-
|
1134
|
-
if (cs >= JSON_float_first_final) {
|
1135
|
-
VALUE mod = Qnil;
|
1136
|
-
ID method_id = 0;
|
1137
|
-
if (rb_respond_to(json->decimal_class, i_try_convert)) {
|
1138
|
-
mod = json->decimal_class;
|
1139
|
-
method_id = i_try_convert;
|
1140
|
-
} else if (rb_respond_to(json->decimal_class, i_new)) {
|
1141
|
-
mod = json->decimal_class;
|
1142
|
-
method_id = i_new;
|
1143
|
-
} else if (RB_TYPE_P(json->decimal_class, T_CLASS)) {
|
1144
|
-
VALUE name = rb_class_name(json->decimal_class);
|
1145
|
-
const char *name_cstr = RSTRING_PTR(name);
|
1146
|
-
const char *last_colon = strrchr(name_cstr, ':');
|
1147
|
-
if (last_colon) {
|
1148
|
-
const char *mod_path_end = last_colon - 1;
|
1149
|
-
VALUE mod_path = rb_str_substr(name, 0, mod_path_end - name_cstr);
|
1150
|
-
mod = rb_path_to_class(mod_path);
|
1151
|
-
|
1152
|
-
const char *method_name_beg = last_colon + 1;
|
1153
|
-
long before_len = method_name_beg - name_cstr;
|
1154
|
-
long len = RSTRING_LEN(name) - before_len;
|
1155
|
-
VALUE method_name = rb_str_substr(name, before_len, len);
|
1156
|
-
method_id = SYM2ID(rb_str_intern(method_name));
|
1157
|
-
} else {
|
1158
|
-
mod = rb_mKernel;
|
1159
|
-
method_id = SYM2ID(rb_str_intern(name));
|
955
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
956
|
+
break;
|
957
|
+
case 'I':
|
958
|
+
if (config->allow_nan && (state->end - state->cursor >= 8) && (memcmp(state->cursor, "Infinity", 8) == 0)) {
|
959
|
+
state->cursor += 8;
|
960
|
+
return PUSH(CInfinity);
|
1160
961
|
}
|
1161
|
-
}
|
1162
962
|
|
1163
|
-
|
1164
|
-
|
1165
|
-
|
1166
|
-
|
963
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
964
|
+
break;
|
965
|
+
case '-':
|
966
|
+
// Note: memcmp with a small power of two compile to an integer comparison
|
967
|
+
if ((state->end - state->cursor >= 9) && (memcmp(state->cursor + 1, "Infinity", 8) == 0)) {
|
968
|
+
if (config->allow_nan) {
|
969
|
+
state->cursor += 9;
|
970
|
+
return PUSH(CMinusInfinity);
|
971
|
+
} else {
|
972
|
+
raise_parse_error("unexpected token at '%s'", state->cursor);
|
973
|
+
}
|
974
|
+
}
|
975
|
+
// Fallthrough
|
976
|
+
case '0': case '1': case '2': case '3': case '4': case '5': case '6': case '7': case '8': case '9': {
|
977
|
+
bool integer = true;
|
1167
978
|
|
1168
|
-
|
1169
|
-
|
1170
|
-
|
1171
|
-
} else {
|
1172
|
-
*result = DBL2NUM(rb_cstr_to_dbl(FBUFFER_PTR(json->fbuffer), 1));
|
1173
|
-
}
|
979
|
+
// /\A-?(0|[1-9]\d*)(\.\d+)?([Ee][-+]?\d+)?/
|
980
|
+
const char *start = state->cursor;
|
981
|
+
state->cursor++;
|
1174
982
|
|
1175
|
-
|
1176
|
-
|
1177
|
-
|
1178
|
-
}
|
1179
|
-
}
|
983
|
+
while ((state->cursor < state->end) && (*state->cursor >= '0') && (*state->cursor <= '9')) {
|
984
|
+
state->cursor++;
|
985
|
+
}
|
1180
986
|
|
987
|
+
long integer_length = state->cursor - start;
|
1181
988
|
|
989
|
+
if (RB_UNLIKELY(start[0] == '0' && integer_length > 1)) {
|
990
|
+
raise_parse_error("invalid number: %s", start);
|
991
|
+
} else if (RB_UNLIKELY(integer_length > 2 && start[0] == '-' && start[1] == '0')) {
|
992
|
+
raise_parse_error("invalid number: %s", start);
|
993
|
+
} else if (RB_UNLIKELY(integer_length == 1 && start[0] == '-')) {
|
994
|
+
raise_parse_error("invalid number: %s", start);
|
995
|
+
}
|
1182
996
|
|
1183
|
-
|
1184
|
-
|
1185
|
-
|
1186
|
-
enum {JSON_array_error = 0};
|
997
|
+
if ((state->cursor < state->end) && (*state->cursor == '.')) {
|
998
|
+
integer = false;
|
999
|
+
state->cursor++;
|
1187
1000
|
|
1188
|
-
|
1001
|
+
if (state->cursor == state->end || *state->cursor < '0' || *state->cursor > '9') {
|
1002
|
+
raise_parse_error("invalid number: %s", state->cursor);
|
1003
|
+
}
|
1189
1004
|
|
1005
|
+
while ((state->cursor < state->end) && (*state->cursor >= '0') && (*state->cursor <= '9')) {
|
1006
|
+
state->cursor++;
|
1007
|
+
}
|
1008
|
+
}
|
1190
1009
|
|
1191
|
-
|
1010
|
+
if ((state->cursor < state->end) && ((*state->cursor == 'e') || (*state->cursor == 'E'))) {
|
1011
|
+
integer = false;
|
1012
|
+
state->cursor++;
|
1013
|
+
if ((state->cursor < state->end) && ((*state->cursor == '+') || (*state->cursor == '-'))) {
|
1014
|
+
state->cursor++;
|
1015
|
+
}
|
1192
1016
|
|
1017
|
+
if (state->cursor == state->end || *state->cursor < '0' || *state->cursor > '9') {
|
1018
|
+
raise_parse_error("invalid number: %s", state->cursor);
|
1019
|
+
}
|
1193
1020
|
|
1194
|
-
|
1195
|
-
|
1196
|
-
|
1197
|
-
|
1021
|
+
while ((state->cursor < state->end) && (*state->cursor >= '0') && (*state->cursor <= '9')) {
|
1022
|
+
state->cursor++;
|
1023
|
+
}
|
1024
|
+
}
|
1198
1025
|
|
1199
|
-
|
1200
|
-
|
1201
|
-
}
|
1202
|
-
*result = NIL_P(array_class) ? rb_ary_new() : rb_class_new_instance(0, 0, array_class);
|
1203
|
-
|
1204
|
-
|
1205
|
-
#line 1206 "parser.c"
|
1206
|
-
{
|
1207
|
-
cs = JSON_array_start;
|
1208
|
-
}
|
1209
|
-
|
1210
|
-
#line 445 "parser.rl"
|
1211
|
-
|
1212
|
-
#line 1213 "parser.c"
|
1213
|
-
{
|
1214
|
-
if ( p == pe )
|
1215
|
-
goto _test_eof;
|
1216
|
-
switch ( cs )
|
1217
|
-
{
|
1218
|
-
case 1:
|
1219
|
-
if ( (*p) == 91 )
|
1220
|
-
goto st2;
|
1221
|
-
goto st0;
|
1222
|
-
st0:
|
1223
|
-
cs = 0;
|
1224
|
-
goto _out;
|
1225
|
-
st2:
|
1226
|
-
if ( ++p == pe )
|
1227
|
-
goto _test_eof2;
|
1228
|
-
case 2:
|
1229
|
-
switch( (*p) ) {
|
1230
|
-
case 13: goto st2;
|
1231
|
-
case 32: goto st2;
|
1232
|
-
case 34: goto tr2;
|
1233
|
-
case 45: goto tr2;
|
1234
|
-
case 47: goto st13;
|
1235
|
-
case 73: goto tr2;
|
1236
|
-
case 78: goto tr2;
|
1237
|
-
case 91: goto tr2;
|
1238
|
-
case 93: goto tr4;
|
1239
|
-
case 102: goto tr2;
|
1240
|
-
case 110: goto tr2;
|
1241
|
-
case 116: goto tr2;
|
1242
|
-
case 123: goto tr2;
|
1243
|
-
}
|
1244
|
-
if ( (*p) > 10 ) {
|
1245
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1246
|
-
goto tr2;
|
1247
|
-
} else if ( (*p) >= 9 )
|
1248
|
-
goto st2;
|
1249
|
-
goto st0;
|
1250
|
-
tr2:
|
1251
|
-
#line 409 "parser.rl"
|
1252
|
-
{
|
1253
|
-
VALUE v = Qnil;
|
1254
|
-
char *np = JSON_parse_value(json, p, pe, &v, current_nesting);
|
1255
|
-
if (np == NULL) {
|
1256
|
-
p--; {p++; cs = 3; goto _out;}
|
1257
|
-
} else {
|
1258
|
-
if (NIL_P(json->array_class)) {
|
1259
|
-
rb_ary_push(*result, v);
|
1260
|
-
} else {
|
1261
|
-
rb_funcall(*result, i_leftshift, 1, v);
|
1026
|
+
if (integer) {
|
1027
|
+
return PUSH(json_decode_integer(start, state->cursor));
|
1262
1028
|
}
|
1263
|
-
|
1029
|
+
return PUSH(json_decode_float(config, start, state->cursor));
|
1264
1030
|
}
|
1265
|
-
|
1266
|
-
|
1267
|
-
|
1268
|
-
|
1269
|
-
|
1270
|
-
case
|
1271
|
-
|
1272
|
-
|
1273
|
-
|
1274
|
-
|
1275
|
-
|
1276
|
-
|
1277
|
-
|
1278
|
-
|
1279
|
-
|
1280
|
-
|
1281
|
-
|
1282
|
-
|
1283
|
-
|
1284
|
-
|
1285
|
-
|
1286
|
-
switch( (*p) ) {
|
1287
|
-
case 13: goto st4;
|
1288
|
-
case 32: goto st4;
|
1289
|
-
case 34: goto tr2;
|
1290
|
-
case 45: goto tr2;
|
1291
|
-
case 47: goto st5;
|
1292
|
-
case 73: goto tr2;
|
1293
|
-
case 78: goto tr2;
|
1294
|
-
case 91: goto tr2;
|
1295
|
-
case 102: goto tr2;
|
1296
|
-
case 110: goto tr2;
|
1297
|
-
case 116: goto tr2;
|
1298
|
-
case 123: goto tr2;
|
1299
|
-
}
|
1300
|
-
if ( (*p) > 10 ) {
|
1301
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1302
|
-
goto tr2;
|
1303
|
-
} else if ( (*p) >= 9 )
|
1304
|
-
goto st4;
|
1305
|
-
goto st0;
|
1306
|
-
st5:
|
1307
|
-
if ( ++p == pe )
|
1308
|
-
goto _test_eof5;
|
1309
|
-
case 5:
|
1310
|
-
switch( (*p) ) {
|
1311
|
-
case 42: goto st6;
|
1312
|
-
case 47: goto st8;
|
1313
|
-
}
|
1314
|
-
goto st0;
|
1315
|
-
st6:
|
1316
|
-
if ( ++p == pe )
|
1317
|
-
goto _test_eof6;
|
1318
|
-
case 6:
|
1319
|
-
if ( (*p) == 42 )
|
1320
|
-
goto st7;
|
1321
|
-
goto st6;
|
1322
|
-
st7:
|
1323
|
-
if ( ++p == pe )
|
1324
|
-
goto _test_eof7;
|
1325
|
-
case 7:
|
1326
|
-
switch( (*p) ) {
|
1327
|
-
case 42: goto st7;
|
1328
|
-
case 47: goto st4;
|
1329
|
-
}
|
1330
|
-
goto st6;
|
1331
|
-
st8:
|
1332
|
-
if ( ++p == pe )
|
1333
|
-
goto _test_eof8;
|
1334
|
-
case 8:
|
1335
|
-
if ( (*p) == 10 )
|
1336
|
-
goto st4;
|
1337
|
-
goto st8;
|
1338
|
-
st9:
|
1339
|
-
if ( ++p == pe )
|
1340
|
-
goto _test_eof9;
|
1341
|
-
case 9:
|
1342
|
-
switch( (*p) ) {
|
1343
|
-
case 42: goto st10;
|
1344
|
-
case 47: goto st12;
|
1345
|
-
}
|
1346
|
-
goto st0;
|
1347
|
-
st10:
|
1348
|
-
if ( ++p == pe )
|
1349
|
-
goto _test_eof10;
|
1350
|
-
case 10:
|
1351
|
-
if ( (*p) == 42 )
|
1352
|
-
goto st11;
|
1353
|
-
goto st10;
|
1354
|
-
st11:
|
1355
|
-
if ( ++p == pe )
|
1356
|
-
goto _test_eof11;
|
1357
|
-
case 11:
|
1358
|
-
switch( (*p) ) {
|
1359
|
-
case 42: goto st11;
|
1360
|
-
case 47: goto st3;
|
1361
|
-
}
|
1362
|
-
goto st10;
|
1363
|
-
st12:
|
1364
|
-
if ( ++p == pe )
|
1365
|
-
goto _test_eof12;
|
1366
|
-
case 12:
|
1367
|
-
if ( (*p) == 10 )
|
1368
|
-
goto st3;
|
1369
|
-
goto st12;
|
1370
|
-
tr4:
|
1371
|
-
#line 424 "parser.rl"
|
1372
|
-
{ p--; {p++; cs = 17; goto _out;} }
|
1373
|
-
goto st17;
|
1374
|
-
st17:
|
1375
|
-
if ( ++p == pe )
|
1376
|
-
goto _test_eof17;
|
1377
|
-
case 17:
|
1378
|
-
#line 1379 "parser.c"
|
1379
|
-
goto st0;
|
1380
|
-
st13:
|
1381
|
-
if ( ++p == pe )
|
1382
|
-
goto _test_eof13;
|
1383
|
-
case 13:
|
1384
|
-
switch( (*p) ) {
|
1385
|
-
case 42: goto st14;
|
1386
|
-
case 47: goto st16;
|
1387
|
-
}
|
1388
|
-
goto st0;
|
1389
|
-
st14:
|
1390
|
-
if ( ++p == pe )
|
1391
|
-
goto _test_eof14;
|
1392
|
-
case 14:
|
1393
|
-
if ( (*p) == 42 )
|
1394
|
-
goto st15;
|
1395
|
-
goto st14;
|
1396
|
-
st15:
|
1397
|
-
if ( ++p == pe )
|
1398
|
-
goto _test_eof15;
|
1399
|
-
case 15:
|
1400
|
-
switch( (*p) ) {
|
1401
|
-
case 42: goto st15;
|
1402
|
-
case 47: goto st2;
|
1403
|
-
}
|
1404
|
-
goto st14;
|
1405
|
-
st16:
|
1406
|
-
if ( ++p == pe )
|
1407
|
-
goto _test_eof16;
|
1408
|
-
case 16:
|
1409
|
-
if ( (*p) == 10 )
|
1410
|
-
goto st2;
|
1411
|
-
goto st16;
|
1412
|
-
}
|
1413
|
-
_test_eof2: cs = 2; goto _test_eof;
|
1414
|
-
_test_eof3: cs = 3; goto _test_eof;
|
1415
|
-
_test_eof4: cs = 4; goto _test_eof;
|
1416
|
-
_test_eof5: cs = 5; goto _test_eof;
|
1417
|
-
_test_eof6: cs = 6; goto _test_eof;
|
1418
|
-
_test_eof7: cs = 7; goto _test_eof;
|
1419
|
-
_test_eof8: cs = 8; goto _test_eof;
|
1420
|
-
_test_eof9: cs = 9; goto _test_eof;
|
1421
|
-
_test_eof10: cs = 10; goto _test_eof;
|
1422
|
-
_test_eof11: cs = 11; goto _test_eof;
|
1423
|
-
_test_eof12: cs = 12; goto _test_eof;
|
1424
|
-
_test_eof17: cs = 17; goto _test_eof;
|
1425
|
-
_test_eof13: cs = 13; goto _test_eof;
|
1426
|
-
_test_eof14: cs = 14; goto _test_eof;
|
1427
|
-
_test_eof15: cs = 15; goto _test_eof;
|
1428
|
-
_test_eof16: cs = 16; goto _test_eof;
|
1429
|
-
|
1430
|
-
_test_eof: {}
|
1431
|
-
_out: {}
|
1432
|
-
}
|
1433
|
-
|
1434
|
-
#line 446 "parser.rl"
|
1435
|
-
|
1436
|
-
if(cs >= JSON_array_first_final) {
|
1437
|
-
return p + 1;
|
1438
|
-
} else {
|
1439
|
-
rb_enc_raise(EXC_ENCODING eParserError, "unexpected token at '%s'", p);
|
1440
|
-
return NULL;
|
1441
|
-
}
|
1442
|
-
}
|
1031
|
+
case '"': {
|
1032
|
+
// %r{\A"[^"\\\t\n\x00]*(?:\\[bfnrtu\\/"][^"\\]*)*"}
|
1033
|
+
return json_parse_string(state, config, false);
|
1034
|
+
break;
|
1035
|
+
}
|
1036
|
+
case '[': {
|
1037
|
+
state->cursor++;
|
1038
|
+
json_eat_whitespace(state);
|
1039
|
+
long stack_head = state->stack->head;
|
1040
|
+
|
1041
|
+
if ((state->cursor < state->end) && (*state->cursor == ']')) {
|
1042
|
+
state->cursor++;
|
1043
|
+
return PUSH(json_decode_array(state, config, 0));
|
1044
|
+
} else {
|
1045
|
+
state->current_nesting++;
|
1046
|
+
if (RB_UNLIKELY(config->max_nesting && (config->max_nesting < state->current_nesting))) {
|
1047
|
+
rb_raise(eNestingError, "nesting of %d is too deep", state->current_nesting);
|
1048
|
+
}
|
1049
|
+
state->in_array++;
|
1050
|
+
json_parse_any(state, config);
|
1051
|
+
}
|
1443
1052
|
|
1444
|
-
|
1445
|
-
|
1446
|
-
{
|
1447
|
-
VALUE result = Qnil;
|
1448
|
-
size_t bufferSize = stringEnd - string;
|
1449
|
-
char *p = string, *pe = string, *unescape, *bufferStart, *buffer;
|
1450
|
-
int unescape_len;
|
1451
|
-
char buf[4];
|
1053
|
+
while (true) {
|
1054
|
+
json_eat_whitespace(state);
|
1452
1055
|
|
1453
|
-
|
1454
|
-
|
1455
|
-
|
1456
|
-
|
1457
|
-
|
1458
|
-
|
1459
|
-
|
1460
|
-
|
1461
|
-
bufferStart = buffer = ALLOCA_N(char, bufferSize ? bufferSize : 1);
|
1462
|
-
# else
|
1463
|
-
bufferStart = buffer = ALLOCA_N(char, bufferSize);
|
1464
|
-
# endif
|
1465
|
-
}
|
1056
|
+
if (state->cursor < state->end) {
|
1057
|
+
if (*state->cursor == ']') {
|
1058
|
+
state->cursor++;
|
1059
|
+
long count = state->stack->head - stack_head;
|
1060
|
+
state->current_nesting--;
|
1061
|
+
state->in_array--;
|
1062
|
+
return PUSH(json_decode_array(state, config, count));
|
1063
|
+
}
|
1466
1064
|
|
1467
|
-
|
1468
|
-
|
1469
|
-
|
1470
|
-
|
1471
|
-
|
1472
|
-
|
1473
|
-
buffer += pe - p;
|
1474
|
-
}
|
1475
|
-
switch (*++pe) {
|
1476
|
-
case 'n':
|
1477
|
-
unescape = (char *) "\n";
|
1478
|
-
break;
|
1479
|
-
case 'r':
|
1480
|
-
unescape = (char *) "\r";
|
1481
|
-
break;
|
1482
|
-
case 't':
|
1483
|
-
unescape = (char *) "\t";
|
1484
|
-
break;
|
1485
|
-
case '"':
|
1486
|
-
unescape = (char *) "\"";
|
1487
|
-
break;
|
1488
|
-
case '\\':
|
1489
|
-
unescape = (char *) "\\";
|
1490
|
-
break;
|
1491
|
-
case 'b':
|
1492
|
-
unescape = (char *) "\b";
|
1493
|
-
break;
|
1494
|
-
case 'f':
|
1495
|
-
unescape = (char *) "\f";
|
1496
|
-
break;
|
1497
|
-
case 'u':
|
1498
|
-
if (pe > stringEnd - 4) {
|
1499
|
-
if (bufferSize > MAX_STACK_BUFFER_SIZE) {
|
1500
|
-
ruby_xfree(bufferStart);
|
1501
|
-
}
|
1502
|
-
rb_enc_raise(
|
1503
|
-
EXC_ENCODING eParserError,
|
1504
|
-
"incomplete unicode character escape sequence at '%s'", p
|
1505
|
-
);
|
1506
|
-
} else {
|
1507
|
-
UTF32 ch = unescape_unicode((unsigned char *) ++pe);
|
1508
|
-
pe += 3;
|
1509
|
-
if (UNI_SUR_HIGH_START == (ch & 0xFC00)) {
|
1510
|
-
pe++;
|
1511
|
-
if (pe > stringEnd - 6) {
|
1512
|
-
if (bufferSize > MAX_STACK_BUFFER_SIZE) {
|
1513
|
-
ruby_xfree(bufferStart);
|
1514
|
-
}
|
1515
|
-
rb_enc_raise(
|
1516
|
-
EXC_ENCODING eParserError,
|
1517
|
-
"incomplete surrogate pair at '%s'", p
|
1518
|
-
);
|
1519
|
-
}
|
1520
|
-
if (pe[0] == '\\' && pe[1] == 'u') {
|
1521
|
-
UTF32 sur = unescape_unicode((unsigned char *) pe + 2);
|
1522
|
-
ch = (((ch & 0x3F) << 10) | ((((ch >> 6) & 0xF) + 1) << 16)
|
1523
|
-
| (sur & 0x3FF));
|
1524
|
-
pe += 5;
|
1525
|
-
} else {
|
1526
|
-
unescape = (char *) "?";
|
1527
|
-
break;
|
1065
|
+
if (*state->cursor == ',') {
|
1066
|
+
state->cursor++;
|
1067
|
+
if (config->allow_trailing_comma) {
|
1068
|
+
json_eat_whitespace(state);
|
1069
|
+
if ((state->cursor < state->end) && (*state->cursor == ']')) {
|
1070
|
+
continue;
|
1528
1071
|
}
|
1529
1072
|
}
|
1530
|
-
|
1531
|
-
|
1073
|
+
json_parse_any(state, config);
|
1074
|
+
continue;
|
1532
1075
|
}
|
1533
|
-
|
1534
|
-
|
1535
|
-
|
1536
|
-
continue;
|
1076
|
+
}
|
1077
|
+
|
1078
|
+
raise_parse_error("expected ',' or ']' after array value", state->cursor);
|
1537
1079
|
}
|
1538
|
-
|
1539
|
-
buffer += unescape_len;
|
1540
|
-
p = ++pe;
|
1541
|
-
} else {
|
1542
|
-
pe++;
|
1080
|
+
break;
|
1543
1081
|
}
|
1544
|
-
|
1082
|
+
case '{': {
|
1083
|
+
state->cursor++;
|
1084
|
+
json_eat_whitespace(state);
|
1085
|
+
long stack_head = state->stack->head;
|
1086
|
+
|
1087
|
+
if ((state->cursor < state->end) && (*state->cursor == '}')) {
|
1088
|
+
state->cursor++;
|
1089
|
+
return PUSH(json_decode_object(state, config, 0));
|
1090
|
+
} else {
|
1091
|
+
state->current_nesting++;
|
1092
|
+
if (RB_UNLIKELY(config->max_nesting && (config->max_nesting < state->current_nesting))) {
|
1093
|
+
rb_raise(eNestingError, "nesting of %d is too deep", state->current_nesting);
|
1094
|
+
}
|
1545
1095
|
|
1546
|
-
|
1547
|
-
|
1548
|
-
|
1549
|
-
|
1096
|
+
if (*state->cursor != '"') {
|
1097
|
+
raise_parse_error("expected object key, got '%s", state->cursor);
|
1098
|
+
}
|
1099
|
+
json_parse_string(state, config, true);
|
1550
1100
|
|
1551
|
-
|
1552
|
-
|
1553
|
-
|
1554
|
-
|
1555
|
-
|
1556
|
-
}
|
1557
|
-
if (bufferSize > MAX_STACK_BUFFER_SIZE) {
|
1558
|
-
ruby_xfree(bufferStart);
|
1559
|
-
}
|
1560
|
-
# else
|
1561
|
-
result = rb_utf8_str_new(bufferStart, (long)(buffer - bufferStart));
|
1101
|
+
json_eat_whitespace(state);
|
1102
|
+
if ((state->cursor >= state->end) || (*state->cursor != ':')) {
|
1103
|
+
raise_parse_error("expected ':' after object key", state->cursor);
|
1104
|
+
}
|
1105
|
+
state->cursor++;
|
1562
1106
|
|
1563
|
-
|
1564
|
-
|
1565
|
-
}
|
1107
|
+
json_parse_any(state, config);
|
1108
|
+
}
|
1566
1109
|
|
1567
|
-
|
1568
|
-
|
1569
|
-
// Starting from MRI 2.8 it is preferable to freeze the string
|
1570
|
-
// before deduplication so that it can be interned directly
|
1571
|
-
// otherwise it would be duplicated first which is wasteful.
|
1572
|
-
result = rb_funcall(rb_str_freeze(result), i_uminus, 0);
|
1573
|
-
# elif STR_UMINUS_DEDUPE
|
1574
|
-
// MRI 2.5 and older do not deduplicate strings that are already
|
1575
|
-
// frozen.
|
1576
|
-
result = rb_funcall(result, i_uminus, 0);
|
1577
|
-
# else
|
1578
|
-
result = rb_str_freeze(result);
|
1579
|
-
# endif
|
1580
|
-
}
|
1581
|
-
# endif
|
1110
|
+
while (true) {
|
1111
|
+
json_eat_whitespace(state);
|
1582
1112
|
|
1583
|
-
|
1584
|
-
|
1585
|
-
|
1113
|
+
if (state->cursor < state->end) {
|
1114
|
+
if (*state->cursor == '}') {
|
1115
|
+
state->cursor++;
|
1116
|
+
state->current_nesting--;
|
1117
|
+
long count = state->stack->head - stack_head;
|
1118
|
+
return PUSH(json_decode_object(state, config, count));
|
1119
|
+
}
|
1586
1120
|
|
1587
|
-
|
1588
|
-
|
1121
|
+
if (*state->cursor == ',') {
|
1122
|
+
state->cursor++;
|
1123
|
+
json_eat_whitespace(state);
|
1589
1124
|
|
1125
|
+
if (config->allow_trailing_comma) {
|
1126
|
+
if ((state->cursor < state->end) && (*state->cursor == '}')) {
|
1127
|
+
continue;
|
1128
|
+
}
|
1129
|
+
}
|
1590
1130
|
|
1591
|
-
|
1592
|
-
|
1593
|
-
|
1594
|
-
|
1131
|
+
if (*state->cursor != '"') {
|
1132
|
+
raise_parse_error("expected object key, got: '%s'", state->cursor);
|
1133
|
+
}
|
1134
|
+
json_parse_string(state, config, true);
|
1595
1135
|
|
1596
|
-
|
1136
|
+
json_eat_whitespace(state);
|
1137
|
+
if ((state->cursor >= state->end) || (*state->cursor != ':')) {
|
1138
|
+
raise_parse_error("expected ':' after object key, got: '%s", state->cursor);
|
1139
|
+
}
|
1140
|
+
state->cursor++;
|
1597
1141
|
|
1142
|
+
json_parse_any(state, config);
|
1598
1143
|
|
1599
|
-
|
1144
|
+
continue;
|
1145
|
+
}
|
1146
|
+
}
|
1600
1147
|
|
1148
|
+
raise_parse_error("expected ',' or '}' after object value, got: '%s'", state->cursor);
|
1149
|
+
}
|
1150
|
+
break;
|
1151
|
+
}
|
1601
1152
|
|
1602
|
-
|
1603
|
-
|
1604
|
-
|
1605
|
-
if (regexp == Qundef) return ST_STOP;
|
1606
|
-
if (RTEST(rb_funcall(klass, i_json_creatable_p, 0)) &&
|
1607
|
-
RTEST(rb_funcall(regexp, i_match, 1, rb_ary_entry(memo, 0)))) {
|
1608
|
-
rb_ary_push(memo, klass);
|
1609
|
-
return ST_STOP;
|
1153
|
+
default:
|
1154
|
+
raise_parse_error("unexpected character: '%s'", state->cursor);
|
1155
|
+
break;
|
1610
1156
|
}
|
1611
|
-
|
1157
|
+
|
1158
|
+
raise_parse_error("unreacheable: '%s'", state->cursor);
|
1612
1159
|
}
|
1613
1160
|
|
1614
|
-
static
|
1161
|
+
static void json_ensure_eof(JSON_ParserState *state)
|
1615
1162
|
{
|
1616
|
-
|
1617
|
-
|
1618
|
-
|
1619
|
-
|
1620
|
-
#line 1621 "parser.c"
|
1621
|
-
{
|
1622
|
-
cs = JSON_string_start;
|
1623
|
-
}
|
1624
|
-
|
1625
|
-
#line 640 "parser.rl"
|
1626
|
-
json->memo = p;
|
1627
|
-
|
1628
|
-
#line 1629 "parser.c"
|
1629
|
-
{
|
1630
|
-
if ( p == pe )
|
1631
|
-
goto _test_eof;
|
1632
|
-
switch ( cs )
|
1633
|
-
{
|
1634
|
-
case 1:
|
1635
|
-
if ( (*p) == 34 )
|
1636
|
-
goto st2;
|
1637
|
-
goto st0;
|
1638
|
-
st0:
|
1639
|
-
cs = 0;
|
1640
|
-
goto _out;
|
1641
|
-
st2:
|
1642
|
-
if ( ++p == pe )
|
1643
|
-
goto _test_eof2;
|
1644
|
-
case 2:
|
1645
|
-
switch( (*p) ) {
|
1646
|
-
case 34: goto tr2;
|
1647
|
-
case 92: goto st3;
|
1648
|
-
}
|
1649
|
-
if ( 0 <= (signed char)(*(p)) && (*(p)) <= 31 )
|
1650
|
-
goto st0;
|
1651
|
-
goto st2;
|
1652
|
-
tr2:
|
1653
|
-
#line 607 "parser.rl"
|
1654
|
-
{
|
1655
|
-
*result = json_string_unescape(json->memo + 1, p, json->parsing_name || json-> freeze, json->parsing_name && json->symbolize_names);
|
1656
|
-
if (NIL_P(*result)) {
|
1657
|
-
p--;
|
1658
|
-
{p++; cs = 8; goto _out;}
|
1659
|
-
} else {
|
1660
|
-
{p = (( p + 1))-1;}
|
1661
|
-
}
|
1662
|
-
}
|
1663
|
-
#line 617 "parser.rl"
|
1664
|
-
{ p--; {p++; cs = 8; goto _out;} }
|
1665
|
-
goto st8;
|
1666
|
-
st8:
|
1667
|
-
if ( ++p == pe )
|
1668
|
-
goto _test_eof8;
|
1669
|
-
case 8:
|
1670
|
-
#line 1671 "parser.c"
|
1671
|
-
goto st0;
|
1672
|
-
st3:
|
1673
|
-
if ( ++p == pe )
|
1674
|
-
goto _test_eof3;
|
1675
|
-
case 3:
|
1676
|
-
if ( (*p) == 117 )
|
1677
|
-
goto st4;
|
1678
|
-
if ( 0 <= (signed char)(*(p)) && (*(p)) <= 31 )
|
1679
|
-
goto st0;
|
1680
|
-
goto st2;
|
1681
|
-
st4:
|
1682
|
-
if ( ++p == pe )
|
1683
|
-
goto _test_eof4;
|
1684
|
-
case 4:
|
1685
|
-
if ( (*p) < 65 ) {
|
1686
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1687
|
-
goto st5;
|
1688
|
-
} else if ( (*p) > 70 ) {
|
1689
|
-
if ( 97 <= (*p) && (*p) <= 102 )
|
1690
|
-
goto st5;
|
1691
|
-
} else
|
1692
|
-
goto st5;
|
1693
|
-
goto st0;
|
1694
|
-
st5:
|
1695
|
-
if ( ++p == pe )
|
1696
|
-
goto _test_eof5;
|
1697
|
-
case 5:
|
1698
|
-
if ( (*p) < 65 ) {
|
1699
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1700
|
-
goto st6;
|
1701
|
-
} else if ( (*p) > 70 ) {
|
1702
|
-
if ( 97 <= (*p) && (*p) <= 102 )
|
1703
|
-
goto st6;
|
1704
|
-
} else
|
1705
|
-
goto st6;
|
1706
|
-
goto st0;
|
1707
|
-
st6:
|
1708
|
-
if ( ++p == pe )
|
1709
|
-
goto _test_eof6;
|
1710
|
-
case 6:
|
1711
|
-
if ( (*p) < 65 ) {
|
1712
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1713
|
-
goto st7;
|
1714
|
-
} else if ( (*p) > 70 ) {
|
1715
|
-
if ( 97 <= (*p) && (*p) <= 102 )
|
1716
|
-
goto st7;
|
1717
|
-
} else
|
1718
|
-
goto st7;
|
1719
|
-
goto st0;
|
1720
|
-
st7:
|
1721
|
-
if ( ++p == pe )
|
1722
|
-
goto _test_eof7;
|
1723
|
-
case 7:
|
1724
|
-
if ( (*p) < 65 ) {
|
1725
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1726
|
-
goto st2;
|
1727
|
-
} else if ( (*p) > 70 ) {
|
1728
|
-
if ( 97 <= (*p) && (*p) <= 102 )
|
1729
|
-
goto st2;
|
1730
|
-
} else
|
1731
|
-
goto st2;
|
1732
|
-
goto st0;
|
1733
|
-
}
|
1734
|
-
_test_eof2: cs = 2; goto _test_eof;
|
1735
|
-
_test_eof8: cs = 8; goto _test_eof;
|
1736
|
-
_test_eof3: cs = 3; goto _test_eof;
|
1737
|
-
_test_eof4: cs = 4; goto _test_eof;
|
1738
|
-
_test_eof5: cs = 5; goto _test_eof;
|
1739
|
-
_test_eof6: cs = 6; goto _test_eof;
|
1740
|
-
_test_eof7: cs = 7; goto _test_eof;
|
1741
|
-
|
1742
|
-
_test_eof: {}
|
1743
|
-
_out: {}
|
1744
|
-
}
|
1745
|
-
|
1746
|
-
#line 642 "parser.rl"
|
1747
|
-
|
1748
|
-
if (json->create_additions && RTEST(match_string = json->match_string)) {
|
1749
|
-
VALUE klass;
|
1750
|
-
VALUE memo = rb_ary_new2(2);
|
1751
|
-
rb_ary_push(memo, *result);
|
1752
|
-
rb_hash_foreach(match_string, match_i, memo);
|
1753
|
-
klass = rb_ary_entry(memo, 1);
|
1754
|
-
if (RTEST(klass)) {
|
1755
|
-
*result = rb_funcall(klass, i_json_create, 1, *result);
|
1756
|
-
}
|
1757
|
-
}
|
1758
|
-
|
1759
|
-
if (cs >= JSON_string_first_final) {
|
1760
|
-
return p + 1;
|
1761
|
-
} else {
|
1762
|
-
return NULL;
|
1163
|
+
json_eat_whitespace(state);
|
1164
|
+
if (state->cursor != state->end) {
|
1165
|
+
raise_parse_error("unexpected token at end of stream '%s'", state->cursor);
|
1763
1166
|
}
|
1764
1167
|
}
|
1765
1168
|
|
@@ -1777,24 +1180,104 @@ case 7:
|
|
1777
1180
|
|
1778
1181
|
static VALUE convert_encoding(VALUE source)
|
1779
1182
|
{
|
1780
|
-
|
1781
|
-
|
1782
|
-
if (
|
1783
|
-
if (OBJ_FROZEN(source)) {
|
1784
|
-
source = rb_str_dup(source);
|
1785
|
-
}
|
1786
|
-
FORCE_UTF8(source);
|
1787
|
-
} else {
|
1788
|
-
source = rb_str_conv_enc(source, rb_enc_get(source), rb_utf8_encoding());
|
1789
|
-
}
|
1790
|
-
#endif
|
1183
|
+
int encindex = RB_ENCODING_GET(source);
|
1184
|
+
|
1185
|
+
if (RB_LIKELY(encindex == utf8_encindex)) {
|
1791
1186
|
return source;
|
1187
|
+
}
|
1188
|
+
|
1189
|
+
if (encindex == binary_encindex) {
|
1190
|
+
// For historical reason, we silently reinterpret binary strings as UTF-8
|
1191
|
+
return rb_enc_associate_index(rb_str_dup(source), utf8_encindex);
|
1192
|
+
}
|
1193
|
+
|
1194
|
+
return rb_funcall(source, i_encode, 1, Encoding_UTF_8);
|
1195
|
+
}
|
1196
|
+
|
1197
|
+
static int parser_config_init_i(VALUE key, VALUE val, VALUE data)
|
1198
|
+
{
|
1199
|
+
JSON_ParserConfig *config = (JSON_ParserConfig *)data;
|
1200
|
+
|
1201
|
+
if (key == sym_max_nesting) { config->max_nesting = RTEST(val) ? FIX2INT(val) : 0; }
|
1202
|
+
else if (key == sym_allow_nan) { config->allow_nan = RTEST(val); }
|
1203
|
+
else if (key == sym_allow_trailing_comma) { config->allow_trailing_comma = RTEST(val); }
|
1204
|
+
else if (key == sym_symbolize_names) { config->symbolize_names = RTEST(val); }
|
1205
|
+
else if (key == sym_freeze) { config->freeze = RTEST(val); }
|
1206
|
+
else if (key == sym_create_id) { config->create_id = RTEST(val) ? val : Qfalse; }
|
1207
|
+
else if (key == sym_object_class) { config->object_class = RTEST(val) ? val : Qfalse; }
|
1208
|
+
else if (key == sym_array_class) { config->array_class = RTEST(val) ? val : Qfalse; }
|
1209
|
+
else if (key == sym_match_string) { config->match_string = RTEST(val) ? val : Qfalse; }
|
1210
|
+
else if (key == sym_decimal_class) {
|
1211
|
+
if (RTEST(val)) {
|
1212
|
+
if (rb_respond_to(val, i_try_convert)) {
|
1213
|
+
config->decimal_class = val;
|
1214
|
+
config->decimal_method_id = i_try_convert;
|
1215
|
+
} else if (rb_respond_to(val, i_new)) {
|
1216
|
+
config->decimal_class = val;
|
1217
|
+
config->decimal_method_id = i_new;
|
1218
|
+
} else if (RB_TYPE_P(val, T_CLASS)) {
|
1219
|
+
VALUE name = rb_class_name(val);
|
1220
|
+
const char *name_cstr = RSTRING_PTR(name);
|
1221
|
+
const char *last_colon = strrchr(name_cstr, ':');
|
1222
|
+
if (last_colon) {
|
1223
|
+
const char *mod_path_end = last_colon - 1;
|
1224
|
+
VALUE mod_path = rb_str_substr(name, 0, mod_path_end - name_cstr);
|
1225
|
+
config->decimal_class = rb_path_to_class(mod_path);
|
1226
|
+
|
1227
|
+
const char *method_name_beg = last_colon + 1;
|
1228
|
+
long before_len = method_name_beg - name_cstr;
|
1229
|
+
long len = RSTRING_LEN(name) - before_len;
|
1230
|
+
VALUE method_name = rb_str_substr(name, before_len, len);
|
1231
|
+
config->decimal_method_id = SYM2ID(rb_str_intern(method_name));
|
1232
|
+
} else {
|
1233
|
+
config->decimal_class = rb_mKernel;
|
1234
|
+
config->decimal_method_id = SYM2ID(rb_str_intern(name));
|
1235
|
+
}
|
1236
|
+
}
|
1237
|
+
}
|
1238
|
+
}
|
1239
|
+
else if (key == sym_create_additions) {
|
1240
|
+
if (NIL_P(val)) {
|
1241
|
+
config->create_additions = true;
|
1242
|
+
config->deprecated_create_additions = true;
|
1243
|
+
} else {
|
1244
|
+
config->create_additions = RTEST(val);
|
1245
|
+
config->deprecated_create_additions = false;
|
1246
|
+
}
|
1247
|
+
}
|
1248
|
+
|
1249
|
+
return ST_CONTINUE;
|
1250
|
+
}
|
1251
|
+
|
1252
|
+
static void parser_config_init(JSON_ParserConfig *config, VALUE opts)
|
1253
|
+
{
|
1254
|
+
config->max_nesting = 100;
|
1255
|
+
|
1256
|
+
if (!NIL_P(opts)) {
|
1257
|
+
Check_Type(opts, T_HASH);
|
1258
|
+
if (RHASH_SIZE(opts) > 0) {
|
1259
|
+
// We assume in most cases few keys are set so it's faster to go over
|
1260
|
+
// the provided keys than to check all possible keys.
|
1261
|
+
rb_hash_foreach(opts, parser_config_init_i, (VALUE)config);
|
1262
|
+
|
1263
|
+
if (config->symbolize_names && config->create_additions) {
|
1264
|
+
rb_raise(rb_eArgError,
|
1265
|
+
"options :symbolize_names and :create_additions cannot be "
|
1266
|
+
" used in conjunction");
|
1267
|
+
}
|
1268
|
+
|
1269
|
+
if (config->create_additions && !config->create_id) {
|
1270
|
+
config->create_id = rb_funcall(mJSON, i_create_id, 0);
|
1271
|
+
}
|
1272
|
+
}
|
1273
|
+
|
1274
|
+
}
|
1792
1275
|
}
|
1793
1276
|
|
1794
1277
|
/*
|
1795
|
-
* call-seq: new(
|
1278
|
+
* call-seq: new(opts => {})
|
1796
1279
|
*
|
1797
|
-
* Creates a new JSON::Ext::
|
1280
|
+
* Creates a new JSON::Ext::ParserConfig instance.
|
1798
1281
|
*
|
1799
1282
|
* It will be configured by the _opts_ hash. _opts_ can have the following
|
1800
1283
|
* keys:
|
@@ -1813,340 +1296,122 @@ static VALUE convert_encoding(VALUE source)
|
|
1813
1296
|
* * *create_additions*: If set to false, the Parser doesn't create
|
1814
1297
|
* additions even if a matching class and create_id was found. This option
|
1815
1298
|
* defaults to false.
|
1816
|
-
* * *object_class*: Defaults to Hash
|
1817
|
-
*
|
1299
|
+
* * *object_class*: Defaults to Hash. If another type is provided, it will be used
|
1300
|
+
* instead of Hash to represent JSON objects. The type must respond to
|
1301
|
+
* +new+ without arguments, and return an object that respond to +[]=+.
|
1302
|
+
* * *array_class*: Defaults to Array If another type is provided, it will be used
|
1303
|
+
* instead of Hash to represent JSON arrays. The type must respond to
|
1304
|
+
* +new+ without arguments, and return an object that respond to +<<+.
|
1305
|
+
* * *decimal_class*: Specifies which class to use instead of the default
|
1306
|
+
* (Float) when parsing decimal numbers. This class must accept a single
|
1307
|
+
* string argument in its constructor.
|
1818
1308
|
*/
|
1819
|
-
static VALUE
|
1309
|
+
static VALUE cParserConfig_initialize(VALUE self, VALUE opts)
|
1820
1310
|
{
|
1821
|
-
|
1822
|
-
|
1311
|
+
GET_PARSER_CONFIG;
|
1312
|
+
|
1313
|
+
parser_config_init(config, opts);
|
1314
|
+
|
1315
|
+
RB_OBJ_WRITTEN(self, Qundef, config->create_id);
|
1316
|
+
RB_OBJ_WRITTEN(self, Qundef, config->object_class);
|
1317
|
+
RB_OBJ_WRITTEN(self, Qundef, config->array_class);
|
1318
|
+
RB_OBJ_WRITTEN(self, Qundef, config->decimal_class);
|
1319
|
+
RB_OBJ_WRITTEN(self, Qundef, config->match_string);
|
1823
1320
|
|
1824
|
-
if (json->Vsource) {
|
1825
|
-
rb_raise(rb_eTypeError, "already initialized instance");
|
1826
|
-
}
|
1827
|
-
rb_scan_args(argc, argv, "1:", &source, &opts);
|
1828
|
-
if (!NIL_P(opts)) {
|
1829
|
-
VALUE tmp = ID2SYM(i_max_nesting);
|
1830
|
-
if (option_given_p(opts, tmp)) {
|
1831
|
-
VALUE max_nesting = rb_hash_aref(opts, tmp);
|
1832
|
-
if (RTEST(max_nesting)) {
|
1833
|
-
Check_Type(max_nesting, T_FIXNUM);
|
1834
|
-
json->max_nesting = FIX2INT(max_nesting);
|
1835
|
-
} else {
|
1836
|
-
json->max_nesting = 0;
|
1837
|
-
}
|
1838
|
-
} else {
|
1839
|
-
json->max_nesting = 100;
|
1840
|
-
}
|
1841
|
-
tmp = ID2SYM(i_allow_nan);
|
1842
|
-
if (option_given_p(opts, tmp)) {
|
1843
|
-
json->allow_nan = RTEST(rb_hash_aref(opts, tmp)) ? 1 : 0;
|
1844
|
-
} else {
|
1845
|
-
json->allow_nan = 0;
|
1846
|
-
}
|
1847
|
-
tmp = ID2SYM(i_symbolize_names);
|
1848
|
-
if (option_given_p(opts, tmp)) {
|
1849
|
-
json->symbolize_names = RTEST(rb_hash_aref(opts, tmp)) ? 1 : 0;
|
1850
|
-
} else {
|
1851
|
-
json->symbolize_names = 0;
|
1852
|
-
}
|
1853
|
-
tmp = ID2SYM(i_freeze);
|
1854
|
-
if (option_given_p(opts, tmp)) {
|
1855
|
-
json->freeze = RTEST(rb_hash_aref(opts, tmp)) ? 1 : 0;
|
1856
|
-
} else {
|
1857
|
-
json->freeze = 0;
|
1858
|
-
}
|
1859
|
-
tmp = ID2SYM(i_create_additions);
|
1860
|
-
if (option_given_p(opts, tmp)) {
|
1861
|
-
json->create_additions = RTEST(rb_hash_aref(opts, tmp));
|
1862
|
-
} else {
|
1863
|
-
json->create_additions = 0;
|
1864
|
-
}
|
1865
|
-
if (json->symbolize_names && json->create_additions) {
|
1866
|
-
rb_raise(rb_eArgError,
|
1867
|
-
"options :symbolize_names and :create_additions cannot be "
|
1868
|
-
" used in conjunction");
|
1869
|
-
}
|
1870
|
-
tmp = ID2SYM(i_create_id);
|
1871
|
-
if (option_given_p(opts, tmp)) {
|
1872
|
-
json->create_id = rb_hash_aref(opts, tmp);
|
1873
|
-
} else {
|
1874
|
-
json->create_id = rb_funcall(mJSON, i_create_id, 0);
|
1875
|
-
}
|
1876
|
-
tmp = ID2SYM(i_object_class);
|
1877
|
-
if (option_given_p(opts, tmp)) {
|
1878
|
-
json->object_class = rb_hash_aref(opts, tmp);
|
1879
|
-
} else {
|
1880
|
-
json->object_class = Qnil;
|
1881
|
-
}
|
1882
|
-
tmp = ID2SYM(i_array_class);
|
1883
|
-
if (option_given_p(opts, tmp)) {
|
1884
|
-
json->array_class = rb_hash_aref(opts, tmp);
|
1885
|
-
} else {
|
1886
|
-
json->array_class = Qnil;
|
1887
|
-
}
|
1888
|
-
tmp = ID2SYM(i_decimal_class);
|
1889
|
-
if (option_given_p(opts, tmp)) {
|
1890
|
-
json->decimal_class = rb_hash_aref(opts, tmp);
|
1891
|
-
} else {
|
1892
|
-
json->decimal_class = Qnil;
|
1893
|
-
}
|
1894
|
-
tmp = ID2SYM(i_match_string);
|
1895
|
-
if (option_given_p(opts, tmp)) {
|
1896
|
-
VALUE match_string = rb_hash_aref(opts, tmp);
|
1897
|
-
json->match_string = RTEST(match_string) ? match_string : Qnil;
|
1898
|
-
} else {
|
1899
|
-
json->match_string = Qnil;
|
1900
|
-
}
|
1901
|
-
} else {
|
1902
|
-
json->max_nesting = 100;
|
1903
|
-
json->allow_nan = 0;
|
1904
|
-
json->create_additions = 0;
|
1905
|
-
json->create_id = Qnil;
|
1906
|
-
json->object_class = Qnil;
|
1907
|
-
json->array_class = Qnil;
|
1908
|
-
json->decimal_class = Qnil;
|
1909
|
-
}
|
1910
|
-
source = convert_encoding(StringValue(source));
|
1911
|
-
StringValue(source);
|
1912
|
-
json->len = RSTRING_LEN(source);
|
1913
|
-
json->source = RSTRING_PTR(source);;
|
1914
|
-
json->Vsource = source;
|
1915
1321
|
return self;
|
1916
1322
|
}
|
1917
1323
|
|
1324
|
+
static VALUE cParser_parse(JSON_ParserConfig *config, VALUE Vsource)
|
1325
|
+
{
|
1326
|
+
Vsource = convert_encoding(StringValue(Vsource));
|
1327
|
+
StringValue(Vsource);
|
1328
|
+
|
1329
|
+
VALUE rvalue_stack_buffer[RVALUE_STACK_INITIAL_CAPA];
|
1330
|
+
rvalue_stack stack = {
|
1331
|
+
.type = RVALUE_STACK_STACK_ALLOCATED,
|
1332
|
+
.ptr = rvalue_stack_buffer,
|
1333
|
+
.capa = RVALUE_STACK_INITIAL_CAPA,
|
1334
|
+
};
|
1918
1335
|
|
1919
|
-
|
1920
|
-
|
1921
|
-
|
1922
|
-
|
1336
|
+
JSON_ParserState _state = {
|
1337
|
+
.cursor = RSTRING_PTR(Vsource),
|
1338
|
+
.end = RSTRING_END(Vsource),
|
1339
|
+
.stack = &stack,
|
1340
|
+
};
|
1341
|
+
JSON_ParserState *state = &_state;
|
1923
1342
|
|
1924
|
-
|
1343
|
+
VALUE result = json_parse_any(state, config);
|
1925
1344
|
|
1345
|
+
// This may be skipped in case of exception, but
|
1346
|
+
// it won't cause a leak.
|
1347
|
+
rvalue_stack_eagerly_release(state->stack_handle);
|
1926
1348
|
|
1927
|
-
|
1349
|
+
json_ensure_eof(state);
|
1928
1350
|
|
1351
|
+
return result;
|
1352
|
+
}
|
1929
1353
|
|
1930
1354
|
/*
|
1931
|
-
* call-seq: parse()
|
1355
|
+
* call-seq: parse(source)
|
1932
1356
|
*
|
1933
1357
|
* Parses the current JSON text _source_ and returns the complete data
|
1934
1358
|
* structure as a result.
|
1935
1359
|
* It raises JSON::ParserError if fail to parse.
|
1936
1360
|
*/
|
1937
|
-
static VALUE
|
1361
|
+
static VALUE cParserConfig_parse(VALUE self, VALUE Vsource)
|
1938
1362
|
{
|
1939
|
-
|
1940
|
-
|
1941
|
-
|
1942
|
-
|
1943
|
-
|
1944
|
-
|
1945
|
-
|
1946
|
-
|
1947
|
-
|
1948
|
-
|
1949
|
-
|
1950
|
-
|
1951
|
-
|
1952
|
-
|
1953
|
-
|
1954
|
-
#line 1955 "parser.c"
|
1955
|
-
{
|
1956
|
-
if ( p == pe )
|
1957
|
-
goto _test_eof;
|
1958
|
-
switch ( cs )
|
1959
|
-
{
|
1960
|
-
st1:
|
1961
|
-
if ( ++p == pe )
|
1962
|
-
goto _test_eof1;
|
1963
|
-
case 1:
|
1964
|
-
switch( (*p) ) {
|
1965
|
-
case 13: goto st1;
|
1966
|
-
case 32: goto st1;
|
1967
|
-
case 34: goto tr2;
|
1968
|
-
case 45: goto tr2;
|
1969
|
-
case 47: goto st6;
|
1970
|
-
case 73: goto tr2;
|
1971
|
-
case 78: goto tr2;
|
1972
|
-
case 91: goto tr2;
|
1973
|
-
case 102: goto tr2;
|
1974
|
-
case 110: goto tr2;
|
1975
|
-
case 116: goto tr2;
|
1976
|
-
case 123: goto tr2;
|
1977
|
-
}
|
1978
|
-
if ( (*p) > 10 ) {
|
1979
|
-
if ( 48 <= (*p) && (*p) <= 57 )
|
1980
|
-
goto tr2;
|
1981
|
-
} else if ( (*p) >= 9 )
|
1982
|
-
goto st1;
|
1983
|
-
goto st0;
|
1984
|
-
st0:
|
1985
|
-
cs = 0;
|
1986
|
-
goto _out;
|
1987
|
-
tr2:
|
1988
|
-
#line 820 "parser.rl"
|
1989
|
-
{
|
1990
|
-
char *np = JSON_parse_value(json, p, pe, &result, 0);
|
1991
|
-
if (np == NULL) { p--; {p++; cs = 10; goto _out;} } else {p = (( np))-1;}
|
1992
|
-
}
|
1993
|
-
goto st10;
|
1994
|
-
st10:
|
1995
|
-
if ( ++p == pe )
|
1996
|
-
goto _test_eof10;
|
1997
|
-
case 10:
|
1998
|
-
#line 1999 "parser.c"
|
1999
|
-
switch( (*p) ) {
|
2000
|
-
case 13: goto st10;
|
2001
|
-
case 32: goto st10;
|
2002
|
-
case 47: goto st2;
|
2003
|
-
}
|
2004
|
-
if ( 9 <= (*p) && (*p) <= 10 )
|
2005
|
-
goto st10;
|
2006
|
-
goto st0;
|
2007
|
-
st2:
|
2008
|
-
if ( ++p == pe )
|
2009
|
-
goto _test_eof2;
|
2010
|
-
case 2:
|
2011
|
-
switch( (*p) ) {
|
2012
|
-
case 42: goto st3;
|
2013
|
-
case 47: goto st5;
|
2014
|
-
}
|
2015
|
-
goto st0;
|
2016
|
-
st3:
|
2017
|
-
if ( ++p == pe )
|
2018
|
-
goto _test_eof3;
|
2019
|
-
case 3:
|
2020
|
-
if ( (*p) == 42 )
|
2021
|
-
goto st4;
|
2022
|
-
goto st3;
|
2023
|
-
st4:
|
2024
|
-
if ( ++p == pe )
|
2025
|
-
goto _test_eof4;
|
2026
|
-
case 4:
|
2027
|
-
switch( (*p) ) {
|
2028
|
-
case 42: goto st4;
|
2029
|
-
case 47: goto st10;
|
2030
|
-
}
|
2031
|
-
goto st3;
|
2032
|
-
st5:
|
2033
|
-
if ( ++p == pe )
|
2034
|
-
goto _test_eof5;
|
2035
|
-
case 5:
|
2036
|
-
if ( (*p) == 10 )
|
2037
|
-
goto st10;
|
2038
|
-
goto st5;
|
2039
|
-
st6:
|
2040
|
-
if ( ++p == pe )
|
2041
|
-
goto _test_eof6;
|
2042
|
-
case 6:
|
2043
|
-
switch( (*p) ) {
|
2044
|
-
case 42: goto st7;
|
2045
|
-
case 47: goto st9;
|
2046
|
-
}
|
2047
|
-
goto st0;
|
2048
|
-
st7:
|
2049
|
-
if ( ++p == pe )
|
2050
|
-
goto _test_eof7;
|
2051
|
-
case 7:
|
2052
|
-
if ( (*p) == 42 )
|
2053
|
-
goto st8;
|
2054
|
-
goto st7;
|
2055
|
-
st8:
|
2056
|
-
if ( ++p == pe )
|
2057
|
-
goto _test_eof8;
|
2058
|
-
case 8:
|
2059
|
-
switch( (*p) ) {
|
2060
|
-
case 42: goto st8;
|
2061
|
-
case 47: goto st1;
|
2062
|
-
}
|
2063
|
-
goto st7;
|
2064
|
-
st9:
|
2065
|
-
if ( ++p == pe )
|
2066
|
-
goto _test_eof9;
|
2067
|
-
case 9:
|
2068
|
-
if ( (*p) == 10 )
|
2069
|
-
goto st1;
|
2070
|
-
goto st9;
|
2071
|
-
}
|
2072
|
-
_test_eof1: cs = 1; goto _test_eof;
|
2073
|
-
_test_eof10: cs = 10; goto _test_eof;
|
2074
|
-
_test_eof2: cs = 2; goto _test_eof;
|
2075
|
-
_test_eof3: cs = 3; goto _test_eof;
|
2076
|
-
_test_eof4: cs = 4; goto _test_eof;
|
2077
|
-
_test_eof5: cs = 5; goto _test_eof;
|
2078
|
-
_test_eof6: cs = 6; goto _test_eof;
|
2079
|
-
_test_eof7: cs = 7; goto _test_eof;
|
2080
|
-
_test_eof8: cs = 8; goto _test_eof;
|
2081
|
-
_test_eof9: cs = 9; goto _test_eof;
|
2082
|
-
|
2083
|
-
_test_eof: {}
|
2084
|
-
_out: {}
|
2085
|
-
}
|
2086
|
-
|
2087
|
-
#line 848 "parser.rl"
|
2088
|
-
|
2089
|
-
if (cs >= JSON_first_final && p == pe) {
|
2090
|
-
return result;
|
2091
|
-
} else {
|
2092
|
-
rb_enc_raise(EXC_ENCODING eParserError, "unexpected token at '%s'", p);
|
2093
|
-
return Qnil;
|
2094
|
-
}
|
1363
|
+
GET_PARSER_CONFIG;
|
1364
|
+
return cParser_parse(config, Vsource);
|
1365
|
+
}
|
1366
|
+
|
1367
|
+
static VALUE cParser_m_parse(VALUE klass, VALUE Vsource, VALUE opts)
|
1368
|
+
{
|
1369
|
+
Vsource = convert_encoding(StringValue(Vsource));
|
1370
|
+
StringValue(Vsource);
|
1371
|
+
|
1372
|
+
JSON_ParserConfig _config = {0};
|
1373
|
+
JSON_ParserConfig *config = &_config;
|
1374
|
+
parser_config_init(config, opts);
|
1375
|
+
|
1376
|
+
return cParser_parse(config, Vsource);
|
2095
1377
|
}
|
2096
1378
|
|
2097
|
-
static void
|
1379
|
+
static void JSON_ParserConfig_mark(void *ptr)
|
2098
1380
|
{
|
2099
|
-
|
2100
|
-
|
2101
|
-
|
2102
|
-
|
2103
|
-
|
2104
|
-
|
2105
|
-
rb_gc_mark_maybe(json->match_string);
|
1381
|
+
JSON_ParserConfig *config = ptr;
|
1382
|
+
rb_gc_mark(config->create_id);
|
1383
|
+
rb_gc_mark(config->object_class);
|
1384
|
+
rb_gc_mark(config->array_class);
|
1385
|
+
rb_gc_mark(config->decimal_class);
|
1386
|
+
rb_gc_mark(config->match_string);
|
2106
1387
|
}
|
2107
1388
|
|
2108
|
-
static void
|
1389
|
+
static void JSON_ParserConfig_free(void *ptr)
|
2109
1390
|
{
|
2110
|
-
|
2111
|
-
|
2112
|
-
ruby_xfree(json);
|
1391
|
+
JSON_ParserConfig *config = ptr;
|
1392
|
+
ruby_xfree(config);
|
2113
1393
|
}
|
2114
1394
|
|
2115
|
-
static size_t
|
1395
|
+
static size_t JSON_ParserConfig_memsize(const void *ptr)
|
2116
1396
|
{
|
2117
|
-
|
2118
|
-
return sizeof(*json) + FBUFFER_CAPA(json->fbuffer);
|
1397
|
+
return sizeof(JSON_ParserConfig);
|
2119
1398
|
}
|
2120
1399
|
|
2121
|
-
|
2122
|
-
|
2123
|
-
|
2124
|
-
|
2125
|
-
|
1400
|
+
static const rb_data_type_t JSON_ParserConfig_type = {
|
1401
|
+
"JSON::Ext::Parser/ParserConfig",
|
1402
|
+
{
|
1403
|
+
JSON_ParserConfig_mark,
|
1404
|
+
JSON_ParserConfig_free,
|
1405
|
+
JSON_ParserConfig_memsize,
|
1406
|
+
},
|
2126
1407
|
0, 0,
|
2127
|
-
RUBY_TYPED_FREE_IMMEDIATELY,
|
2128
|
-
#endif
|
1408
|
+
RUBY_TYPED_FREE_IMMEDIATELY | RUBY_TYPED_WB_PROTECTED,
|
2129
1409
|
};
|
2130
|
-
#endif
|
2131
1410
|
|
2132
1411
|
static VALUE cJSON_parser_s_allocate(VALUE klass)
|
2133
1412
|
{
|
2134
|
-
|
2135
|
-
|
2136
|
-
json->fbuffer = fbuffer_alloc(0);
|
2137
|
-
return obj;
|
2138
|
-
}
|
2139
|
-
|
2140
|
-
/*
|
2141
|
-
* call-seq: source()
|
2142
|
-
*
|
2143
|
-
* Returns a copy of the current _source_ string, that was used to construct
|
2144
|
-
* this Parser.
|
2145
|
-
*/
|
2146
|
-
static VALUE cParser_source(VALUE self)
|
2147
|
-
{
|
2148
|
-
GET_PARSER;
|
2149
|
-
return rb_str_dup(json->Vsource);
|
1413
|
+
JSON_ParserConfig *config;
|
1414
|
+
return TypedData_Make_Struct(klass, JSON_ParserConfig, &JSON_ParserConfig_type, config);
|
2150
1415
|
}
|
2151
1416
|
|
2152
1417
|
void Init_parser(void)
|
@@ -2158,16 +1423,16 @@ void Init_parser(void)
|
|
2158
1423
|
#undef rb_intern
|
2159
1424
|
rb_require("json/common");
|
2160
1425
|
mJSON = rb_define_module("JSON");
|
2161
|
-
mExt = rb_define_module_under(mJSON, "Ext");
|
2162
|
-
|
2163
|
-
eParserError = rb_path2class("JSON::ParserError");
|
1426
|
+
VALUE mExt = rb_define_module_under(mJSON, "Ext");
|
1427
|
+
VALUE cParserConfig = rb_define_class_under(mExt, "ParserConfig", rb_cObject);
|
2164
1428
|
eNestingError = rb_path2class("JSON::NestingError");
|
2165
|
-
rb_gc_register_mark_object(eParserError);
|
2166
1429
|
rb_gc_register_mark_object(eNestingError);
|
2167
|
-
rb_define_alloc_func(
|
2168
|
-
rb_define_method(
|
2169
|
-
rb_define_method(
|
2170
|
-
|
1430
|
+
rb_define_alloc_func(cParserConfig, cJSON_parser_s_allocate);
|
1431
|
+
rb_define_method(cParserConfig, "initialize", cParserConfig_initialize, 1);
|
1432
|
+
rb_define_method(cParserConfig, "parse", cParserConfig_parse, 1);
|
1433
|
+
|
1434
|
+
VALUE cParser = rb_define_class_under(mExt, "Parser", rb_cObject);
|
1435
|
+
rb_define_singleton_method(cParser, "parse", cParser_m_parse, 2);
|
2171
1436
|
|
2172
1437
|
CNaN = rb_const_get(mJSON, rb_intern("NaN"));
|
2173
1438
|
rb_gc_register_mark_object(CNaN);
|
@@ -2178,34 +1443,36 @@ void Init_parser(void)
|
|
2178
1443
|
CMinusInfinity = rb_const_get(mJSON, rb_intern("MinusInfinity"));
|
2179
1444
|
rb_gc_register_mark_object(CMinusInfinity);
|
2180
1445
|
|
1446
|
+
rb_global_variable(&Encoding_UTF_8);
|
1447
|
+
Encoding_UTF_8 = rb_const_get(rb_path2class("Encoding"), rb_intern("UTF_8"));
|
1448
|
+
|
1449
|
+
sym_max_nesting = ID2SYM(rb_intern("max_nesting"));
|
1450
|
+
sym_allow_nan = ID2SYM(rb_intern("allow_nan"));
|
1451
|
+
sym_allow_trailing_comma = ID2SYM(rb_intern("allow_trailing_comma"));
|
1452
|
+
sym_symbolize_names = ID2SYM(rb_intern("symbolize_names"));
|
1453
|
+
sym_freeze = ID2SYM(rb_intern("freeze"));
|
1454
|
+
sym_create_additions = ID2SYM(rb_intern("create_additions"));
|
1455
|
+
sym_create_id = ID2SYM(rb_intern("create_id"));
|
1456
|
+
sym_object_class = ID2SYM(rb_intern("object_class"));
|
1457
|
+
sym_array_class = ID2SYM(rb_intern("array_class"));
|
1458
|
+
sym_decimal_class = ID2SYM(rb_intern("decimal_class"));
|
1459
|
+
sym_match_string = ID2SYM(rb_intern("match_string"));
|
1460
|
+
|
1461
|
+
i_create_id = rb_intern("create_id");
|
2181
1462
|
i_json_creatable_p = rb_intern("json_creatable?");
|
2182
1463
|
i_json_create = rb_intern("json_create");
|
2183
|
-
i_create_id = rb_intern("create_id");
|
2184
|
-
i_create_additions = rb_intern("create_additions");
|
2185
1464
|
i_chr = rb_intern("chr");
|
2186
|
-
i_max_nesting = rb_intern("max_nesting");
|
2187
|
-
i_allow_nan = rb_intern("allow_nan");
|
2188
|
-
i_symbolize_names = rb_intern("symbolize_names");
|
2189
|
-
i_object_class = rb_intern("object_class");
|
2190
|
-
i_array_class = rb_intern("array_class");
|
2191
|
-
i_decimal_class = rb_intern("decimal_class");
|
2192
1465
|
i_match = rb_intern("match");
|
2193
|
-
i_match_string = rb_intern("match_string");
|
2194
|
-
i_key_p = rb_intern("key?");
|
2195
1466
|
i_deep_const_get = rb_intern("deep_const_get");
|
2196
1467
|
i_aset = rb_intern("[]=");
|
2197
1468
|
i_aref = rb_intern("[]");
|
2198
1469
|
i_leftshift = rb_intern("<<");
|
2199
1470
|
i_new = rb_intern("new");
|
2200
1471
|
i_try_convert = rb_intern("try_convert");
|
2201
|
-
i_freeze = rb_intern("freeze");
|
2202
1472
|
i_uminus = rb_intern("-@");
|
2203
|
-
|
1473
|
+
i_encode = rb_intern("encode");
|
2204
1474
|
|
2205
|
-
|
2206
|
-
|
2207
|
-
|
2208
|
-
|
2209
|
-
* indent-tabs-mode: nil
|
2210
|
-
* End:
|
2211
|
-
*/
|
1475
|
+
binary_encindex = rb_ascii8bit_encindex();
|
1476
|
+
utf8_encindex = rb_utf8_encindex();
|
1477
|
+
enc_utf8 = rb_utf8_encoding();
|
1478
|
+
}
|