oj 3.7.12
Sign up to get free protection for your applications and to get access to all the features.
- checksums.yaml +7 -0
- data/LICENSE +21 -0
- data/README.md +96 -0
- data/ext/oj/buf.h +103 -0
- data/ext/oj/cache8.c +107 -0
- data/ext/oj/cache8.h +48 -0
- data/ext/oj/circarray.c +68 -0
- data/ext/oj/circarray.h +23 -0
- data/ext/oj/code.c +235 -0
- data/ext/oj/code.h +42 -0
- data/ext/oj/compat.c +299 -0
- data/ext/oj/custom.c +1188 -0
- data/ext/oj/dump.c +1232 -0
- data/ext/oj/dump.h +94 -0
- data/ext/oj/dump_compat.c +973 -0
- data/ext/oj/dump_leaf.c +252 -0
- data/ext/oj/dump_object.c +837 -0
- data/ext/oj/dump_strict.c +433 -0
- data/ext/oj/encode.h +45 -0
- data/ext/oj/err.c +57 -0
- data/ext/oj/err.h +70 -0
- data/ext/oj/extconf.rb +47 -0
- data/ext/oj/fast.c +1771 -0
- data/ext/oj/hash.c +163 -0
- data/ext/oj/hash.h +46 -0
- data/ext/oj/hash_test.c +512 -0
- data/ext/oj/mimic_json.c +873 -0
- data/ext/oj/object.c +771 -0
- data/ext/oj/odd.c +231 -0
- data/ext/oj/odd.h +44 -0
- data/ext/oj/oj.c +1694 -0
- data/ext/oj/oj.h +381 -0
- data/ext/oj/parse.c +1085 -0
- data/ext/oj/parse.h +111 -0
- data/ext/oj/rails.c +1485 -0
- data/ext/oj/rails.h +21 -0
- data/ext/oj/reader.c +231 -0
- data/ext/oj/reader.h +151 -0
- data/ext/oj/resolve.c +102 -0
- data/ext/oj/resolve.h +14 -0
- data/ext/oj/rxclass.c +147 -0
- data/ext/oj/rxclass.h +27 -0
- data/ext/oj/saj.c +714 -0
- data/ext/oj/scp.c +224 -0
- data/ext/oj/sparse.c +910 -0
- data/ext/oj/stream_writer.c +363 -0
- data/ext/oj/strict.c +212 -0
- data/ext/oj/string_writer.c +512 -0
- data/ext/oj/trace.c +79 -0
- data/ext/oj/trace.h +28 -0
- data/ext/oj/util.c +136 -0
- data/ext/oj/util.h +19 -0
- data/ext/oj/val_stack.c +118 -0
- data/ext/oj/val_stack.h +185 -0
- data/ext/oj/wab.c +631 -0
- data/lib/oj.rb +21 -0
- data/lib/oj/active_support_helper.rb +41 -0
- data/lib/oj/bag.rb +88 -0
- data/lib/oj/easy_hash.rb +52 -0
- data/lib/oj/error.rb +22 -0
- data/lib/oj/json.rb +176 -0
- data/lib/oj/mimic.rb +267 -0
- data/lib/oj/saj.rb +66 -0
- data/lib/oj/schandler.rb +142 -0
- data/lib/oj/state.rb +131 -0
- data/lib/oj/version.rb +5 -0
- data/pages/Advanced.md +22 -0
- data/pages/Compatibility.md +25 -0
- data/pages/Custom.md +23 -0
- data/pages/Encoding.md +65 -0
- data/pages/JsonGem.md +79 -0
- data/pages/Modes.md +154 -0
- data/pages/Options.md +266 -0
- data/pages/Rails.md +116 -0
- data/pages/Security.md +20 -0
- data/pages/WAB.md +13 -0
- data/test/_test_active.rb +76 -0
- data/test/_test_active_mimic.rb +96 -0
- data/test/_test_mimic_rails.rb +126 -0
- data/test/activerecord/result_test.rb +27 -0
- data/test/activesupport4/decoding_test.rb +108 -0
- data/test/activesupport4/encoding_test.rb +531 -0
- data/test/activesupport4/test_helper.rb +41 -0
- data/test/activesupport5/decoding_test.rb +125 -0
- data/test/activesupport5/encoding_test.rb +485 -0
- data/test/activesupport5/encoding_test_cases.rb +90 -0
- data/test/activesupport5/test_helper.rb +50 -0
- data/test/activesupport5/time_zone_test_helpers.rb +24 -0
- data/test/big.rb +15 -0
- data/test/files.rb +29 -0
- data/test/foo.rb +33 -0
- data/test/helper.rb +26 -0
- data/test/isolated/shared.rb +308 -0
- data/test/isolated/test_mimic_after.rb +13 -0
- data/test/isolated/test_mimic_alone.rb +12 -0
- data/test/isolated/test_mimic_as_json.rb +45 -0
- data/test/isolated/test_mimic_before.rb +13 -0
- data/test/isolated/test_mimic_define.rb +28 -0
- data/test/isolated/test_mimic_rails_after.rb +22 -0
- data/test/isolated/test_mimic_rails_before.rb +21 -0
- data/test/isolated/test_mimic_redefine.rb +15 -0
- data/test/json_gem/json_addition_test.rb +216 -0
- data/test/json_gem/json_common_interface_test.rb +148 -0
- data/test/json_gem/json_encoding_test.rb +107 -0
- data/test/json_gem/json_ext_parser_test.rb +20 -0
- data/test/json_gem/json_fixtures_test.rb +35 -0
- data/test/json_gem/json_generator_test.rb +383 -0
- data/test/json_gem/json_generic_object_test.rb +90 -0
- data/test/json_gem/json_parser_test.rb +470 -0
- data/test/json_gem/json_string_matching_test.rb +42 -0
- data/test/json_gem/test_helper.rb +18 -0
- data/test/mem.rb +35 -0
- data/test/perf.rb +107 -0
- data/test/perf_compat.rb +130 -0
- data/test/perf_fast.rb +164 -0
- data/test/perf_file.rb +64 -0
- data/test/perf_object.rb +138 -0
- data/test/perf_saj.rb +109 -0
- data/test/perf_scp.rb +151 -0
- data/test/perf_simple.rb +287 -0
- data/test/perf_strict.rb +145 -0
- data/test/perf_wab.rb +131 -0
- data/test/sample.rb +54 -0
- data/test/sample/change.rb +14 -0
- data/test/sample/dir.rb +19 -0
- data/test/sample/doc.rb +36 -0
- data/test/sample/file.rb +48 -0
- data/test/sample/group.rb +16 -0
- data/test/sample/hasprops.rb +16 -0
- data/test/sample/layer.rb +12 -0
- data/test/sample/line.rb +20 -0
- data/test/sample/oval.rb +10 -0
- data/test/sample/rect.rb +10 -0
- data/test/sample/shape.rb +35 -0
- data/test/sample/text.rb +20 -0
- data/test/sample_json.rb +37 -0
- data/test/test_compat.rb +509 -0
- data/test/test_custom.rb +406 -0
- data/test/test_debian.rb +53 -0
- data/test/test_fast.rb +470 -0
- data/test/test_file.rb +239 -0
- data/test/test_gc.rb +49 -0
- data/test/test_hash.rb +29 -0
- data/test/test_integer_range.rb +73 -0
- data/test/test_null.rb +376 -0
- data/test/test_object.rb +1018 -0
- data/test/test_saj.rb +186 -0
- data/test/test_scp.rb +433 -0
- data/test/test_strict.rb +410 -0
- data/test/test_various.rb +739 -0
- data/test/test_wab.rb +307 -0
- data/test/test_writer.rb +380 -0
- data/test/tests.rb +24 -0
- data/test/tests_mimic.rb +14 -0
- data/test/tests_mimic_addition.rb +7 -0
- metadata +359 -0
data/ext/oj/oj.h
ADDED
@@ -0,0 +1,381 @@
|
|
1
|
+
/* oj.h
|
2
|
+
* Copyright (c) 2011, Peter Ohler
|
3
|
+
* All rights reserved.
|
4
|
+
*/
|
5
|
+
|
6
|
+
#ifndef OJ_H
|
7
|
+
#define OJ_H
|
8
|
+
|
9
|
+
#if defined(cplusplus)
|
10
|
+
extern "C" {
|
11
|
+
#if 0
|
12
|
+
} /* satisfy cc-mode */
|
13
|
+
#endif
|
14
|
+
#endif
|
15
|
+
|
16
|
+
#define RSTRING_NOT_MODIFIED
|
17
|
+
|
18
|
+
#include "ruby.h"
|
19
|
+
#include "ruby/encoding.h"
|
20
|
+
|
21
|
+
#include <stdint.h>
|
22
|
+
#include <stdbool.h>
|
23
|
+
|
24
|
+
#if HAVE_LIBPTHREAD
|
25
|
+
#include <pthread.h>
|
26
|
+
#endif
|
27
|
+
#include "cache8.h"
|
28
|
+
|
29
|
+
#ifdef RUBINIUS_RUBY
|
30
|
+
#undef T_RATIONAL
|
31
|
+
#undef T_COMPLEX
|
32
|
+
enum st_retval {ST_CONTINUE = 0, ST_STOP = 1, ST_DELETE = 2, ST_CHECK};
|
33
|
+
#else
|
34
|
+
#include "ruby/st.h"
|
35
|
+
#endif
|
36
|
+
|
37
|
+
#include "rxclass.h"
|
38
|
+
#include "err.h"
|
39
|
+
|
40
|
+
#define INF_VAL "3.0e14159265358979323846"
|
41
|
+
#define NINF_VAL "-3.0e14159265358979323846"
|
42
|
+
#define NAN_VAL "3.3e14159265358979323846"
|
43
|
+
|
44
|
+
typedef enum {
|
45
|
+
Yes = 'y',
|
46
|
+
No = 'n',
|
47
|
+
NotSet = 0
|
48
|
+
} YesNo;
|
49
|
+
|
50
|
+
typedef enum {
|
51
|
+
StrictMode = 's',
|
52
|
+
ObjectMode = 'o',
|
53
|
+
NullMode = 'n',
|
54
|
+
CompatMode = 'c',
|
55
|
+
RailsMode = 'r',
|
56
|
+
CustomMode = 'C',
|
57
|
+
WabMode = 'w',
|
58
|
+
} Mode;
|
59
|
+
|
60
|
+
typedef enum {
|
61
|
+
UnixTime = 'u',
|
62
|
+
UnixZTime = 'z',
|
63
|
+
XmlTime = 'x',
|
64
|
+
RubyTime = 'r'
|
65
|
+
} TimeFormat;
|
66
|
+
|
67
|
+
typedef enum {
|
68
|
+
NLEsc = 'n',
|
69
|
+
JSONEsc = 'j',
|
70
|
+
XSSEsc = 'x',
|
71
|
+
ASCIIEsc = 'a',
|
72
|
+
JXEsc = 'g', // json gem
|
73
|
+
RailsXEsc = 'r', // rails xss mode
|
74
|
+
RailsEsc = 'R', // rails non escape
|
75
|
+
} Encoding;
|
76
|
+
|
77
|
+
typedef enum {
|
78
|
+
BigDec = 'b',
|
79
|
+
FloatDec = 'f',
|
80
|
+
AutoDec = 'a'
|
81
|
+
} BigLoad;
|
82
|
+
|
83
|
+
typedef enum {
|
84
|
+
ArrayNew = 'A',
|
85
|
+
ArrayType = 'a',
|
86
|
+
ObjectNew = 'O',
|
87
|
+
ObjectType = 'o',
|
88
|
+
} DumpType;
|
89
|
+
|
90
|
+
typedef enum {
|
91
|
+
AutoNan = 'a',
|
92
|
+
NullNan = 'n',
|
93
|
+
HugeNan = 'h',
|
94
|
+
WordNan = 'w',
|
95
|
+
RaiseNan = 'r',
|
96
|
+
} NanDump;
|
97
|
+
|
98
|
+
typedef enum {
|
99
|
+
STRING_IO = 'c',
|
100
|
+
STREAM_IO = 's',
|
101
|
+
FILE_IO = 'f',
|
102
|
+
} StreamWriterType;
|
103
|
+
|
104
|
+
typedef enum {
|
105
|
+
CALLER_DUMP = 'd',
|
106
|
+
CALLER_TO_JSON = 't',
|
107
|
+
CALLER_GENERATE = 'g',
|
108
|
+
// Add the fast versions if necessary. Maybe unparse as well if needed.
|
109
|
+
} DumpCaller;
|
110
|
+
|
111
|
+
typedef struct _dumpOpts {
|
112
|
+
bool use;
|
113
|
+
char indent_str[16];
|
114
|
+
char before_sep[16];
|
115
|
+
char after_sep[16];
|
116
|
+
char hash_nl[16];
|
117
|
+
char array_nl[16];
|
118
|
+
uint8_t indent_size;
|
119
|
+
uint8_t before_size;
|
120
|
+
uint8_t after_size;
|
121
|
+
uint8_t hash_size;
|
122
|
+
uint8_t array_size;
|
123
|
+
char nan_dump; // NanDump
|
124
|
+
bool omit_nil;
|
125
|
+
int max_depth;
|
126
|
+
} *DumpOpts;
|
127
|
+
|
128
|
+
typedef struct _options {
|
129
|
+
int indent; // indention for dump, default 2
|
130
|
+
char circular; // YesNo
|
131
|
+
char auto_define; // YesNo
|
132
|
+
char sym_key; // YesNo
|
133
|
+
char escape_mode; // Escape_Mode
|
134
|
+
char mode; // Mode
|
135
|
+
char class_cache; // YesNo
|
136
|
+
char time_format; // TimeFormat
|
137
|
+
char bigdec_as_num; // YesNo
|
138
|
+
char bigdec_load; // BigLoad
|
139
|
+
char to_hash; // YesNo
|
140
|
+
char to_json; // YesNo
|
141
|
+
char as_json; // YesNo
|
142
|
+
char nilnil; // YesNo
|
143
|
+
char empty_string; // YesNo
|
144
|
+
char allow_gc; // allow GC during parse
|
145
|
+
char quirks_mode; // allow single JSON values instead of documents
|
146
|
+
char allow_invalid; // YesNo - allow invalid unicode
|
147
|
+
char create_ok; // YesNo allow create_id
|
148
|
+
char allow_nan; // YEsyNo for parsing only
|
149
|
+
char trace; // YesNo
|
150
|
+
int64_t integer_range_min; // dump numbers outside range as string
|
151
|
+
int64_t integer_range_max;
|
152
|
+
const char *create_id; // 0 or string
|
153
|
+
size_t create_id_len; // length of create_id
|
154
|
+
int sec_prec; // second precision when dumping time
|
155
|
+
char float_prec; // float precision, linked to float_fmt
|
156
|
+
char float_fmt[7]; // float format for dumping, if empty use Ruby
|
157
|
+
VALUE hash_class; // class to use in place of Hash on load
|
158
|
+
VALUE array_class; // class to use in place of Array on load
|
159
|
+
struct _dumpOpts dump_opts;
|
160
|
+
struct _rxClass str_rx;
|
161
|
+
VALUE *ignore; // Qnil terminated array of classes or NULL
|
162
|
+
} *Options;
|
163
|
+
|
164
|
+
struct _out;
|
165
|
+
typedef void (*DumpFunc)(VALUE obj, int depth, struct _out *out, bool as_ok);
|
166
|
+
|
167
|
+
// rails optimize
|
168
|
+
typedef struct _rOpt {
|
169
|
+
VALUE clas;
|
170
|
+
bool on;
|
171
|
+
DumpFunc dump;
|
172
|
+
} *ROpt;
|
173
|
+
|
174
|
+
typedef struct _rOptTable {
|
175
|
+
int len;
|
176
|
+
int alen;
|
177
|
+
ROpt table;
|
178
|
+
} *ROptTable;
|
179
|
+
|
180
|
+
typedef struct _out {
|
181
|
+
char *buf;
|
182
|
+
char *end;
|
183
|
+
char *cur;
|
184
|
+
Cache8 circ_cache;
|
185
|
+
slot_t circ_cnt;
|
186
|
+
int indent;
|
187
|
+
int depth; // used by dump_hash
|
188
|
+
Options opts;
|
189
|
+
uint32_t hash_cnt;
|
190
|
+
bool allocated;
|
191
|
+
bool omit_nil;
|
192
|
+
int argc;
|
193
|
+
VALUE *argv;
|
194
|
+
DumpCaller caller; // used for the mimic json only
|
195
|
+
ROptTable ropts;
|
196
|
+
} *Out;
|
197
|
+
|
198
|
+
typedef struct _strWriter {
|
199
|
+
struct _out out;
|
200
|
+
struct _options opts;
|
201
|
+
int depth;
|
202
|
+
char *types; // DumpType
|
203
|
+
char *types_end;
|
204
|
+
int keyWritten;
|
205
|
+
|
206
|
+
} *StrWriter;
|
207
|
+
|
208
|
+
typedef struct _streamWriter {
|
209
|
+
struct _strWriter sw;
|
210
|
+
StreamWriterType type;
|
211
|
+
VALUE stream;
|
212
|
+
int fd;
|
213
|
+
int flush_limit; // indicator of when to flush
|
214
|
+
} *StreamWriter;
|
215
|
+
|
216
|
+
enum {
|
217
|
+
NO_VAL = 0x00,
|
218
|
+
STR_VAL = 0x01,
|
219
|
+
COL_VAL = 0x02,
|
220
|
+
RUBY_VAL = 0x03
|
221
|
+
};
|
222
|
+
|
223
|
+
typedef struct _leaf {
|
224
|
+
struct _leaf *next;
|
225
|
+
union {
|
226
|
+
const char *key; // hash key
|
227
|
+
size_t index; // array index, 0 is not set
|
228
|
+
};
|
229
|
+
union {
|
230
|
+
char *str; // pointer to location in json string or allocated
|
231
|
+
struct _leaf *elements; // array and hash elements
|
232
|
+
VALUE value;
|
233
|
+
};
|
234
|
+
uint8_t rtype;
|
235
|
+
uint8_t parent_type;
|
236
|
+
uint8_t value_type;
|
237
|
+
} *Leaf;
|
238
|
+
|
239
|
+
extern VALUE oj_saj_parse(int argc, VALUE *argv, VALUE self);
|
240
|
+
extern VALUE oj_sc_parse(int argc, VALUE *argv, VALUE self);
|
241
|
+
|
242
|
+
extern VALUE oj_strict_parse(int argc, VALUE *argv, VALUE self);
|
243
|
+
extern VALUE oj_strict_sparse(int argc, VALUE *argv, VALUE self);
|
244
|
+
extern VALUE oj_compat_parse(int argc, VALUE *argv, VALUE self);
|
245
|
+
extern VALUE oj_compat_load(int argc, VALUE *argv, VALUE self);
|
246
|
+
extern VALUE oj_object_parse(int argc, VALUE *argv, VALUE self);
|
247
|
+
extern VALUE oj_custom_parse(int argc, VALUE *argv, VALUE self);
|
248
|
+
extern VALUE oj_wab_parse(int argc, VALUE *argv, VALUE self);
|
249
|
+
|
250
|
+
extern VALUE oj_strict_parse_cstr(int argc, VALUE *argv, char *json, size_t len);
|
251
|
+
extern VALUE oj_compat_parse_cstr(int argc, VALUE *argv, char *json, size_t len);
|
252
|
+
extern VALUE oj_object_parse_cstr(int argc, VALUE *argv, char *json, size_t len);
|
253
|
+
extern VALUE oj_custom_parse_cstr(int argc, VALUE *argv, char *json, size_t len);
|
254
|
+
|
255
|
+
extern void oj_parse_options(VALUE ropts, Options copts);
|
256
|
+
|
257
|
+
extern void oj_dump_obj_to_json(VALUE obj, Options copts, Out out);
|
258
|
+
extern void oj_dump_obj_to_json_using_params(VALUE obj, Options copts, Out out, int argc, VALUE *argv);
|
259
|
+
extern void oj_write_obj_to_file(VALUE obj, const char *path, Options copts);
|
260
|
+
extern void oj_write_obj_to_stream(VALUE obj, VALUE stream, Options copts);
|
261
|
+
extern void oj_dump_leaf_to_json(Leaf leaf, Options copts, Out out);
|
262
|
+
extern void oj_write_leaf_to_file(Leaf leaf, const char *path, Options copts);
|
263
|
+
|
264
|
+
extern void oj_str_writer_push_key(StrWriter sw, const char *key);
|
265
|
+
extern void oj_str_writer_push_object(StrWriter sw, const char *key);
|
266
|
+
extern void oj_str_writer_push_array(StrWriter sw, const char *key);
|
267
|
+
extern void oj_str_writer_push_value(StrWriter sw, VALUE val, const char *key);
|
268
|
+
extern void oj_str_writer_push_json(StrWriter sw, const char *json, const char *key);
|
269
|
+
extern void oj_str_writer_pop(StrWriter sw);
|
270
|
+
extern void oj_str_writer_pop_all(StrWriter sw);
|
271
|
+
|
272
|
+
extern void oj_init_doc(void);
|
273
|
+
extern void oj_string_writer_init();
|
274
|
+
extern void oj_stream_writer_init();
|
275
|
+
extern void oj_str_writer_init(StrWriter sw, int buf_size);
|
276
|
+
extern VALUE oj_define_mimic_json(int argc, VALUE *argv, VALUE self);
|
277
|
+
extern VALUE oj_mimic_generate(int argc, VALUE *argv, VALUE self);
|
278
|
+
extern VALUE oj_mimic_pretty_generate(int argc, VALUE *argv, VALUE self);
|
279
|
+
extern void oj_parse_mimic_dump_options(VALUE ropts, Options copts);
|
280
|
+
|
281
|
+
extern VALUE oj_mimic_parse(int argc, VALUE *argv, VALUE self);
|
282
|
+
extern VALUE oj_get_json_err_class(const char *err_classname);
|
283
|
+
extern void oj_parse_opt_match_string(RxClass rc, VALUE ropts);
|
284
|
+
|
285
|
+
extern VALUE oj_rails_encode(int argc, VALUE *argv, VALUE self);
|
286
|
+
|
287
|
+
extern VALUE Oj;
|
288
|
+
extern struct _options oj_default_options;
|
289
|
+
extern rb_encoding *oj_utf8_encoding;
|
290
|
+
|
291
|
+
extern VALUE oj_bag_class;
|
292
|
+
extern VALUE oj_bigdecimal_class;
|
293
|
+
extern VALUE oj_cstack_class;
|
294
|
+
extern VALUE oj_date_class;
|
295
|
+
extern VALUE oj_datetime_class;
|
296
|
+
extern VALUE oj_doc_class;
|
297
|
+
extern VALUE oj_enumerable_class;
|
298
|
+
extern VALUE oj_json_generator_error_class;
|
299
|
+
extern VALUE oj_json_parser_error_class;
|
300
|
+
extern VALUE oj_stream_writer_class;
|
301
|
+
extern VALUE oj_string_writer_class;
|
302
|
+
extern VALUE oj_stringio_class;
|
303
|
+
extern VALUE oj_struct_class;
|
304
|
+
|
305
|
+
extern VALUE oj_allow_nan_sym;
|
306
|
+
extern VALUE oj_array_class_sym;
|
307
|
+
extern VALUE oj_array_nl_sym;
|
308
|
+
extern VALUE oj_ascii_only_sym;
|
309
|
+
extern VALUE oj_create_additions_sym;
|
310
|
+
extern VALUE oj_hash_class_sym;
|
311
|
+
extern VALUE oj_indent_sym;
|
312
|
+
extern VALUE oj_max_nesting_sym;
|
313
|
+
extern VALUE oj_object_class_sym;
|
314
|
+
extern VALUE oj_object_nl_sym;
|
315
|
+
extern VALUE oj_quirks_mode_sym;
|
316
|
+
extern VALUE oj_space_before_sym;
|
317
|
+
extern VALUE oj_space_sym;
|
318
|
+
extern VALUE oj_trace_sym;
|
319
|
+
|
320
|
+
extern VALUE oj_slash_string;
|
321
|
+
|
322
|
+
extern ID oj_add_value_id;
|
323
|
+
extern ID oj_array_append_id;
|
324
|
+
extern ID oj_array_end_id;
|
325
|
+
extern ID oj_array_start_id;
|
326
|
+
extern ID oj_as_json_id;
|
327
|
+
extern ID oj_begin_id;
|
328
|
+
extern ID oj_bigdecimal_id;
|
329
|
+
extern ID oj_end_id;
|
330
|
+
extern ID oj_error_id;
|
331
|
+
extern ID oj_exclude_end_id;
|
332
|
+
extern ID oj_file_id;
|
333
|
+
extern ID oj_fileno_id;
|
334
|
+
extern ID oj_ftype_id;
|
335
|
+
extern ID oj_has_key_id;
|
336
|
+
extern ID oj_hash_end_id;
|
337
|
+
extern ID oj_hash_key_id;
|
338
|
+
extern ID oj_hash_set_id;
|
339
|
+
extern ID oj_hash_start_id;
|
340
|
+
extern ID oj_iconv_id;
|
341
|
+
extern ID oj_instance_variables_id;
|
342
|
+
extern ID oj_json_create_id;
|
343
|
+
extern ID oj_length_id;
|
344
|
+
extern ID oj_new_id;
|
345
|
+
extern ID oj_parse_id;
|
346
|
+
extern ID oj_pos_id;
|
347
|
+
extern ID oj_read_id;
|
348
|
+
extern ID oj_readpartial_id;
|
349
|
+
extern ID oj_replace_id;
|
350
|
+
extern ID oj_stat_id;
|
351
|
+
extern ID oj_string_id;
|
352
|
+
extern ID oj_to_h_id;
|
353
|
+
extern ID oj_to_hash_id;
|
354
|
+
extern ID oj_to_json_id;
|
355
|
+
extern ID oj_to_s_id;
|
356
|
+
extern ID oj_to_sym_id;
|
357
|
+
extern ID oj_to_time_id;
|
358
|
+
extern ID oj_tv_nsec_id;
|
359
|
+
extern ID oj_tv_sec_id;
|
360
|
+
extern ID oj_tv_usec_id;
|
361
|
+
extern ID oj_utc_id;
|
362
|
+
extern ID oj_utc_offset_id;
|
363
|
+
extern ID oj_utcq_id;
|
364
|
+
extern ID oj_write_id;
|
365
|
+
|
366
|
+
extern bool oj_use_hash_alt;
|
367
|
+
extern bool oj_use_array_alt;
|
368
|
+
|
369
|
+
#if HAVE_LIBPTHREAD
|
370
|
+
extern pthread_mutex_t oj_cache_mutex;
|
371
|
+
#else
|
372
|
+
extern VALUE oj_cache_mutex;
|
373
|
+
#endif
|
374
|
+
|
375
|
+
#if defined(cplusplus)
|
376
|
+
#if 0
|
377
|
+
{ /* satisfy cc-mode */
|
378
|
+
#endif
|
379
|
+
} /* extern "C" { */
|
380
|
+
#endif
|
381
|
+
#endif /* OJ_H */
|
data/ext/oj/parse.c
ADDED
@@ -0,0 +1,1085 @@
|
|
1
|
+
/* parse.c
|
2
|
+
* Copyright (c) 2013, Peter Ohler
|
3
|
+
* All rights reserved.
|
4
|
+
*/
|
5
|
+
|
6
|
+
#include <stdlib.h>
|
7
|
+
#include <stdio.h>
|
8
|
+
#include <string.h>
|
9
|
+
#include <unistd.h>
|
10
|
+
#include <math.h>
|
11
|
+
|
12
|
+
#include "oj.h"
|
13
|
+
#include "encode.h"
|
14
|
+
#include "parse.h"
|
15
|
+
#include "buf.h"
|
16
|
+
#include "val_stack.h"
|
17
|
+
#include "rxclass.h"
|
18
|
+
|
19
|
+
// Workaround in case INFINITY is not defined in math.h or if the OS is CentOS
|
20
|
+
#define OJ_INFINITY (1.0/0.0)
|
21
|
+
|
22
|
+
//#define EXP_MAX 1023
|
23
|
+
#define EXP_MAX 100000
|
24
|
+
#define DEC_MAX 15
|
25
|
+
|
26
|
+
static void
|
27
|
+
next_non_white(ParseInfo pi) {
|
28
|
+
for (; 1; pi->cur++) {
|
29
|
+
switch(*pi->cur) {
|
30
|
+
case ' ':
|
31
|
+
case '\t':
|
32
|
+
case '\f':
|
33
|
+
case '\n':
|
34
|
+
case '\r':
|
35
|
+
break;
|
36
|
+
default:
|
37
|
+
return;
|
38
|
+
}
|
39
|
+
}
|
40
|
+
}
|
41
|
+
|
42
|
+
static void
|
43
|
+
skip_comment(ParseInfo pi) {
|
44
|
+
if ('*' == *pi->cur) {
|
45
|
+
pi->cur++;
|
46
|
+
for (; pi->cur < pi->end; pi->cur++) {
|
47
|
+
if ('*' == *pi->cur && '/' == *(pi->cur + 1)) {
|
48
|
+
pi->cur += 2;
|
49
|
+
return;
|
50
|
+
} else if (pi->end <= pi->cur) {
|
51
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "comment not terminated");
|
52
|
+
return;
|
53
|
+
}
|
54
|
+
}
|
55
|
+
} else if ('/' == *pi->cur) {
|
56
|
+
for (; 1; pi->cur++) {
|
57
|
+
switch (*pi->cur) {
|
58
|
+
case '\n':
|
59
|
+
case '\r':
|
60
|
+
case '\f':
|
61
|
+
case '\0':
|
62
|
+
return;
|
63
|
+
default:
|
64
|
+
break;
|
65
|
+
}
|
66
|
+
}
|
67
|
+
} else {
|
68
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid comment format");
|
69
|
+
}
|
70
|
+
}
|
71
|
+
|
72
|
+
static void
|
73
|
+
add_value(ParseInfo pi, VALUE rval) {
|
74
|
+
Val parent = stack_peek(&pi->stack);
|
75
|
+
|
76
|
+
if (0 == parent) { // simple add
|
77
|
+
pi->add_value(pi, rval);
|
78
|
+
} else {
|
79
|
+
switch (parent->next) {
|
80
|
+
case NEXT_ARRAY_NEW:
|
81
|
+
case NEXT_ARRAY_ELEMENT:
|
82
|
+
pi->array_append_value(pi, rval);
|
83
|
+
parent->next = NEXT_ARRAY_COMMA;
|
84
|
+
break;
|
85
|
+
case NEXT_HASH_VALUE:
|
86
|
+
pi->hash_set_value(pi, parent, rval);
|
87
|
+
if (0 != parent->key && 0 < parent->klen && (parent->key < pi->json || pi->cur < parent->key)) {
|
88
|
+
xfree((char*)parent->key);
|
89
|
+
parent->key = 0;
|
90
|
+
}
|
91
|
+
parent->next = NEXT_HASH_COMMA;
|
92
|
+
break;
|
93
|
+
case NEXT_HASH_NEW:
|
94
|
+
case NEXT_HASH_KEY:
|
95
|
+
case NEXT_HASH_COMMA:
|
96
|
+
case NEXT_NONE:
|
97
|
+
case NEXT_ARRAY_COMMA:
|
98
|
+
case NEXT_HASH_COLON:
|
99
|
+
default:
|
100
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s", oj_stack_next_string(parent->next));
|
101
|
+
break;
|
102
|
+
}
|
103
|
+
}
|
104
|
+
}
|
105
|
+
|
106
|
+
static void
|
107
|
+
read_null(ParseInfo pi) {
|
108
|
+
if ('u' == *pi->cur++ && 'l' == *pi->cur++ && 'l' == *pi->cur++) {
|
109
|
+
add_value(pi, Qnil);
|
110
|
+
} else {
|
111
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected null");
|
112
|
+
}
|
113
|
+
}
|
114
|
+
|
115
|
+
static void
|
116
|
+
read_true(ParseInfo pi) {
|
117
|
+
if ('r' == *pi->cur++ && 'u' == *pi->cur++ && 'e' == *pi->cur++) {
|
118
|
+
add_value(pi, Qtrue);
|
119
|
+
} else {
|
120
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected true");
|
121
|
+
}
|
122
|
+
}
|
123
|
+
|
124
|
+
static void
|
125
|
+
read_false(ParseInfo pi) {
|
126
|
+
if ('a' == *pi->cur++ && 'l' == *pi->cur++ && 's' == *pi->cur++ && 'e' == *pi->cur++) {
|
127
|
+
add_value(pi, Qfalse);
|
128
|
+
} else {
|
129
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected false");
|
130
|
+
}
|
131
|
+
}
|
132
|
+
|
133
|
+
static uint32_t
|
134
|
+
read_hex(ParseInfo pi, const char *h) {
|
135
|
+
uint32_t b = 0;
|
136
|
+
int i;
|
137
|
+
|
138
|
+
for (i = 0; i < 4; i++, h++) {
|
139
|
+
b = b << 4;
|
140
|
+
if ('0' <= *h && *h <= '9') {
|
141
|
+
b += *h - '0';
|
142
|
+
} else if ('A' <= *h && *h <= 'F') {
|
143
|
+
b += *h - 'A' + 10;
|
144
|
+
} else if ('a' <= *h && *h <= 'f') {
|
145
|
+
b += *h - 'a' + 10;
|
146
|
+
} else {
|
147
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid hex character");
|
148
|
+
return 0;
|
149
|
+
}
|
150
|
+
}
|
151
|
+
return b;
|
152
|
+
}
|
153
|
+
|
154
|
+
static void
|
155
|
+
unicode_to_chars(ParseInfo pi, Buf buf, uint32_t code) {
|
156
|
+
if (0x0000007F >= code) {
|
157
|
+
buf_append(buf, (char)code);
|
158
|
+
} else if (0x000007FF >= code) {
|
159
|
+
buf_append(buf, 0xC0 | (code >> 6));
|
160
|
+
buf_append(buf, 0x80 | (0x3F & code));
|
161
|
+
} else if (0x0000FFFF >= code) {
|
162
|
+
buf_append(buf, 0xE0 | (code >> 12));
|
163
|
+
buf_append(buf, 0x80 | ((code >> 6) & 0x3F));
|
164
|
+
buf_append(buf, 0x80 | (0x3F & code));
|
165
|
+
} else if (0x001FFFFF >= code) {
|
166
|
+
buf_append(buf, 0xF0 | (code >> 18));
|
167
|
+
buf_append(buf, 0x80 | ((code >> 12) & 0x3F));
|
168
|
+
buf_append(buf, 0x80 | ((code >> 6) & 0x3F));
|
169
|
+
buf_append(buf, 0x80 | (0x3F & code));
|
170
|
+
} else if (0x03FFFFFF >= code) {
|
171
|
+
buf_append(buf, 0xF8 | (code >> 24));
|
172
|
+
buf_append(buf, 0x80 | ((code >> 18) & 0x3F));
|
173
|
+
buf_append(buf, 0x80 | ((code >> 12) & 0x3F));
|
174
|
+
buf_append(buf, 0x80 | ((code >> 6) & 0x3F));
|
175
|
+
buf_append(buf, 0x80 | (0x3F & code));
|
176
|
+
} else if (0x7FFFFFFF >= code) {
|
177
|
+
buf_append(buf, 0xFC | (code >> 30));
|
178
|
+
buf_append(buf, 0x80 | ((code >> 24) & 0x3F));
|
179
|
+
buf_append(buf, 0x80 | ((code >> 18) & 0x3F));
|
180
|
+
buf_append(buf, 0x80 | ((code >> 12) & 0x3F));
|
181
|
+
buf_append(buf, 0x80 | ((code >> 6) & 0x3F));
|
182
|
+
buf_append(buf, 0x80 | (0x3F & code));
|
183
|
+
} else {
|
184
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid Unicode character");
|
185
|
+
}
|
186
|
+
}
|
187
|
+
|
188
|
+
// entered at /
|
189
|
+
static void
|
190
|
+
read_escaped_str(ParseInfo pi, const char *start) {
|
191
|
+
struct _buf buf;
|
192
|
+
const char *s;
|
193
|
+
int cnt = (int)(pi->cur - start);
|
194
|
+
uint32_t code;
|
195
|
+
Val parent = stack_peek(&pi->stack);
|
196
|
+
|
197
|
+
buf_init(&buf);
|
198
|
+
if (0 < cnt) {
|
199
|
+
buf_append_string(&buf, start, cnt);
|
200
|
+
}
|
201
|
+
for (s = pi->cur; '"' != *s; s++) {
|
202
|
+
if (s >= pi->end) {
|
203
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "quoted string not terminated");
|
204
|
+
buf_cleanup(&buf);
|
205
|
+
return;
|
206
|
+
} else if ('\\' == *s) {
|
207
|
+
s++;
|
208
|
+
switch (*s) {
|
209
|
+
case 'n': buf_append(&buf, '\n'); break;
|
210
|
+
case 'r': buf_append(&buf, '\r'); break;
|
211
|
+
case 't': buf_append(&buf, '\t'); break;
|
212
|
+
case 'f': buf_append(&buf, '\f'); break;
|
213
|
+
case 'b': buf_append(&buf, '\b'); break;
|
214
|
+
case '"': buf_append(&buf, '"'); break;
|
215
|
+
case '/': buf_append(&buf, '/'); break;
|
216
|
+
case '\\': buf_append(&buf, '\\'); break;
|
217
|
+
case '\'':
|
218
|
+
// The json gem claims this is not an error despite the
|
219
|
+
// ECMA-404 indicating it is not valid.
|
220
|
+
if (CompatMode == pi->options.mode) {
|
221
|
+
buf_append(&buf, '\'');
|
222
|
+
} else {
|
223
|
+
pi->cur = s;
|
224
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid escaped character");
|
225
|
+
buf_cleanup(&buf);
|
226
|
+
return;
|
227
|
+
}
|
228
|
+
break;
|
229
|
+
case 'u':
|
230
|
+
s++;
|
231
|
+
if (0 == (code = read_hex(pi, s)) && err_has(&pi->err)) {
|
232
|
+
buf_cleanup(&buf);
|
233
|
+
return;
|
234
|
+
}
|
235
|
+
s += 3;
|
236
|
+
if (0x0000D800 <= code && code <= 0x0000DFFF) {
|
237
|
+
uint32_t c1 = (code - 0x0000D800) & 0x000003FF;
|
238
|
+
uint32_t c2;
|
239
|
+
|
240
|
+
s++;
|
241
|
+
if ('\\' != *s || 'u' != *(s + 1)) {
|
242
|
+
if (Yes == pi->options.allow_invalid) {
|
243
|
+
s--;
|
244
|
+
unicode_to_chars(pi, &buf, code);
|
245
|
+
break;
|
246
|
+
}
|
247
|
+
pi->cur = s;
|
248
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid escaped character");
|
249
|
+
buf_cleanup(&buf);
|
250
|
+
return;
|
251
|
+
}
|
252
|
+
s += 2;
|
253
|
+
if (0 == (c2 = read_hex(pi, s)) && err_has(&pi->err)) {
|
254
|
+
buf_cleanup(&buf);
|
255
|
+
return;
|
256
|
+
}
|
257
|
+
s += 3;
|
258
|
+
c2 = (c2 - 0x0000DC00) & 0x000003FF;
|
259
|
+
code = ((c1 << 10) | c2) + 0x00010000;
|
260
|
+
}
|
261
|
+
unicode_to_chars(pi, &buf, code);
|
262
|
+
if (err_has(&pi->err)) {
|
263
|
+
buf_cleanup(&buf);
|
264
|
+
return;
|
265
|
+
}
|
266
|
+
break;
|
267
|
+
default:
|
268
|
+
pi->cur = s;
|
269
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "invalid escaped character");
|
270
|
+
buf_cleanup(&buf);
|
271
|
+
return;
|
272
|
+
}
|
273
|
+
} else {
|
274
|
+
buf_append(&buf, *s);
|
275
|
+
}
|
276
|
+
}
|
277
|
+
if (0 == parent) {
|
278
|
+
pi->add_cstr(pi, buf.head, buf_len(&buf), start);
|
279
|
+
} else {
|
280
|
+
switch (parent->next) {
|
281
|
+
case NEXT_ARRAY_NEW:
|
282
|
+
case NEXT_ARRAY_ELEMENT:
|
283
|
+
pi->array_append_cstr(pi, buf.head, buf_len(&buf), start);
|
284
|
+
parent->next = NEXT_ARRAY_COMMA;
|
285
|
+
break;
|
286
|
+
case NEXT_HASH_NEW:
|
287
|
+
case NEXT_HASH_KEY:
|
288
|
+
if (Qundef == (parent->key_val = pi->hash_key(pi, buf.head, buf_len(&buf)))) {
|
289
|
+
parent->klen = buf_len(&buf);
|
290
|
+
parent->key = malloc(parent->klen + 1);
|
291
|
+
memcpy((char*)parent->key, buf.head, parent->klen);
|
292
|
+
*(char*)(parent->key + parent->klen) = '\0';
|
293
|
+
} else {
|
294
|
+
parent->key = "";
|
295
|
+
parent->klen = 0;
|
296
|
+
}
|
297
|
+
parent->k1 = *start;
|
298
|
+
parent->next = NEXT_HASH_COLON;
|
299
|
+
break;
|
300
|
+
case NEXT_HASH_VALUE:
|
301
|
+
pi->hash_set_cstr(pi, parent, buf.head, buf_len(&buf), start);
|
302
|
+
if (0 != parent->key && 0 < parent->klen && (parent->key < pi->json || pi->cur < parent->key)) {
|
303
|
+
xfree((char*)parent->key);
|
304
|
+
parent->key = 0;
|
305
|
+
}
|
306
|
+
parent->next = NEXT_HASH_COMMA;
|
307
|
+
break;
|
308
|
+
case NEXT_HASH_COMMA:
|
309
|
+
case NEXT_NONE:
|
310
|
+
case NEXT_ARRAY_COMMA:
|
311
|
+
case NEXT_HASH_COLON:
|
312
|
+
default:
|
313
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s, not a string", oj_stack_next_string(parent->next));
|
314
|
+
break;
|
315
|
+
}
|
316
|
+
}
|
317
|
+
pi->cur = s + 1;
|
318
|
+
buf_cleanup(&buf);
|
319
|
+
}
|
320
|
+
|
321
|
+
static void
|
322
|
+
read_str(ParseInfo pi) {
|
323
|
+
const char *str = pi->cur;
|
324
|
+
Val parent = stack_peek(&pi->stack);
|
325
|
+
|
326
|
+
for (; '"' != *pi->cur; pi->cur++) {
|
327
|
+
if (pi->end <= pi->cur) {
|
328
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "quoted string not terminated");
|
329
|
+
return;
|
330
|
+
} else if ('\0' == *pi->cur) {
|
331
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "NULL byte in string");
|
332
|
+
return;
|
333
|
+
} else if ('\\' == *pi->cur) {
|
334
|
+
read_escaped_str(pi, str);
|
335
|
+
return;
|
336
|
+
}
|
337
|
+
}
|
338
|
+
if (0 == parent) { // simple add
|
339
|
+
pi->add_cstr(pi, str, pi->cur - str, str);
|
340
|
+
} else {
|
341
|
+
switch (parent->next) {
|
342
|
+
case NEXT_ARRAY_NEW:
|
343
|
+
case NEXT_ARRAY_ELEMENT:
|
344
|
+
pi->array_append_cstr(pi, str, pi->cur - str, str);
|
345
|
+
parent->next = NEXT_ARRAY_COMMA;
|
346
|
+
break;
|
347
|
+
case NEXT_HASH_NEW:
|
348
|
+
case NEXT_HASH_KEY:
|
349
|
+
if (Qundef == (parent->key_val = pi->hash_key(pi, str, pi->cur - str))) {
|
350
|
+
parent->key = str;
|
351
|
+
parent->klen = pi->cur - str;
|
352
|
+
} else {
|
353
|
+
parent->key = "";
|
354
|
+
parent->klen = 0;
|
355
|
+
}
|
356
|
+
parent->k1 = *str;
|
357
|
+
parent->next = NEXT_HASH_COLON;
|
358
|
+
break;
|
359
|
+
case NEXT_HASH_VALUE:
|
360
|
+
pi->hash_set_cstr(pi, parent, str, pi->cur - str, str);
|
361
|
+
if (0 != parent->key && 0 < parent->klen && (parent->key < pi->json || pi->cur < parent->key)) {
|
362
|
+
xfree((char*)parent->key);
|
363
|
+
parent->key = 0;
|
364
|
+
}
|
365
|
+
parent->next = NEXT_HASH_COMMA;
|
366
|
+
break;
|
367
|
+
case NEXT_HASH_COMMA:
|
368
|
+
case NEXT_NONE:
|
369
|
+
case NEXT_ARRAY_COMMA:
|
370
|
+
case NEXT_HASH_COLON:
|
371
|
+
default:
|
372
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s, not a string", oj_stack_next_string(parent->next));
|
373
|
+
break;
|
374
|
+
}
|
375
|
+
}
|
376
|
+
pi->cur++; // move past "
|
377
|
+
}
|
378
|
+
|
379
|
+
static void
|
380
|
+
read_num(ParseInfo pi) {
|
381
|
+
struct _numInfo ni;
|
382
|
+
Val parent = stack_peek(&pi->stack);
|
383
|
+
|
384
|
+
ni.str = pi->cur;
|
385
|
+
ni.i = 0;
|
386
|
+
ni.num = 0;
|
387
|
+
ni.div = 1;
|
388
|
+
ni.di = 0;
|
389
|
+
ni.len = 0;
|
390
|
+
ni.exp = 0;
|
391
|
+
ni.big = 0;
|
392
|
+
ni.infinity = 0;
|
393
|
+
ni.nan = 0;
|
394
|
+
ni.neg = 0;
|
395
|
+
ni.hasExp = 0;
|
396
|
+
ni.no_big = (FloatDec == pi->options.bigdec_load);
|
397
|
+
|
398
|
+
if ('-' == *pi->cur) {
|
399
|
+
pi->cur++;
|
400
|
+
ni.neg = 1;
|
401
|
+
} else if ('+' == *pi->cur) {
|
402
|
+
pi->cur++;
|
403
|
+
}
|
404
|
+
if ('I' == *pi->cur) {
|
405
|
+
if (No == pi->options.allow_nan || 0 != strncmp("Infinity", pi->cur, 8)) {
|
406
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "not a number or other value");
|
407
|
+
return;
|
408
|
+
}
|
409
|
+
pi->cur += 8;
|
410
|
+
ni.infinity = 1;
|
411
|
+
} else if ('N' == *pi->cur || 'n' == *pi->cur) {
|
412
|
+
if ('a' != pi->cur[1] || ('N' != pi->cur[2] && 'n' != pi->cur[2])) {
|
413
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "not a number or other value");
|
414
|
+
return;
|
415
|
+
}
|
416
|
+
pi->cur += 3;
|
417
|
+
ni.nan = 1;
|
418
|
+
} else {
|
419
|
+
int dec_cnt = 0;
|
420
|
+
bool zero1 = false;
|
421
|
+
|
422
|
+
for (; '0' <= *pi->cur && *pi->cur <= '9'; pi->cur++) {
|
423
|
+
if (0 == ni.i && '0' == *pi->cur) {
|
424
|
+
zero1 = true;
|
425
|
+
}
|
426
|
+
if (0 < ni.i) {
|
427
|
+
dec_cnt++;
|
428
|
+
}
|
429
|
+
if (!ni.big) {
|
430
|
+
int d = (*pi->cur - '0');
|
431
|
+
|
432
|
+
if (0 < d) {
|
433
|
+
if (zero1 && CompatMode == pi->options.mode) {
|
434
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "not a number");
|
435
|
+
return;
|
436
|
+
}
|
437
|
+
zero1 = false;
|
438
|
+
}
|
439
|
+
ni.i = ni.i * 10 + d;
|
440
|
+
if (INT64_MAX <= ni.i || DEC_MAX < dec_cnt) {
|
441
|
+
ni.big = 1;
|
442
|
+
}
|
443
|
+
}
|
444
|
+
}
|
445
|
+
if ('.' == *pi->cur) {
|
446
|
+
pi->cur++;
|
447
|
+
// A trailing . is not a valid decimal but if encountered allow it
|
448
|
+
// except when mimicing the JSON gem.
|
449
|
+
if (CompatMode == pi->options.mode) {
|
450
|
+
if (*pi->cur < '0' || '9' < *pi->cur) {
|
451
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "not a number");
|
452
|
+
return;
|
453
|
+
}
|
454
|
+
}
|
455
|
+
for (; '0' <= *pi->cur && *pi->cur <= '9'; pi->cur++) {
|
456
|
+
int d = (*pi->cur - '0');
|
457
|
+
|
458
|
+
if (0 < ni.num || 0 < ni.i) {
|
459
|
+
dec_cnt++;
|
460
|
+
}
|
461
|
+
ni.num = ni.num * 10 + d;
|
462
|
+
ni.div *= 10;
|
463
|
+
ni.di++;
|
464
|
+
if (INT64_MAX <= ni.div || DEC_MAX < dec_cnt) {
|
465
|
+
ni.big = 1;
|
466
|
+
}
|
467
|
+
}
|
468
|
+
}
|
469
|
+
if ('e' == *pi->cur || 'E' == *pi->cur) {
|
470
|
+
int eneg = 0;
|
471
|
+
|
472
|
+
ni.hasExp = 1;
|
473
|
+
pi->cur++;
|
474
|
+
if ('-' == *pi->cur) {
|
475
|
+
pi->cur++;
|
476
|
+
eneg = 1;
|
477
|
+
} else if ('+' == *pi->cur) {
|
478
|
+
pi->cur++;
|
479
|
+
}
|
480
|
+
for (; '0' <= *pi->cur && *pi->cur <= '9'; pi->cur++) {
|
481
|
+
ni.exp = ni.exp * 10 + (*pi->cur - '0');
|
482
|
+
if (EXP_MAX <= ni.exp) {
|
483
|
+
ni.big = 1;
|
484
|
+
}
|
485
|
+
}
|
486
|
+
if (eneg) {
|
487
|
+
ni.exp = -ni.exp;
|
488
|
+
}
|
489
|
+
}
|
490
|
+
ni.len = pi->cur - ni.str;
|
491
|
+
}
|
492
|
+
// Check for special reserved values for Infinity and NaN.
|
493
|
+
if (ni.big) {
|
494
|
+
if (0 == strcasecmp(INF_VAL, ni.str)) {
|
495
|
+
ni.infinity = 1;
|
496
|
+
} else if (0 == strcasecmp(NINF_VAL, ni.str)) {
|
497
|
+
ni.infinity = 1;
|
498
|
+
ni.neg = 1;
|
499
|
+
} else if (0 == strcasecmp(NAN_VAL, ni.str)) {
|
500
|
+
ni.nan = 1;
|
501
|
+
}
|
502
|
+
}
|
503
|
+
if (BigDec == pi->options.bigdec_load) {
|
504
|
+
ni.big = 1;
|
505
|
+
}
|
506
|
+
if (0 == parent) {
|
507
|
+
pi->add_num(pi, &ni);
|
508
|
+
} else {
|
509
|
+
switch (parent->next) {
|
510
|
+
case NEXT_ARRAY_NEW:
|
511
|
+
case NEXT_ARRAY_ELEMENT:
|
512
|
+
pi->array_append_num(pi, &ni);
|
513
|
+
parent->next = NEXT_ARRAY_COMMA;
|
514
|
+
break;
|
515
|
+
case NEXT_HASH_VALUE:
|
516
|
+
pi->hash_set_num(pi, parent, &ni);
|
517
|
+
if (0 != parent->key && 0 < parent->klen && (parent->key < pi->json || pi->cur < parent->key)) {
|
518
|
+
xfree((char*)parent->key);
|
519
|
+
parent->key = 0;
|
520
|
+
}
|
521
|
+
parent->next = NEXT_HASH_COMMA;
|
522
|
+
break;
|
523
|
+
default:
|
524
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s", oj_stack_next_string(parent->next));
|
525
|
+
break;
|
526
|
+
}
|
527
|
+
}
|
528
|
+
}
|
529
|
+
|
530
|
+
static void
|
531
|
+
array_start(ParseInfo pi) {
|
532
|
+
volatile VALUE v = pi->start_array(pi);
|
533
|
+
|
534
|
+
stack_push(&pi->stack, v, NEXT_ARRAY_NEW);
|
535
|
+
}
|
536
|
+
|
537
|
+
static void
|
538
|
+
array_end(ParseInfo pi) {
|
539
|
+
Val array = stack_pop(&pi->stack);
|
540
|
+
|
541
|
+
if (0 == array) {
|
542
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected array close");
|
543
|
+
} else if (NEXT_ARRAY_COMMA != array->next && NEXT_ARRAY_NEW != array->next) {
|
544
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s, not an array close", oj_stack_next_string(array->next));
|
545
|
+
} else {
|
546
|
+
pi->end_array(pi);
|
547
|
+
add_value(pi, array->val);
|
548
|
+
}
|
549
|
+
}
|
550
|
+
|
551
|
+
static void
|
552
|
+
hash_start(ParseInfo pi) {
|
553
|
+
volatile VALUE v = pi->start_hash(pi);
|
554
|
+
|
555
|
+
stack_push(&pi->stack, v, NEXT_HASH_NEW);
|
556
|
+
}
|
557
|
+
|
558
|
+
static void
|
559
|
+
hash_end(ParseInfo pi) {
|
560
|
+
volatile Val hash = stack_peek(&pi->stack);
|
561
|
+
|
562
|
+
// leave hash on stack until just before
|
563
|
+
if (0 == hash) {
|
564
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected hash close");
|
565
|
+
} else if (NEXT_HASH_COMMA != hash->next && NEXT_HASH_NEW != hash->next) {
|
566
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "expected %s, not a hash close", oj_stack_next_string(hash->next));
|
567
|
+
} else {
|
568
|
+
pi->end_hash(pi);
|
569
|
+
stack_pop(&pi->stack);
|
570
|
+
add_value(pi, hash->val);
|
571
|
+
}
|
572
|
+
}
|
573
|
+
|
574
|
+
static void
|
575
|
+
comma(ParseInfo pi) {
|
576
|
+
Val parent = stack_peek(&pi->stack);
|
577
|
+
|
578
|
+
if (0 == parent) {
|
579
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected comma");
|
580
|
+
} else if (NEXT_ARRAY_COMMA == parent->next) {
|
581
|
+
parent->next = NEXT_ARRAY_ELEMENT;
|
582
|
+
} else if (NEXT_HASH_COMMA == parent->next) {
|
583
|
+
parent->next = NEXT_HASH_KEY;
|
584
|
+
} else {
|
585
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected comma");
|
586
|
+
}
|
587
|
+
}
|
588
|
+
|
589
|
+
static void
|
590
|
+
colon(ParseInfo pi) {
|
591
|
+
Val parent = stack_peek(&pi->stack);
|
592
|
+
|
593
|
+
if (0 != parent && NEXT_HASH_COLON == parent->next) {
|
594
|
+
parent->next = NEXT_HASH_VALUE;
|
595
|
+
} else {
|
596
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected colon");
|
597
|
+
}
|
598
|
+
}
|
599
|
+
|
600
|
+
void
|
601
|
+
oj_parse2(ParseInfo pi) {
|
602
|
+
int first = 1;
|
603
|
+
long start = 0;
|
604
|
+
|
605
|
+
pi->cur = pi->json;
|
606
|
+
err_init(&pi->err);
|
607
|
+
while (1) {
|
608
|
+
if (0 < pi->max_depth && pi->max_depth <= pi->stack.tail - pi->stack.head - 1) {
|
609
|
+
VALUE err_clas = oj_get_json_err_class("NestingError");
|
610
|
+
|
611
|
+
oj_set_error_at(pi, err_clas, __FILE__, __LINE__, "Too deeply nested.");
|
612
|
+
pi->err_class = err_clas;
|
613
|
+
return;
|
614
|
+
}
|
615
|
+
next_non_white(pi);
|
616
|
+
if (!first && '\0' != *pi->cur) {
|
617
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected characters after the JSON document");
|
618
|
+
}
|
619
|
+
|
620
|
+
// If no tokens are consumed (i.e. empty string), throw a parse error
|
621
|
+
// this is the behavior of JSON.parse in both Ruby and JS.
|
622
|
+
if (No == pi->options.empty_string && 1 == first && '\0' == *pi->cur) {
|
623
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected character");
|
624
|
+
}
|
625
|
+
|
626
|
+
switch (*pi->cur++) {
|
627
|
+
case '{':
|
628
|
+
hash_start(pi);
|
629
|
+
break;
|
630
|
+
case '}':
|
631
|
+
hash_end(pi);
|
632
|
+
break;
|
633
|
+
case ':':
|
634
|
+
colon(pi);
|
635
|
+
break;
|
636
|
+
case '[':
|
637
|
+
array_start(pi);
|
638
|
+
break;
|
639
|
+
case ']':
|
640
|
+
array_end(pi);
|
641
|
+
break;
|
642
|
+
case ',':
|
643
|
+
comma(pi);
|
644
|
+
break;
|
645
|
+
case '"':
|
646
|
+
read_str(pi);
|
647
|
+
break;
|
648
|
+
//case '+':
|
649
|
+
case '+':
|
650
|
+
if (CompatMode == pi->options.mode) {
|
651
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected character");
|
652
|
+
return;
|
653
|
+
}
|
654
|
+
pi->cur--;
|
655
|
+
read_num(pi);
|
656
|
+
break;
|
657
|
+
case '-':
|
658
|
+
case '0':
|
659
|
+
case '1':
|
660
|
+
case '2':
|
661
|
+
case '3':
|
662
|
+
case '4':
|
663
|
+
case '5':
|
664
|
+
case '6':
|
665
|
+
case '7':
|
666
|
+
case '8':
|
667
|
+
case '9':
|
668
|
+
pi->cur--;
|
669
|
+
read_num(pi);
|
670
|
+
break;
|
671
|
+
case 'I':
|
672
|
+
case 'N':
|
673
|
+
if (Yes == pi->options.allow_nan) {
|
674
|
+
pi->cur--;
|
675
|
+
read_num(pi);
|
676
|
+
} else {
|
677
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected character");
|
678
|
+
}
|
679
|
+
break;
|
680
|
+
case 't':
|
681
|
+
read_true(pi);
|
682
|
+
break;
|
683
|
+
case 'f':
|
684
|
+
read_false(pi);
|
685
|
+
break;
|
686
|
+
case 'n':
|
687
|
+
if ('u' == *pi->cur) {
|
688
|
+
read_null(pi);
|
689
|
+
} else {
|
690
|
+
pi->cur--;
|
691
|
+
read_num(pi);
|
692
|
+
}
|
693
|
+
break;
|
694
|
+
case '/':
|
695
|
+
skip_comment(pi);
|
696
|
+
if (first) {
|
697
|
+
continue;
|
698
|
+
}
|
699
|
+
break;
|
700
|
+
case '\0':
|
701
|
+
pi->cur--;
|
702
|
+
return;
|
703
|
+
default:
|
704
|
+
oj_set_error_at(pi, oj_parse_error_class, __FILE__, __LINE__, "unexpected character");
|
705
|
+
return;
|
706
|
+
}
|
707
|
+
if (err_has(&pi->err)) {
|
708
|
+
return;
|
709
|
+
}
|
710
|
+
if (stack_empty(&pi->stack)) {
|
711
|
+
if (Qundef != pi->proc) {
|
712
|
+
VALUE args[3];
|
713
|
+
long len = (pi->cur - pi->json) - start;
|
714
|
+
|
715
|
+
*args = stack_head_val(&pi->stack);
|
716
|
+
args[1] = LONG2NUM(start);
|
717
|
+
args[2] = LONG2NUM(len);
|
718
|
+
|
719
|
+
if (Qnil == pi->proc) {
|
720
|
+
rb_yield_values2(3, args);
|
721
|
+
} else {
|
722
|
+
rb_proc_call_with_block(pi->proc, 3, args, Qnil);
|
723
|
+
}
|
724
|
+
} else if (!pi->has_callbacks) {
|
725
|
+
first = 0;
|
726
|
+
}
|
727
|
+
start = pi->cur - pi->json;
|
728
|
+
}
|
729
|
+
}
|
730
|
+
}
|
731
|
+
|
732
|
+
static VALUE
|
733
|
+
rescue_big_decimal(VALUE str) {
|
734
|
+
rb_raise(oj_parse_error_class, "Invalid value for BigDecimal()");
|
735
|
+
return Qnil;
|
736
|
+
}
|
737
|
+
|
738
|
+
static VALUE
|
739
|
+
parse_big_decimal(VALUE str) {
|
740
|
+
return rb_funcall(rb_cObject, oj_bigdecimal_id, 1, str);
|
741
|
+
}
|
742
|
+
|
743
|
+
VALUE
|
744
|
+
oj_num_as_value(NumInfo ni) {
|
745
|
+
volatile VALUE rnum = Qnil;
|
746
|
+
|
747
|
+
if (ni->infinity) {
|
748
|
+
if (ni->neg) {
|
749
|
+
rnum = rb_float_new(-OJ_INFINITY);
|
750
|
+
} else {
|
751
|
+
rnum = rb_float_new(OJ_INFINITY);
|
752
|
+
}
|
753
|
+
} else if (ni->nan) {
|
754
|
+
rnum = rb_float_new(0.0/0.0);
|
755
|
+
} else if (1 == ni->div && 0 == ni->exp) { // fixnum
|
756
|
+
if (ni->big) {
|
757
|
+
if (256 > ni->len) {
|
758
|
+
char buf[256];
|
759
|
+
|
760
|
+
memcpy(buf, ni->str, ni->len);
|
761
|
+
buf[ni->len] = '\0';
|
762
|
+
rnum = rb_cstr_to_inum(buf, 10, 0);
|
763
|
+
} else {
|
764
|
+
char *buf = ALLOC_N(char, ni->len + 1);
|
765
|
+
|
766
|
+
memcpy(buf, ni->str, ni->len);
|
767
|
+
buf[ni->len] = '\0';
|
768
|
+
rnum = rb_cstr_to_inum(buf, 10, 0);
|
769
|
+
xfree(buf);
|
770
|
+
}
|
771
|
+
} else {
|
772
|
+
if (ni->neg) {
|
773
|
+
rnum = rb_ll2inum(-ni->i);
|
774
|
+
} else {
|
775
|
+
rnum = rb_ll2inum(ni->i);
|
776
|
+
}
|
777
|
+
}
|
778
|
+
} else { // decimal
|
779
|
+
if (ni->big) {
|
780
|
+
volatile VALUE bd = rb_str_new(ni->str, ni->len);
|
781
|
+
|
782
|
+
rnum = rb_rescue2(parse_big_decimal, bd, rescue_big_decimal, bd, rb_eException, 0);
|
783
|
+
if (ni->no_big) {
|
784
|
+
rnum = rb_funcall(rnum, rb_intern("to_f"), 0);
|
785
|
+
}
|
786
|
+
} else {
|
787
|
+
// All these machinations are to get rounding to work better.
|
788
|
+
long double d = (long double)ni->i * (long double)ni->div + (long double)ni->num;
|
789
|
+
int x = (int)((int64_t)ni->exp - ni->di);
|
790
|
+
|
791
|
+
// Rounding sometimes cuts off the last digit even if there are only
|
792
|
+
// 15 digits. This attempts to fix those few cases where this
|
793
|
+
// occurs.
|
794
|
+
if ((long double)INT64_MAX > d && (int64_t)d != (ni->i * ni->div + ni->num)) {
|
795
|
+
volatile VALUE bd = rb_str_new(ni->str, ni->len);
|
796
|
+
|
797
|
+
rnum = rb_rescue2(parse_big_decimal, bd, rescue_big_decimal, bd, rb_eException, 0);
|
798
|
+
if (ni->no_big) {
|
799
|
+
rnum = rb_funcall(rnum, rb_intern("to_f"), 0);
|
800
|
+
}
|
801
|
+
} else {
|
802
|
+
d = roundl(d);
|
803
|
+
if (0 < x) {
|
804
|
+
d *= powl(10.0L, x);
|
805
|
+
} else if (0 > x) {
|
806
|
+
d /= powl(10.0L, -x);
|
807
|
+
}
|
808
|
+
if (ni->neg) {
|
809
|
+
d = -d;
|
810
|
+
}
|
811
|
+
rnum = rb_float_new((double)d);
|
812
|
+
}
|
813
|
+
}
|
814
|
+
}
|
815
|
+
return rnum;
|
816
|
+
}
|
817
|
+
|
818
|
+
void
|
819
|
+
oj_set_error_at(ParseInfo pi, VALUE err_clas, const char* file, int line, const char *format, ...) {
|
820
|
+
va_list ap;
|
821
|
+
char msg[256];
|
822
|
+
char *p = msg;
|
823
|
+
char *end = p + sizeof(msg) - 2;
|
824
|
+
char *start;
|
825
|
+
Val vp;
|
826
|
+
|
827
|
+
va_start(ap, format);
|
828
|
+
p += vsnprintf(msg, sizeof(msg) - 1, format, ap);
|
829
|
+
va_end(ap);
|
830
|
+
pi->err.clas = err_clas;
|
831
|
+
if (p + 3 < end) {
|
832
|
+
*p++ = ' ';
|
833
|
+
*p++ = '(';
|
834
|
+
start = p;
|
835
|
+
for (vp = pi->stack.head; vp < pi->stack.tail; vp++) {
|
836
|
+
if (end <= p + 1 + vp->klen) {
|
837
|
+
break;
|
838
|
+
}
|
839
|
+
if (NULL != vp->key) {
|
840
|
+
if (start < p) {
|
841
|
+
*p++ = '.';
|
842
|
+
}
|
843
|
+
memcpy(p, vp->key, vp->klen);
|
844
|
+
p += vp->klen;
|
845
|
+
} else {
|
846
|
+
if (RUBY_T_ARRAY == rb_type(vp->val)) {
|
847
|
+
if (end <= p + 12) {
|
848
|
+
break;
|
849
|
+
}
|
850
|
+
p += snprintf(p, end - p, "[%ld]", RARRAY_LEN(vp->val));
|
851
|
+
}
|
852
|
+
}
|
853
|
+
}
|
854
|
+
*p++ = ')';
|
855
|
+
}
|
856
|
+
*p = '\0';
|
857
|
+
if (0 == pi->json) {
|
858
|
+
oj_err_set(&pi->err, err_clas, "%s at line %d, column %d [%s:%d]", msg, pi->rd.line, pi->rd.col, file, line);
|
859
|
+
} else {
|
860
|
+
_oj_err_set_with_location(&pi->err, err_clas, msg, pi->json, pi->cur - 1, file, line);
|
861
|
+
}
|
862
|
+
}
|
863
|
+
|
864
|
+
static VALUE
|
865
|
+
protect_parse(VALUE pip) {
|
866
|
+
oj_parse2((ParseInfo)pip);
|
867
|
+
|
868
|
+
return Qnil;
|
869
|
+
}
|
870
|
+
|
871
|
+
extern int oj_utf8_index;
|
872
|
+
|
873
|
+
static void
|
874
|
+
oj_pi_set_input_str(ParseInfo pi, volatile VALUE *inputp) {
|
875
|
+
rb_encoding *enc = rb_to_encoding(rb_obj_encoding(*inputp));
|
876
|
+
|
877
|
+
if (rb_utf8_encoding() != enc) {
|
878
|
+
*inputp = rb_str_conv_enc(*inputp, enc, rb_utf8_encoding());
|
879
|
+
}
|
880
|
+
pi->json = rb_string_value_ptr((VALUE*)inputp);
|
881
|
+
pi->end = pi->json + RSTRING_LEN(*inputp);
|
882
|
+
}
|
883
|
+
|
884
|
+
VALUE
|
885
|
+
oj_pi_parse(int argc, VALUE *argv, ParseInfo pi, char *json, size_t len, int yieldOk) {
|
886
|
+
char *buf = 0;
|
887
|
+
volatile VALUE input;
|
888
|
+
volatile VALUE wrapped_stack;
|
889
|
+
volatile VALUE result = Qnil;
|
890
|
+
int line = 0;
|
891
|
+
int free_json = 0;
|
892
|
+
|
893
|
+
if (argc < 1) {
|
894
|
+
rb_raise(rb_eArgError, "Wrong number of arguments to parse.");
|
895
|
+
}
|
896
|
+
input = argv[0];
|
897
|
+
if (2 <= argc) {
|
898
|
+
if (T_HASH == rb_type(argv[1])) {
|
899
|
+
oj_parse_options(argv[1], &pi->options);
|
900
|
+
} else if (3 <= argc && T_HASH == rb_type(argv[2])) {
|
901
|
+
oj_parse_options(argv[2], &pi->options);
|
902
|
+
}
|
903
|
+
}
|
904
|
+
if (yieldOk && rb_block_given_p()) {
|
905
|
+
pi->proc = Qnil;
|
906
|
+
} else {
|
907
|
+
pi->proc = Qundef;
|
908
|
+
}
|
909
|
+
if (0 != json) {
|
910
|
+
pi->json = json;
|
911
|
+
pi->end = json + len;
|
912
|
+
free_json = 1;
|
913
|
+
} else if (T_STRING == rb_type(input)) {
|
914
|
+
if (CompatMode == pi->options.mode) {
|
915
|
+
if (No == pi->options.nilnil && 0 == RSTRING_LEN(input)) {
|
916
|
+
rb_raise(oj_json_parser_error_class, "An empty string is not a valid JSON string.");
|
917
|
+
}
|
918
|
+
}
|
919
|
+
oj_pi_set_input_str(pi, &input);
|
920
|
+
} else if (Qnil == input) {
|
921
|
+
if (Yes == pi->options.nilnil) {
|
922
|
+
return Qnil;
|
923
|
+
} else {
|
924
|
+
rb_raise(rb_eTypeError, "Nil is not a valid JSON source.");
|
925
|
+
}
|
926
|
+
} else {
|
927
|
+
VALUE clas = rb_obj_class(input);
|
928
|
+
volatile VALUE s;
|
929
|
+
|
930
|
+
if (oj_stringio_class == clas) {
|
931
|
+
s = rb_funcall2(input, oj_string_id, 0, 0);
|
932
|
+
oj_pi_set_input_str(pi, &s);
|
933
|
+
#if !IS_WINDOWS
|
934
|
+
} else if (rb_cFile == clas && 0 == FIX2INT(rb_funcall(input, oj_pos_id, 0))) {
|
935
|
+
int fd = FIX2INT(rb_funcall(input, oj_fileno_id, 0));
|
936
|
+
ssize_t cnt;
|
937
|
+
size_t len = lseek(fd, 0, SEEK_END);
|
938
|
+
|
939
|
+
lseek(fd, 0, SEEK_SET);
|
940
|
+
buf = ALLOC_N(char, len + 1);
|
941
|
+
pi->json = buf;
|
942
|
+
pi->end = buf + len;
|
943
|
+
if (0 >= (cnt = read(fd, (char*)pi->json, len)) || cnt != (ssize_t)len) {
|
944
|
+
if (0 != buf) {
|
945
|
+
xfree(buf);
|
946
|
+
}
|
947
|
+
rb_raise(rb_eIOError, "failed to read from IO Object.");
|
948
|
+
}
|
949
|
+
((char*)pi->json)[len] = '\0';
|
950
|
+
/* skip UTF-8 BOM if present */
|
951
|
+
if (0xEF == (uint8_t)*pi->json && 0xBB == (uint8_t)pi->json[1] && 0xBF == (uint8_t)pi->json[2]) {
|
952
|
+
pi->cur += 3;
|
953
|
+
}
|
954
|
+
#endif
|
955
|
+
} else if (rb_respond_to(input, oj_read_id)) {
|
956
|
+
// use stream parser instead
|
957
|
+
return oj_pi_sparse(argc, argv, pi, 0);
|
958
|
+
} else {
|
959
|
+
rb_raise(rb_eArgError, "parse() expected a String or IO Object.");
|
960
|
+
}
|
961
|
+
}
|
962
|
+
if (Yes == pi->options.circular) {
|
963
|
+
pi->circ_array = oj_circ_array_new();
|
964
|
+
} else {
|
965
|
+
pi->circ_array = 0;
|
966
|
+
}
|
967
|
+
if (No == pi->options.allow_gc) {
|
968
|
+
rb_gc_disable();
|
969
|
+
}
|
970
|
+
// GC can run at any time. When it runs any Object created by C will be
|
971
|
+
// freed. We protect against this by wrapping the value stack in a ruby
|
972
|
+
// data object and poviding a mark function for ruby objects on the
|
973
|
+
// value stack (while it is in scope).
|
974
|
+
wrapped_stack = oj_stack_init(&pi->stack);
|
975
|
+
rb_protect(protect_parse, (VALUE)pi, &line);
|
976
|
+
if (Qundef == pi->stack.head->val && !empty_ok(&pi->options)) {
|
977
|
+
if (No == pi->options.nilnil || (CompatMode == pi->options.mode && 0 < pi->cur - pi->json)) {
|
978
|
+
oj_set_error_at(pi, oj_json_parser_error_class, __FILE__, __LINE__, "Empty input");
|
979
|
+
}
|
980
|
+
}
|
981
|
+
result = stack_head_val(&pi->stack);
|
982
|
+
DATA_PTR(wrapped_stack) = 0;
|
983
|
+
if (No == pi->options.allow_gc) {
|
984
|
+
rb_gc_enable();
|
985
|
+
}
|
986
|
+
if (!err_has(&pi->err)) {
|
987
|
+
// If the stack is not empty then the JSON terminated early.
|
988
|
+
Val v;
|
989
|
+
VALUE err_class = oj_parse_error_class;
|
990
|
+
|
991
|
+
if (0 != line) {
|
992
|
+
VALUE ec = rb_obj_class(rb_errinfo());
|
993
|
+
|
994
|
+
if (rb_eArgError != ec && 0 != ec) {
|
995
|
+
err_class = ec;
|
996
|
+
}
|
997
|
+
if (rb_eIOError != ec) {
|
998
|
+
goto CLEANUP;
|
999
|
+
}
|
1000
|
+
}
|
1001
|
+
if (NULL != (v = stack_peek(&pi->stack))) {
|
1002
|
+
switch (v->next) {
|
1003
|
+
case NEXT_ARRAY_NEW:
|
1004
|
+
case NEXT_ARRAY_ELEMENT:
|
1005
|
+
case NEXT_ARRAY_COMMA:
|
1006
|
+
oj_set_error_at(pi, err_class, __FILE__, __LINE__, "Array not terminated");
|
1007
|
+
break;
|
1008
|
+
case NEXT_HASH_NEW:
|
1009
|
+
case NEXT_HASH_KEY:
|
1010
|
+
case NEXT_HASH_COLON:
|
1011
|
+
case NEXT_HASH_VALUE:
|
1012
|
+
case NEXT_HASH_COMMA:
|
1013
|
+
oj_set_error_at(pi, err_class, __FILE__, __LINE__, "Hash/Object not terminated");
|
1014
|
+
break;
|
1015
|
+
default:
|
1016
|
+
oj_set_error_at(pi, err_class, __FILE__, __LINE__, "not terminated");
|
1017
|
+
}
|
1018
|
+
}
|
1019
|
+
}
|
1020
|
+
CLEANUP:
|
1021
|
+
// proceed with cleanup
|
1022
|
+
if (0 != pi->circ_array) {
|
1023
|
+
oj_circ_array_free(pi->circ_array);
|
1024
|
+
}
|
1025
|
+
if (0 != buf) {
|
1026
|
+
xfree(buf);
|
1027
|
+
} else if (free_json) {
|
1028
|
+
xfree(json);
|
1029
|
+
}
|
1030
|
+
stack_cleanup(&pi->stack);
|
1031
|
+
if (pi->str_rx.head != oj_default_options.str_rx.head) {
|
1032
|
+
oj_rxclass_cleanup(&pi->str_rx);
|
1033
|
+
}
|
1034
|
+
if (err_has(&pi->err)) {
|
1035
|
+
rb_set_errinfo(Qnil);
|
1036
|
+
if (Qnil != pi->err_class) {
|
1037
|
+
pi->err.clas = pi->err_class;
|
1038
|
+
}
|
1039
|
+
if (CompatMode == pi->options.mode) {
|
1040
|
+
// The json gem requires the error message be UTF-8 encoded. In
|
1041
|
+
// additional the complete JSON source must be returned. There
|
1042
|
+
// does not seem to be a size limit.
|
1043
|
+
VALUE msg = oj_encode(rb_str_new2(pi->err.msg));
|
1044
|
+
VALUE args[1];
|
1045
|
+
|
1046
|
+
if (NULL != pi->json) {
|
1047
|
+
msg = rb_str_append(msg, oj_encode(rb_str_new2(" in '")));
|
1048
|
+
msg = rb_str_append(msg, oj_encode(rb_str_new2(pi->json)));
|
1049
|
+
}
|
1050
|
+
args[0] = msg;
|
1051
|
+
rb_exc_raise(rb_class_new_instance(1, args, pi->err.clas));
|
1052
|
+
} else {
|
1053
|
+
oj_err_raise(&pi->err);
|
1054
|
+
}
|
1055
|
+
} else if (0 != line) {
|
1056
|
+
rb_jump_tag(line);
|
1057
|
+
}
|
1058
|
+
if (pi->options.quirks_mode == No) {
|
1059
|
+
switch (rb_type(result)) {
|
1060
|
+
case T_NIL:
|
1061
|
+
case T_TRUE:
|
1062
|
+
case T_FALSE:
|
1063
|
+
case T_FIXNUM:
|
1064
|
+
case T_FLOAT:
|
1065
|
+
case T_CLASS:
|
1066
|
+
case T_STRING:
|
1067
|
+
case T_SYMBOL: {
|
1068
|
+
struct _err err;
|
1069
|
+
|
1070
|
+
if (Qnil == pi->err_class) {
|
1071
|
+
err.clas = oj_parse_error_class;
|
1072
|
+
} else {
|
1073
|
+
err.clas = pi->err_class;
|
1074
|
+
}
|
1075
|
+
snprintf(err.msg, sizeof(err.msg), "unexpected non-document value");
|
1076
|
+
oj_err_raise(&err);
|
1077
|
+
break;
|
1078
|
+
}
|
1079
|
+
default:
|
1080
|
+
// okay
|
1081
|
+
break;
|
1082
|
+
}
|
1083
|
+
}
|
1084
|
+
return result;
|
1085
|
+
}
|