yajl-ruby 0.5.5

Sign up to get free protection for your applications and to get access to all the features.

Potentially problematic release.


This version of yajl-ruby might be problematic. Click here for more details.

Files changed (129) hide show
  1. data/.gitignore +5 -0
  2. data/CHANGELOG.md +164 -0
  3. data/MIT-LICENSE +20 -0
  4. data/README.rdoc +264 -0
  5. data/Rakefile +29 -0
  6. data/VERSION.yml +4 -0
  7. data/benchmark/encode.rb +46 -0
  8. data/benchmark/encode_json_and_marshal.rb +35 -0
  9. data/benchmark/encode_json_and_yaml.rb +47 -0
  10. data/benchmark/http.rb +30 -0
  11. data/benchmark/parse.rb +49 -0
  12. data/benchmark/parse_json_and_marshal.rb +47 -0
  13. data/benchmark/parse_json_and_yaml.rb +56 -0
  14. data/benchmark/parse_stream.rb +48 -0
  15. data/benchmark/subjects/contacts.json +1 -0
  16. data/benchmark/subjects/contacts.marshal_dump +0 -0
  17. data/benchmark/subjects/contacts.yml +114685 -0
  18. data/benchmark/subjects/item.json +1 -0
  19. data/benchmark/subjects/ohai.json +1216 -0
  20. data/benchmark/subjects/twitter_search.json +1 -0
  21. data/benchmark/subjects/twitter_stream.json +430 -0
  22. data/benchmark/subjects/unicode.json +1 -0
  23. data/examples/http/twitter_search_api.rb +15 -0
  24. data/examples/http/twitter_stream_api.rb +25 -0
  25. data/examples/parsing/from_file.rb +14 -0
  26. data/examples/parsing/from_stdin.rb +9 -0
  27. data/examples/parsing/from_string.rb +15 -0
  28. data/ext/api/yajl_common.h +85 -0
  29. data/ext/api/yajl_gen.h +123 -0
  30. data/ext/api/yajl_parse.h +182 -0
  31. data/ext/extconf.rb +8 -0
  32. data/ext/yajl.c +157 -0
  33. data/ext/yajl_alloc.c +65 -0
  34. data/ext/yajl_alloc.h +50 -0
  35. data/ext/yajl_buf.c +119 -0
  36. data/ext/yajl_buf.h +73 -0
  37. data/ext/yajl_bytestack.h +85 -0
  38. data/ext/yajl_encode.c +179 -0
  39. data/ext/yajl_encode.h +44 -0
  40. data/ext/yajl_ext.c +774 -0
  41. data/ext/yajl_ext.h +74 -0
  42. data/ext/yajl_gen.c +290 -0
  43. data/ext/yajl_lex.c +744 -0
  44. data/ext/yajl_lex.h +135 -0
  45. data/ext/yajl_parser.c +447 -0
  46. data/ext/yajl_parser.h +79 -0
  47. data/lib/yajl.rb +80 -0
  48. data/lib/yajl/bzip2.rb +11 -0
  49. data/lib/yajl/bzip2/stream_reader.rb +29 -0
  50. data/lib/yajl/bzip2/stream_writer.rb +15 -0
  51. data/lib/yajl/deflate.rb +6 -0
  52. data/lib/yajl/deflate/stream_reader.rb +37 -0
  53. data/lib/yajl/deflate/stream_writer.rb +21 -0
  54. data/lib/yajl/gzip.rb +6 -0
  55. data/lib/yajl/gzip/stream_reader.rb +28 -0
  56. data/lib/yajl/gzip/stream_writer.rb +14 -0
  57. data/lib/yajl/http_stream.rb +101 -0
  58. data/lib/yajl/json_gem.rb +69 -0
  59. data/spec/encoding/encoding_spec.rb +186 -0
  60. data/spec/http/fixtures/http.bzip2.dump +0 -0
  61. data/spec/http/fixtures/http.deflate.dump +0 -0
  62. data/spec/http/fixtures/http.gzip.dump +0 -0
  63. data/spec/http/fixtures/http.raw.dump +12 -0
  64. data/spec/http/http_spec.rb +94 -0
  65. data/spec/json_gem_compatibility/compatibility_spec.rb +170 -0
  66. data/spec/parsing/active_support_spec.rb +68 -0
  67. data/spec/parsing/chunked_spec.rb +98 -0
  68. data/spec/parsing/fixtures/fail.15.json +1 -0
  69. data/spec/parsing/fixtures/fail.16.json +1 -0
  70. data/spec/parsing/fixtures/fail.17.json +1 -0
  71. data/spec/parsing/fixtures/fail.26.json +1 -0
  72. data/spec/parsing/fixtures/fail11.json +1 -0
  73. data/spec/parsing/fixtures/fail12.json +1 -0
  74. data/spec/parsing/fixtures/fail13.json +1 -0
  75. data/spec/parsing/fixtures/fail14.json +1 -0
  76. data/spec/parsing/fixtures/fail19.json +1 -0
  77. data/spec/parsing/fixtures/fail20.json +1 -0
  78. data/spec/parsing/fixtures/fail21.json +1 -0
  79. data/spec/parsing/fixtures/fail22.json +1 -0
  80. data/spec/parsing/fixtures/fail23.json +1 -0
  81. data/spec/parsing/fixtures/fail24.json +1 -0
  82. data/spec/parsing/fixtures/fail25.json +1 -0
  83. data/spec/parsing/fixtures/fail27.json +2 -0
  84. data/spec/parsing/fixtures/fail28.json +2 -0
  85. data/spec/parsing/fixtures/fail3.json +1 -0
  86. data/spec/parsing/fixtures/fail4.json +1 -0
  87. data/spec/parsing/fixtures/fail5.json +1 -0
  88. data/spec/parsing/fixtures/fail6.json +1 -0
  89. data/spec/parsing/fixtures/fail9.json +1 -0
  90. data/spec/parsing/fixtures/pass.array.json +6 -0
  91. data/spec/parsing/fixtures/pass.codepoints_from_unicode_org.json +1 -0
  92. data/spec/parsing/fixtures/pass.contacts.json +1 -0
  93. data/spec/parsing/fixtures/pass.db100.xml.json +1 -0
  94. data/spec/parsing/fixtures/pass.db1000.xml.json +1 -0
  95. data/spec/parsing/fixtures/pass.dc_simple_with_comments.json +11 -0
  96. data/spec/parsing/fixtures/pass.deep_arrays.json +1 -0
  97. data/spec/parsing/fixtures/pass.difficult_json_c_test_case.json +1 -0
  98. data/spec/parsing/fixtures/pass.difficult_json_c_test_case_with_comments.json +1 -0
  99. data/spec/parsing/fixtures/pass.doubles.json +1 -0
  100. data/spec/parsing/fixtures/pass.empty_array.json +1 -0
  101. data/spec/parsing/fixtures/pass.empty_string.json +1 -0
  102. data/spec/parsing/fixtures/pass.escaped_bulgarian.json +4 -0
  103. data/spec/parsing/fixtures/pass.escaped_foobar.json +1 -0
  104. data/spec/parsing/fixtures/pass.item.json +1 -0
  105. data/spec/parsing/fixtures/pass.json-org-sample1.json +23 -0
  106. data/spec/parsing/fixtures/pass.json-org-sample2.json +11 -0
  107. data/spec/parsing/fixtures/pass.json-org-sample3.json +26 -0
  108. data/spec/parsing/fixtures/pass.json-org-sample4-nows.json +88 -0
  109. data/spec/parsing/fixtures/pass.json-org-sample4.json +89 -0
  110. data/spec/parsing/fixtures/pass.json-org-sample5.json +27 -0
  111. data/spec/parsing/fixtures/pass.map-spain.xml.json +1 -0
  112. data/spec/parsing/fixtures/pass.ns-invoice100.xml.json +1 -0
  113. data/spec/parsing/fixtures/pass.ns-soap.xml.json +1 -0
  114. data/spec/parsing/fixtures/pass.numbers-fp-4k.json +6 -0
  115. data/spec/parsing/fixtures/pass.numbers-fp-64k.json +61 -0
  116. data/spec/parsing/fixtures/pass.numbers-int-4k.json +11 -0
  117. data/spec/parsing/fixtures/pass.numbers-int-64k.json +154 -0
  118. data/spec/parsing/fixtures/pass.twitter-search.json +1 -0
  119. data/spec/parsing/fixtures/pass.twitter-search2.json +1 -0
  120. data/spec/parsing/fixtures/pass.unicode.json +3315 -0
  121. data/spec/parsing/fixtures/pass.yelp.json +1 -0
  122. data/spec/parsing/fixtures/pass1.json +56 -0
  123. data/spec/parsing/fixtures/pass2.json +1 -0
  124. data/spec/parsing/fixtures/pass3.json +6 -0
  125. data/spec/parsing/fixtures_spec.rb +45 -0
  126. data/spec/parsing/one_off_spec.rb +58 -0
  127. data/spec/spec_helper.rb +11 -0
  128. data/yajl-ruby.gemspec +176 -0
  129. metadata +196 -0
data/ext/yajl_lex.h ADDED
@@ -0,0 +1,135 @@
1
+ /*
2
+ * Copyright 2007-2009, Lloyd Hilaiel.
3
+ *
4
+ * Redistribution and use in source and binary forms, with or without
5
+ * modification, are permitted provided that the following conditions are
6
+ * met:
7
+ *
8
+ * 1. Redistributions of source code must retain the above copyright
9
+ * notice, this list of conditions and the following disclaimer.
10
+ *
11
+ * 2. Redistributions in binary form must reproduce the above copyright
12
+ * notice, this list of conditions and the following disclaimer in
13
+ * the documentation and/or other materials provided with the
14
+ * distribution.
15
+ *
16
+ * 3. Neither the name of Lloyd Hilaiel nor the names of its
17
+ * contributors may be used to endorse or promote products derived
18
+ * from this software without specific prior written permission.
19
+ *
20
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
21
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
22
+ * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
23
+ * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
24
+ * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
25
+ * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
26
+ * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
28
+ * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
29
+ * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30
+ * POSSIBILITY OF SUCH DAMAGE.
31
+ */
32
+
33
+ #ifndef __YAJL_LEX_H__
34
+ #define __YAJL_LEX_H__
35
+
36
+ #include "api/yajl_common.h"
37
+
38
+ typedef enum {
39
+ yajl_tok_bool,
40
+ yajl_tok_colon,
41
+ yajl_tok_comma,
42
+ yajl_tok_eof,
43
+ yajl_tok_error,
44
+ yajl_tok_left_brace,
45
+ yajl_tok_left_bracket,
46
+ yajl_tok_null,
47
+ yajl_tok_right_brace,
48
+ yajl_tok_right_bracket,
49
+
50
+ /* we differentiate between integers and doubles to allow the
51
+ * parser to interpret the number without re-scanning */
52
+ yajl_tok_integer,
53
+ yajl_tok_double,
54
+
55
+ /* we differentiate between strings which require further processing,
56
+ * and strings that do not */
57
+ yajl_tok_string,
58
+ yajl_tok_string_with_escapes,
59
+
60
+ /* comment tokens are not currently returned to the parser, ever */
61
+ yajl_tok_comment
62
+ } yajl_tok;
63
+
64
+ typedef struct yajl_lexer_t * yajl_lexer;
65
+
66
+ yajl_lexer yajl_lex_alloc(yajl_alloc_funcs * alloc,
67
+ unsigned int allowComments,
68
+ unsigned int validateUTF8);
69
+
70
+ yajl_lexer yajl_lex_realloc(yajl_lexer orig);
71
+
72
+ void yajl_lex_free(yajl_lexer lexer);
73
+
74
+ /**
75
+ * run/continue a lex. "offset" is an input/output parameter.
76
+ * It should be initialized to zero for a
77
+ * new chunk of target text, and upon subsetquent calls with the same
78
+ * target text should passed with the value of the previous invocation.
79
+ *
80
+ * the client may be interested in the value of offset when an error is
81
+ * returned from the lexer. This allows the client to render useful
82
+ n * error messages.
83
+ *
84
+ * When you pass the next chunk of data, context should be reinitialized
85
+ * to zero.
86
+ *
87
+ * Finally, the output buffer is usually just a pointer into the jsonText,
88
+ * however in cases where the entity being lexed spans multiple chunks,
89
+ * the lexer will buffer the entity and the data returned will be
90
+ * a pointer into that buffer.
91
+ *
92
+ * This behavior is abstracted from client code except for the performance
93
+ * implications which require that the client choose a reasonable chunk
94
+ * size to get adequate performance.
95
+ */
96
+ yajl_tok yajl_lex_lex(yajl_lexer lexer, const unsigned char * jsonText,
97
+ unsigned int jsonTextLen, unsigned int * offset,
98
+ const unsigned char ** outBuf, unsigned int * outLen);
99
+
100
+ /** have a peek at the next token, but don't move the lexer forward */
101
+ yajl_tok yajl_lex_peek(yajl_lexer lexer, const unsigned char * jsonText,
102
+ unsigned int jsonTextLen, unsigned int offset);
103
+
104
+
105
+ typedef enum {
106
+ yajl_lex_e_ok = 0,
107
+ yajl_lex_string_invalid_utf8,
108
+ yajl_lex_string_invalid_escaped_char,
109
+ yajl_lex_string_invalid_json_char,
110
+ yajl_lex_string_invalid_hex_char,
111
+ yajl_lex_invalid_char,
112
+ yajl_lex_invalid_string,
113
+ yajl_lex_missing_integer_after_decimal,
114
+ yajl_lex_missing_integer_after_exponent,
115
+ yajl_lex_missing_integer_after_minus,
116
+ yajl_lex_unallowed_comment
117
+ } yajl_lex_error;
118
+
119
+ const char * yajl_lex_error_to_string(yajl_lex_error error);
120
+
121
+ /** allows access to more specific information about the lexical
122
+ * error when yajl_lex_lex returns yajl_tok_error. */
123
+ yajl_lex_error yajl_lex_get_error(yajl_lexer lexer);
124
+
125
+ /** get the current offset into the most recently lexed json string. */
126
+ unsigned int yajl_lex_current_offset(yajl_lexer lexer);
127
+
128
+ /** get the number of lines lexed by this lexer instance */
129
+ unsigned int yajl_lex_current_line(yajl_lexer lexer);
130
+
131
+ /** get the number of chars lexed by this lexer instance since the last
132
+ * \n or \r */
133
+ unsigned int yajl_lex_current_char(yajl_lexer lexer);
134
+
135
+ #endif
data/ext/yajl_parser.c ADDED
@@ -0,0 +1,447 @@
1
+ /*
2
+ * Copyright 2007-2009, Lloyd Hilaiel.
3
+ *
4
+ * Redistribution and use in source and binary forms, with or without
5
+ * modification, are permitted provided that the following conditions are
6
+ * met:
7
+ *
8
+ * 1. Redistributions of source code must retain the above copyright
9
+ * notice, this list of conditions and the following disclaimer.
10
+ *
11
+ * 2. Redistributions in binary form must reproduce the above copyright
12
+ * notice, this list of conditions and the following disclaimer in
13
+ * the documentation and/or other materials provided with the
14
+ * distribution.
15
+ *
16
+ * 3. Neither the name of Lloyd Hilaiel nor the names of its
17
+ * contributors may be used to endorse or promote products derived
18
+ * from this software without specific prior written permission.
19
+ *
20
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
21
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
22
+ * WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
23
+ * DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT,
24
+ * INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES
25
+ * (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
26
+ * SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
27
+ * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,
28
+ * STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING
29
+ * IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
30
+ * POSSIBILITY OF SUCH DAMAGE.
31
+ */
32
+
33
+ #include "yajl_lex.h"
34
+ #include "yajl_parser.h"
35
+ #include "yajl_encode.h"
36
+ #include "yajl_bytestack.h"
37
+
38
+ #include <stdlib.h>
39
+ #include <limits.h>
40
+ #include <errno.h>
41
+ #include <stdio.h>
42
+ #include <string.h>
43
+ #include <ctype.h>
44
+ #include <assert.h>
45
+ #include <math.h>
46
+
47
+ unsigned char *
48
+ yajl_render_error_string(yajl_handle hand, const unsigned char * jsonText,
49
+ unsigned int jsonTextLen, int verbose)
50
+ {
51
+ unsigned int offset = hand->errorOffset;
52
+ unsigned char * str;
53
+ const char * errorType = NULL;
54
+ const char * errorText = NULL;
55
+ char text[72];
56
+ const char * arrow = " (right here) ------^\n";
57
+
58
+ if (yajl_bs_current(hand->stateStack) == yajl_state_parse_error) {
59
+ errorType = "parse";
60
+ errorText = hand->parseError;
61
+ } else if (yajl_bs_current(hand->stateStack) == yajl_state_lexical_error) {
62
+ errorType = "lexical";
63
+ errorText = yajl_lex_error_to_string(yajl_lex_get_error(hand->lexer));
64
+ } else {
65
+ errorType = "unknown";
66
+ }
67
+
68
+ {
69
+ unsigned int memneeded = 0;
70
+ memneeded += strlen(errorType);
71
+ memneeded += strlen(" error");
72
+ if (errorText != NULL) {
73
+ memneeded += strlen(": ");
74
+ memneeded += strlen(errorText);
75
+ }
76
+ str = (unsigned char *) YA_MALLOC(&(hand->alloc), memneeded + 2);
77
+ str[0] = 0;
78
+ strcat((char *) str, errorType);
79
+ strcat((char *) str, " error");
80
+ if (errorText != NULL) {
81
+ strcat((char *) str, ": ");
82
+ strcat((char *) str, errorText);
83
+ }
84
+ strcat((char *) str, "\n");
85
+ }
86
+
87
+ /* now we append as many spaces as needed to make sure the error
88
+ * falls at char 41, if verbose was specified */
89
+ if (verbose) {
90
+ unsigned int start, end, i;
91
+ unsigned int spacesNeeded;
92
+
93
+ spacesNeeded = (offset < 30 ? 40 - offset : 10);
94
+ start = (offset >= 30 ? offset - 30 : 0);
95
+ end = (offset + 30 > jsonTextLen ? jsonTextLen : offset + 30);
96
+
97
+ for (i=0;i<spacesNeeded;i++) text[i] = ' ';
98
+
99
+ for (;start < end;start++, i++) {
100
+ if (jsonText[start] != '\n' && jsonText[start] != '\r')
101
+ {
102
+ text[i] = jsonText[start];
103
+ }
104
+ else
105
+ {
106
+ text[i] = ' ';
107
+ }
108
+ }
109
+ assert(i <= 71);
110
+ text[i++] = '\n';
111
+ text[i] = 0;
112
+ {
113
+ char * newStr = (char *)
114
+ YA_MALLOC(&(hand->alloc), (strlen((char *) str) +
115
+ strlen((char *) text) +
116
+ strlen(arrow) + 1));
117
+ newStr[0] = 0;
118
+ strcat((char *) newStr, (char *) str);
119
+ strcat((char *) newStr, text);
120
+ strcat((char *) newStr, arrow);
121
+ YA_FREE(&(hand->alloc), str);
122
+ str = (unsigned char *) newStr;
123
+ }
124
+ }
125
+ return str;
126
+ }
127
+
128
+ /* check for client cancelation */
129
+ #define _CC_CHK(x) \
130
+ if (!(x)) { \
131
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error); \
132
+ hand->parseError = \
133
+ "client cancelled parse via callback return value"; \
134
+ return yajl_status_client_canceled; \
135
+ }
136
+
137
+
138
+ yajl_status
139
+ yajl_do_parse(yajl_handle hand, unsigned int * offset,
140
+ const unsigned char * jsonText, unsigned int jsonTextLen)
141
+ {
142
+ yajl_tok tok;
143
+ const unsigned char * buf;
144
+ unsigned int bufLen;
145
+
146
+ around_again:
147
+ switch (yajl_bs_current(hand->stateStack)) {
148
+ case yajl_state_parse_complete:
149
+ return yajl_status_ok;
150
+ case yajl_state_lexical_error:
151
+ case yajl_state_parse_error:
152
+ hand->errorOffset = *offset;
153
+ return yajl_status_error;
154
+ case yajl_state_start:
155
+ case yajl_state_map_need_val:
156
+ case yajl_state_array_need_val:
157
+ case yajl_state_array_start: {
158
+ /* for arrays and maps, we advance the state for this
159
+ * depth, then push the state of the next depth.
160
+ * If an error occurs during the parsing of the nesting
161
+ * enitity, the state at this level will not matter.
162
+ * a state that needs pushing will be anything other
163
+ * than state_start */
164
+ yajl_state stateToPush = yajl_state_start;
165
+
166
+ tok = yajl_lex_lex(hand->lexer, jsonText, jsonTextLen,
167
+ offset, &buf, &bufLen);
168
+
169
+ switch (tok) {
170
+ case yajl_tok_eof:
171
+ return yajl_status_insufficient_data;
172
+ case yajl_tok_error:
173
+ yajl_bs_set(hand->stateStack, yajl_state_lexical_error);
174
+ goto around_again;
175
+ case yajl_tok_string:
176
+ if (hand->callbacks && hand->callbacks->yajl_string) {
177
+ _CC_CHK(hand->callbacks->yajl_string(hand->ctx,
178
+ buf, bufLen));
179
+ }
180
+ break;
181
+ case yajl_tok_string_with_escapes:
182
+ if (hand->callbacks && hand->callbacks->yajl_string) {
183
+ yajl_buf_clear(hand->decodeBuf);
184
+ yajl_string_decode(hand->decodeBuf, buf, bufLen);
185
+ _CC_CHK(hand->callbacks->yajl_string(
186
+ hand->ctx, yajl_buf_data(hand->decodeBuf),
187
+ yajl_buf_len(hand->decodeBuf)));
188
+ }
189
+ break;
190
+ case yajl_tok_bool:
191
+ if (hand->callbacks && hand->callbacks->yajl_boolean) {
192
+ _CC_CHK(hand->callbacks->yajl_boolean(hand->ctx,
193
+ *buf == 't'));
194
+ }
195
+ break;
196
+ case yajl_tok_null:
197
+ if (hand->callbacks && hand->callbacks->yajl_null) {
198
+ _CC_CHK(hand->callbacks->yajl_null(hand->ctx));
199
+ }
200
+ break;
201
+ case yajl_tok_left_bracket:
202
+ if (hand->callbacks && hand->callbacks->yajl_start_map) {
203
+ _CC_CHK(hand->callbacks->yajl_start_map(hand->ctx));
204
+ }
205
+ stateToPush = yajl_state_map_start;
206
+ break;
207
+ case yajl_tok_left_brace:
208
+ if (hand->callbacks && hand->callbacks->yajl_start_array) {
209
+ _CC_CHK(hand->callbacks->yajl_start_array(hand->ctx));
210
+ }
211
+ stateToPush = yajl_state_array_start;
212
+ break;
213
+ case yajl_tok_integer:
214
+ /*
215
+ * note. strtol does not respect the length of
216
+ * the lexical token. in a corner case where the
217
+ * lexed number is a integer with a trailing zero,
218
+ * immediately followed by the end of buffer,
219
+ * sscanf could run off into oblivion and cause a
220
+ * crash. for this reason we copy the integer
221
+ * (and doubles), into our parse buffer (the same
222
+ * one used for unescaping strings), before
223
+ * calling strtol. yajl_buf ensures null padding,
224
+ * so we're safe.
225
+ */
226
+ if (hand->callbacks) {
227
+ if (hand->callbacks->yajl_number) {
228
+ _CC_CHK(hand->callbacks->yajl_number(
229
+ hand->ctx,(const char *) buf, bufLen));
230
+ } else if (hand->callbacks->yajl_integer) {
231
+ long int i = 0;
232
+ yajl_buf_clear(hand->decodeBuf);
233
+ yajl_buf_append(hand->decodeBuf, buf, bufLen);
234
+ buf = yajl_buf_data(hand->decodeBuf);
235
+ i = strtol((const char *) buf, NULL, 10);
236
+ if ((i == LONG_MIN || i == LONG_MAX) &&
237
+ errno == ERANGE)
238
+ {
239
+ yajl_bs_set(hand->stateStack,
240
+ yajl_state_parse_error);
241
+ hand->parseError = "integer overflow" ;
242
+ /* try to restore error offset */
243
+ if (*offset >= bufLen) *offset -= bufLen;
244
+ else *offset = 0;
245
+ goto around_again;
246
+ }
247
+ _CC_CHK(hand->callbacks->yajl_integer(hand->ctx,
248
+ i));
249
+ }
250
+ }
251
+ break;
252
+ case yajl_tok_double:
253
+ if (hand->callbacks) {
254
+ if (hand->callbacks->yajl_number) {
255
+ _CC_CHK(hand->callbacks->yajl_number(
256
+ hand->ctx, (const char *) buf, bufLen));
257
+ } else if (hand->callbacks->yajl_double) {
258
+ double d = 0.0;
259
+ yajl_buf_clear(hand->decodeBuf);
260
+ yajl_buf_append(hand->decodeBuf, buf, bufLen);
261
+ buf = yajl_buf_data(hand->decodeBuf);
262
+ d = strtod((char *) buf, NULL);
263
+ if ((d == HUGE_VAL || d == -HUGE_VAL) &&
264
+ errno == ERANGE)
265
+ {
266
+ yajl_bs_set(hand->stateStack,
267
+ yajl_state_parse_error);
268
+ hand->parseError = "numeric (floating point) "
269
+ "overflow";
270
+ /* try to restore error offset */
271
+ if (*offset >= bufLen) *offset -= bufLen;
272
+ else *offset = 0;
273
+ goto around_again;
274
+ }
275
+ _CC_CHK(hand->callbacks->yajl_double(hand->ctx,
276
+ d));
277
+ }
278
+ }
279
+ break;
280
+ case yajl_tok_right_brace: {
281
+ if (yajl_bs_current(hand->stateStack) ==
282
+ yajl_state_array_start)
283
+ {
284
+ if (hand->callbacks &&
285
+ hand->callbacks->yajl_end_array)
286
+ {
287
+ _CC_CHK(hand->callbacks->yajl_end_array(hand->ctx));
288
+ }
289
+ yajl_bs_pop(hand->stateStack);
290
+ goto around_again;
291
+ }
292
+ /* intentional fall-through */
293
+ }
294
+ case yajl_tok_colon:
295
+ case yajl_tok_comma:
296
+ case yajl_tok_right_bracket:
297
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
298
+ hand->parseError =
299
+ "unallowed token at this point in JSON text";
300
+ goto around_again;
301
+ default:
302
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
303
+ hand->parseError = "invalid token, internal error";
304
+ goto around_again;
305
+ }
306
+ /* got a value. transition depends on the state we're in. */
307
+ {
308
+ yajl_state s = yajl_bs_current(hand->stateStack);
309
+ if (s == yajl_state_start) {
310
+ // HACK: is this even safe to do?
311
+ // yajl_bs_set(hand->stateStack, yajl_state_parse_complete);
312
+ yajl_reset_parser(hand);
313
+ } else if (s == yajl_state_map_need_val) {
314
+ yajl_bs_set(hand->stateStack, yajl_state_map_got_val);
315
+ } else {
316
+ yajl_bs_set(hand->stateStack, yajl_state_array_got_val);
317
+ }
318
+ }
319
+ if (stateToPush != yajl_state_start) {
320
+ yajl_bs_push(hand->stateStack, stateToPush);
321
+ }
322
+
323
+ goto around_again;
324
+ }
325
+ case yajl_state_map_start:
326
+ case yajl_state_map_need_key: {
327
+ /* only difference between these two states is that in
328
+ * start '}' is valid, whereas in need_key, we've parsed
329
+ * a comma, and a string key _must_ follow */
330
+ tok = yajl_lex_lex(hand->lexer, jsonText, jsonTextLen,
331
+ offset, &buf, &bufLen);
332
+ switch (tok) {
333
+ case yajl_tok_eof:
334
+ return yajl_status_insufficient_data;
335
+ case yajl_tok_error:
336
+ yajl_bs_set(hand->stateStack, yajl_state_lexical_error);
337
+ goto around_again;
338
+ case yajl_tok_string_with_escapes:
339
+ if (hand->callbacks && hand->callbacks->yajl_map_key) {
340
+ yajl_buf_clear(hand->decodeBuf);
341
+ yajl_string_decode(hand->decodeBuf, buf, bufLen);
342
+ buf = yajl_buf_data(hand->decodeBuf);
343
+ bufLen = yajl_buf_len(hand->decodeBuf);
344
+ }
345
+ /* intentional fall-through */
346
+ case yajl_tok_string:
347
+ if (hand->callbacks && hand->callbacks->yajl_map_key) {
348
+ _CC_CHK(hand->callbacks->yajl_map_key(hand->ctx, buf,
349
+ bufLen));
350
+ }
351
+ yajl_bs_set(hand->stateStack, yajl_state_map_sep);
352
+ goto around_again;
353
+ case yajl_tok_right_bracket:
354
+ if (yajl_bs_current(hand->stateStack) ==
355
+ yajl_state_map_start)
356
+ {
357
+ if (hand->callbacks && hand->callbacks->yajl_end_map) {
358
+ _CC_CHK(hand->callbacks->yajl_end_map(hand->ctx));
359
+ }
360
+ yajl_bs_pop(hand->stateStack);
361
+ goto around_again;
362
+ }
363
+ default:
364
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
365
+ hand->parseError =
366
+ "invalid object key (must be a string)";
367
+ goto around_again;
368
+ }
369
+ }
370
+ case yajl_state_map_sep: {
371
+ tok = yajl_lex_lex(hand->lexer, jsonText, jsonTextLen,
372
+ offset, &buf, &bufLen);
373
+ switch (tok) {
374
+ case yajl_tok_colon:
375
+ yajl_bs_set(hand->stateStack, yajl_state_map_need_val);
376
+ goto around_again;
377
+ case yajl_tok_eof:
378
+ return yajl_status_insufficient_data;
379
+ case yajl_tok_error:
380
+ yajl_bs_set(hand->stateStack, yajl_state_lexical_error);
381
+ goto around_again;
382
+ default:
383
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
384
+ hand->parseError = "object key and value must "
385
+ "be separated by a colon (':')";
386
+ goto around_again;
387
+ }
388
+ }
389
+ case yajl_state_map_got_val: {
390
+ tok = yajl_lex_lex(hand->lexer, jsonText, jsonTextLen,
391
+ offset, &buf, &bufLen);
392
+ switch (tok) {
393
+ case yajl_tok_right_bracket:
394
+ if (hand->callbacks && hand->callbacks->yajl_end_map) {
395
+ _CC_CHK(hand->callbacks->yajl_end_map(hand->ctx));
396
+ }
397
+ yajl_bs_pop(hand->stateStack);
398
+ goto around_again;
399
+ case yajl_tok_comma:
400
+ yajl_bs_set(hand->stateStack, yajl_state_map_need_key);
401
+ goto around_again;
402
+ case yajl_tok_eof:
403
+ return yajl_status_insufficient_data;
404
+ case yajl_tok_error:
405
+ yajl_bs_set(hand->stateStack, yajl_state_lexical_error);
406
+ goto around_again;
407
+ default:
408
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
409
+ hand->parseError = "after key and value, inside map, "
410
+ "I expect ',' or '}'";
411
+ /* try to restore error offset */
412
+ if (*offset >= bufLen) *offset -= bufLen;
413
+ else *offset = 0;
414
+ goto around_again;
415
+ }
416
+ }
417
+ case yajl_state_array_got_val: {
418
+ tok = yajl_lex_lex(hand->lexer, jsonText, jsonTextLen,
419
+ offset, &buf, &bufLen);
420
+ switch (tok) {
421
+ case yajl_tok_right_brace:
422
+ if (hand->callbacks && hand->callbacks->yajl_end_array) {
423
+ _CC_CHK(hand->callbacks->yajl_end_array(hand->ctx));
424
+ }
425
+ yajl_bs_pop(hand->stateStack);
426
+ goto around_again;
427
+ case yajl_tok_comma:
428
+ yajl_bs_set(hand->stateStack, yajl_state_array_need_val);
429
+ goto around_again;
430
+ case yajl_tok_eof:
431
+ return yajl_status_insufficient_data;
432
+ case yajl_tok_error:
433
+ yajl_bs_set(hand->stateStack, yajl_state_lexical_error);
434
+ goto around_again;
435
+ default:
436
+ yajl_bs_set(hand->stateStack, yajl_state_parse_error);
437
+ hand->parseError =
438
+ "after array element, I expect ',' or ']'";
439
+ goto around_again;
440
+ }
441
+ }
442
+ }
443
+
444
+ abort();
445
+ return yajl_status_error;
446
+ }
447
+