jbarnette-johnson 1.0.0.200806240111 → 1.0.0.200807291507

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (269) hide show
  1. data/MANIFEST +1 -0
  2. data/Rakefile +3 -10
  3. data/bin/johnson +2 -1
  4. data/ext/spidermonkey/context.c +3 -4
  5. data/ext/spidermonkey/context.h +1 -1
  6. data/ext/spidermonkey/conversions.c +39 -33
  7. data/ext/spidermonkey/debugger.c +5 -5
  8. data/ext/spidermonkey/immutable_node.c.erb +11 -11
  9. data/ext/spidermonkey/jroot.h +4 -4
  10. data/ext/spidermonkey/js_land_proxy.c +9 -8
  11. data/ext/spidermonkey/ruby_land_proxy.c +5 -4
  12. data/ext/spidermonkey/runtime.c +1 -1
  13. data/johnson.gemspec +36 -0
  14. data/lib/hoe.rb +0 -7
  15. data/lib/johnson/cli/options.rb +10 -4
  16. data/lib/johnson/spidermonkey/runtime.rb +2 -2
  17. data/lib/johnson/version.rb +4 -2
  18. data/lib/johnson.rb +1 -0
  19. data/test/johnson/runtime_test.rb +11 -0
  20. data/test/johnson/spidermonkey/ruby_land_proxy_test.rb +6 -0
  21. data/vendor/spidermonkey/.cvsignore +9 -0
  22. data/vendor/spidermonkey/Makefile.in +462 -0
  23. data/vendor/spidermonkey/Makefile.ref +364 -0
  24. data/vendor/spidermonkey/README.html +820 -0
  25. data/vendor/spidermonkey/SpiderMonkey.rsp +12 -0
  26. data/vendor/spidermonkey/Y.js +19 -0
  27. data/vendor/spidermonkey/build.mk +43 -0
  28. data/vendor/spidermonkey/config/AIX4.1.mk +65 -0
  29. data/vendor/spidermonkey/config/AIX4.2.mk +64 -0
  30. data/vendor/spidermonkey/config/AIX4.3.mk +65 -0
  31. data/vendor/spidermonkey/config/Darwin.mk +83 -0
  32. data/vendor/spidermonkey/config/Darwin1.3.mk +81 -0
  33. data/vendor/spidermonkey/config/Darwin1.4.mk +41 -0
  34. data/vendor/spidermonkey/config/Darwin5.2.mk +81 -0
  35. data/vendor/spidermonkey/config/Darwin5.3.mk +81 -0
  36. data/vendor/spidermonkey/config/HP-UXB.10.10.mk +77 -0
  37. data/vendor/spidermonkey/config/HP-UXB.10.20.mk +77 -0
  38. data/vendor/spidermonkey/config/HP-UXB.11.00.mk +80 -0
  39. data/vendor/spidermonkey/config/IRIX.mk +87 -0
  40. data/vendor/spidermonkey/config/IRIX5.3.mk +44 -0
  41. data/vendor/spidermonkey/config/IRIX6.1.mk +44 -0
  42. data/vendor/spidermonkey/config/IRIX6.2.mk +44 -0
  43. data/vendor/spidermonkey/config/IRIX6.3.mk +44 -0
  44. data/vendor/spidermonkey/config/IRIX6.5.mk +44 -0
  45. data/vendor/spidermonkey/config/Linux_All.mk +103 -0
  46. data/vendor/spidermonkey/config/Mac_OS10.0.mk +82 -0
  47. data/vendor/spidermonkey/config/OSF1V4.0.mk +72 -0
  48. data/vendor/spidermonkey/config/OSF1V5.0.mk +69 -0
  49. data/vendor/spidermonkey/config/SunOS4.1.4.mk +101 -0
  50. data/vendor/spidermonkey/config/SunOS5.10.mk +50 -0
  51. data/vendor/spidermonkey/config/SunOS5.3.mk +91 -0
  52. data/vendor/spidermonkey/config/SunOS5.4.mk +92 -0
  53. data/vendor/spidermonkey/config/SunOS5.5.1.mk +44 -0
  54. data/vendor/spidermonkey/config/SunOS5.5.mk +87 -0
  55. data/vendor/spidermonkey/config/SunOS5.6.mk +89 -0
  56. data/vendor/spidermonkey/config/SunOS5.7.mk +44 -0
  57. data/vendor/spidermonkey/config/SunOS5.8.mk +44 -0
  58. data/vendor/spidermonkey/config/SunOS5.9.mk +44 -0
  59. data/vendor/spidermonkey/config/WINNT4.0.mk +117 -0
  60. data/vendor/spidermonkey/config/WINNT5.0.mk +117 -0
  61. data/vendor/spidermonkey/config/WINNT5.1.mk +117 -0
  62. data/vendor/spidermonkey/config/WINNT5.2.mk +117 -0
  63. data/vendor/spidermonkey/config/WINNT6.0.mk +117 -0
  64. data/vendor/spidermonkey/config/dgux.mk +64 -0
  65. data/vendor/spidermonkey/config.mk +192 -0
  66. data/vendor/spidermonkey/editline/Makefile.ref +144 -0
  67. data/vendor/spidermonkey/editline/README +83 -0
  68. data/vendor/spidermonkey/editline/editline.3 +175 -0
  69. data/vendor/spidermonkey/editline/editline.c +1369 -0
  70. data/vendor/spidermonkey/editline/editline.h +135 -0
  71. data/vendor/spidermonkey/editline/sysunix.c +182 -0
  72. data/vendor/spidermonkey/editline/unix.h +82 -0
  73. data/vendor/spidermonkey/fdlibm/.cvsignore +7 -0
  74. data/vendor/spidermonkey/fdlibm/Makefile.in +127 -0
  75. data/vendor/spidermonkey/fdlibm/Makefile.ref +192 -0
  76. data/vendor/spidermonkey/fdlibm/e_acos.c +147 -0
  77. data/vendor/spidermonkey/fdlibm/e_acosh.c +105 -0
  78. data/vendor/spidermonkey/fdlibm/e_asin.c +156 -0
  79. data/vendor/spidermonkey/fdlibm/e_atan2.c +165 -0
  80. data/vendor/spidermonkey/fdlibm/e_atanh.c +110 -0
  81. data/vendor/spidermonkey/fdlibm/e_cosh.c +133 -0
  82. data/vendor/spidermonkey/fdlibm/e_exp.c +202 -0
  83. data/vendor/spidermonkey/fdlibm/e_fmod.c +184 -0
  84. data/vendor/spidermonkey/fdlibm/e_gamma.c +71 -0
  85. data/vendor/spidermonkey/fdlibm/e_gamma_r.c +70 -0
  86. data/vendor/spidermonkey/fdlibm/e_hypot.c +173 -0
  87. data/vendor/spidermonkey/fdlibm/e_j0.c +524 -0
  88. data/vendor/spidermonkey/fdlibm/e_j1.c +523 -0
  89. data/vendor/spidermonkey/fdlibm/e_jn.c +315 -0
  90. data/vendor/spidermonkey/fdlibm/e_lgamma.c +71 -0
  91. data/vendor/spidermonkey/fdlibm/e_lgamma_r.c +347 -0
  92. data/vendor/spidermonkey/fdlibm/e_log.c +184 -0
  93. data/vendor/spidermonkey/fdlibm/e_log10.c +134 -0
  94. data/vendor/spidermonkey/fdlibm/e_pow.c +386 -0
  95. data/vendor/spidermonkey/fdlibm/e_rem_pio2.c +222 -0
  96. data/vendor/spidermonkey/fdlibm/e_remainder.c +120 -0
  97. data/vendor/spidermonkey/fdlibm/e_scalb.c +89 -0
  98. data/vendor/spidermonkey/fdlibm/e_sinh.c +122 -0
  99. data/vendor/spidermonkey/fdlibm/e_sqrt.c +497 -0
  100. data/vendor/spidermonkey/fdlibm/fdlibm.h +273 -0
  101. data/vendor/spidermonkey/fdlibm/fdlibm.mak +1453 -0
  102. data/vendor/spidermonkey/fdlibm/fdlibm.mdp +0 -0
  103. data/vendor/spidermonkey/fdlibm/k_cos.c +135 -0
  104. data/vendor/spidermonkey/fdlibm/k_rem_pio2.c +354 -0
  105. data/vendor/spidermonkey/fdlibm/k_sin.c +114 -0
  106. data/vendor/spidermonkey/fdlibm/k_standard.c +785 -0
  107. data/vendor/spidermonkey/fdlibm/k_tan.c +170 -0
  108. data/vendor/spidermonkey/fdlibm/s_asinh.c +101 -0
  109. data/vendor/spidermonkey/fdlibm/s_atan.c +175 -0
  110. data/vendor/spidermonkey/fdlibm/s_cbrt.c +133 -0
  111. data/vendor/spidermonkey/fdlibm/s_ceil.c +120 -0
  112. data/vendor/spidermonkey/fdlibm/s_copysign.c +72 -0
  113. data/vendor/spidermonkey/fdlibm/s_cos.c +118 -0
  114. data/vendor/spidermonkey/fdlibm/s_erf.c +356 -0
  115. data/vendor/spidermonkey/fdlibm/s_expm1.c +267 -0
  116. data/vendor/spidermonkey/fdlibm/s_fabs.c +70 -0
  117. data/vendor/spidermonkey/fdlibm/s_finite.c +71 -0
  118. data/vendor/spidermonkey/fdlibm/s_floor.c +121 -0
  119. data/vendor/spidermonkey/fdlibm/s_frexp.c +99 -0
  120. data/vendor/spidermonkey/fdlibm/s_ilogb.c +85 -0
  121. data/vendor/spidermonkey/fdlibm/s_isnan.c +74 -0
  122. data/vendor/spidermonkey/fdlibm/s_ldexp.c +66 -0
  123. data/vendor/spidermonkey/fdlibm/s_lib_version.c +73 -0
  124. data/vendor/spidermonkey/fdlibm/s_log1p.c +211 -0
  125. data/vendor/spidermonkey/fdlibm/s_logb.c +79 -0
  126. data/vendor/spidermonkey/fdlibm/s_matherr.c +64 -0
  127. data/vendor/spidermonkey/fdlibm/s_modf.c +132 -0
  128. data/vendor/spidermonkey/fdlibm/s_nextafter.c +124 -0
  129. data/vendor/spidermonkey/fdlibm/s_rint.c +131 -0
  130. data/vendor/spidermonkey/fdlibm/s_scalbn.c +107 -0
  131. data/vendor/spidermonkey/fdlibm/s_signgam.c +40 -0
  132. data/vendor/spidermonkey/fdlibm/s_significand.c +68 -0
  133. data/vendor/spidermonkey/fdlibm/s_sin.c +118 -0
  134. data/vendor/spidermonkey/fdlibm/s_tan.c +112 -0
  135. data/vendor/spidermonkey/fdlibm/s_tanh.c +122 -0
  136. data/vendor/spidermonkey/fdlibm/w_acos.c +78 -0
  137. data/vendor/spidermonkey/fdlibm/w_acosh.c +78 -0
  138. data/vendor/spidermonkey/fdlibm/w_asin.c +80 -0
  139. data/vendor/spidermonkey/fdlibm/w_atan2.c +79 -0
  140. data/vendor/spidermonkey/fdlibm/w_atanh.c +81 -0
  141. data/vendor/spidermonkey/fdlibm/w_cosh.c +77 -0
  142. data/vendor/spidermonkey/fdlibm/w_exp.c +88 -0
  143. data/vendor/spidermonkey/fdlibm/w_fmod.c +78 -0
  144. data/vendor/spidermonkey/fdlibm/w_gamma.c +85 -0
  145. data/vendor/spidermonkey/fdlibm/w_gamma_r.c +81 -0
  146. data/vendor/spidermonkey/fdlibm/w_hypot.c +78 -0
  147. data/vendor/spidermonkey/fdlibm/w_j0.c +105 -0
  148. data/vendor/spidermonkey/fdlibm/w_j1.c +106 -0
  149. data/vendor/spidermonkey/fdlibm/w_jn.c +128 -0
  150. data/vendor/spidermonkey/fdlibm/w_lgamma.c +85 -0
  151. data/vendor/spidermonkey/fdlibm/w_lgamma_r.c +81 -0
  152. data/vendor/spidermonkey/fdlibm/w_log.c +78 -0
  153. data/vendor/spidermonkey/fdlibm/w_log10.c +81 -0
  154. data/vendor/spidermonkey/fdlibm/w_pow.c +99 -0
  155. data/vendor/spidermonkey/fdlibm/w_remainder.c +77 -0
  156. data/vendor/spidermonkey/fdlibm/w_scalb.c +95 -0
  157. data/vendor/spidermonkey/fdlibm/w_sinh.c +77 -0
  158. data/vendor/spidermonkey/fdlibm/w_sqrt.c +77 -0
  159. data/vendor/spidermonkey/javascript-trace.d +73 -0
  160. data/vendor/spidermonkey/js.c +3951 -0
  161. data/vendor/spidermonkey/js.mak +4438 -0
  162. data/vendor/spidermonkey/js.mdp +0 -0
  163. data/vendor/spidermonkey/js.msg +307 -0
  164. data/vendor/spidermonkey/js.pkg +2 -0
  165. data/vendor/spidermonkey/js3240.rc +79 -0
  166. data/vendor/spidermonkey/jsOS240.def +654 -0
  167. data/vendor/spidermonkey/jsapi.c +5836 -0
  168. data/vendor/spidermonkey/jsapi.h +2624 -0
  169. data/vendor/spidermonkey/jsarena.c +450 -0
  170. data/vendor/spidermonkey/jsarena.h +318 -0
  171. data/vendor/spidermonkey/jsarray.c +2988 -0
  172. data/vendor/spidermonkey/jsarray.h +124 -0
  173. data/vendor/spidermonkey/jsatom.c +1045 -0
  174. data/vendor/spidermonkey/jsatom.h +442 -0
  175. data/vendor/spidermonkey/jsbit.h +253 -0
  176. data/vendor/spidermonkey/jsbool.c +176 -0
  177. data/vendor/spidermonkey/jsbool.h +73 -0
  178. data/vendor/spidermonkey/jsclist.h +139 -0
  179. data/vendor/spidermonkey/jscntxt.c +1348 -0
  180. data/vendor/spidermonkey/jscntxt.h +1120 -0
  181. data/vendor/spidermonkey/jscompat.h +57 -0
  182. data/vendor/spidermonkey/jsconfig.h +248 -0
  183. data/vendor/spidermonkey/jsconfig.mk +181 -0
  184. data/vendor/spidermonkey/jscpucfg.c +383 -0
  185. data/vendor/spidermonkey/jscpucfg.h +212 -0
  186. data/vendor/spidermonkey/jsdate.c +2398 -0
  187. data/vendor/spidermonkey/jsdate.h +124 -0
  188. data/vendor/spidermonkey/jsdbgapi.c +1799 -0
  189. data/vendor/spidermonkey/jsdbgapi.h +464 -0
  190. data/vendor/spidermonkey/jsdhash.c +868 -0
  191. data/vendor/spidermonkey/jsdhash.h +592 -0
  192. data/vendor/spidermonkey/jsdtoa.c +3167 -0
  193. data/vendor/spidermonkey/jsdtoa.h +130 -0
  194. data/vendor/spidermonkey/jsdtracef.c +317 -0
  195. data/vendor/spidermonkey/jsdtracef.h +77 -0
  196. data/vendor/spidermonkey/jsemit.c +6909 -0
  197. data/vendor/spidermonkey/jsemit.h +741 -0
  198. data/vendor/spidermonkey/jsexn.c +1371 -0
  199. data/vendor/spidermonkey/jsexn.h +96 -0
  200. data/vendor/spidermonkey/jsfile.c +2736 -0
  201. data/vendor/spidermonkey/jsfile.h +56 -0
  202. data/vendor/spidermonkey/jsfile.msg +90 -0
  203. data/vendor/spidermonkey/jsfun.c +2634 -0
  204. data/vendor/spidermonkey/jsfun.h +254 -0
  205. data/vendor/spidermonkey/jsgc.c +3554 -0
  206. data/vendor/spidermonkey/jsgc.h +403 -0
  207. data/vendor/spidermonkey/jshash.c +476 -0
  208. data/vendor/spidermonkey/jshash.h +151 -0
  209. data/vendor/spidermonkey/jsify.pl +485 -0
  210. data/vendor/spidermonkey/jsinterp.c +6981 -0
  211. data/vendor/spidermonkey/jsinterp.h +521 -0
  212. data/vendor/spidermonkey/jsinvoke.c +43 -0
  213. data/vendor/spidermonkey/jsiter.c +1067 -0
  214. data/vendor/spidermonkey/jsiter.h +122 -0
  215. data/vendor/spidermonkey/jskeyword.tbl +124 -0
  216. data/vendor/spidermonkey/jskwgen.c +460 -0
  217. data/vendor/spidermonkey/jslibmath.h +266 -0
  218. data/vendor/spidermonkey/jslock.c +1309 -0
  219. data/vendor/spidermonkey/jslock.h +313 -0
  220. data/vendor/spidermonkey/jslocko.asm +60 -0
  221. data/vendor/spidermonkey/jslog2.c +94 -0
  222. data/vendor/spidermonkey/jslong.c +264 -0
  223. data/vendor/spidermonkey/jslong.h +412 -0
  224. data/vendor/spidermonkey/jsmath.c +568 -0
  225. data/vendor/spidermonkey/jsmath.h +57 -0
  226. data/vendor/spidermonkey/jsnum.c +1228 -0
  227. data/vendor/spidermonkey/jsnum.h +283 -0
  228. data/vendor/spidermonkey/jsobj.c +5266 -0
  229. data/vendor/spidermonkey/jsobj.h +709 -0
  230. data/vendor/spidermonkey/jsopcode.c +5245 -0
  231. data/vendor/spidermonkey/jsopcode.h +394 -0
  232. data/vendor/spidermonkey/jsopcode.tbl +523 -0
  233. data/vendor/spidermonkey/jsotypes.h +202 -0
  234. data/vendor/spidermonkey/jsparse.c +6680 -0
  235. data/vendor/spidermonkey/jsparse.h +511 -0
  236. data/vendor/spidermonkey/jsprf.c +1262 -0
  237. data/vendor/spidermonkey/jsprf.h +150 -0
  238. data/vendor/spidermonkey/jsproto.tbl +128 -0
  239. data/vendor/spidermonkey/jsprvtd.h +267 -0
  240. data/vendor/spidermonkey/jspubtd.h +744 -0
  241. data/vendor/spidermonkey/jsregexp.c +4352 -0
  242. data/vendor/spidermonkey/jsregexp.h +183 -0
  243. data/vendor/spidermonkey/jsreops.tbl +145 -0
  244. data/vendor/spidermonkey/jsscan.c +2003 -0
  245. data/vendor/spidermonkey/jsscan.h +387 -0
  246. data/vendor/spidermonkey/jsscope.c +1948 -0
  247. data/vendor/spidermonkey/jsscope.h +418 -0
  248. data/vendor/spidermonkey/jsscript.c +1832 -0
  249. data/vendor/spidermonkey/jsscript.h +287 -0
  250. data/vendor/spidermonkey/jsshell.msg +50 -0
  251. data/vendor/spidermonkey/jsstddef.h +83 -0
  252. data/vendor/spidermonkey/jsstr.c +5004 -0
  253. data/vendor/spidermonkey/jsstr.h +641 -0
  254. data/vendor/spidermonkey/jstypes.h +475 -0
  255. data/vendor/spidermonkey/jsutil.c +345 -0
  256. data/vendor/spidermonkey/jsutil.h +157 -0
  257. data/vendor/spidermonkey/jsxdrapi.c +800 -0
  258. data/vendor/spidermonkey/jsxdrapi.h +218 -0
  259. data/vendor/spidermonkey/jsxml.c +8471 -0
  260. data/vendor/spidermonkey/jsxml.h +349 -0
  261. data/vendor/spidermonkey/lock_SunOS.s +119 -0
  262. data/vendor/spidermonkey/perfect.js +39 -0
  263. data/vendor/spidermonkey/plify_jsdhash.sed +36 -0
  264. data/vendor/spidermonkey/prmjtime.c +846 -0
  265. data/vendor/spidermonkey/prmjtime.h +103 -0
  266. data/vendor/spidermonkey/resource.h +15 -0
  267. data/vendor/spidermonkey/rules.mk +197 -0
  268. data/vendor/spidermonkey/win32.order +384 -0
  269. metadata +4 -3
@@ -0,0 +1,183 @@
1
+ /* -*- Mode: C; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 4 -*-
2
+ *
3
+ * ***** BEGIN LICENSE BLOCK *****
4
+ * Version: MPL 1.1/GPL 2.0/LGPL 2.1
5
+ *
6
+ * The contents of this file are subject to the Mozilla Public License Version
7
+ * 1.1 (the "License"); you may not use this file except in compliance with
8
+ * the License. You may obtain a copy of the License at
9
+ * http://www.mozilla.org/MPL/
10
+ *
11
+ * Software distributed under the License is distributed on an "AS IS" basis,
12
+ * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
13
+ * for the specific language governing rights and limitations under the
14
+ * License.
15
+ *
16
+ * The Original Code is Mozilla Communicator client code, released
17
+ * March 31, 1998.
18
+ *
19
+ * The Initial Developer of the Original Code is
20
+ * Netscape Communications Corporation.
21
+ * Portions created by the Initial Developer are Copyright (C) 1998
22
+ * the Initial Developer. All Rights Reserved.
23
+ *
24
+ * Contributor(s):
25
+ *
26
+ * Alternatively, the contents of this file may be used under the terms of
27
+ * either of the GNU General Public License Version 2 or later (the "GPL"),
28
+ * or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
29
+ * in which case the provisions of the GPL or the LGPL are applicable instead
30
+ * of those above. If you wish to allow use of your version of this file only
31
+ * under the terms of either the GPL or the LGPL, and not to allow others to
32
+ * use your version of this file under the terms of the MPL, indicate your
33
+ * decision by deleting the provisions above and replace them with the notice
34
+ * and other provisions required by the GPL or the LGPL. If you do not delete
35
+ * the provisions above, a recipient may use your version of this file under
36
+ * the terms of any one of the MPL, the GPL or the LGPL.
37
+ *
38
+ * ***** END LICENSE BLOCK ***** */
39
+
40
+ #ifndef jsregexp_h___
41
+ #define jsregexp_h___
42
+ /*
43
+ * JS regular expression interface.
44
+ */
45
+ #include <stddef.h>
46
+ #include "jspubtd.h"
47
+ #include "jsstr.h"
48
+
49
+ #ifdef JS_THREADSAFE
50
+ #include "jsdhash.h"
51
+ #endif
52
+
53
+ JS_BEGIN_EXTERN_C
54
+
55
+ struct JSRegExpStatics {
56
+ JSString *input; /* input string to match (perl $_, GC root) */
57
+ JSBool multiline; /* whether input contains newlines (perl $*) */
58
+ uint16 parenCount; /* number of valid elements in parens[] */
59
+ uint16 moreLength; /* number of allocated elements in moreParens */
60
+ JSSubString parens[9]; /* last set of parens matched (perl $1, $2) */
61
+ JSSubString *moreParens; /* null or realloc'd vector for $10, etc. */
62
+ JSSubString lastMatch; /* last string matched (perl $&) */
63
+ JSSubString lastParen; /* last paren matched (perl $+) */
64
+ JSSubString leftContext; /* input to left of last match (perl $`) */
65
+ JSSubString rightContext; /* input to right of last match (perl $') */
66
+ };
67
+
68
+ /*
69
+ * This struct holds a bitmap representation of a class from a regexp.
70
+ * There's a list of these referenced by the classList field in the JSRegExp
71
+ * struct below. The initial state has startIndex set to the offset in the
72
+ * original regexp source of the beginning of the class contents. The first
73
+ * use of the class converts the source representation into a bitmap.
74
+ *
75
+ */
76
+ typedef struct RECharSet {
77
+ JSPackedBool converted;
78
+ JSPackedBool sense;
79
+ uint16 length;
80
+ union {
81
+ uint8 *bits;
82
+ struct {
83
+ size_t startIndex;
84
+ size_t length;
85
+ } src;
86
+ } u;
87
+ } RECharSet;
88
+
89
+ /*
90
+ * This macro is safe because moreParens is guaranteed to be allocated and big
91
+ * enough to hold parenCount, or else be null when parenCount is 0.
92
+ */
93
+ #define REGEXP_PAREN_SUBSTRING(res, num) \
94
+ (((jsuint)(num) < (jsuint)(res)->parenCount) \
95
+ ? ((jsuint)(num) < 9) \
96
+ ? &(res)->parens[num] \
97
+ : &(res)->moreParens[(num) - 9] \
98
+ : &js_EmptySubString)
99
+
100
+ typedef struct RENode RENode;
101
+
102
+ struct JSRegExp {
103
+ jsrefcount nrefs; /* reference count */
104
+ uint16 flags; /* flags, see jsapi.h's JSREG_* defines */
105
+ size_t parenCount; /* number of parenthesized submatches */
106
+ size_t classCount; /* count [...] bitmaps */
107
+ RECharSet *classList; /* list of [...] bitmaps */
108
+ JSString *source; /* locked source string, sans // */
109
+ jsbytecode program[1]; /* regular expression bytecode */
110
+ };
111
+
112
+ extern JSRegExp *
113
+ js_NewRegExp(JSContext *cx, JSTokenStream *ts,
114
+ JSString *str, uintN flags, JSBool flat);
115
+
116
+ extern JSRegExp *
117
+ js_NewRegExpOpt(JSContext *cx, JSString *str, JSString *opt, JSBool flat);
118
+
119
+ #define HOLD_REGEXP(cx, re) JS_ATOMIC_INCREMENT(&(re)->nrefs)
120
+ #define DROP_REGEXP(cx, re) js_DestroyRegExp(cx, re)
121
+
122
+ extern void
123
+ js_DestroyRegExp(JSContext *cx, JSRegExp *re);
124
+
125
+ /*
126
+ * Execute re on input str at *indexp, returning null in *rval on mismatch.
127
+ * On match, return true if test is true, otherwise return an array object.
128
+ * Update *indexp and cx->regExpStatics always on match.
129
+ */
130
+ extern JSBool
131
+ js_ExecuteRegExp(JSContext *cx, JSRegExp *re, JSString *str, size_t *indexp,
132
+ JSBool test, jsval *rval);
133
+
134
+ /*
135
+ * These two add and remove GC roots, respectively, so their calls must be
136
+ * well-ordered.
137
+ */
138
+ extern JSBool
139
+ js_InitRegExpStatics(JSContext *cx, JSRegExpStatics *res);
140
+
141
+ extern void
142
+ js_FreeRegExpStatics(JSContext *cx, JSRegExpStatics *res);
143
+
144
+ #define JSVAL_IS_REGEXP(cx, v) \
145
+ (JSVAL_IS_OBJECT(v) && JSVAL_TO_OBJECT(v) && \
146
+ OBJ_GET_CLASS(cx, JSVAL_TO_OBJECT(v)) == &js_RegExpClass)
147
+
148
+ extern JSClass js_RegExpClass;
149
+
150
+ extern JSObject *
151
+ js_InitRegExpClass(JSContext *cx, JSObject *obj);
152
+
153
+ /*
154
+ * Export js_regexp_toString to the decompiler.
155
+ */
156
+ extern JSBool
157
+ js_regexp_toString(JSContext *cx, JSObject *obj, jsval *vp);
158
+
159
+ /*
160
+ * Create, serialize/deserialize, or clone a RegExp object.
161
+ */
162
+ extern JSObject *
163
+ js_NewRegExpObject(JSContext *cx, JSTokenStream *ts,
164
+ jschar *chars, size_t length, uintN flags);
165
+
166
+ extern JSBool
167
+ js_XDRRegExp(JSXDRState *xdr, JSObject **objp);
168
+
169
+ extern JSObject *
170
+ js_CloneRegExpObject(JSContext *cx, JSObject *obj, JSObject *parent);
171
+
172
+ /*
173
+ * Get and set the per-object (clone or clone-parent) lastIndex slot.
174
+ */
175
+ extern JSBool
176
+ js_GetLastIndex(JSContext *cx, JSObject *obj, jsdouble *lastIndex);
177
+
178
+ extern JSBool
179
+ js_SetLastIndex(JSContext *cx, JSObject *obj, jsdouble lastIndex);
180
+
181
+ JS_END_EXTERN_C
182
+
183
+ #endif /* jsregexp_h___ */
@@ -0,0 +1,145 @@
1
+ /* -*- Mode: C; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 4 -*-
2
+ * vim: set ts=8 sw=4 et tw=0 ft=C:
3
+ *
4
+ * ***** BEGIN LICENSE BLOCK *****
5
+ * Version: MPL 1.1/GPL 2.0/LGPL 2.1
6
+ *
7
+ * The contents of this file are subject to the Mozilla Public License Version
8
+ * 1.1 (the "license"); you may not use this file except in compliance with
9
+ * the License. You may obtain a copy of the License at
10
+ * http://www.mozilla.org/MPL/
11
+ *
12
+ * Software distributed under the License is distributed on an "as is" basis,
13
+ * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
14
+ * for the specific language governing rights and limitations under the
15
+ * License.
16
+ *
17
+ * The Original Code is Mozilla Communicator client code, released
18
+ * March 31, 1998.
19
+ *
20
+ * The Initial Developer of the Original Code is
21
+ * Netscape Communications Corporation.
22
+ * Portions created by the Initial Developer are Copyright (C) 1998
23
+ * the Initial Developer. All Rights Reserved.
24
+ *
25
+ * Contributor(s):
26
+ *
27
+ * Alternatively, the contentsof this file are subject to the Mozilla Public License Version
28
+ * 1.1 (the "license"); you may not use this file except in compliance with
29
+ * the License. You may obtain a copy of thter (the "lgpl"),
30
+ * in which case the provisions of the GPL or the LGPL are applicable instead
31
+ * of those above. If you wish to allow use of your version of this file only
32
+ * under the terms of either the GPL or the LGPL, and not to allow others to
33
+ * use your version of this file under the terms of the MPL, indicate your
34
+ * decision by deleting the provisions above and replace them with the notice
35
+ * and other provisions required by the GPL or the LGPL. If you do not delete
36
+ * the provisions above, a recipient may use your version of this file under
37
+ * the terms of any one of the MPL, the GPL or the LGPL.
38
+ *
39
+ * ***** END LICENSE BLOCK ***** */
40
+
41
+
42
+ /* Note : contiguity of 'simple opcodes' is important for SimpleMatch() */
43
+
44
+ /* match rest of input against rest of r.e. */
45
+ REOP_DEF(REOP_EMPTY, "empty")
46
+ /* beginning of input (or line if multiline) */
47
+ REOP_DEF(REOP_BOL, "bol")
48
+ /* end of input (or line if multiline) */
49
+ REOP_DEF(REOP_EOL, "eol")
50
+ /* match "" at word boundary */
51
+ REOP_DEF(REOP_WBDRY, "wbdry")
52
+ /* match "" at word non-boundary */
53
+ REOP_DEF(REOP_WNONBDRY, "wnonbdry")
54
+ /* stands for any character */
55
+ REOP_DEF(REOP_DOT, "dot")
56
+ /* match a digit char: [0-9] */
57
+ REOP_DEF(REOP_DIGIT, "digit")
58
+ /* match a non-digit char: [^0-9] */
59
+ REOP_DEF(REOP_NONDIGIT, "nondigit")
60
+ /* match an alphanumeric char: [0-9a-z_A-Z] */
61
+ REOP_DEF(REOP_ALNUM, "alnum")
62
+ /* match a non-alphanumeric char: [^0-9a-z_A-Z] */
63
+ REOP_DEF(REOP_NONALNUM, "nonalnum")
64
+ /* match a whitespace char */
65
+ REOP_DEF(REOP_SPACE, "space")
66
+ /* match a non-whitespace char */
67
+ REOP_DEF(REOP_NONSPACE, "nonspace")
68
+ /* back-reference (e.g., \1) to a parenthetical */
69
+ REOP_DEF(REOP_BACKREF, "backref")
70
+ /* match a flat string */
71
+ REOP_DEF(REOP_FLAT, "flat")
72
+ /* match a single char */
73
+ REOP_DEF(REOP_FLAT1, "flat1")
74
+ /* case-independent REOP_FLAT */
75
+ REOP_DEF(REOP_FLATi, "flati")
76
+ /* case-independent REOP_FLAT1 */
77
+ REOP_DEF(REOP_FLAT1i, "flat1i")
78
+ /* single Unicode char */
79
+ REOP_DEF(REOP_UCFLAT1, "ucflat1")
80
+ /* case-independent REOP_UCFLAT1 */
81
+ REOP_DEF(REOP_UCFLAT1i, "ucflat1i")
82
+ /* flat Unicode string; len immediate counts chars */
83
+ REOP_DEF(REOP_UCFLAT, "ucflat")
84
+ /* case-independent REOP_UCFLAT */
85
+ REOP_DEF(REOP_UCFLATi, "ucflati")
86
+ /* character class with index */
87
+ REOP_DEF(REOP_CLASS, "class")
88
+ /* negated character class with index */
89
+ REOP_DEF(REOP_NCLASS, "nclass")
90
+
91
+ /* NCLASS is considered to be the last "simple" op-code */
92
+
93
+
94
+ /* alternative subexpressions in kid and next */
95
+ REOP_DEF(REOP_ALT, "alt")
96
+ /* quantified atom: atom{1,2} */
97
+ REOP_DEF(REOP_QUANT, "quant")
98
+ /* zero or more occurrences of kid */
99
+ REOP_DEF(REOP_STAR, "star")
100
+ /* one or more occurrences of kid */
101
+ REOP_DEF(REOP_PLUS, "plus")
102
+ /* optional subexpression in kid */
103
+ REOP_DEF(REOP_OPT, "opt")
104
+ /* left paren bytecode: kid is u.num'th sub-regexp */
105
+ REOP_DEF(REOP_LPAREN, "lparen")
106
+ /* right paren bytecode */
107
+ REOP_DEF(REOP_RPAREN, "rparen")
108
+ /* for deoptimized closure loops */
109
+ REOP_DEF(REOP_JUMP, "jump")
110
+ /* optimize .* to use a single opcode */
111
+ REOP_DEF(REOP_DOTSTAR, "dotstar")
112
+ /* non-capturing version of REOP_LPAREN */
113
+ REOP_DEF(REOP_LPARENNON, "lparennon")
114
+ /* zero width positive lookahead assertion */
115
+ REOP_DEF(REOP_ASSERT, "assert")
116
+ /* zero width negative lookahead assertion */
117
+ REOP_DEF(REOP_ASSERT_NOT, "assert_not")
118
+ /* sentinel at end of assertion child */
119
+ REOP_DEF(REOP_ASSERTTEST, "asserttest")
120
+ /* sentinel at end of !assertion child */
121
+ REOP_DEF(REOP_ASSERTNOTTEST, "assertnottest")
122
+ /* non-greedy version of * */
123
+ REOP_DEF(REOP_MINIMALSTAR, "minimalstar")
124
+ /* non-greedy version of + */
125
+ REOP_DEF(REOP_MINIMALPLUS, "minimalplus")
126
+ /* non-greedy version of ? */
127
+ REOP_DEF(REOP_MINIMALOPT, "minimalopt")
128
+ /* non-greedy version of {} */
129
+ REOP_DEF(REOP_MINIMALQUANT, "minimalquant")
130
+ /* sentinel at end of quantifier child */
131
+ REOP_DEF(REOP_ENDCHILD, "endchild")
132
+ /* directs execution of greedy quantifier */
133
+ REOP_DEF(REOP_REPEAT, "repeat")
134
+ /* directs execution of non-greedy quantifier */
135
+ REOP_DEF(REOP_MINIMALREPEAT, "minimalrepeat")
136
+ /* prerequisite for ALT, either of two chars */
137
+ REOP_DEF(REOP_ALTPREREQ, "altprereq")
138
+ /* prerequisite for ALT, a char or a class */
139
+ REOP_DEF(REOP_ALTPREREQ2, "altprereq2")
140
+ /* end of final alternate */
141
+ REOP_DEF(REOP_ENDALT, "endalt")
142
+ /* concatenation of terms (parse time only) */
143
+ REOP_DEF(REOP_CONCAT, "concat")
144
+ /* end of expression */
145
+ REOP_DEF(REOP_END, "end")
@@ -0,0 +1,2003 @@
1
+ /* -*- Mode: C; tab-width: 8; indent-tabs-mode: nil; c-basic-offset: 4 -*-
2
+ * vim: set sw=4 ts=8 et tw=78:
3
+ *
4
+ * ***** BEGIN LICENSE BLOCK *****
5
+ * Version: MPL 1.1/GPL 2.0/LGPL 2.1
6
+ *
7
+ * The contents of this file are subject to the Mozilla Public License Version
8
+ * 1.1 (the "License"); you may not use this file except in compliance with
9
+ * the License. You may obtain a copy of the License at
10
+ * http://www.mozilla.org/MPL/
11
+ *
12
+ * Software distributed under the License is distributed on an "AS IS" basis,
13
+ * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
14
+ * for the specific language governing rights and limitations under the
15
+ * License.
16
+ *
17
+ * The Original Code is Mozilla Communicator client code, released
18
+ * March 31, 1998.
19
+ *
20
+ * The Initial Developer of the Original Code is
21
+ * Netscape Communications Corporation.
22
+ * Portions created by the Initial Developer are Copyright (C) 1998
23
+ * the Initial Developer. All Rights Reserved.
24
+ *
25
+ * Contributor(s):
26
+ *
27
+ * Alternatively, the contents of this file may be used under the terms of
28
+ * either of the GNU General Public License Version 2 or later (the "GPL"),
29
+ * or the GNU Lesser General Public License Version 2.1 or later (the "LGPL"),
30
+ * in which case the provisions of the GPL or the LGPL are applicable instead
31
+ * of those above. If you wish to allow use of your version of this file only
32
+ * under the terms of either the GPL or the LGPL, and not to allow others to
33
+ * use your version of this file under the terms of the MPL, indicate your
34
+ * decision by deleting the provisions above and replace them with the notice
35
+ * and other provisions required by the GPL or the LGPL. If you do not delete
36
+ * the provisions above, a recipient may use your version of this file under
37
+ * the terms of any one of the MPL, the GPL or the LGPL.
38
+ *
39
+ * ***** END LICENSE BLOCK ***** */
40
+
41
+ /*
42
+ * JS lexical scanner.
43
+ */
44
+ #include "jsstddef.h"
45
+ #include <stdio.h> /* first to avoid trouble on some systems */
46
+ #include <errno.h>
47
+ #include <limits.h>
48
+ #include <math.h>
49
+ #ifdef HAVE_MEMORY_H
50
+ #include <memory.h>
51
+ #endif
52
+ #include <stdarg.h>
53
+ #include <stdlib.h>
54
+ #include <string.h>
55
+ #include "jstypes.h"
56
+ #include "jsarena.h" /* Added by JSIFY */
57
+ #include "jsutil.h" /* Added by JSIFY */
58
+ #include "jsdtoa.h"
59
+ #include "jsprf.h"
60
+ #include "jsapi.h"
61
+ #include "jsatom.h"
62
+ #include "jscntxt.h"
63
+ #include "jsconfig.h"
64
+ #include "jsemit.h"
65
+ #include "jsexn.h"
66
+ #include "jsnum.h"
67
+ #include "jsopcode.h"
68
+ #include "jsparse.h"
69
+ #include "jsregexp.h"
70
+ #include "jsscan.h"
71
+ #include "jsscript.h"
72
+
73
+ #if JS_HAS_XML_SUPPORT
74
+ #include "jsxml.h"
75
+ #endif
76
+
77
+ #define JS_KEYWORD(keyword, type, op, version) \
78
+ const char js_##keyword##_str[] = #keyword;
79
+ #include "jskeyword.tbl"
80
+ #undef JS_KEYWORD
81
+
82
+ struct keyword {
83
+ const char *chars; /* C string with keyword text */
84
+ JSTokenType tokentype; /* JSTokenType */
85
+ JSOp op; /* JSOp */
86
+ JSVersion version; /* JSVersion */
87
+ };
88
+
89
+ static const struct keyword keyword_defs[] = {
90
+ #define JS_KEYWORD(keyword, type, op, version) \
91
+ {js_##keyword##_str, type, op, version},
92
+ #include "jskeyword.tbl"
93
+ #undef JS_KEYWORD
94
+ };
95
+
96
+ #define KEYWORD_COUNT JS_ARRAY_LENGTH(keyword_defs)
97
+
98
+ static const struct keyword *
99
+ FindKeyword(const jschar *s, size_t length)
100
+ {
101
+ register size_t i;
102
+ const struct keyword *kw;
103
+ const char *chars;
104
+
105
+ JS_ASSERT(length != 0);
106
+
107
+ #define JSKW_LENGTH() length
108
+ #define JSKW_AT(column) s[column]
109
+ #define JSKW_GOT_MATCH(index) i = (index); goto got_match;
110
+ #define JSKW_TEST_GUESS(index) i = (index); goto test_guess;
111
+ #define JSKW_NO_MATCH() goto no_match;
112
+ #include "jsautokw.h"
113
+ #undef JSKW_NO_MATCH
114
+ #undef JSKW_TEST_GUESS
115
+ #undef JSKW_GOT_MATCH
116
+ #undef JSKW_AT
117
+ #undef JSKW_LENGTH
118
+
119
+ got_match:
120
+ return &keyword_defs[i];
121
+
122
+ test_guess:
123
+ kw = &keyword_defs[i];
124
+ chars = kw->chars;
125
+ do {
126
+ if (*s++ != (unsigned char)(*chars++))
127
+ goto no_match;
128
+ } while (--length != 0);
129
+ return kw;
130
+
131
+ no_match:
132
+ return NULL;
133
+ }
134
+
135
+ JSTokenType
136
+ js_CheckKeyword(const jschar *str, size_t length)
137
+ {
138
+ const struct keyword *kw;
139
+
140
+ JS_ASSERT(length != 0);
141
+ kw = FindKeyword(str, length);
142
+ return kw ? kw->tokentype : TOK_EOF;
143
+ }
144
+
145
+ JS_FRIEND_API(void)
146
+ js_MapKeywords(void (*mapfun)(const char *))
147
+ {
148
+ size_t i;
149
+
150
+ for (i = 0; i != KEYWORD_COUNT; ++i)
151
+ mapfun(keyword_defs[i].chars);
152
+ }
153
+
154
+ JSBool
155
+ js_IsIdentifier(JSString *str)
156
+ {
157
+ size_t length;
158
+ jschar c, *chars, *end;
159
+
160
+ JSSTRING_CHARS_AND_LENGTH(str, chars, length);
161
+ if (length == 0)
162
+ return JS_FALSE;
163
+ c = *chars;
164
+ if (!JS_ISIDSTART(c))
165
+ return JS_FALSE;
166
+ end = chars + length;
167
+ while (++chars != end) {
168
+ c = *chars;
169
+ if (!JS_ISIDENT(c))
170
+ return JS_FALSE;
171
+ }
172
+ return JS_TRUE;
173
+ }
174
+
175
+ #define TBMIN 64
176
+
177
+ static JSBool
178
+ GrowTokenBuf(JSStringBuffer *sb, size_t newlength)
179
+ {
180
+ JSContext *cx;
181
+ jschar *base;
182
+ ptrdiff_t offset, length;
183
+ size_t tbsize;
184
+ JSArenaPool *pool;
185
+
186
+ cx = (JSContext*) sb->data;
187
+ base = sb->base;
188
+ offset = PTRDIFF(sb->ptr, base, jschar);
189
+ pool = &cx->tempPool;
190
+ if (!base) {
191
+ tbsize = TBMIN * sizeof(jschar);
192
+ length = TBMIN - 1;
193
+ JS_ARENA_ALLOCATE_CAST(base, jschar *, pool, tbsize);
194
+ } else {
195
+ length = PTRDIFF(sb->limit, base, jschar);
196
+ if ((size_t)length >= ~(size_t)0 / sizeof(jschar)) {
197
+ base = NULL;
198
+ } else {
199
+ tbsize = (length + 1) * sizeof(jschar);
200
+ length += length + 1;
201
+ JS_ARENA_GROW_CAST(base, jschar *, pool, tbsize, tbsize);
202
+ }
203
+ }
204
+ if (!base) {
205
+ js_ReportOutOfScriptQuota(cx);
206
+ sb->base = STRING_BUFFER_ERROR_BASE;
207
+ return JS_FALSE;
208
+ }
209
+ sb->base = base;
210
+ sb->limit = base + length;
211
+ sb->ptr = base + offset;
212
+ return JS_TRUE;
213
+ }
214
+
215
+ JSBool
216
+ js_InitTokenStream(JSContext *cx, JSTokenStream *ts,
217
+ const jschar *base, size_t length,
218
+ FILE *fp, const char *filename, uintN lineno)
219
+ {
220
+ jschar *buf;
221
+ size_t nb;
222
+
223
+ JS_ASSERT_IF(fp, !base);
224
+ JS_ASSERT_IF(!base, length == 0);
225
+ nb = fp
226
+ ? 2 * JS_LINE_LIMIT * sizeof(jschar)
227
+ : JS_LINE_LIMIT * sizeof(jschar);
228
+ JS_ARENA_ALLOCATE_CAST(buf, jschar *, &cx->tempPool, nb);
229
+ if (!buf) {
230
+ js_ReportOutOfScriptQuota(cx);
231
+ return JS_FALSE;
232
+ }
233
+ memset(buf, 0, nb);
234
+ memset(ts, 0, sizeof(*ts));
235
+ ts->filename = filename;
236
+ ts->lineno = lineno;
237
+ ts->linebuf.base = ts->linebuf.limit = ts->linebuf.ptr = buf;
238
+ if (fp) {
239
+ ts->file = fp;
240
+ ts->userbuf.base = buf + JS_LINE_LIMIT;
241
+ ts->userbuf.ptr = ts->userbuf.limit = ts->userbuf.base + JS_LINE_LIMIT;
242
+ } else {
243
+ ts->userbuf.base = (jschar *)base;
244
+ ts->userbuf.limit = (jschar *)base + length;
245
+ ts->userbuf.ptr = (jschar *)base;
246
+ }
247
+ ts->tokenbuf.grow = GrowTokenBuf;
248
+ ts->tokenbuf.data = cx;
249
+ ts->listener = cx->debugHooks->sourceHandler;
250
+ ts->listenerData = cx->debugHooks->sourceHandlerData;
251
+ return JS_TRUE;
252
+ }
253
+
254
+ void
255
+ js_CloseTokenStream(JSContext *cx, JSTokenStream *ts)
256
+ {
257
+ if (ts->flags & TSF_OWNFILENAME)
258
+ JS_free(cx, (void *) ts->filename);
259
+ }
260
+
261
+ JS_FRIEND_API(int)
262
+ js_fgets(char *buf, int size, FILE *file)
263
+ {
264
+ int n, i, c;
265
+ JSBool crflag;
266
+
267
+ n = size - 1;
268
+ if (n < 0)
269
+ return -1;
270
+
271
+ crflag = JS_FALSE;
272
+ for (i = 0; i < n && (c = getc(file)) != EOF; i++) {
273
+ buf[i] = c;
274
+ if (c == '\n') { /* any \n ends a line */
275
+ i++; /* keep the \n; we know there is room for \0 */
276
+ break;
277
+ }
278
+ if (crflag) { /* \r not followed by \n ends line at the \r */
279
+ ungetc(c, file);
280
+ break; /* and overwrite c in buf with \0 */
281
+ }
282
+ crflag = (c == '\r');
283
+ }
284
+
285
+ buf[i] = '\0';
286
+ return i;
287
+ }
288
+
289
+ static int32
290
+ GetChar(JSTokenStream *ts)
291
+ {
292
+ int32 c;
293
+ ptrdiff_t i, j, len, olen;
294
+ JSBool crflag;
295
+ char cbuf[JS_LINE_LIMIT];
296
+ jschar *ubuf, *nl;
297
+
298
+ if (ts->ungetpos != 0) {
299
+ c = ts->ungetbuf[--ts->ungetpos];
300
+ } else {
301
+ do {
302
+ if (ts->linebuf.ptr == ts->linebuf.limit) {
303
+ len = PTRDIFF(ts->userbuf.limit, ts->userbuf.ptr, jschar);
304
+ if (len <= 0) {
305
+ if (!ts->file) {
306
+ ts->flags |= TSF_EOF;
307
+ return EOF;
308
+ }
309
+
310
+ /* Fill ts->userbuf so that \r and \r\n convert to \n. */
311
+ crflag = (ts->flags & TSF_CRFLAG) != 0;
312
+ len = js_fgets(cbuf, JS_LINE_LIMIT - crflag, ts->file);
313
+ if (len <= 0) {
314
+ ts->flags |= TSF_EOF;
315
+ return EOF;
316
+ }
317
+ olen = len;
318
+ ubuf = ts->userbuf.base;
319
+ i = 0;
320
+ if (crflag) {
321
+ ts->flags &= ~TSF_CRFLAG;
322
+ if (cbuf[0] != '\n') {
323
+ ubuf[i++] = '\n';
324
+ len++;
325
+ ts->linepos--;
326
+ }
327
+ }
328
+ for (j = 0; i < len; i++, j++)
329
+ ubuf[i] = (jschar) (unsigned char) cbuf[j];
330
+ ts->userbuf.limit = ubuf + len;
331
+ ts->userbuf.ptr = ubuf;
332
+ }
333
+ if (ts->listener) {
334
+ ts->listener(ts->filename, ts->lineno, ts->userbuf.ptr, len,
335
+ &ts->listenerTSData, ts->listenerData);
336
+ }
337
+
338
+ nl = ts->saveEOL;
339
+ if (!nl) {
340
+ /*
341
+ * Any one of \n, \r, or \r\n ends a line (the longest
342
+ * match wins). Also allow the Unicode line and paragraph
343
+ * separators.
344
+ */
345
+ for (nl = ts->userbuf.ptr; nl < ts->userbuf.limit; nl++) {
346
+ /*
347
+ * Try to prevent value-testing on most characters by
348
+ * filtering out characters that aren't 000x or 202x.
349
+ */
350
+ if ((*nl & 0xDFD0) == 0) {
351
+ if (*nl == '\n')
352
+ break;
353
+ if (*nl == '\r') {
354
+ if (nl + 1 < ts->userbuf.limit && nl[1] == '\n')
355
+ nl++;
356
+ break;
357
+ }
358
+ if (*nl == LINE_SEPARATOR || *nl == PARA_SEPARATOR)
359
+ break;
360
+ }
361
+ }
362
+ }
363
+
364
+ /*
365
+ * If there was a line terminator, copy thru it into linebuf.
366
+ * Else copy JS_LINE_LIMIT-1 bytes into linebuf.
367
+ */
368
+ if (nl < ts->userbuf.limit)
369
+ len = PTRDIFF(nl, ts->userbuf.ptr, jschar) + 1;
370
+ if (len >= JS_LINE_LIMIT) {
371
+ len = JS_LINE_LIMIT - 1;
372
+ ts->saveEOL = nl;
373
+ } else {
374
+ ts->saveEOL = NULL;
375
+ }
376
+ js_strncpy(ts->linebuf.base, ts->userbuf.ptr, len);
377
+ ts->userbuf.ptr += len;
378
+ olen = len;
379
+
380
+ /*
381
+ * Make sure linebuf contains \n for EOL (don't do this in
382
+ * userbuf because the user's string might be readonly).
383
+ */
384
+ if (nl < ts->userbuf.limit) {
385
+ if (*nl == '\r') {
386
+ if (ts->linebuf.base[len-1] == '\r') {
387
+ /*
388
+ * Does the line segment end in \r? We must check
389
+ * for a \n at the front of the next segment before
390
+ * storing a \n into linebuf. This case matters
391
+ * only when we're reading from a file.
392
+ */
393
+ if (nl + 1 == ts->userbuf.limit && ts->file) {
394
+ len--;
395
+ ts->flags |= TSF_CRFLAG; /* clear NLFLAG? */
396
+ if (len == 0) {
397
+ /*
398
+ * This can happen when a segment ends in
399
+ * \r\r. Start over. ptr == limit in this
400
+ * case, so we'll fall into buffer-filling
401
+ * code.
402
+ */
403
+ return GetChar(ts);
404
+ }
405
+ } else {
406
+ ts->linebuf.base[len-1] = '\n';
407
+ }
408
+ }
409
+ } else if (*nl == '\n') {
410
+ if (nl > ts->userbuf.base &&
411
+ nl[-1] == '\r' &&
412
+ ts->linebuf.base[len-2] == '\r') {
413
+ len--;
414
+ JS_ASSERT(ts->linebuf.base[len] == '\n');
415
+ ts->linebuf.base[len-1] = '\n';
416
+ }
417
+ } else if (*nl == LINE_SEPARATOR || *nl == PARA_SEPARATOR) {
418
+ ts->linebuf.base[len-1] = '\n';
419
+ }
420
+ }
421
+
422
+ /* Reset linebuf based on adjusted segment length. */
423
+ ts->linebuf.limit = ts->linebuf.base + len;
424
+ ts->linebuf.ptr = ts->linebuf.base;
425
+
426
+ /* Update position of linebuf within physical userbuf line. */
427
+ if (!(ts->flags & TSF_NLFLAG))
428
+ ts->linepos += ts->linelen;
429
+ else
430
+ ts->linepos = 0;
431
+ if (ts->linebuf.limit[-1] == '\n')
432
+ ts->flags |= TSF_NLFLAG;
433
+ else
434
+ ts->flags &= ~TSF_NLFLAG;
435
+
436
+ /* Update linelen from original segment length. */
437
+ ts->linelen = olen;
438
+ }
439
+ c = *ts->linebuf.ptr++;
440
+ /*
441
+ * In the hopes of being liberal in what we accept, we toss out little-
442
+ * and big-endian byte order markers here, see bug 368516.
443
+ */
444
+ } while (c == 0xfffe || c == 0xfeff);
445
+ }
446
+ if (c == '\n')
447
+ ts->lineno++;
448
+ return c;
449
+ }
450
+
451
+ static void
452
+ UngetChar(JSTokenStream *ts, int32 c)
453
+ {
454
+ if (c == EOF)
455
+ return;
456
+ JS_ASSERT(ts->ungetpos < JS_ARRAY_LENGTH(ts->ungetbuf));
457
+ if (c == '\n')
458
+ ts->lineno--;
459
+ ts->ungetbuf[ts->ungetpos++] = (jschar)c;
460
+ }
461
+
462
+ static int32
463
+ PeekChar(JSTokenStream *ts)
464
+ {
465
+ int32 c;
466
+
467
+ c = GetChar(ts);
468
+ UngetChar(ts, c);
469
+ return c;
470
+ }
471
+
472
+ /*
473
+ * Peek n chars ahead into ts. Return true if n chars were read, false if
474
+ * there weren't enough characters in the input stream. This function cannot
475
+ * be used to peek into or past a newline.
476
+ */
477
+ static JSBool
478
+ PeekChars(JSTokenStream *ts, intN n, jschar *cp)
479
+ {
480
+ intN i, j;
481
+ int32 c;
482
+
483
+ for (i = 0; i < n; i++) {
484
+ c = GetChar(ts);
485
+ if (c == EOF)
486
+ break;
487
+ if (c == '\n') {
488
+ UngetChar(ts, c);
489
+ break;
490
+ }
491
+ cp[i] = (jschar)c;
492
+ }
493
+ for (j = i - 1; j >= 0; j--)
494
+ UngetChar(ts, cp[j]);
495
+ return i == n;
496
+ }
497
+
498
+ static void
499
+ SkipChars(JSTokenStream *ts, intN n)
500
+ {
501
+ while (--n >= 0)
502
+ GetChar(ts);
503
+ }
504
+
505
+ static JSBool
506
+ MatchChar(JSTokenStream *ts, int32 expect)
507
+ {
508
+ int32 c;
509
+
510
+ c = GetChar(ts);
511
+ if (c == expect)
512
+ return JS_TRUE;
513
+ UngetChar(ts, c);
514
+ return JS_FALSE;
515
+ }
516
+
517
+ JSBool
518
+ js_ReportCompileErrorNumber(JSContext *cx, JSTokenStream *ts, JSParseNode *pn,
519
+ uintN flags, uintN errorNumber, ...)
520
+ {
521
+ JSErrorReport report;
522
+ char *message;
523
+ size_t linelength;
524
+ jschar *linechars;
525
+ char *linebytes;
526
+ va_list ap;
527
+ JSBool warning, ok;
528
+ JSTokenPos *tp;
529
+ uintN index, i;
530
+ JSErrorReporter onError;
531
+
532
+ JS_ASSERT(ts->linebuf.limit < ts->linebuf.base + JS_LINE_LIMIT);
533
+
534
+ if ((flags & JSREPORT_STRICT) && !JS_HAS_STRICT_OPTION(cx))
535
+ return JS_TRUE;
536
+
537
+ memset(&report, 0, sizeof report);
538
+ report.flags = flags;
539
+ report.errorNumber = errorNumber;
540
+ message = NULL;
541
+ linechars = NULL;
542
+ linebytes = NULL;
543
+
544
+ /* From this point the control must flow through the label out.*/
545
+ va_start(ap, errorNumber);
546
+ ok = js_ExpandErrorArguments(cx, js_GetErrorMessage, NULL,
547
+ errorNumber, &message, &report, &warning,
548
+ !(flags & JSREPORT_UC), ap);
549
+ va_end(ap);
550
+ if (!ok) {
551
+ warning = JS_FALSE;
552
+ goto out;
553
+ }
554
+
555
+ report.filename = ts->filename;
556
+
557
+ if (pn) {
558
+ report.lineno = pn->pn_pos.begin.lineno;
559
+ if (report.lineno != ts->lineno)
560
+ goto report;
561
+ tp = &pn->pn_pos;
562
+ } else {
563
+ /* Point to the current token, not the next one to get. */
564
+ tp = &ts->tokens[ts->cursor].pos;
565
+ }
566
+ report.lineno = ts->lineno;
567
+ linelength = PTRDIFF(ts->linebuf.limit, ts->linebuf.base, jschar);
568
+ linechars = (jschar *)JS_malloc(cx, (linelength + 1) * sizeof(jschar));
569
+ if (!linechars) {
570
+ warning = JS_FALSE;
571
+ goto out;
572
+ }
573
+ memcpy(linechars, ts->linebuf.base, linelength * sizeof(jschar));
574
+ linechars[linelength] = 0;
575
+ linebytes = js_DeflateString(cx, linechars, linelength);
576
+ if (!linebytes) {
577
+ warning = JS_FALSE;
578
+ goto out;
579
+ }
580
+ report.linebuf = linebytes;
581
+
582
+ /*
583
+ * FIXME: What should instead happen here is that we should
584
+ * find error-tokens in userbuf, if !ts->file. That will
585
+ * allow us to deliver a more helpful error message, which
586
+ * includes all or part of the bad string or bad token. The
587
+ * code here yields something that looks truncated.
588
+ * See https://bugzilla.mozilla.org/show_bug.cgi?id=352970
589
+ */
590
+ index = 0;
591
+ if (tp->begin.lineno == tp->end.lineno) {
592
+ if (tp->begin.index < ts->linepos)
593
+ goto report;
594
+
595
+ index = tp->begin.index - ts->linepos;
596
+ }
597
+
598
+ report.tokenptr = report.linebuf + index;
599
+ report.uclinebuf = linechars;
600
+ report.uctokenptr = report.uclinebuf + index;
601
+
602
+ /*
603
+ * If there's a runtime exception type associated with this error
604
+ * number, set that as the pending exception. For errors occuring at
605
+ * compile time, this is very likely to be a JSEXN_SYNTAXERR.
606
+ *
607
+ * If an exception is thrown but not caught, the JSREPORT_EXCEPTION
608
+ * flag will be set in report.flags. Proper behavior for an error
609
+ * reporter is to ignore a report with this flag for all but top-level
610
+ * compilation errors. The exception will remain pending, and so long
611
+ * as the non-top-level "load", "eval", or "compile" native function
612
+ * returns false, the top-level reporter will eventually receive the
613
+ * uncaught exception report.
614
+ *
615
+ * XXX it'd probably be best if there was only one call to this
616
+ * function, but there seem to be two error reporter call points.
617
+ */
618
+ report:
619
+ onError = cx->errorReporter;
620
+
621
+ /*
622
+ * Try to raise an exception only if there isn't one already set --
623
+ * otherwise the exception will describe the last compile-time error,
624
+ * which is likely spurious.
625
+ */
626
+ if (!(ts->flags & TSF_ERROR)) {
627
+ if (js_ErrorToException(cx, message, &report))
628
+ onError = NULL;
629
+ }
630
+
631
+ /*
632
+ * Suppress any compile-time errors that don't occur at the top level.
633
+ * This may still fail, as interplevel may be zero in contexts where we
634
+ * don't really want to call the error reporter, as when js is called
635
+ * by other code which could catch the error.
636
+ */
637
+ if (cx->interpLevel != 0 && !JSREPORT_IS_WARNING(flags))
638
+ onError = NULL;
639
+
640
+ if (onError) {
641
+ JSDebugErrorHook hook = cx->debugHooks->debugErrorHook;
642
+
643
+ /*
644
+ * If debugErrorHook is present then we give it a chance to veto
645
+ * sending the error on to the regular error reporter.
646
+ */
647
+ if (hook && !hook(cx, message, &report,
648
+ cx->debugHooks->debugErrorHookData)) {
649
+ onError = NULL;
650
+ }
651
+ }
652
+ if (onError)
653
+ (*onError)(cx, message, &report);
654
+
655
+ out:
656
+ if (linebytes)
657
+ JS_free(cx, linebytes);
658
+ if (linechars)
659
+ JS_free(cx, linechars);
660
+ if (message)
661
+ JS_free(cx, message);
662
+ if (report.ucmessage)
663
+ JS_free(cx, (void *)report.ucmessage);
664
+
665
+ if (report.messageArgs) {
666
+ if (!(flags & JSREPORT_UC)) {
667
+ i = 0;
668
+ while (report.messageArgs[i])
669
+ JS_free(cx, (void *)report.messageArgs[i++]);
670
+ }
671
+ JS_free(cx, (void *)report.messageArgs);
672
+ }
673
+
674
+ if (!JSREPORT_IS_WARNING(flags)) {
675
+ /* Set the error flag to suppress spurious reports. */
676
+ ts->flags |= TSF_ERROR;
677
+ }
678
+
679
+ return warning;
680
+ }
681
+
682
+ static JSBool
683
+ GrowStringBuffer(JSStringBuffer *sb, size_t newlength)
684
+ {
685
+ ptrdiff_t offset;
686
+ jschar *bp;
687
+
688
+ offset = PTRDIFF(sb->ptr, sb->base, jschar);
689
+ JS_ASSERT(offset >= 0);
690
+ newlength += offset + 1;
691
+ if ((size_t)offset < newlength && newlength < ~(size_t)0 / sizeof(jschar))
692
+ bp = (jschar *) realloc(sb->base, newlength * sizeof(jschar));
693
+ else
694
+ bp = NULL;
695
+ if (!bp) {
696
+ free(sb->base);
697
+ sb->base = STRING_BUFFER_ERROR_BASE;
698
+ return JS_FALSE;
699
+ }
700
+ sb->base = bp;
701
+ sb->ptr = bp + offset;
702
+ sb->limit = bp + newlength - 1;
703
+ return JS_TRUE;
704
+ }
705
+
706
+ static void
707
+ FreeStringBuffer(JSStringBuffer *sb)
708
+ {
709
+ JS_ASSERT(STRING_BUFFER_OK(sb));
710
+ if (sb->base)
711
+ free(sb->base);
712
+ }
713
+
714
+ void
715
+ js_InitStringBuffer(JSStringBuffer *sb)
716
+ {
717
+ sb->base = sb->limit = sb->ptr = NULL;
718
+ sb->data = NULL;
719
+ sb->grow = GrowStringBuffer;
720
+ sb->free = FreeStringBuffer;
721
+ }
722
+
723
+ void
724
+ js_FinishStringBuffer(JSStringBuffer *sb)
725
+ {
726
+ sb->free(sb);
727
+ }
728
+
729
+ #define ENSURE_STRING_BUFFER(sb,n) \
730
+ ((sb)->ptr + (n) <= (sb)->limit || sb->grow(sb, n))
731
+
732
+ static void
733
+ FastAppendChar(JSStringBuffer *sb, jschar c)
734
+ {
735
+ if (!STRING_BUFFER_OK(sb))
736
+ return;
737
+ if (!ENSURE_STRING_BUFFER(sb, 1))
738
+ return;
739
+ *sb->ptr++ = c;
740
+ }
741
+
742
+ void
743
+ js_AppendChar(JSStringBuffer *sb, jschar c)
744
+ {
745
+ jschar *bp;
746
+
747
+ if (!STRING_BUFFER_OK(sb))
748
+ return;
749
+ if (!ENSURE_STRING_BUFFER(sb, 1))
750
+ return;
751
+ bp = sb->ptr;
752
+ *bp++ = c;
753
+ *bp = 0;
754
+ sb->ptr = bp;
755
+ }
756
+
757
+ #if JS_HAS_XML_SUPPORT
758
+
759
+ void
760
+ js_RepeatChar(JSStringBuffer *sb, jschar c, uintN count)
761
+ {
762
+ jschar *bp;
763
+
764
+ if (!STRING_BUFFER_OK(sb) || count == 0)
765
+ return;
766
+ if (!ENSURE_STRING_BUFFER(sb, count))
767
+ return;
768
+ for (bp = sb->ptr; count; --count)
769
+ *bp++ = c;
770
+ *bp = 0;
771
+ sb->ptr = bp;
772
+ }
773
+
774
+ void
775
+ js_AppendCString(JSStringBuffer *sb, const char *asciiz)
776
+ {
777
+ size_t length;
778
+ jschar *bp;
779
+
780
+ if (!STRING_BUFFER_OK(sb) || *asciiz == '\0')
781
+ return;
782
+ length = strlen(asciiz);
783
+ if (!ENSURE_STRING_BUFFER(sb, length))
784
+ return;
785
+ for (bp = sb->ptr; length; --length)
786
+ *bp++ = (jschar) *asciiz++;
787
+ *bp = 0;
788
+ sb->ptr = bp;
789
+ }
790
+
791
+ void
792
+ js_AppendJSString(JSStringBuffer *sb, JSString *str)
793
+ {
794
+ size_t length;
795
+ jschar *bp;
796
+
797
+ if (!STRING_BUFFER_OK(sb))
798
+ return;
799
+ length = JSSTRING_LENGTH(str);
800
+ if (length == 0 || !ENSURE_STRING_BUFFER(sb, length))
801
+ return;
802
+ bp = sb->ptr;
803
+ js_strncpy(bp, JSSTRING_CHARS(str), length);
804
+ bp += length;
805
+ *bp = 0;
806
+ sb->ptr = bp;
807
+ }
808
+
809
+ static JSBool
810
+ GetXMLEntity(JSContext *cx, JSTokenStream *ts)
811
+ {
812
+ ptrdiff_t offset, length, i;
813
+ int32 c, d;
814
+ JSBool ispair;
815
+ jschar *bp, digit;
816
+ char *bytes;
817
+ JSErrNum msg;
818
+
819
+ /* Put the entity, including the '&' already scanned, in ts->tokenbuf. */
820
+ offset = PTRDIFF(ts->tokenbuf.ptr, ts->tokenbuf.base, jschar);
821
+ FastAppendChar(&ts->tokenbuf, '&');
822
+ while ((c = GetChar(ts)) != ';') {
823
+ if (c == EOF || c == '\n') {
824
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
825
+ JSMSG_END_OF_XML_ENTITY);
826
+ return JS_FALSE;
827
+ }
828
+ FastAppendChar(&ts->tokenbuf, (jschar) c);
829
+ }
830
+
831
+ /* Let length be the number of jschars after the '&', including the ';'. */
832
+ length = PTRDIFF(ts->tokenbuf.ptr, ts->tokenbuf.base, jschar) - offset;
833
+ bp = ts->tokenbuf.base + offset;
834
+ c = d = 0;
835
+ ispair = JS_FALSE;
836
+ if (length > 2 && bp[1] == '#') {
837
+ /* Match a well-formed XML Character Reference. */
838
+ i = 2;
839
+ if (length > 3 && JS_TOLOWER(bp[i]) == 'x') {
840
+ if (length > 9) /* at most 6 hex digits allowed */
841
+ goto badncr;
842
+ while (++i < length) {
843
+ digit = bp[i];
844
+ if (!JS7_ISHEX(digit))
845
+ goto badncr;
846
+ c = (c << 4) + JS7_UNHEX(digit);
847
+ }
848
+ } else {
849
+ while (i < length) {
850
+ digit = bp[i++];
851
+ if (!JS7_ISDEC(digit))
852
+ goto badncr;
853
+ c = (c * 10) + JS7_UNDEC(digit);
854
+ if (c < 0)
855
+ goto badncr;
856
+ }
857
+ }
858
+
859
+ if (0x10000 <= c && c <= 0x10FFFF) {
860
+ /* Form a surrogate pair (c, d) -- c is the high surrogate. */
861
+ d = 0xDC00 + (c & 0x3FF);
862
+ c = 0xD7C0 + (c >> 10);
863
+ ispair = JS_TRUE;
864
+ } else {
865
+ /* Enforce the http://www.w3.org/TR/REC-xml/#wf-Legalchar WFC. */
866
+ if (c != 0x9 && c != 0xA && c != 0xD &&
867
+ !(0x20 <= c && c <= 0xD7FF) &&
868
+ !(0xE000 <= c && c <= 0xFFFD)) {
869
+ goto badncr;
870
+ }
871
+ }
872
+ } else {
873
+ /* Try to match one of the five XML 1.0 predefined entities. */
874
+ switch (length) {
875
+ case 3:
876
+ if (bp[2] == 't') {
877
+ if (bp[1] == 'l')
878
+ c = '<';
879
+ else if (bp[1] == 'g')
880
+ c = '>';
881
+ }
882
+ break;
883
+ case 4:
884
+ if (bp[1] == 'a' && bp[2] == 'm' && bp[3] == 'p')
885
+ c = '&';
886
+ break;
887
+ case 5:
888
+ if (bp[3] == 'o') {
889
+ if (bp[1] == 'a' && bp[2] == 'p' && bp[4] == 's')
890
+ c = '\'';
891
+ else if (bp[1] == 'q' && bp[2] == 'u' && bp[4] == 't')
892
+ c = '"';
893
+ }
894
+ break;
895
+ }
896
+ if (c == 0) {
897
+ msg = JSMSG_UNKNOWN_XML_ENTITY;
898
+ goto bad;
899
+ }
900
+ }
901
+
902
+ /* If we matched, retract ts->tokenbuf and store the entity's value. */
903
+ *bp++ = (jschar) c;
904
+ if (ispair)
905
+ *bp++ = (jschar) d;
906
+ *bp = 0;
907
+ ts->tokenbuf.ptr = bp;
908
+ return JS_TRUE;
909
+
910
+ badncr:
911
+ msg = JSMSG_BAD_XML_NCR;
912
+ bad:
913
+ /* No match: throw a TypeError per ECMA-357 10.3.2.1 step 8(a). */
914
+ bytes = js_DeflateString(cx, bp + 1,
915
+ PTRDIFF(ts->tokenbuf.ptr, bp, jschar) - 1);
916
+ if (bytes) {
917
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
918
+ msg, bytes);
919
+ JS_free(cx, bytes);
920
+ }
921
+ return JS_FALSE;
922
+ }
923
+
924
+ #endif /* JS_HAS_XML_SUPPORT */
925
+
926
+ JSTokenType
927
+ js_PeekToken(JSContext *cx, JSTokenStream *ts)
928
+ {
929
+ JSTokenType tt;
930
+
931
+ if (ts->lookahead != 0) {
932
+ tt = ts->tokens[(ts->cursor + ts->lookahead) & NTOKENS_MASK].type;
933
+ } else {
934
+ tt = js_GetToken(cx, ts);
935
+ js_UngetToken(ts);
936
+ }
937
+ return tt;
938
+ }
939
+
940
+ JSTokenType
941
+ js_PeekTokenSameLine(JSContext *cx, JSTokenStream *ts)
942
+ {
943
+ JSTokenType tt;
944
+
945
+ if (!ON_CURRENT_LINE(ts, CURRENT_TOKEN(ts).pos))
946
+ return TOK_EOL;
947
+ ts->flags |= TSF_NEWLINES;
948
+ tt = js_PeekToken(cx, ts);
949
+ ts->flags &= ~TSF_NEWLINES;
950
+ return tt;
951
+ }
952
+
953
+ /*
954
+ * We have encountered a '\': check for a Unicode escape sequence after it,
955
+ * returning the character code value if we found a Unicode escape sequence.
956
+ * Otherwise, non-destructively return the original '\'.
957
+ */
958
+ static int32
959
+ GetUnicodeEscape(JSTokenStream *ts)
960
+ {
961
+ jschar cp[5];
962
+ int32 c;
963
+
964
+ if (PeekChars(ts, 5, cp) && cp[0] == 'u' &&
965
+ JS7_ISHEX(cp[1]) && JS7_ISHEX(cp[2]) &&
966
+ JS7_ISHEX(cp[3]) && JS7_ISHEX(cp[4]))
967
+ {
968
+ c = (((((JS7_UNHEX(cp[1]) << 4)
969
+ + JS7_UNHEX(cp[2])) << 4)
970
+ + JS7_UNHEX(cp[3])) << 4)
971
+ + JS7_UNHEX(cp[4]);
972
+ SkipChars(ts, 5);
973
+ return c;
974
+ }
975
+ return '\\';
976
+ }
977
+
978
+ static JSToken *
979
+ NewToken(JSTokenStream *ts, ptrdiff_t adjust)
980
+ {
981
+ JSToken *tp;
982
+
983
+ ts->cursor = (ts->cursor + 1) & NTOKENS_MASK;
984
+ tp = &CURRENT_TOKEN(ts);
985
+ tp->ptr = ts->linebuf.ptr + adjust;
986
+ tp->pos.begin.index = ts->linepos +
987
+ PTRDIFF(tp->ptr, ts->linebuf.base, jschar) -
988
+ ts->ungetpos;
989
+ tp->pos.begin.lineno = tp->pos.end.lineno = (uint16)ts->lineno;
990
+ return tp;
991
+ }
992
+
993
+ JSTokenType
994
+ js_GetToken(JSContext *cx, JSTokenStream *ts)
995
+ {
996
+ JSTokenType tt;
997
+ int32 c, qc;
998
+ JSToken *tp;
999
+ JSAtom *atom;
1000
+ JSBool hadUnicodeEscape;
1001
+ const struct keyword *kw;
1002
+ #if JS_HAS_XML_SUPPORT
1003
+ JSBool inTarget;
1004
+ size_t targetLength;
1005
+ ptrdiff_t contentIndex;
1006
+ #endif
1007
+
1008
+ #define INIT_TOKENBUF() (ts->tokenbuf.ptr = ts->tokenbuf.base)
1009
+ #define TOKENBUF_LENGTH() PTRDIFF(ts->tokenbuf.ptr, ts->tokenbuf.base, jschar)
1010
+ #define TOKENBUF_OK() STRING_BUFFER_OK(&ts->tokenbuf)
1011
+ #define TOKENBUF_TO_ATOM() (TOKENBUF_OK() \
1012
+ ? js_AtomizeChars(cx, \
1013
+ TOKENBUF_BASE(), \
1014
+ TOKENBUF_LENGTH(), \
1015
+ 0) \
1016
+ : NULL)
1017
+ #define ADD_TO_TOKENBUF(c) FastAppendChar(&ts->tokenbuf, (jschar) (c))
1018
+
1019
+ /* The following 4 macros should only be used when TOKENBUF_OK() is true. */
1020
+ #define TOKENBUF_BASE() (ts->tokenbuf.base)
1021
+ #define TOKENBUF_END() (ts->tokenbuf.ptr)
1022
+ #define TOKENBUF_CHAR(i) (ts->tokenbuf.base[i])
1023
+ #define TRIM_TOKENBUF(i) (ts->tokenbuf.ptr = ts->tokenbuf.base + i)
1024
+ #define NUL_TERM_TOKENBUF() (*ts->tokenbuf.ptr = 0)
1025
+
1026
+ /* Check for a pushed-back token resulting from mismatching lookahead. */
1027
+ while (ts->lookahead != 0) {
1028
+ JS_ASSERT(!(ts->flags & TSF_XMLTEXTMODE));
1029
+ ts->lookahead--;
1030
+ ts->cursor = (ts->cursor + 1) & NTOKENS_MASK;
1031
+ tt = CURRENT_TOKEN(ts).type;
1032
+ if (tt != TOK_EOL || (ts->flags & TSF_NEWLINES))
1033
+ return tt;
1034
+ }
1035
+
1036
+ /* If there was a fatal error, keep returning TOK_ERROR. */
1037
+ if (ts->flags & TSF_ERROR)
1038
+ return TOK_ERROR;
1039
+
1040
+ #if JS_HAS_XML_SUPPORT
1041
+ if (ts->flags & TSF_XMLTEXTMODE) {
1042
+ tt = TOK_XMLSPACE; /* veto if non-space, return TOK_XMLTEXT */
1043
+ tp = NewToken(ts, 0);
1044
+ INIT_TOKENBUF();
1045
+ qc = (ts->flags & TSF_XMLONLYMODE) ? '<' : '{';
1046
+
1047
+ while ((c = GetChar(ts)) != qc && c != '<' && c != EOF) {
1048
+ if (c == '&' && qc == '<') {
1049
+ if (!GetXMLEntity(cx, ts))
1050
+ goto error;
1051
+ tt = TOK_XMLTEXT;
1052
+ continue;
1053
+ }
1054
+
1055
+ if (!JS_ISXMLSPACE(c))
1056
+ tt = TOK_XMLTEXT;
1057
+ ADD_TO_TOKENBUF(c);
1058
+ }
1059
+ UngetChar(ts, c);
1060
+
1061
+ if (TOKENBUF_LENGTH() == 0) {
1062
+ atom = NULL;
1063
+ } else {
1064
+ atom = TOKENBUF_TO_ATOM();
1065
+ if (!atom)
1066
+ goto error;
1067
+ }
1068
+ tp->pos.end.lineno = (uint16)ts->lineno;
1069
+ tp->t_op = JSOP_STRING;
1070
+ tp->t_atom = atom;
1071
+ goto out;
1072
+ }
1073
+
1074
+ if (ts->flags & TSF_XMLTAGMODE) {
1075
+ tp = NewToken(ts, 0);
1076
+ c = GetChar(ts);
1077
+ if (JS_ISXMLSPACE(c)) {
1078
+ do {
1079
+ c = GetChar(ts);
1080
+ } while (JS_ISXMLSPACE(c));
1081
+ UngetChar(ts, c);
1082
+ tt = TOK_XMLSPACE;
1083
+ goto out;
1084
+ }
1085
+
1086
+ if (c == EOF) {
1087
+ tt = TOK_EOF;
1088
+ goto out;
1089
+ }
1090
+
1091
+ INIT_TOKENBUF();
1092
+ if (JS_ISXMLNSSTART(c)) {
1093
+ JSBool sawColon = JS_FALSE;
1094
+
1095
+ ADD_TO_TOKENBUF(c);
1096
+ while ((c = GetChar(ts)) != EOF && JS_ISXMLNAME(c)) {
1097
+ if (c == ':') {
1098
+ int nextc;
1099
+
1100
+ if (sawColon ||
1101
+ (nextc = PeekChar(ts),
1102
+ ((ts->flags & TSF_XMLONLYMODE) || nextc != '{') &&
1103
+ !JS_ISXMLNAME(nextc))) {
1104
+ js_ReportCompileErrorNumber(cx, ts, NULL,
1105
+ JSREPORT_ERROR,
1106
+ JSMSG_BAD_XML_QNAME);
1107
+ goto error;
1108
+ }
1109
+ sawColon = JS_TRUE;
1110
+ }
1111
+
1112
+ ADD_TO_TOKENBUF(c);
1113
+ }
1114
+
1115
+ UngetChar(ts, c);
1116
+ atom = TOKENBUF_TO_ATOM();
1117
+ if (!atom)
1118
+ goto error;
1119
+ tp->t_op = JSOP_STRING;
1120
+ tp->t_atom = atom;
1121
+ tt = TOK_XMLNAME;
1122
+ goto out;
1123
+ }
1124
+
1125
+ switch (c) {
1126
+ case '{':
1127
+ if (ts->flags & TSF_XMLONLYMODE)
1128
+ goto bad_xml_char;
1129
+ tt = TOK_LC;
1130
+ goto out;
1131
+
1132
+ case '=':
1133
+ tt = TOK_ASSIGN;
1134
+ goto out;
1135
+
1136
+ case '"':
1137
+ case '\'':
1138
+ qc = c;
1139
+ while ((c = GetChar(ts)) != qc) {
1140
+ if (c == EOF) {
1141
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1142
+ JSMSG_UNTERMINATED_STRING);
1143
+ goto error;
1144
+ }
1145
+
1146
+ /*
1147
+ * XML attribute values are double-quoted when pretty-printed,
1148
+ * so escape " if it is expressed directly in a single-quoted
1149
+ * attribute value.
1150
+ */
1151
+ if (c == '"' && !(ts->flags & TSF_XMLONLYMODE)) {
1152
+ JS_ASSERT(qc == '\'');
1153
+ js_AppendCString(&ts->tokenbuf, js_quot_entity_str);
1154
+ continue;
1155
+ }
1156
+
1157
+ if (c == '&' && (ts->flags & TSF_XMLONLYMODE)) {
1158
+ if (!GetXMLEntity(cx, ts))
1159
+ goto error;
1160
+ continue;
1161
+ }
1162
+
1163
+ ADD_TO_TOKENBUF(c);
1164
+ }
1165
+ atom = TOKENBUF_TO_ATOM();
1166
+ if (!atom)
1167
+ goto error;
1168
+ tp->pos.end.lineno = (uint16)ts->lineno;
1169
+ tp->t_op = JSOP_STRING;
1170
+ tp->t_atom = atom;
1171
+ tt = TOK_XMLATTR;
1172
+ goto out;
1173
+
1174
+ case '>':
1175
+ tt = TOK_XMLTAGC;
1176
+ goto out;
1177
+
1178
+ case '/':
1179
+ if (MatchChar(ts, '>')) {
1180
+ tt = TOK_XMLPTAGC;
1181
+ goto out;
1182
+ }
1183
+ /* FALL THROUGH */
1184
+
1185
+ bad_xml_char:
1186
+ default:
1187
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1188
+ JSMSG_BAD_XML_CHARACTER);
1189
+ goto error;
1190
+ }
1191
+ /* NOTREACHED */
1192
+ }
1193
+ #endif /* JS_HAS_XML_SUPPORT */
1194
+
1195
+ retry:
1196
+ do {
1197
+ c = GetChar(ts);
1198
+ if (c == '\n') {
1199
+ ts->flags &= ~TSF_DIRTYLINE;
1200
+ if (ts->flags & TSF_NEWLINES)
1201
+ break;
1202
+ }
1203
+ } while (JS_ISSPACE(c));
1204
+
1205
+ tp = NewToken(ts, -1);
1206
+ if (c == EOF) {
1207
+ tt = TOK_EOF;
1208
+ goto out;
1209
+ }
1210
+
1211
+ hadUnicodeEscape = JS_FALSE;
1212
+ if (JS_ISIDSTART(c) ||
1213
+ (c == '\\' &&
1214
+ (qc = GetUnicodeEscape(ts),
1215
+ hadUnicodeEscape = JS_ISIDSTART(qc)))) {
1216
+ if (hadUnicodeEscape)
1217
+ c = qc;
1218
+ INIT_TOKENBUF();
1219
+ for (;;) {
1220
+ ADD_TO_TOKENBUF(c);
1221
+ c = GetChar(ts);
1222
+ if (c == '\\') {
1223
+ qc = GetUnicodeEscape(ts);
1224
+ if (!JS_ISIDENT(qc))
1225
+ break;
1226
+ c = qc;
1227
+ hadUnicodeEscape = JS_TRUE;
1228
+ } else {
1229
+ if (!JS_ISIDENT(c))
1230
+ break;
1231
+ }
1232
+ }
1233
+ UngetChar(ts, c);
1234
+
1235
+ /*
1236
+ * Check for keywords unless we saw Unicode escape or parser asks
1237
+ * to ignore keywords.
1238
+ */
1239
+ if (!hadUnicodeEscape &&
1240
+ !(ts->flags & TSF_KEYWORD_IS_NAME) &&
1241
+ TOKENBUF_OK() &&
1242
+ (kw = FindKeyword(TOKENBUF_BASE(), TOKENBUF_LENGTH()))) {
1243
+ if (kw->tokentype == TOK_RESERVED) {
1244
+ if (!js_ReportCompileErrorNumber(cx, ts, NULL,
1245
+ JSREPORT_WARNING |
1246
+ JSREPORT_STRICT,
1247
+ JSMSG_RESERVED_ID,
1248
+ kw->chars)) {
1249
+ goto error;
1250
+ }
1251
+ } else if (kw->version <= JSVERSION_NUMBER(cx)) {
1252
+ tt = kw->tokentype;
1253
+ tp->t_op = (JSOp) kw->op;
1254
+ goto out;
1255
+ }
1256
+ }
1257
+
1258
+ atom = TOKENBUF_TO_ATOM();
1259
+ if (!atom)
1260
+ goto error;
1261
+ tp->t_op = JSOP_NAME;
1262
+ tp->t_atom = atom;
1263
+ tt = TOK_NAME;
1264
+ goto out;
1265
+ }
1266
+
1267
+ if (JS7_ISDEC(c) || (c == '.' && JS7_ISDEC(PeekChar(ts)))) {
1268
+ jsint radix;
1269
+ const jschar *endptr;
1270
+ jsdouble dval;
1271
+
1272
+ radix = 10;
1273
+ INIT_TOKENBUF();
1274
+
1275
+ if (c == '0') {
1276
+ ADD_TO_TOKENBUF(c);
1277
+ c = GetChar(ts);
1278
+ if (JS_TOLOWER(c) == 'x') {
1279
+ ADD_TO_TOKENBUF(c);
1280
+ c = GetChar(ts);
1281
+ radix = 16;
1282
+ } else if (JS7_ISDEC(c)) {
1283
+ radix = 8;
1284
+ }
1285
+ }
1286
+
1287
+ while (JS7_ISHEX(c)) {
1288
+ if (radix < 16) {
1289
+ if (JS7_ISLET(c))
1290
+ break;
1291
+
1292
+ /*
1293
+ * We permit 08 and 09 as decimal numbers, which makes our
1294
+ * behaviour a superset of the ECMA numeric grammar. We might
1295
+ * not always be so permissive, so we warn about it.
1296
+ */
1297
+ if (radix == 8 && c >= '8') {
1298
+ if (!js_ReportCompileErrorNumber(cx, ts, NULL,
1299
+ JSREPORT_WARNING,
1300
+ JSMSG_BAD_OCTAL,
1301
+ c == '8' ? "08" : "09")) {
1302
+ goto error;
1303
+ }
1304
+ radix = 10;
1305
+ }
1306
+ }
1307
+ ADD_TO_TOKENBUF(c);
1308
+ c = GetChar(ts);
1309
+ }
1310
+
1311
+ if (radix == 10 && (c == '.' || JS_TOLOWER(c) == 'e')) {
1312
+ if (c == '.') {
1313
+ do {
1314
+ ADD_TO_TOKENBUF(c);
1315
+ c = GetChar(ts);
1316
+ } while (JS7_ISDEC(c));
1317
+ }
1318
+ if (JS_TOLOWER(c) == 'e') {
1319
+ ADD_TO_TOKENBUF(c);
1320
+ c = GetChar(ts);
1321
+ if (c == '+' || c == '-') {
1322
+ ADD_TO_TOKENBUF(c);
1323
+ c = GetChar(ts);
1324
+ }
1325
+ if (!JS7_ISDEC(c)) {
1326
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1327
+ JSMSG_MISSING_EXPONENT);
1328
+ goto error;
1329
+ }
1330
+ do {
1331
+ ADD_TO_TOKENBUF(c);
1332
+ c = GetChar(ts);
1333
+ } while (JS7_ISDEC(c));
1334
+ }
1335
+ }
1336
+
1337
+ /* Put back the next char and NUL-terminate tokenbuf for js_strto*. */
1338
+ UngetChar(ts, c);
1339
+ ADD_TO_TOKENBUF(0);
1340
+
1341
+ if (!TOKENBUF_OK())
1342
+ goto error;
1343
+ if (radix == 10) {
1344
+ if (!js_strtod(cx, TOKENBUF_BASE(), TOKENBUF_END(),
1345
+ &endptr, &dval)) {
1346
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1347
+ JSMSG_OUT_OF_MEMORY);
1348
+ goto error;
1349
+ }
1350
+ } else {
1351
+ if (!js_strtointeger(cx, TOKENBUF_BASE(), TOKENBUF_END(),
1352
+ &endptr, radix, &dval)) {
1353
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1354
+ JSMSG_OUT_OF_MEMORY);
1355
+ goto error;
1356
+ }
1357
+ }
1358
+ tp->t_dval = dval;
1359
+ tt = TOK_NUMBER;
1360
+ goto out;
1361
+ }
1362
+
1363
+ if (c == '"' || c == '\'') {
1364
+ qc = c;
1365
+ INIT_TOKENBUF();
1366
+ while ((c = GetChar(ts)) != qc) {
1367
+ if (c == '\n' || c == EOF) {
1368
+ UngetChar(ts, c);
1369
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1370
+ JSMSG_UNTERMINATED_STRING);
1371
+ goto error;
1372
+ }
1373
+ if (c == '\\') {
1374
+ switch (c = GetChar(ts)) {
1375
+ case 'b': c = '\b'; break;
1376
+ case 'f': c = '\f'; break;
1377
+ case 'n': c = '\n'; break;
1378
+ case 'r': c = '\r'; break;
1379
+ case 't': c = '\t'; break;
1380
+ case 'v': c = '\v'; break;
1381
+
1382
+ default:
1383
+ if ('0' <= c && c < '8') {
1384
+ int32 val = JS7_UNDEC(c);
1385
+
1386
+ c = PeekChar(ts);
1387
+ if ('0' <= c && c < '8') {
1388
+ val = 8 * val + JS7_UNDEC(c);
1389
+ GetChar(ts);
1390
+ c = PeekChar(ts);
1391
+ if ('0' <= c && c < '8') {
1392
+ int32 save = val;
1393
+ val = 8 * val + JS7_UNDEC(c);
1394
+ if (val <= 0377)
1395
+ GetChar(ts);
1396
+ else
1397
+ val = save;
1398
+ }
1399
+ }
1400
+
1401
+ c = (jschar)val;
1402
+ } else if (c == 'u') {
1403
+ jschar cp[4];
1404
+ if (PeekChars(ts, 4, cp) &&
1405
+ JS7_ISHEX(cp[0]) && JS7_ISHEX(cp[1]) &&
1406
+ JS7_ISHEX(cp[2]) && JS7_ISHEX(cp[3])) {
1407
+ c = (((((JS7_UNHEX(cp[0]) << 4)
1408
+ + JS7_UNHEX(cp[1])) << 4)
1409
+ + JS7_UNHEX(cp[2])) << 4)
1410
+ + JS7_UNHEX(cp[3]);
1411
+ SkipChars(ts, 4);
1412
+ }
1413
+ } else if (c == 'x') {
1414
+ jschar cp[2];
1415
+ if (PeekChars(ts, 2, cp) &&
1416
+ JS7_ISHEX(cp[0]) && JS7_ISHEX(cp[1])) {
1417
+ c = (JS7_UNHEX(cp[0]) << 4) + JS7_UNHEX(cp[1]);
1418
+ SkipChars(ts, 2);
1419
+ }
1420
+ } else if (c == '\n') {
1421
+ /* ECMA follows C by removing escaped newlines. */
1422
+ continue;
1423
+ }
1424
+ break;
1425
+ }
1426
+ }
1427
+ ADD_TO_TOKENBUF(c);
1428
+ }
1429
+ atom = TOKENBUF_TO_ATOM();
1430
+ if (!atom)
1431
+ goto error;
1432
+ tp->pos.end.lineno = (uint16)ts->lineno;
1433
+ tp->t_op = JSOP_STRING;
1434
+ tp->t_atom = atom;
1435
+ tt = TOK_STRING;
1436
+ goto out;
1437
+ }
1438
+
1439
+ switch (c) {
1440
+ case '\n': tt = TOK_EOL; goto eol_out;
1441
+ case ';': tt = TOK_SEMI; break;
1442
+ case '[': tt = TOK_LB; break;
1443
+ case ']': tt = TOK_RB; break;
1444
+ case '{': tt = TOK_LC; break;
1445
+ case '}': tt = TOK_RC; break;
1446
+ case '(': tt = TOK_LP; break;
1447
+ case ')': tt = TOK_RP; break;
1448
+ case ',': tt = TOK_COMMA; break;
1449
+ case '?': tt = TOK_HOOK; break;
1450
+
1451
+ case '.':
1452
+ #if JS_HAS_XML_SUPPORT
1453
+ if (MatchChar(ts, c))
1454
+ tt = TOK_DBLDOT;
1455
+ else
1456
+ #endif
1457
+ tt = TOK_DOT;
1458
+ break;
1459
+
1460
+ case ':':
1461
+ #if JS_HAS_XML_SUPPORT
1462
+ if (MatchChar(ts, c)) {
1463
+ tt = TOK_DBLCOLON;
1464
+ break;
1465
+ }
1466
+ #endif
1467
+ /*
1468
+ * Default so compiler can modify to JSOP_GETTER if 'p getter: v' in an
1469
+ * object initializer, likewise for setter.
1470
+ */
1471
+ tp->t_op = JSOP_NOP;
1472
+ tt = TOK_COLON;
1473
+ break;
1474
+
1475
+ case '|':
1476
+ if (MatchChar(ts, c)) {
1477
+ tt = TOK_OR;
1478
+ } else if (MatchChar(ts, '=')) {
1479
+ tp->t_op = JSOP_BITOR;
1480
+ tt = TOK_ASSIGN;
1481
+ } else {
1482
+ tt = TOK_BITOR;
1483
+ }
1484
+ break;
1485
+
1486
+ case '^':
1487
+ if (MatchChar(ts, '=')) {
1488
+ tp->t_op = JSOP_BITXOR;
1489
+ tt = TOK_ASSIGN;
1490
+ } else {
1491
+ tt = TOK_BITXOR;
1492
+ }
1493
+ break;
1494
+
1495
+ case '&':
1496
+ if (MatchChar(ts, c)) {
1497
+ tt = TOK_AND;
1498
+ } else if (MatchChar(ts, '=')) {
1499
+ tp->t_op = JSOP_BITAND;
1500
+ tt = TOK_ASSIGN;
1501
+ } else {
1502
+ tt = TOK_BITAND;
1503
+ }
1504
+ break;
1505
+
1506
+ case '=':
1507
+ if (MatchChar(ts, c)) {
1508
+ tp->t_op = MatchChar(ts, c) ? JSOP_STRICTEQ : JSOP_EQ;
1509
+ tt = TOK_EQOP;
1510
+ } else {
1511
+ tp->t_op = JSOP_NOP;
1512
+ tt = TOK_ASSIGN;
1513
+ }
1514
+ break;
1515
+
1516
+ case '!':
1517
+ if (MatchChar(ts, '=')) {
1518
+ tp->t_op = MatchChar(ts, '=') ? JSOP_STRICTNE : JSOP_NE;
1519
+ tt = TOK_EQOP;
1520
+ } else {
1521
+ tp->t_op = JSOP_NOT;
1522
+ tt = TOK_UNARYOP;
1523
+ }
1524
+ break;
1525
+
1526
+ #if JS_HAS_XML_SUPPORT
1527
+ case '@':
1528
+ tt = TOK_AT;
1529
+ break;
1530
+ #endif
1531
+
1532
+ case '<':
1533
+ #if JS_HAS_XML_SUPPORT
1534
+ /*
1535
+ * After much testing, it's clear that Postel's advice to protocol
1536
+ * designers ("be liberal in what you accept, and conservative in what
1537
+ * you send") invites a natural-law repercussion for JS as "protocol":
1538
+ *
1539
+ * "If you are liberal in what you accept, others will utterly fail to
1540
+ * be conservative in what they send."
1541
+ *
1542
+ * Which means you will get <!-- comments to end of line in the middle
1543
+ * of .js files, and after if conditions whose then statements are on
1544
+ * the next line, and other wonders. See at least the following bugs:
1545
+ * https://bugzilla.mozilla.org/show_bug.cgi?id=309242
1546
+ * https://bugzilla.mozilla.org/show_bug.cgi?id=309712
1547
+ * https://bugzilla.mozilla.org/show_bug.cgi?id=310993
1548
+ *
1549
+ * So without JSOPTION_XML, we never scan an XML comment or CDATA
1550
+ * literal. We always scan <! as the start of an HTML comment hack
1551
+ * to end of line, used since Netscape 2 to hide script tag content
1552
+ * from script-unaware browsers.
1553
+ */
1554
+ if ((ts->flags & TSF_OPERAND) &&
1555
+ (JS_HAS_XML_OPTION(cx) || PeekChar(ts) != '!')) {
1556
+ /* Check for XML comment or CDATA section. */
1557
+ if (MatchChar(ts, '!')) {
1558
+ INIT_TOKENBUF();
1559
+
1560
+ /* Scan XML comment. */
1561
+ if (MatchChar(ts, '-')) {
1562
+ if (!MatchChar(ts, '-'))
1563
+ goto bad_xml_markup;
1564
+ while ((c = GetChar(ts)) != '-' || !MatchChar(ts, '-')) {
1565
+ if (c == EOF)
1566
+ goto bad_xml_markup;
1567
+ ADD_TO_TOKENBUF(c);
1568
+ }
1569
+ tt = TOK_XMLCOMMENT;
1570
+ tp->t_op = JSOP_XMLCOMMENT;
1571
+ goto finish_xml_markup;
1572
+ }
1573
+
1574
+ /* Scan CDATA section. */
1575
+ if (MatchChar(ts, '[')) {
1576
+ jschar cp[6];
1577
+ if (PeekChars(ts, 6, cp) &&
1578
+ cp[0] == 'C' &&
1579
+ cp[1] == 'D' &&
1580
+ cp[2] == 'A' &&
1581
+ cp[3] == 'T' &&
1582
+ cp[4] == 'A' &&
1583
+ cp[5] == '[') {
1584
+ SkipChars(ts, 6);
1585
+ while ((c = GetChar(ts)) != ']' ||
1586
+ !PeekChars(ts, 2, cp) ||
1587
+ cp[0] != ']' ||
1588
+ cp[1] != '>') {
1589
+ if (c == EOF)
1590
+ goto bad_xml_markup;
1591
+ ADD_TO_TOKENBUF(c);
1592
+ }
1593
+ GetChar(ts); /* discard ] but not > */
1594
+ tt = TOK_XMLCDATA;
1595
+ tp->t_op = JSOP_XMLCDATA;
1596
+ goto finish_xml_markup;
1597
+ }
1598
+ goto bad_xml_markup;
1599
+ }
1600
+ }
1601
+
1602
+ /* Check for processing instruction. */
1603
+ if (MatchChar(ts, '?')) {
1604
+ inTarget = JS_TRUE;
1605
+ targetLength = 0;
1606
+ contentIndex = -1;
1607
+
1608
+ INIT_TOKENBUF();
1609
+ while ((c = GetChar(ts)) != '?' || PeekChar(ts) != '>') {
1610
+ if (c == EOF)
1611
+ goto bad_xml_markup;
1612
+ if (inTarget) {
1613
+ if (JS_ISXMLSPACE(c)) {
1614
+ if (TOKENBUF_LENGTH() == 0)
1615
+ goto bad_xml_markup;
1616
+ inTarget = JS_FALSE;
1617
+ } else {
1618
+ if (!((TOKENBUF_LENGTH() == 0)
1619
+ ? JS_ISXMLNSSTART(c)
1620
+ : JS_ISXMLNS(c))) {
1621
+ goto bad_xml_markup;
1622
+ }
1623
+ ++targetLength;
1624
+ }
1625
+ } else {
1626
+ if (contentIndex < 0 && !JS_ISXMLSPACE(c))
1627
+ contentIndex = TOKENBUF_LENGTH();
1628
+ }
1629
+ ADD_TO_TOKENBUF(c);
1630
+ }
1631
+ if (targetLength == 0)
1632
+ goto bad_xml_markup;
1633
+ if (!TOKENBUF_OK())
1634
+ goto error;
1635
+ if (contentIndex < 0) {
1636
+ atom = cx->runtime->atomState.emptyAtom;
1637
+ } else {
1638
+ atom = js_AtomizeChars(cx,
1639
+ &TOKENBUF_CHAR(contentIndex),
1640
+ TOKENBUF_LENGTH() - contentIndex,
1641
+ 0);
1642
+ if (!atom)
1643
+ goto error;
1644
+ }
1645
+ TRIM_TOKENBUF(targetLength);
1646
+ tp->t_atom2 = atom;
1647
+ tt = TOK_XMLPI;
1648
+
1649
+ finish_xml_markup:
1650
+ if (!MatchChar(ts, '>'))
1651
+ goto bad_xml_markup;
1652
+ atom = TOKENBUF_TO_ATOM();
1653
+ if (!atom)
1654
+ goto error;
1655
+ tp->t_atom = atom;
1656
+ tp->pos.end.lineno = (uint16)ts->lineno;
1657
+ goto out;
1658
+ }
1659
+
1660
+ /* An XML start-of-tag character. */
1661
+ tt = MatchChar(ts, '/') ? TOK_XMLETAGO : TOK_XMLSTAGO;
1662
+ goto out;
1663
+
1664
+ bad_xml_markup:
1665
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1666
+ JSMSG_BAD_XML_MARKUP);
1667
+ goto error;
1668
+ }
1669
+ #endif /* JS_HAS_XML_SUPPORT */
1670
+
1671
+ /* NB: treat HTML begin-comment as comment-till-end-of-line */
1672
+ if (MatchChar(ts, '!')) {
1673
+ if (MatchChar(ts, '-')) {
1674
+ if (MatchChar(ts, '-')) {
1675
+ ts->flags |= TSF_IN_HTML_COMMENT;
1676
+ goto skipline;
1677
+ }
1678
+ UngetChar(ts, '-');
1679
+ }
1680
+ UngetChar(ts, '!');
1681
+ }
1682
+ if (MatchChar(ts, c)) {
1683
+ tp->t_op = JSOP_LSH;
1684
+ tt = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_SHOP;
1685
+ } else {
1686
+ tp->t_op = MatchChar(ts, '=') ? JSOP_LE : JSOP_LT;
1687
+ tt = TOK_RELOP;
1688
+ }
1689
+ break;
1690
+
1691
+ case '>':
1692
+ if (MatchChar(ts, c)) {
1693
+ tp->t_op = MatchChar(ts, c) ? JSOP_URSH : JSOP_RSH;
1694
+ tt = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_SHOP;
1695
+ } else {
1696
+ tp->t_op = MatchChar(ts, '=') ? JSOP_GE : JSOP_GT;
1697
+ tt = TOK_RELOP;
1698
+ }
1699
+ break;
1700
+
1701
+ case '*':
1702
+ tp->t_op = JSOP_MUL;
1703
+ tt = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_STAR;
1704
+ break;
1705
+
1706
+ case '/':
1707
+ if (MatchChar(ts, '/')) {
1708
+ /*
1709
+ * Hack for source filters such as the Mozilla XUL preprocessor:
1710
+ * "//@line 123\n" sets the number of the *next* line after the
1711
+ * comment to 123.
1712
+ */
1713
+ if (JS_HAS_ATLINE_OPTION(cx)) {
1714
+ jschar cp[5];
1715
+ uintN i, line, temp;
1716
+ char filename[1024];
1717
+
1718
+ if (PeekChars(ts, 5, cp) &&
1719
+ cp[0] == '@' &&
1720
+ cp[1] == 'l' &&
1721
+ cp[2] == 'i' &&
1722
+ cp[3] == 'n' &&
1723
+ cp[4] == 'e') {
1724
+ SkipChars(ts, 5);
1725
+ while ((c = GetChar(ts)) != '\n' && JS_ISSPACE(c))
1726
+ continue;
1727
+ if (JS7_ISDEC(c)) {
1728
+ line = JS7_UNDEC(c);
1729
+ while ((c = GetChar(ts)) != EOF && JS7_ISDEC(c)) {
1730
+ temp = 10 * line + JS7_UNDEC(c);
1731
+ if (temp < line) {
1732
+ /* Ignore overlarge line numbers. */
1733
+ goto skipline;
1734
+ }
1735
+ line = temp;
1736
+ }
1737
+ while (c != '\n' && JS_ISSPACE(c))
1738
+ c = GetChar(ts);
1739
+ i = 0;
1740
+ if (c == '"') {
1741
+ while ((c = GetChar(ts)) != EOF && c != '"') {
1742
+ if (c == '\n') {
1743
+ UngetChar(ts, c);
1744
+ goto skipline;
1745
+ }
1746
+ if ((c >> 8) != 0 || i >= sizeof filename - 1)
1747
+ goto skipline;
1748
+ filename[i++] = (char) c;
1749
+ }
1750
+ if (c == '"') {
1751
+ while ((c = GetChar(ts)) != '\n' &&
1752
+ JS_ISSPACE(c)) {
1753
+ continue;
1754
+ }
1755
+ }
1756
+ }
1757
+ filename[i] = '\0';
1758
+ if (c == '\n') {
1759
+ if (i > 0) {
1760
+ if (ts->flags & TSF_OWNFILENAME)
1761
+ JS_free(cx, (void *) ts->filename);
1762
+ ts->filename = JS_strdup(cx, filename);
1763
+ if (!ts->filename)
1764
+ goto error;
1765
+ ts->flags |= TSF_OWNFILENAME;
1766
+ }
1767
+ ts->lineno = line;
1768
+ }
1769
+ }
1770
+ UngetChar(ts, c);
1771
+ }
1772
+ }
1773
+
1774
+ skipline:
1775
+ /* Optimize line skipping if we are not in an HTML comment. */
1776
+ if (ts->flags & TSF_IN_HTML_COMMENT) {
1777
+ while ((c = GetChar(ts)) != EOF && c != '\n') {
1778
+ if (c == '-' && MatchChar(ts, '-') && MatchChar(ts, '>'))
1779
+ ts->flags &= ~TSF_IN_HTML_COMMENT;
1780
+ }
1781
+ } else {
1782
+ while ((c = GetChar(ts)) != EOF && c != '\n')
1783
+ continue;
1784
+ }
1785
+ UngetChar(ts, c);
1786
+ ts->cursor = (ts->cursor - 1) & NTOKENS_MASK;
1787
+ goto retry;
1788
+ }
1789
+
1790
+ if (MatchChar(ts, '*')) {
1791
+ while ((c = GetChar(ts)) != EOF &&
1792
+ !(c == '*' && MatchChar(ts, '/'))) {
1793
+ /* Ignore all characters until comment close. */
1794
+ }
1795
+ if (c == EOF) {
1796
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1797
+ JSMSG_UNTERMINATED_COMMENT);
1798
+ goto error;
1799
+ }
1800
+ ts->cursor = (ts->cursor - 1) & NTOKENS_MASK;
1801
+ goto retry;
1802
+ }
1803
+
1804
+ if (ts->flags & TSF_OPERAND) {
1805
+ uintN flags;
1806
+ JSBool inCharClass = JS_FALSE;
1807
+
1808
+ INIT_TOKENBUF();
1809
+ for (;;) {
1810
+ c = GetChar(ts);
1811
+ if (c == '\n' || c == EOF) {
1812
+ UngetChar(ts, c);
1813
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1814
+ JSMSG_UNTERMINATED_REGEXP);
1815
+ goto error;
1816
+ }
1817
+ if (c == '\\') {
1818
+ ADD_TO_TOKENBUF(c);
1819
+ c = GetChar(ts);
1820
+ } else if (c == '[') {
1821
+ inCharClass = JS_TRUE;
1822
+ } else if (c == ']') {
1823
+ inCharClass = JS_FALSE;
1824
+ } else if (c == '/' && !inCharClass) {
1825
+ /* For compat with IE, allow unescaped / in char classes. */
1826
+ break;
1827
+ }
1828
+ ADD_TO_TOKENBUF(c);
1829
+ }
1830
+ for (flags = 0; ; ) {
1831
+ c = PeekChar(ts);
1832
+ if (c == 'g')
1833
+ flags |= JSREG_GLOB;
1834
+ else if (c == 'i')
1835
+ flags |= JSREG_FOLD;
1836
+ else if (c == 'm')
1837
+ flags |= JSREG_MULTILINE;
1838
+ else if (c == 'y')
1839
+ flags |= JSREG_STICKY;
1840
+ else
1841
+ break;
1842
+ GetChar(ts);
1843
+ }
1844
+ c = PeekChar(ts);
1845
+ if (JS7_ISLET(c)) {
1846
+ tp->ptr = ts->linebuf.ptr - 1;
1847
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1848
+ JSMSG_BAD_REGEXP_FLAG);
1849
+ (void) GetChar(ts);
1850
+ goto error;
1851
+ }
1852
+ /* XXXbe fix jsregexp.c so it doesn't depend on NUL termination */
1853
+ if (!TOKENBUF_OK())
1854
+ goto error;
1855
+ NUL_TERM_TOKENBUF();
1856
+ tp->t_reflags = flags;
1857
+ tt = TOK_REGEXP;
1858
+ break;
1859
+ }
1860
+
1861
+ tp->t_op = JSOP_DIV;
1862
+ tt = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_DIVOP;
1863
+ break;
1864
+
1865
+ case '%':
1866
+ tp->t_op = JSOP_MOD;
1867
+ tt = MatchChar(ts, '=') ? TOK_ASSIGN : TOK_DIVOP;
1868
+ break;
1869
+
1870
+ case '~':
1871
+ tp->t_op = JSOP_BITNOT;
1872
+ tt = TOK_UNARYOP;
1873
+ break;
1874
+
1875
+ case '+':
1876
+ if (MatchChar(ts, '=')) {
1877
+ tp->t_op = JSOP_ADD;
1878
+ tt = TOK_ASSIGN;
1879
+ } else if (MatchChar(ts, c)) {
1880
+ tt = TOK_INC;
1881
+ } else {
1882
+ tp->t_op = JSOP_POS;
1883
+ tt = TOK_PLUS;
1884
+ }
1885
+ break;
1886
+
1887
+ case '-':
1888
+ if (MatchChar(ts, '=')) {
1889
+ tp->t_op = JSOP_SUB;
1890
+ tt = TOK_ASSIGN;
1891
+ } else if (MatchChar(ts, c)) {
1892
+ if (PeekChar(ts) == '>' && !(ts->flags & TSF_DIRTYLINE)) {
1893
+ ts->flags &= ~TSF_IN_HTML_COMMENT;
1894
+ goto skipline;
1895
+ }
1896
+ tt = TOK_DEC;
1897
+ } else {
1898
+ tp->t_op = JSOP_NEG;
1899
+ tt = TOK_MINUS;
1900
+ }
1901
+ break;
1902
+
1903
+ #if JS_HAS_SHARP_VARS
1904
+ case '#':
1905
+ {
1906
+ uint32 n;
1907
+
1908
+ c = GetChar(ts);
1909
+ if (!JS7_ISDEC(c)) {
1910
+ UngetChar(ts, c);
1911
+ goto badchar;
1912
+ }
1913
+ n = (uint32)JS7_UNDEC(c);
1914
+ for (;;) {
1915
+ c = GetChar(ts);
1916
+ if (!JS7_ISDEC(c))
1917
+ break;
1918
+ n = 10 * n + JS7_UNDEC(c);
1919
+ if (n >= UINT16_LIMIT) {
1920
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1921
+ JSMSG_SHARPVAR_TOO_BIG);
1922
+ goto error;
1923
+ }
1924
+ }
1925
+ tp->t_dval = (jsdouble) n;
1926
+ if (JS_HAS_STRICT_OPTION(cx) &&
1927
+ (c == '=' || c == '#')) {
1928
+ char buf[20];
1929
+ JS_snprintf(buf, sizeof buf, "#%u%c", n, c);
1930
+ if (!js_ReportCompileErrorNumber(cx, ts, NULL,
1931
+ JSREPORT_WARNING |
1932
+ JSREPORT_STRICT,
1933
+ JSMSG_DEPRECATED_USAGE,
1934
+ buf)) {
1935
+ goto error;
1936
+ }
1937
+ }
1938
+ if (c == '=')
1939
+ tt = TOK_DEFSHARP;
1940
+ else if (c == '#')
1941
+ tt = TOK_USESHARP;
1942
+ else
1943
+ goto badchar;
1944
+ break;
1945
+ }
1946
+ #endif /* JS_HAS_SHARP_VARS */
1947
+
1948
+ #if JS_HAS_SHARP_VARS || JS_HAS_XML_SUPPORT
1949
+ badchar:
1950
+ #endif
1951
+
1952
+ default:
1953
+ js_ReportCompileErrorNumber(cx, ts, NULL, JSREPORT_ERROR,
1954
+ JSMSG_ILLEGAL_CHARACTER);
1955
+ goto error;
1956
+ }
1957
+
1958
+ out:
1959
+ JS_ASSERT(tt != TOK_EOL);
1960
+ ts->flags |= TSF_DIRTYLINE;
1961
+
1962
+ eol_out:
1963
+ if (!STRING_BUFFER_OK(&ts->tokenbuf))
1964
+ tt = TOK_ERROR;
1965
+ JS_ASSERT(tt < TOK_LIMIT);
1966
+ tp->pos.end.index = ts->linepos +
1967
+ PTRDIFF(ts->linebuf.ptr, ts->linebuf.base, jschar) -
1968
+ ts->ungetpos;
1969
+ tp->type = tt;
1970
+ return tt;
1971
+
1972
+ error:
1973
+ tt = TOK_ERROR;
1974
+ ts->flags |= TSF_ERROR;
1975
+ goto out;
1976
+
1977
+ #undef INIT_TOKENBUF
1978
+ #undef TOKENBUF_LENGTH
1979
+ #undef TOKENBUF_OK
1980
+ #undef TOKENBUF_TO_ATOM
1981
+ #undef ADD_TO_TOKENBUF
1982
+ #undef TOKENBUF_BASE
1983
+ #undef TOKENBUF_CHAR
1984
+ #undef TRIM_TOKENBUF
1985
+ #undef NUL_TERM_TOKENBUF
1986
+ }
1987
+
1988
+ void
1989
+ js_UngetToken(JSTokenStream *ts)
1990
+ {
1991
+ JS_ASSERT(ts->lookahead < NTOKENS_MASK);
1992
+ ts->lookahead++;
1993
+ ts->cursor = (ts->cursor - 1) & NTOKENS_MASK;
1994
+ }
1995
+
1996
+ JSBool
1997
+ js_MatchToken(JSContext *cx, JSTokenStream *ts, JSTokenType tt)
1998
+ {
1999
+ if (js_GetToken(cx, ts) == tt)
2000
+ return JS_TRUE;
2001
+ js_UngetToken(ts);
2002
+ return JS_FALSE;
2003
+ }