gitlab-pygments.rb 0.3.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (399) hide show
  1. data/.gitignore +6 -0
  2. data/Gemfile +2 -0
  3. data/README.md +91 -0
  4. data/Rakefile +78 -0
  5. data/bench.rb +22 -0
  6. data/cache-lexers.rb +8 -0
  7. data/lexers +0 -0
  8. data/lib/pygments/lexer.rb +148 -0
  9. data/lib/pygments/mentos.py +344 -0
  10. data/lib/pygments/popen.rb +389 -0
  11. data/lib/pygments/version.rb +3 -0
  12. data/lib/pygments.rb +8 -0
  13. data/pygments.rb.gemspec +24 -0
  14. data/test/test_data.c +2581 -0
  15. data/test/test_data.py +514 -0
  16. data/test/test_data_generated +2582 -0
  17. data/test/test_pygments.rb +276 -0
  18. data/vendor/custom_formatters/gitlab.py +171 -0
  19. data/vendor/custom_lexers/github.py +362 -0
  20. data/vendor/pygments-main/AUTHORS +115 -0
  21. data/vendor/pygments-main/CHANGES +762 -0
  22. data/vendor/pygments-main/LICENSE +25 -0
  23. data/vendor/pygments-main/MANIFEST.in +6 -0
  24. data/vendor/pygments-main/Makefile +59 -0
  25. data/vendor/pygments-main/REVISION +1 -0
  26. data/vendor/pygments-main/TODO +15 -0
  27. data/vendor/pygments-main/docs/generate.py +472 -0
  28. data/vendor/pygments-main/docs/pygmentize.1 +94 -0
  29. data/vendor/pygments-main/docs/src/api.txt +270 -0
  30. data/vendor/pygments-main/docs/src/authors.txt +5 -0
  31. data/vendor/pygments-main/docs/src/changelog.txt +5 -0
  32. data/vendor/pygments-main/docs/src/cmdline.txt +147 -0
  33. data/vendor/pygments-main/docs/src/filterdevelopment.txt +70 -0
  34. data/vendor/pygments-main/docs/src/filters.txt +42 -0
  35. data/vendor/pygments-main/docs/src/formatterdevelopment.txt +169 -0
  36. data/vendor/pygments-main/docs/src/formatters.txt +48 -0
  37. data/vendor/pygments-main/docs/src/index.txt +69 -0
  38. data/vendor/pygments-main/docs/src/installation.txt +71 -0
  39. data/vendor/pygments-main/docs/src/integrate.txt +43 -0
  40. data/vendor/pygments-main/docs/src/lexerdevelopment.txt +551 -0
  41. data/vendor/pygments-main/docs/src/lexers.txt +67 -0
  42. data/vendor/pygments-main/docs/src/moinmoin.txt +39 -0
  43. data/vendor/pygments-main/docs/src/plugins.txt +93 -0
  44. data/vendor/pygments-main/docs/src/quickstart.txt +202 -0
  45. data/vendor/pygments-main/docs/src/rstdirective.txt +22 -0
  46. data/vendor/pygments-main/docs/src/styles.txt +143 -0
  47. data/vendor/pygments-main/docs/src/tokens.txt +349 -0
  48. data/vendor/pygments-main/docs/src/unicode.txt +49 -0
  49. data/vendor/pygments-main/external/markdown-processor.py +67 -0
  50. data/vendor/pygments-main/external/moin-parser.py +112 -0
  51. data/vendor/pygments-main/external/pygments.bashcomp +38 -0
  52. data/vendor/pygments-main/external/rst-directive-old.py +77 -0
  53. data/vendor/pygments-main/external/rst-directive.py +83 -0
  54. data/vendor/pygments-main/ez_setup.py +276 -0
  55. data/vendor/pygments-main/pygmentize +7 -0
  56. data/vendor/pygments-main/pygments/__init__.py +91 -0
  57. data/vendor/pygments-main/pygments/cmdline.py +433 -0
  58. data/vendor/pygments-main/pygments/console.py +74 -0
  59. data/vendor/pygments-main/pygments/filter.py +74 -0
  60. data/vendor/pygments-main/pygments/filters/__init__.py +357 -0
  61. data/vendor/pygments-main/pygments/formatter.py +92 -0
  62. data/vendor/pygments-main/pygments/formatters/__init__.py +68 -0
  63. data/vendor/pygments-main/pygments/formatters/_mapping.py +94 -0
  64. data/vendor/pygments-main/pygments/formatters/bbcode.py +109 -0
  65. data/vendor/pygments-main/pygments/formatters/gitlab.py +171 -0
  66. data/vendor/pygments-main/pygments/formatters/html.py +750 -0
  67. data/vendor/pygments-main/pygments/formatters/img.py +553 -0
  68. data/vendor/pygments-main/pygments/formatters/latex.py +378 -0
  69. data/vendor/pygments-main/pygments/formatters/other.py +117 -0
  70. data/vendor/pygments-main/pygments/formatters/rtf.py +136 -0
  71. data/vendor/pygments-main/pygments/formatters/svg.py +154 -0
  72. data/vendor/pygments-main/pygments/formatters/terminal.py +112 -0
  73. data/vendor/pygments-main/pygments/formatters/terminal256.py +222 -0
  74. data/vendor/pygments-main/pygments/lexer.py +697 -0
  75. data/vendor/pygments-main/pygments/lexers/__init__.py +229 -0
  76. data/vendor/pygments-main/pygments/lexers/_asybuiltins.py +1645 -0
  77. data/vendor/pygments-main/pygments/lexers/_clbuiltins.py +232 -0
  78. data/vendor/pygments-main/pygments/lexers/_luabuiltins.py +249 -0
  79. data/vendor/pygments-main/pygments/lexers/_mapping.py +298 -0
  80. data/vendor/pygments-main/pygments/lexers/_phpbuiltins.py +3787 -0
  81. data/vendor/pygments-main/pygments/lexers/_postgres_builtins.py +232 -0
  82. data/vendor/pygments-main/pygments/lexers/_scilab_builtins.py +29 -0
  83. data/vendor/pygments-main/pygments/lexers/_vimbuiltins.py +3 -0
  84. data/vendor/pygments-main/pygments/lexers/agile.py +1803 -0
  85. data/vendor/pygments-main/pygments/lexers/asm.py +360 -0
  86. data/vendor/pygments-main/pygments/lexers/compiled.py +2891 -0
  87. data/vendor/pygments-main/pygments/lexers/dotnet.py +636 -0
  88. data/vendor/pygments-main/pygments/lexers/functional.py +1832 -0
  89. data/vendor/pygments-main/pygments/lexers/github.py +362 -0
  90. data/vendor/pygments-main/pygments/lexers/hdl.py +356 -0
  91. data/vendor/pygments-main/pygments/lexers/jvm.py +847 -0
  92. data/vendor/pygments-main/pygments/lexers/math.py +1072 -0
  93. data/vendor/pygments-main/pygments/lexers/other.py +3339 -0
  94. data/vendor/pygments-main/pygments/lexers/parsers.py +695 -0
  95. data/vendor/pygments-main/pygments/lexers/shell.py +361 -0
  96. data/vendor/pygments-main/pygments/lexers/special.py +100 -0
  97. data/vendor/pygments-main/pygments/lexers/sql.py +559 -0
  98. data/vendor/pygments-main/pygments/lexers/templates.py +1631 -0
  99. data/vendor/pygments-main/pygments/lexers/text.py +1753 -0
  100. data/vendor/pygments-main/pygments/lexers/web.py +2864 -0
  101. data/vendor/pygments-main/pygments/plugin.py +74 -0
  102. data/vendor/pygments-main/pygments/scanner.py +104 -0
  103. data/vendor/pygments-main/pygments/style.py +117 -0
  104. data/vendor/pygments-main/pygments/styles/__init__.py +70 -0
  105. data/vendor/pygments-main/pygments/styles/autumn.py +65 -0
  106. data/vendor/pygments-main/pygments/styles/borland.py +51 -0
  107. data/vendor/pygments-main/pygments/styles/bw.py +49 -0
  108. data/vendor/pygments-main/pygments/styles/colorful.py +81 -0
  109. data/vendor/pygments-main/pygments/styles/default.py +73 -0
  110. data/vendor/pygments-main/pygments/styles/emacs.py +72 -0
  111. data/vendor/pygments-main/pygments/styles/friendly.py +72 -0
  112. data/vendor/pygments-main/pygments/styles/fruity.py +42 -0
  113. data/vendor/pygments-main/pygments/styles/manni.py +75 -0
  114. data/vendor/pygments-main/pygments/styles/monokai.py +106 -0
  115. data/vendor/pygments-main/pygments/styles/murphy.py +80 -0
  116. data/vendor/pygments-main/pygments/styles/native.py +65 -0
  117. data/vendor/pygments-main/pygments/styles/pastie.py +75 -0
  118. data/vendor/pygments-main/pygments/styles/perldoc.py +69 -0
  119. data/vendor/pygments-main/pygments/styles/rrt.py +33 -0
  120. data/vendor/pygments-main/pygments/styles/tango.py +141 -0
  121. data/vendor/pygments-main/pygments/styles/trac.py +63 -0
  122. data/vendor/pygments-main/pygments/styles/vim.py +63 -0
  123. data/vendor/pygments-main/pygments/styles/vs.py +38 -0
  124. data/vendor/pygments-main/pygments/token.py +195 -0
  125. data/vendor/pygments-main/pygments/unistring.py +130 -0
  126. data/vendor/pygments-main/pygments/util.py +232 -0
  127. data/vendor/pygments-main/scripts/check_sources.py +242 -0
  128. data/vendor/pygments-main/scripts/detect_missing_analyse_text.py +30 -0
  129. data/vendor/pygments-main/scripts/epydoc.css +280 -0
  130. data/vendor/pygments-main/scripts/find_codetags.py +205 -0
  131. data/vendor/pygments-main/scripts/find_error.py +171 -0
  132. data/vendor/pygments-main/scripts/get_vimkw.py +43 -0
  133. data/vendor/pygments-main/scripts/pylintrc +301 -0
  134. data/vendor/pygments-main/scripts/reindent.py +291 -0
  135. data/vendor/pygments-main/scripts/vim2pygments.py +933 -0
  136. data/vendor/pygments-main/setup.cfg +6 -0
  137. data/vendor/pygments-main/setup.py +88 -0
  138. data/vendor/pygments-main/tests/dtds/HTML4-f.dtd +37 -0
  139. data/vendor/pygments-main/tests/dtds/HTML4-s.dtd +869 -0
  140. data/vendor/pygments-main/tests/dtds/HTML4.dcl +88 -0
  141. data/vendor/pygments-main/tests/dtds/HTML4.dtd +1092 -0
  142. data/vendor/pygments-main/tests/dtds/HTML4.soc +9 -0
  143. data/vendor/pygments-main/tests/dtds/HTMLlat1.ent +195 -0
  144. data/vendor/pygments-main/tests/dtds/HTMLspec.ent +77 -0
  145. data/vendor/pygments-main/tests/dtds/HTMLsym.ent +241 -0
  146. data/vendor/pygments-main/tests/examplefiles/ANTLRv3.g +608 -0
  147. data/vendor/pygments-main/tests/examplefiles/AcidStateAdvanced.hs +209 -0
  148. data/vendor/pygments-main/tests/examplefiles/AlternatingGroup.mu +102 -0
  149. data/vendor/pygments-main/tests/examplefiles/CPDictionary.j +611 -0
  150. data/vendor/pygments-main/tests/examplefiles/Constants.mo +158 -0
  151. data/vendor/pygments-main/tests/examplefiles/DancingSudoku.lhs +411 -0
  152. data/vendor/pygments-main/tests/examplefiles/Errors.scala +18 -0
  153. data/vendor/pygments-main/tests/examplefiles/File.hy +174 -0
  154. data/vendor/pygments-main/tests/examplefiles/Intro.java +1660 -0
  155. data/vendor/pygments-main/tests/examplefiles/Makefile +1131 -0
  156. data/vendor/pygments-main/tests/examplefiles/Object.st +4394 -0
  157. data/vendor/pygments-main/tests/examplefiles/OrderedMap.hx +584 -0
  158. data/vendor/pygments-main/tests/examplefiles/SmallCheck.hs +378 -0
  159. data/vendor/pygments-main/tests/examplefiles/Sorting.mod +470 -0
  160. data/vendor/pygments-main/tests/examplefiles/Sudoku.lhs +382 -0
  161. data/vendor/pygments-main/tests/examplefiles/addressbook.proto +30 -0
  162. data/vendor/pygments-main/tests/examplefiles/antlr_throws +1 -0
  163. data/vendor/pygments-main/tests/examplefiles/apache2.conf +393 -0
  164. data/vendor/pygments-main/tests/examplefiles/as3_test.as +143 -0
  165. data/vendor/pygments-main/tests/examplefiles/as3_test2.as +46 -0
  166. data/vendor/pygments-main/tests/examplefiles/as3_test3.as +3 -0
  167. data/vendor/pygments-main/tests/examplefiles/aspx-cs_example +27 -0
  168. data/vendor/pygments-main/tests/examplefiles/badcase.java +2 -0
  169. data/vendor/pygments-main/tests/examplefiles/batchfile.bat +49 -0
  170. data/vendor/pygments-main/tests/examplefiles/boot-9.scm +1557 -0
  171. data/vendor/pygments-main/tests/examplefiles/cells.ps +515 -0
  172. data/vendor/pygments-main/tests/examplefiles/ceval.c +2604 -0
  173. data/vendor/pygments-main/tests/examplefiles/cheetah_example.html +13 -0
  174. data/vendor/pygments-main/tests/examplefiles/classes.dylan +40 -0
  175. data/vendor/pygments-main/tests/examplefiles/condensed_ruby.rb +10 -0
  176. data/vendor/pygments-main/tests/examplefiles/coq_RelationClasses +447 -0
  177. data/vendor/pygments-main/tests/examplefiles/database.pytb +20 -0
  178. data/vendor/pygments-main/tests/examplefiles/de.MoinMoin.po +2461 -0
  179. data/vendor/pygments-main/tests/examplefiles/demo.ahk +181 -0
  180. data/vendor/pygments-main/tests/examplefiles/demo.cfm +38 -0
  181. data/vendor/pygments-main/tests/examplefiles/django_sample.html+django +68 -0
  182. data/vendor/pygments-main/tests/examplefiles/dwarf.cw +17 -0
  183. data/vendor/pygments-main/tests/examplefiles/erl_session +10 -0
  184. data/vendor/pygments-main/tests/examplefiles/escape_semicolon.clj +1 -0
  185. data/vendor/pygments-main/tests/examplefiles/evil_regex.js +48 -0
  186. data/vendor/pygments-main/tests/examplefiles/example.c +2080 -0
  187. data/vendor/pygments-main/tests/examplefiles/example.cls +15 -0
  188. data/vendor/pygments-main/tests/examplefiles/example.cpp +2363 -0
  189. data/vendor/pygments-main/tests/examplefiles/example.gs +106 -0
  190. data/vendor/pygments-main/tests/examplefiles/example.gst +7 -0
  191. data/vendor/pygments-main/tests/examplefiles/example.kt +47 -0
  192. data/vendor/pygments-main/tests/examplefiles/example.lua +250 -0
  193. data/vendor/pygments-main/tests/examplefiles/example.moo +26 -0
  194. data/vendor/pygments-main/tests/examplefiles/example.moon +629 -0
  195. data/vendor/pygments-main/tests/examplefiles/example.nim +1010 -0
  196. data/vendor/pygments-main/tests/examplefiles/example.ns2 +69 -0
  197. data/vendor/pygments-main/tests/examplefiles/example.p +34 -0
  198. data/vendor/pygments-main/tests/examplefiles/example.pas +2708 -0
  199. data/vendor/pygments-main/tests/examplefiles/example.rb +1852 -0
  200. data/vendor/pygments-main/tests/examplefiles/example.rhtml +561 -0
  201. data/vendor/pygments-main/tests/examplefiles/example.sh-session +19 -0
  202. data/vendor/pygments-main/tests/examplefiles/example.sml +156 -0
  203. data/vendor/pygments-main/tests/examplefiles/example.snobol +15 -0
  204. data/vendor/pygments-main/tests/examplefiles/example.tea +34 -0
  205. data/vendor/pygments-main/tests/examplefiles/example.u +548 -0
  206. data/vendor/pygments-main/tests/examplefiles/example.weechatlog +9 -0
  207. data/vendor/pygments-main/tests/examplefiles/example.xhtml +376 -0
  208. data/vendor/pygments-main/tests/examplefiles/example.yaml +302 -0
  209. data/vendor/pygments-main/tests/examplefiles/example2.aspx +29 -0
  210. data/vendor/pygments-main/tests/examplefiles/example_elixir.ex +363 -0
  211. data/vendor/pygments-main/tests/examplefiles/example_file.fy +128 -0
  212. data/vendor/pygments-main/tests/examplefiles/firefox.mak +586 -0
  213. data/vendor/pygments-main/tests/examplefiles/flipflop.sv +19 -0
  214. data/vendor/pygments-main/tests/examplefiles/foo.sce +6 -0
  215. data/vendor/pygments-main/tests/examplefiles/format.ml +1213 -0
  216. data/vendor/pygments-main/tests/examplefiles/fucked_up.rb +77 -0
  217. data/vendor/pygments-main/tests/examplefiles/function.mu +1 -0
  218. data/vendor/pygments-main/tests/examplefiles/functional.rst +1472 -0
  219. data/vendor/pygments-main/tests/examplefiles/genclass.clj +510 -0
  220. data/vendor/pygments-main/tests/examplefiles/genshi_example.xml+genshi +193 -0
  221. data/vendor/pygments-main/tests/examplefiles/genshitext_example.genshitext +33 -0
  222. data/vendor/pygments-main/tests/examplefiles/glsl.frag +7 -0
  223. data/vendor/pygments-main/tests/examplefiles/glsl.vert +13 -0
  224. data/vendor/pygments-main/tests/examplefiles/html+php_faulty.php +1 -0
  225. data/vendor/pygments-main/tests/examplefiles/http_request_example +14 -0
  226. data/vendor/pygments-main/tests/examplefiles/http_response_example +27 -0
  227. data/vendor/pygments-main/tests/examplefiles/import.hs +4 -0
  228. data/vendor/pygments-main/tests/examplefiles/intro.ik +24 -0
  229. data/vendor/pygments-main/tests/examplefiles/ints.php +10 -0
  230. data/vendor/pygments-main/tests/examplefiles/intsyn.fun +675 -0
  231. data/vendor/pygments-main/tests/examplefiles/intsyn.sig +286 -0
  232. data/vendor/pygments-main/tests/examplefiles/irb_heredoc +8 -0
  233. data/vendor/pygments-main/tests/examplefiles/irc.lsp +214 -0
  234. data/vendor/pygments-main/tests/examplefiles/java.properties +16 -0
  235. data/vendor/pygments-main/tests/examplefiles/jbst_example1.jbst +28 -0
  236. data/vendor/pygments-main/tests/examplefiles/jbst_example2.jbst +45 -0
  237. data/vendor/pygments-main/tests/examplefiles/jinjadesignerdoc.rst +713 -0
  238. data/vendor/pygments-main/tests/examplefiles/lighttpd_config.conf +13 -0
  239. data/vendor/pygments-main/tests/examplefiles/linecontinuation.py +47 -0
  240. data/vendor/pygments-main/tests/examplefiles/ltmain.sh +2849 -0
  241. data/vendor/pygments-main/tests/examplefiles/main.cmake +42 -0
  242. data/vendor/pygments-main/tests/examplefiles/markdown.lsp +679 -0
  243. data/vendor/pygments-main/tests/examplefiles/matlab_noreturn +3 -0
  244. data/vendor/pygments-main/tests/examplefiles/matlab_sample +27 -0
  245. data/vendor/pygments-main/tests/examplefiles/matlabsession_sample.txt +37 -0
  246. data/vendor/pygments-main/tests/examplefiles/minimal.ns2 +4 -0
  247. data/vendor/pygments-main/tests/examplefiles/moin_SyntaxReference.txt +340 -0
  248. data/vendor/pygments-main/tests/examplefiles/multiline_regexes.rb +38 -0
  249. data/vendor/pygments-main/tests/examplefiles/nasm_aoutso.asm +96 -0
  250. data/vendor/pygments-main/tests/examplefiles/nasm_objexe.asm +30 -0
  251. data/vendor/pygments-main/tests/examplefiles/nemerle_sample.n +87 -0
  252. data/vendor/pygments-main/tests/examplefiles/nginx_nginx.conf +118 -0
  253. data/vendor/pygments-main/tests/examplefiles/numbers.c +12 -0
  254. data/vendor/pygments-main/tests/examplefiles/objc_example.m +25 -0
  255. data/vendor/pygments-main/tests/examplefiles/objc_example2.m +24 -0
  256. data/vendor/pygments-main/tests/examplefiles/perl_misc +62 -0
  257. data/vendor/pygments-main/tests/examplefiles/perl_perl5db +998 -0
  258. data/vendor/pygments-main/tests/examplefiles/perl_regex-delims +120 -0
  259. data/vendor/pygments-main/tests/examplefiles/perlfunc.1 +856 -0
  260. data/vendor/pygments-main/tests/examplefiles/phpcomplete.vim +567 -0
  261. data/vendor/pygments-main/tests/examplefiles/pleac.in.rb +1223 -0
  262. data/vendor/pygments-main/tests/examplefiles/postgresql_test.txt +47 -0
  263. data/vendor/pygments-main/tests/examplefiles/pppoe.applescript +10 -0
  264. data/vendor/pygments-main/tests/examplefiles/psql_session.txt +122 -0
  265. data/vendor/pygments-main/tests/examplefiles/py3_test.txt +2 -0
  266. data/vendor/pygments-main/tests/examplefiles/pycon_test.pycon +14 -0
  267. data/vendor/pygments-main/tests/examplefiles/pytb_test2.pytb +2 -0
  268. data/vendor/pygments-main/tests/examplefiles/python25-bsd.mak +234 -0
  269. data/vendor/pygments-main/tests/examplefiles/qsort.prolog +13 -0
  270. data/vendor/pygments-main/tests/examplefiles/r-console-transcript.Rout +38 -0
  271. data/vendor/pygments-main/tests/examplefiles/ragel-cpp_rlscan +280 -0
  272. data/vendor/pygments-main/tests/examplefiles/ragel-cpp_snippet +2 -0
  273. data/vendor/pygments-main/tests/examplefiles/regex.js +22 -0
  274. data/vendor/pygments-main/tests/examplefiles/reversi.lsp +427 -0
  275. data/vendor/pygments-main/tests/examplefiles/ruby_func_def.rb +11 -0
  276. data/vendor/pygments-main/tests/examplefiles/scilab.sci +30 -0
  277. data/vendor/pygments-main/tests/examplefiles/sibling.prolog +19 -0
  278. data/vendor/pygments-main/tests/examplefiles/simple.md +747 -0
  279. data/vendor/pygments-main/tests/examplefiles/smarty_example.html +209 -0
  280. data/vendor/pygments-main/tests/examplefiles/source.lgt +343 -0
  281. data/vendor/pygments-main/tests/examplefiles/sources.list +62 -0
  282. data/vendor/pygments-main/tests/examplefiles/sphere.pov +18 -0
  283. data/vendor/pygments-main/tests/examplefiles/sqlite3.sqlite3-console +27 -0
  284. data/vendor/pygments-main/tests/examplefiles/squid.conf +30 -0
  285. data/vendor/pygments-main/tests/examplefiles/string.jl +1031 -0
  286. data/vendor/pygments-main/tests/examplefiles/string_delimiters.d +21 -0
  287. data/vendor/pygments-main/tests/examplefiles/stripheredoc.sh +3 -0
  288. data/vendor/pygments-main/tests/examplefiles/test.R +119 -0
  289. data/vendor/pygments-main/tests/examplefiles/test.adb +211 -0
  290. data/vendor/pygments-main/tests/examplefiles/test.asy +131 -0
  291. data/vendor/pygments-main/tests/examplefiles/test.awk +121 -0
  292. data/vendor/pygments-main/tests/examplefiles/test.bas +29 -0
  293. data/vendor/pygments-main/tests/examplefiles/test.bmx +145 -0
  294. data/vendor/pygments-main/tests/examplefiles/test.boo +39 -0
  295. data/vendor/pygments-main/tests/examplefiles/test.bro +250 -0
  296. data/vendor/pygments-main/tests/examplefiles/test.cs +374 -0
  297. data/vendor/pygments-main/tests/examplefiles/test.css +54 -0
  298. data/vendor/pygments-main/tests/examplefiles/test.d +135 -0
  299. data/vendor/pygments-main/tests/examplefiles/test.dart +23 -0
  300. data/vendor/pygments-main/tests/examplefiles/test.dtd +89 -0
  301. data/vendor/pygments-main/tests/examplefiles/test.ec +605 -0
  302. data/vendor/pygments-main/tests/examplefiles/test.ecl +58 -0
  303. data/vendor/pygments-main/tests/examplefiles/test.eh +315 -0
  304. data/vendor/pygments-main/tests/examplefiles/test.erl +169 -0
  305. data/vendor/pygments-main/tests/examplefiles/test.evoque +33 -0
  306. data/vendor/pygments-main/tests/examplefiles/test.fan +818 -0
  307. data/vendor/pygments-main/tests/examplefiles/test.flx +57 -0
  308. data/vendor/pygments-main/tests/examplefiles/test.gdc +13 -0
  309. data/vendor/pygments-main/tests/examplefiles/test.groovy +97 -0
  310. data/vendor/pygments-main/tests/examplefiles/test.html +339 -0
  311. data/vendor/pygments-main/tests/examplefiles/test.ini +10 -0
  312. data/vendor/pygments-main/tests/examplefiles/test.java +653 -0
  313. data/vendor/pygments-main/tests/examplefiles/test.jsp +24 -0
  314. data/vendor/pygments-main/tests/examplefiles/test.maql +45 -0
  315. data/vendor/pygments-main/tests/examplefiles/test.mod +374 -0
  316. data/vendor/pygments-main/tests/examplefiles/test.moo +51 -0
  317. data/vendor/pygments-main/tests/examplefiles/test.myt +166 -0
  318. data/vendor/pygments-main/tests/examplefiles/test.nim +93 -0
  319. data/vendor/pygments-main/tests/examplefiles/test.pas +743 -0
  320. data/vendor/pygments-main/tests/examplefiles/test.php +505 -0
  321. data/vendor/pygments-main/tests/examplefiles/test.plot +333 -0
  322. data/vendor/pygments-main/tests/examplefiles/test.ps1 +108 -0
  323. data/vendor/pygments-main/tests/examplefiles/test.pypylog +1839 -0
  324. data/vendor/pygments-main/tests/examplefiles/test.r3 +94 -0
  325. data/vendor/pygments-main/tests/examplefiles/test.rb +177 -0
  326. data/vendor/pygments-main/tests/examplefiles/test.rhtml +43 -0
  327. data/vendor/pygments-main/tests/examplefiles/test.scaml +8 -0
  328. data/vendor/pygments-main/tests/examplefiles/test.ssp +12 -0
  329. data/vendor/pygments-main/tests/examplefiles/test.tcsh +830 -0
  330. data/vendor/pygments-main/tests/examplefiles/test.vb +407 -0
  331. data/vendor/pygments-main/tests/examplefiles/test.vhdl +161 -0
  332. data/vendor/pygments-main/tests/examplefiles/test.xqy +138 -0
  333. data/vendor/pygments-main/tests/examplefiles/test.xsl +23 -0
  334. data/vendor/pygments-main/tests/examplefiles/truncated.pytb +15 -0
  335. data/vendor/pygments-main/tests/examplefiles/type.lisp +1202 -0
  336. data/vendor/pygments-main/tests/examplefiles/underscore.coffee +603 -0
  337. data/vendor/pygments-main/tests/examplefiles/unicode.applescript +5 -0
  338. data/vendor/pygments-main/tests/examplefiles/unicodedoc.py +11 -0
  339. data/vendor/pygments-main/tests/examplefiles/webkit-transition.css +3 -0
  340. data/vendor/pygments-main/tests/examplefiles/while.pov +13 -0
  341. data/vendor/pygments-main/tests/examplefiles/wiki.factor +384 -0
  342. data/vendor/pygments-main/tests/examplefiles/xml_example +1897 -0
  343. data/vendor/pygments-main/tests/examplefiles/zmlrpc.f90 +798 -0
  344. data/vendor/pygments-main/tests/old_run.py +138 -0
  345. data/vendor/pygments-main/tests/run.py +48 -0
  346. data/vendor/pygments-main/tests/support.py +15 -0
  347. data/vendor/pygments-main/tests/test_basic_api.py +294 -0
  348. data/vendor/pygments-main/tests/test_clexer.py +31 -0
  349. data/vendor/pygments-main/tests/test_cmdline.py +105 -0
  350. data/vendor/pygments-main/tests/test_examplefiles.py +97 -0
  351. data/vendor/pygments-main/tests/test_html_formatter.py +162 -0
  352. data/vendor/pygments-main/tests/test_latex_formatter.py +55 -0
  353. data/vendor/pygments-main/tests/test_perllexer.py +137 -0
  354. data/vendor/pygments-main/tests/test_regexlexer.py +47 -0
  355. data/vendor/pygments-main/tests/test_token.py +46 -0
  356. data/vendor/pygments-main/tests/test_using_api.py +40 -0
  357. data/vendor/pygments-main/tests/test_util.py +116 -0
  358. data/vendor/simplejson/.gitignore +10 -0
  359. data/vendor/simplejson/.travis.yml +5 -0
  360. data/vendor/simplejson/CHANGES.txt +291 -0
  361. data/vendor/simplejson/LICENSE.txt +19 -0
  362. data/vendor/simplejson/MANIFEST.in +5 -0
  363. data/vendor/simplejson/README.rst +19 -0
  364. data/vendor/simplejson/conf.py +179 -0
  365. data/vendor/simplejson/index.rst +628 -0
  366. data/vendor/simplejson/scripts/make_docs.py +18 -0
  367. data/vendor/simplejson/setup.py +104 -0
  368. data/vendor/simplejson/simplejson/__init__.py +510 -0
  369. data/vendor/simplejson/simplejson/_speedups.c +2745 -0
  370. data/vendor/simplejson/simplejson/decoder.py +425 -0
  371. data/vendor/simplejson/simplejson/encoder.py +567 -0
  372. data/vendor/simplejson/simplejson/ordered_dict.py +119 -0
  373. data/vendor/simplejson/simplejson/scanner.py +77 -0
  374. data/vendor/simplejson/simplejson/tests/__init__.py +67 -0
  375. data/vendor/simplejson/simplejson/tests/test_bigint_as_string.py +55 -0
  376. data/vendor/simplejson/simplejson/tests/test_check_circular.py +30 -0
  377. data/vendor/simplejson/simplejson/tests/test_decimal.py +66 -0
  378. data/vendor/simplejson/simplejson/tests/test_decode.py +83 -0
  379. data/vendor/simplejson/simplejson/tests/test_default.py +9 -0
  380. data/vendor/simplejson/simplejson/tests/test_dump.py +67 -0
  381. data/vendor/simplejson/simplejson/tests/test_encode_basestring_ascii.py +46 -0
  382. data/vendor/simplejson/simplejson/tests/test_encode_for_html.py +32 -0
  383. data/vendor/simplejson/simplejson/tests/test_errors.py +34 -0
  384. data/vendor/simplejson/simplejson/tests/test_fail.py +91 -0
  385. data/vendor/simplejson/simplejson/tests/test_float.py +19 -0
  386. data/vendor/simplejson/simplejson/tests/test_indent.py +86 -0
  387. data/vendor/simplejson/simplejson/tests/test_item_sort_key.py +20 -0
  388. data/vendor/simplejson/simplejson/tests/test_namedtuple.py +121 -0
  389. data/vendor/simplejson/simplejson/tests/test_pass1.py +76 -0
  390. data/vendor/simplejson/simplejson/tests/test_pass2.py +14 -0
  391. data/vendor/simplejson/simplejson/tests/test_pass3.py +20 -0
  392. data/vendor/simplejson/simplejson/tests/test_recursion.py +67 -0
  393. data/vendor/simplejson/simplejson/tests/test_scanstring.py +117 -0
  394. data/vendor/simplejson/simplejson/tests/test_separators.py +42 -0
  395. data/vendor/simplejson/simplejson/tests/test_speedups.py +20 -0
  396. data/vendor/simplejson/simplejson/tests/test_tuple.py +49 -0
  397. data/vendor/simplejson/simplejson/tests/test_unicode.py +109 -0
  398. data/vendor/simplejson/simplejson/tool.py +39 -0
  399. metadata +492 -0
@@ -0,0 +1,697 @@
1
+ # -*- coding: utf-8 -*-
2
+ """
3
+ pygments.lexer
4
+ ~~~~~~~~~~~~~~
5
+
6
+ Base lexer classes.
7
+
8
+ :copyright: Copyright 2006-2012 by the Pygments team, see AUTHORS.
9
+ :license: BSD, see LICENSE for details.
10
+ """
11
+ import re
12
+
13
+ from pygments.filter import apply_filters, Filter
14
+ from pygments.filters import get_filter_by_name
15
+ from pygments.token import Error, Text, Other, _TokenType
16
+ from pygments.util import get_bool_opt, get_int_opt, get_list_opt, \
17
+ make_analysator
18
+
19
+
20
+ __all__ = ['Lexer', 'RegexLexer', 'ExtendedRegexLexer', 'DelegatingLexer',
21
+ 'LexerContext', 'include', 'bygroups', 'using', 'this']
22
+
23
+
24
+ _encoding_map = [('\xef\xbb\xbf', 'utf-8'),
25
+ ('\xff\xfe\0\0', 'utf-32'),
26
+ ('\0\0\xfe\xff', 'utf-32be'),
27
+ ('\xff\xfe', 'utf-16'),
28
+ ('\xfe\xff', 'utf-16be')]
29
+
30
+ _default_analyse = staticmethod(lambda x: 0.0)
31
+
32
+
33
+ class LexerMeta(type):
34
+ """
35
+ This metaclass automagically converts ``analyse_text`` methods into
36
+ static methods which always return float values.
37
+ """
38
+
39
+ def __new__(cls, name, bases, d):
40
+ if 'analyse_text' in d:
41
+ d['analyse_text'] = make_analysator(d['analyse_text'])
42
+ return type.__new__(cls, name, bases, d)
43
+
44
+
45
+ class Lexer(object):
46
+ """
47
+ Lexer for a specific language.
48
+
49
+ Basic options recognized:
50
+ ``stripnl``
51
+ Strip leading and trailing newlines from the input (default: True).
52
+ ``stripall``
53
+ Strip all leading and trailing whitespace from the input
54
+ (default: False).
55
+ ``ensurenl``
56
+ Make sure that the input ends with a newline (default: True). This
57
+ is required for some lexers that consume input linewise.
58
+ *New in Pygments 1.3.*
59
+ ``tabsize``
60
+ If given and greater than 0, expand tabs in the input (default: 0).
61
+ ``encoding``
62
+ If given, must be an encoding name. This encoding will be used to
63
+ convert the input string to Unicode, if it is not already a Unicode
64
+ string (default: ``'latin1'``).
65
+ Can also be ``'guess'`` to use a simple UTF-8 / Latin1 detection, or
66
+ ``'chardet'`` to use the chardet library, if it is installed.
67
+ """
68
+
69
+ #: Name of the lexer
70
+ name = None
71
+
72
+ #: Shortcuts for the lexer
73
+ aliases = []
74
+
75
+ #: fn match rules
76
+ filenames = []
77
+
78
+ #: fn alias filenames
79
+ alias_filenames = []
80
+
81
+ #: mime types
82
+ mimetypes = []
83
+
84
+ __metaclass__ = LexerMeta
85
+
86
+ def __init__(self, **options):
87
+ self.options = options
88
+ self.stripnl = get_bool_opt(options, 'stripnl', True)
89
+ self.stripall = get_bool_opt(options, 'stripall', False)
90
+ self.ensurenl = get_bool_opt(options, 'ensurenl', True)
91
+ self.tabsize = get_int_opt(options, 'tabsize', 0)
92
+ self.encoding = options.get('encoding', 'latin1')
93
+ # self.encoding = options.get('inencoding', None) or self.encoding
94
+ self.filters = []
95
+ for filter_ in get_list_opt(options, 'filters', ()):
96
+ self.add_filter(filter_)
97
+
98
+ def __repr__(self):
99
+ if self.options:
100
+ return '<pygments.lexers.%s with %r>' % (self.__class__.__name__,
101
+ self.options)
102
+ else:
103
+ return '<pygments.lexers.%s>' % self.__class__.__name__
104
+
105
+ def add_filter(self, filter_, **options):
106
+ """
107
+ Add a new stream filter to this lexer.
108
+ """
109
+ if not isinstance(filter_, Filter):
110
+ filter_ = get_filter_by_name(filter_, **options)
111
+ self.filters.append(filter_)
112
+
113
+ def analyse_text(text):
114
+ """
115
+ Has to return a float between ``0`` and ``1`` that indicates
116
+ if a lexer wants to highlight this text. Used by ``guess_lexer``.
117
+ If this method returns ``0`` it won't highlight it in any case, if
118
+ it returns ``1`` highlighting with this lexer is guaranteed.
119
+
120
+ The `LexerMeta` metaclass automatically wraps this function so
121
+ that it works like a static method (no ``self`` or ``cls``
122
+ parameter) and the return value is automatically converted to
123
+ `float`. If the return value is an object that is boolean `False`
124
+ it's the same as if the return values was ``0.0``.
125
+ """
126
+
127
+ def get_tokens(self, text, unfiltered=False):
128
+ """
129
+ Return an iterable of (tokentype, value) pairs generated from
130
+ `text`. If `unfiltered` is set to `True`, the filtering mechanism
131
+ is bypassed even if filters are defined.
132
+
133
+ Also preprocess the text, i.e. expand tabs and strip it if
134
+ wanted and applies registered filters.
135
+ """
136
+ if not isinstance(text, unicode):
137
+ if self.encoding == 'guess':
138
+ try:
139
+ text = text.decode('utf-8')
140
+ if text.startswith(u'\ufeff'):
141
+ text = text[len(u'\ufeff'):]
142
+ except UnicodeDecodeError:
143
+ text = text.decode('latin1')
144
+ elif self.encoding == 'chardet':
145
+ try:
146
+ import chardet
147
+ except ImportError:
148
+ raise ImportError('To enable chardet encoding guessing, '
149
+ 'please install the chardet library '
150
+ 'from http://chardet.feedparser.org/')
151
+ # check for BOM first
152
+ decoded = None
153
+ for bom, encoding in _encoding_map:
154
+ if text.startswith(bom):
155
+ decoded = unicode(text[len(bom):], encoding,
156
+ errors='replace')
157
+ break
158
+ # no BOM found, so use chardet
159
+ if decoded is None:
160
+ enc = chardet.detect(text[:1024]) # Guess using first 1KB
161
+ decoded = unicode(text, enc.get('encoding') or 'utf-8',
162
+ errors='replace')
163
+ text = decoded
164
+ else:
165
+ text = text.decode(self.encoding)
166
+ # text now *is* a unicode string
167
+ text = text.replace('\r\n', '\n')
168
+ text = text.replace('\r', '\n')
169
+ if self.stripall:
170
+ text = text.strip()
171
+ elif self.stripnl:
172
+ text = text.strip('\n')
173
+ if self.tabsize > 0:
174
+ text = text.expandtabs(self.tabsize)
175
+ if self.ensurenl and not text.endswith('\n'):
176
+ text += '\n'
177
+
178
+ def streamer():
179
+ for i, t, v in self.get_tokens_unprocessed(text):
180
+ yield t, v
181
+ stream = streamer()
182
+ if not unfiltered:
183
+ stream = apply_filters(stream, self.filters, self)
184
+ return stream
185
+
186
+ def get_tokens_unprocessed(self, text):
187
+ """
188
+ Return an iterable of (tokentype, value) pairs.
189
+ In subclasses, implement this method as a generator to
190
+ maximize effectiveness.
191
+ """
192
+ raise NotImplementedError
193
+
194
+
195
+ class DelegatingLexer(Lexer):
196
+ """
197
+ This lexer takes two lexer as arguments. A root lexer and
198
+ a language lexer. First everything is scanned using the language
199
+ lexer, afterwards all ``Other`` tokens are lexed using the root
200
+ lexer.
201
+
202
+ The lexers from the ``template`` lexer package use this base lexer.
203
+ """
204
+
205
+ def __init__(self, _root_lexer, _language_lexer, _needle=Other, **options):
206
+ self.root_lexer = _root_lexer(**options)
207
+ self.language_lexer = _language_lexer(**options)
208
+ self.needle = _needle
209
+ Lexer.__init__(self, **options)
210
+
211
+ def get_tokens_unprocessed(self, text):
212
+ buffered = ''
213
+ insertions = []
214
+ lng_buffer = []
215
+ for i, t, v in self.language_lexer.get_tokens_unprocessed(text):
216
+ if t is self.needle:
217
+ if lng_buffer:
218
+ insertions.append((len(buffered), lng_buffer))
219
+ lng_buffer = []
220
+ buffered += v
221
+ else:
222
+ lng_buffer.append((i, t, v))
223
+ if lng_buffer:
224
+ insertions.append((len(buffered), lng_buffer))
225
+ return do_insertions(insertions,
226
+ self.root_lexer.get_tokens_unprocessed(buffered))
227
+
228
+
229
+ #-------------------------------------------------------------------------------
230
+ # RegexLexer and ExtendedRegexLexer
231
+ #
232
+
233
+
234
+ class include(str):
235
+ """
236
+ Indicates that a state should include rules from another state.
237
+ """
238
+ pass
239
+
240
+
241
+ class combined(tuple):
242
+ """
243
+ Indicates a state combined from multiple states.
244
+ """
245
+
246
+ def __new__(cls, *args):
247
+ return tuple.__new__(cls, args)
248
+
249
+ def __init__(self, *args):
250
+ # tuple.__init__ doesn't do anything
251
+ pass
252
+
253
+
254
+ class _PseudoMatch(object):
255
+ """
256
+ A pseudo match object constructed from a string.
257
+ """
258
+
259
+ def __init__(self, start, text):
260
+ self._text = text
261
+ self._start = start
262
+
263
+ def start(self, arg=None):
264
+ return self._start
265
+
266
+ def end(self, arg=None):
267
+ return self._start + len(self._text)
268
+
269
+ def group(self, arg=None):
270
+ if arg:
271
+ raise IndexError('No such group')
272
+ return self._text
273
+
274
+ def groups(self):
275
+ return (self._text,)
276
+
277
+ def groupdict(self):
278
+ return {}
279
+
280
+
281
+ def bygroups(*args):
282
+ """
283
+ Callback that yields multiple actions for each group in the match.
284
+ """
285
+ def callback(lexer, match, ctx=None):
286
+ for i, action in enumerate(args):
287
+ if action is None:
288
+ continue
289
+ elif type(action) is _TokenType:
290
+ data = match.group(i + 1)
291
+ if data:
292
+ yield match.start(i + 1), action, data
293
+ else:
294
+ data = match.group(i + 1)
295
+ if data is not None:
296
+ if ctx:
297
+ ctx.pos = match.start(i + 1)
298
+ for item in action(lexer, _PseudoMatch(match.start(i + 1),
299
+ data), ctx):
300
+ if item:
301
+ yield item
302
+ if ctx:
303
+ ctx.pos = match.end()
304
+ return callback
305
+
306
+
307
+ class _This(object):
308
+ """
309
+ Special singleton used for indicating the caller class.
310
+ Used by ``using``.
311
+ """
312
+ this = _This()
313
+
314
+
315
+ def using(_other, **kwargs):
316
+ """
317
+ Callback that processes the match with a different lexer.
318
+
319
+ The keyword arguments are forwarded to the lexer, except `state` which
320
+ is handled separately.
321
+
322
+ `state` specifies the state that the new lexer will start in, and can
323
+ be an enumerable such as ('root', 'inline', 'string') or a simple
324
+ string which is assumed to be on top of the root state.
325
+
326
+ Note: For that to work, `_other` must not be an `ExtendedRegexLexer`.
327
+ """
328
+ gt_kwargs = {}
329
+ if 'state' in kwargs:
330
+ s = kwargs.pop('state')
331
+ if isinstance(s, (list, tuple)):
332
+ gt_kwargs['stack'] = s
333
+ else:
334
+ gt_kwargs['stack'] = ('root', s)
335
+
336
+ if _other is this:
337
+ def callback(lexer, match, ctx=None):
338
+ # if keyword arguments are given the callback
339
+ # function has to create a new lexer instance
340
+ if kwargs:
341
+ # XXX: cache that somehow
342
+ kwargs.update(lexer.options)
343
+ lx = lexer.__class__(**kwargs)
344
+ else:
345
+ lx = lexer
346
+ s = match.start()
347
+ for i, t, v in lx.get_tokens_unprocessed(match.group(), **gt_kwargs):
348
+ yield i + s, t, v
349
+ if ctx:
350
+ ctx.pos = match.end()
351
+ else:
352
+ def callback(lexer, match, ctx=None):
353
+ # XXX: cache that somehow
354
+ kwargs.update(lexer.options)
355
+ lx = _other(**kwargs)
356
+
357
+ s = match.start()
358
+ for i, t, v in lx.get_tokens_unprocessed(match.group(), **gt_kwargs):
359
+ yield i + s, t, v
360
+ if ctx:
361
+ ctx.pos = match.end()
362
+ return callback
363
+
364
+
365
+ class RegexLexerMeta(LexerMeta):
366
+ """
367
+ Metaclass for RegexLexer, creates the self._tokens attribute from
368
+ self.tokens on the first instantiation.
369
+ """
370
+
371
+ def _process_regex(cls, regex, rflags):
372
+ """Preprocess the regular expression component of a token definition."""
373
+ return re.compile(regex, rflags).match
374
+
375
+ def _process_token(cls, token):
376
+ """Preprocess the token component of a token definition."""
377
+ assert type(token) is _TokenType or callable(token), \
378
+ 'token type must be simple type or callable, not %r' % (token,)
379
+ return token
380
+
381
+ def _process_new_state(cls, new_state, unprocessed, processed):
382
+ """Preprocess the state transition action of a token definition."""
383
+ if isinstance(new_state, str):
384
+ # an existing state
385
+ if new_state == '#pop':
386
+ return -1
387
+ elif new_state in unprocessed:
388
+ return (new_state,)
389
+ elif new_state == '#push':
390
+ return new_state
391
+ elif new_state[:5] == '#pop:':
392
+ return -int(new_state[5:])
393
+ else:
394
+ assert False, 'unknown new state %r' % new_state
395
+ elif isinstance(new_state, combined):
396
+ # combine a new state from existing ones
397
+ tmp_state = '_tmp_%d' % cls._tmpname
398
+ cls._tmpname += 1
399
+ itokens = []
400
+ for istate in new_state:
401
+ assert istate != new_state, 'circular state ref %r' % istate
402
+ itokens.extend(cls._process_state(unprocessed,
403
+ processed, istate))
404
+ processed[tmp_state] = itokens
405
+ return (tmp_state,)
406
+ elif isinstance(new_state, tuple):
407
+ # push more than one state
408
+ for istate in new_state:
409
+ assert (istate in unprocessed or
410
+ istate in ('#pop', '#push')), \
411
+ 'unknown new state ' + istate
412
+ return new_state
413
+ else:
414
+ assert False, 'unknown new state def %r' % new_state
415
+
416
+ def _process_state(cls, unprocessed, processed, state):
417
+ """Preprocess a single state definition."""
418
+ assert type(state) is str, "wrong state name %r" % state
419
+ assert state[0] != '#', "invalid state name %r" % state
420
+ if state in processed:
421
+ return processed[state]
422
+ tokens = processed[state] = []
423
+ rflags = cls.flags
424
+ for tdef in unprocessed[state]:
425
+ if isinstance(tdef, include):
426
+ # it's a state reference
427
+ assert tdef != state, "circular state reference %r" % state
428
+ tokens.extend(cls._process_state(unprocessed, processed,
429
+ str(tdef)))
430
+ continue
431
+
432
+ assert type(tdef) is tuple, "wrong rule def %r" % tdef
433
+
434
+ try:
435
+ rex = cls._process_regex(tdef[0], rflags)
436
+ except Exception, err:
437
+ raise ValueError("uncompilable regex %r in state %r of %r: %s" %
438
+ (tdef[0], state, cls, err))
439
+
440
+ token = cls._process_token(tdef[1])
441
+
442
+ if len(tdef) == 2:
443
+ new_state = None
444
+ else:
445
+ new_state = cls._process_new_state(tdef[2],
446
+ unprocessed, processed)
447
+
448
+ tokens.append((rex, token, new_state))
449
+ return tokens
450
+
451
+ def process_tokendef(cls, name, tokendefs=None):
452
+ """Preprocess a dictionary of token definitions."""
453
+ processed = cls._all_tokens[name] = {}
454
+ tokendefs = tokendefs or cls.tokens[name]
455
+ for state in tokendefs.keys():
456
+ cls._process_state(tokendefs, processed, state)
457
+ return processed
458
+
459
+ def __call__(cls, *args, **kwds):
460
+ """Instantiate cls after preprocessing its token definitions."""
461
+ if '_tokens' not in cls.__dict__:
462
+ cls._all_tokens = {}
463
+ cls._tmpname = 0
464
+ if hasattr(cls, 'token_variants') and cls.token_variants:
465
+ # don't process yet
466
+ pass
467
+ else:
468
+ cls._tokens = cls.process_tokendef('', cls.tokens)
469
+
470
+ return type.__call__(cls, *args, **kwds)
471
+
472
+
473
+ class RegexLexer(Lexer):
474
+ """
475
+ Base for simple stateful regular expression-based lexers.
476
+ Simplifies the lexing process so that you need only
477
+ provide a list of states and regular expressions.
478
+ """
479
+ __metaclass__ = RegexLexerMeta
480
+
481
+ #: Flags for compiling the regular expressions.
482
+ #: Defaults to MULTILINE.
483
+ flags = re.MULTILINE
484
+
485
+ #: Dict of ``{'state': [(regex, tokentype, new_state), ...], ...}``
486
+ #:
487
+ #: The initial state is 'root'.
488
+ #: ``new_state`` can be omitted to signify no state transition.
489
+ #: If it is a string, the state is pushed on the stack and changed.
490
+ #: If it is a tuple of strings, all states are pushed on the stack and
491
+ #: the current state will be the topmost.
492
+ #: It can also be ``combined('state1', 'state2', ...)``
493
+ #: to signify a new, anonymous state combined from the rules of two
494
+ #: or more existing ones.
495
+ #: Furthermore, it can be '#pop' to signify going back one step in
496
+ #: the state stack, or '#push' to push the current state on the stack
497
+ #: again.
498
+ #:
499
+ #: The tuple can also be replaced with ``include('state')``, in which
500
+ #: case the rules from the state named by the string are included in the
501
+ #: current one.
502
+ tokens = {}
503
+
504
+ def get_tokens_unprocessed(self, text, stack=('root',)):
505
+ """
506
+ Split ``text`` into (tokentype, text) pairs.
507
+
508
+ ``stack`` is the inital stack (default: ``['root']``)
509
+ """
510
+ pos = 0
511
+ tokendefs = self._tokens
512
+ statestack = list(stack)
513
+ statetokens = tokendefs[statestack[-1]]
514
+ while 1:
515
+ for rexmatch, action, new_state in statetokens:
516
+ m = rexmatch(text, pos)
517
+ if m:
518
+ if type(action) is _TokenType:
519
+ yield pos, action, m.group()
520
+ else:
521
+ for item in action(self, m):
522
+ yield item
523
+ pos = m.end()
524
+ if new_state is not None:
525
+ # state transition
526
+ if isinstance(new_state, tuple):
527
+ for state in new_state:
528
+ if state == '#pop':
529
+ statestack.pop()
530
+ elif state == '#push':
531
+ statestack.append(statestack[-1])
532
+ else:
533
+ statestack.append(state)
534
+ elif isinstance(new_state, int):
535
+ # pop
536
+ del statestack[new_state:]
537
+ elif new_state == '#push':
538
+ statestack.append(statestack[-1])
539
+ else:
540
+ assert False, "wrong state def: %r" % new_state
541
+ statetokens = tokendefs[statestack[-1]]
542
+ break
543
+ else:
544
+ try:
545
+ if text[pos] == '\n':
546
+ # at EOL, reset state to "root"
547
+ statestack = ['root']
548
+ statetokens = tokendefs['root']
549
+ yield pos, Text, u'\n'
550
+ pos += 1
551
+ continue
552
+ yield pos, Error, text[pos]
553
+ pos += 1
554
+ except IndexError:
555
+ break
556
+
557
+
558
+ class LexerContext(object):
559
+ """
560
+ A helper object that holds lexer position data.
561
+ """
562
+
563
+ def __init__(self, text, pos, stack=None, end=None):
564
+ self.text = text
565
+ self.pos = pos
566
+ self.end = end or len(text) # end=0 not supported ;-)
567
+ self.stack = stack or ['root']
568
+
569
+ def __repr__(self):
570
+ return 'LexerContext(%r, %r, %r)' % (
571
+ self.text, self.pos, self.stack)
572
+
573
+
574
+ class ExtendedRegexLexer(RegexLexer):
575
+ """
576
+ A RegexLexer that uses a context object to store its state.
577
+ """
578
+
579
+ def get_tokens_unprocessed(self, text=None, context=None):
580
+ """
581
+ Split ``text`` into (tokentype, text) pairs.
582
+ If ``context`` is given, use this lexer context instead.
583
+ """
584
+ tokendefs = self._tokens
585
+ if not context:
586
+ ctx = LexerContext(text, 0)
587
+ statetokens = tokendefs['root']
588
+ else:
589
+ ctx = context
590
+ statetokens = tokendefs[ctx.stack[-1]]
591
+ text = ctx.text
592
+ while 1:
593
+ for rexmatch, action, new_state in statetokens:
594
+ m = rexmatch(text, ctx.pos, ctx.end)
595
+ if m:
596
+ if type(action) is _TokenType:
597
+ yield ctx.pos, action, m.group()
598
+ ctx.pos = m.end()
599
+ else:
600
+ for item in action(self, m, ctx):
601
+ yield item
602
+ if not new_state:
603
+ # altered the state stack?
604
+ statetokens = tokendefs[ctx.stack[-1]]
605
+ # CAUTION: callback must set ctx.pos!
606
+ if new_state is not None:
607
+ # state transition
608
+ if isinstance(new_state, tuple):
609
+ ctx.stack.extend(new_state)
610
+ elif isinstance(new_state, int):
611
+ # pop
612
+ del ctx.stack[new_state:]
613
+ elif new_state == '#push':
614
+ ctx.stack.append(ctx.stack[-1])
615
+ else:
616
+ assert False, "wrong state def: %r" % new_state
617
+ statetokens = tokendefs[ctx.stack[-1]]
618
+ break
619
+ else:
620
+ try:
621
+ if ctx.pos >= ctx.end:
622
+ break
623
+ if text[ctx.pos] == '\n':
624
+ # at EOL, reset state to "root"
625
+ ctx.pos += 1
626
+ ctx.stack = ['root']
627
+ statetokens = tokendefs['root']
628
+ yield ctx.pos, Text, u'\n'
629
+ continue
630
+ yield ctx.pos, Error, text[ctx.pos]
631
+ ctx.pos += 1
632
+ except IndexError:
633
+ break
634
+
635
+
636
+ def do_insertions(insertions, tokens):
637
+ """
638
+ Helper for lexers which must combine the results of several
639
+ sublexers.
640
+
641
+ ``insertions`` is a list of ``(index, itokens)`` pairs.
642
+ Each ``itokens`` iterable should be inserted at position
643
+ ``index`` into the token stream given by the ``tokens``
644
+ argument.
645
+
646
+ The result is a combined token stream.
647
+
648
+ TODO: clean up the code here.
649
+ """
650
+ insertions = iter(insertions)
651
+ try:
652
+ index, itokens = insertions.next()
653
+ except StopIteration:
654
+ # no insertions
655
+ for item in tokens:
656
+ yield item
657
+ return
658
+
659
+ realpos = None
660
+ insleft = True
661
+
662
+ # iterate over the token stream where we want to insert
663
+ # the tokens from the insertion list.
664
+ for i, t, v in tokens:
665
+ # first iteration. store the postition of first item
666
+ if realpos is None:
667
+ realpos = i
668
+ oldi = 0
669
+ while insleft and i + len(v) >= index:
670
+ tmpval = v[oldi:index - i]
671
+ yield realpos, t, tmpval
672
+ realpos += len(tmpval)
673
+ for it_index, it_token, it_value in itokens:
674
+ yield realpos, it_token, it_value
675
+ realpos += len(it_value)
676
+ oldi = index - i
677
+ try:
678
+ index, itokens = insertions.next()
679
+ except StopIteration:
680
+ insleft = False
681
+ break # not strictly necessary
682
+ yield realpos, t, v[oldi:]
683
+ realpos += len(v) - oldi
684
+
685
+ # leftover tokens
686
+ while insleft:
687
+ # no normal tokens, set realpos to zero
688
+ realpos = realpos or 0
689
+ for p, t, v in itokens:
690
+ yield realpos, t, v
691
+ realpos += len(v)
692
+ try:
693
+ index, itokens = insertions.next()
694
+ except StopIteration:
695
+ insleft = False
696
+ break # not strictly necessary
697
+