redsnow 0.0.8

Sign up to get free protection for your applications and to get access to all the features.
Files changed (174) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +34 -0
  3. data/.gitmodules +3 -0
  4. data/.travis.yml +20 -0
  5. data/CHANGELOG.md +4 -0
  6. data/Gemfile +4 -0
  7. data/LICENSE +21 -0
  8. data/README.md +62 -0
  9. data/Rakefile +36 -0
  10. data/Vagrantfile +20 -0
  11. data/ext/snowcrash/Makefile +64 -0
  12. data/ext/snowcrash/Vagrantfile +20 -0
  13. data/ext/snowcrash/bin/snowcrash +0 -0
  14. data/ext/snowcrash/common.gypi +163 -0
  15. data/ext/snowcrash/config.gypi +10 -0
  16. data/ext/snowcrash/config.mk +5 -0
  17. data/ext/snowcrash/configure +213 -0
  18. data/ext/snowcrash/provisioning.sh +15 -0
  19. data/ext/snowcrash/snowcrash.gyp +141 -0
  20. data/ext/snowcrash/src/ActionParser.h +503 -0
  21. data/ext/snowcrash/src/AssetParser.h +215 -0
  22. data/ext/snowcrash/src/BlockUtility.h +186 -0
  23. data/ext/snowcrash/src/Blueprint.h +283 -0
  24. data/ext/snowcrash/src/BlueprintParser.h +347 -0
  25. data/ext/snowcrash/src/BlueprintParserCore.h +190 -0
  26. data/ext/snowcrash/src/BlueprintSection.h +140 -0
  27. data/ext/snowcrash/src/BlueprintUtility.h +126 -0
  28. data/ext/snowcrash/src/CBlueprint.cc +600 -0
  29. data/ext/snowcrash/src/CBlueprint.h +354 -0
  30. data/ext/snowcrash/src/CSourceAnnotation.cc +140 -0
  31. data/ext/snowcrash/src/CSourceAnnotation.h +106 -0
  32. data/ext/snowcrash/src/CodeBlockUtility.h +189 -0
  33. data/ext/snowcrash/src/DescriptionSectionUtility.h +156 -0
  34. data/ext/snowcrash/src/HTTP.cc +46 -0
  35. data/ext/snowcrash/src/HTTP.h +105 -0
  36. data/ext/snowcrash/src/HeaderParser.h +289 -0
  37. data/ext/snowcrash/src/ListBlockUtility.h +273 -0
  38. data/ext/snowcrash/src/ListUtility.h +95 -0
  39. data/ext/snowcrash/src/MarkdownBlock.cc +176 -0
  40. data/ext/snowcrash/src/MarkdownBlock.h +93 -0
  41. data/ext/snowcrash/src/MarkdownParser.cc +266 -0
  42. data/ext/snowcrash/src/MarkdownParser.h +88 -0
  43. data/ext/snowcrash/src/ParameterDefinitonParser.h +570 -0
  44. data/ext/snowcrash/src/ParametersParser.h +252 -0
  45. data/ext/snowcrash/src/Parser.cc +71 -0
  46. data/ext/snowcrash/src/Parser.h +29 -0
  47. data/ext/snowcrash/src/ParserCore.cc +120 -0
  48. data/ext/snowcrash/src/ParserCore.h +82 -0
  49. data/ext/snowcrash/src/PayloadParser.h +672 -0
  50. data/ext/snowcrash/src/Platform.h +54 -0
  51. data/ext/snowcrash/src/RegexMatch.h +32 -0
  52. data/ext/snowcrash/src/ResourceGroupParser.h +195 -0
  53. data/ext/snowcrash/src/ResourceParser.h +584 -0
  54. data/ext/snowcrash/src/SectionUtility.h +142 -0
  55. data/ext/snowcrash/src/Serialize.cc +52 -0
  56. data/ext/snowcrash/src/Serialize.h +69 -0
  57. data/ext/snowcrash/src/SerializeJSON.cc +601 -0
  58. data/ext/snowcrash/src/SerializeJSON.h +21 -0
  59. data/ext/snowcrash/src/SerializeYAML.cc +336 -0
  60. data/ext/snowcrash/src/SerializeYAML.h +21 -0
  61. data/ext/snowcrash/src/SourceAnnotation.h +177 -0
  62. data/ext/snowcrash/src/StringUtility.h +109 -0
  63. data/ext/snowcrash/src/SymbolTable.h +83 -0
  64. data/ext/snowcrash/src/UriTemplateParser.cc +195 -0
  65. data/ext/snowcrash/src/UriTemplateParser.h +243 -0
  66. data/ext/snowcrash/src/Version.h +39 -0
  67. data/ext/snowcrash/src/csnowcrash.cc +23 -0
  68. data/ext/snowcrash/src/csnowcrash.h +38 -0
  69. data/ext/snowcrash/src/posix/RegexMatch.cc +99 -0
  70. data/ext/snowcrash/src/snowcrash.cc +18 -0
  71. data/ext/snowcrash/src/snowcrash.h +41 -0
  72. data/ext/snowcrash/src/snowcrash/snowcrash.cc +170 -0
  73. data/ext/snowcrash/src/win/RegexMatch.cc +78 -0
  74. data/ext/snowcrash/sundown/CONTRIBUTING.md +10 -0
  75. data/ext/snowcrash/sundown/Makefile +83 -0
  76. data/ext/snowcrash/sundown/Makefile.win +33 -0
  77. data/ext/snowcrash/sundown/examples/smartypants.c +72 -0
  78. data/ext/snowcrash/sundown/examples/sundown.c +80 -0
  79. data/ext/snowcrash/sundown/html/houdini.h +37 -0
  80. data/ext/snowcrash/sundown/html/houdini_href_e.c +108 -0
  81. data/ext/snowcrash/sundown/html/houdini_html_e.c +84 -0
  82. data/ext/snowcrash/sundown/html/html.c +647 -0
  83. data/ext/snowcrash/sundown/html/html.h +77 -0
  84. data/ext/snowcrash/sundown/html/html_smartypants.c +389 -0
  85. data/ext/snowcrash/sundown/html_block_names.txt +25 -0
  86. data/ext/snowcrash/sundown/src/autolink.c +297 -0
  87. data/ext/snowcrash/sundown/src/autolink.h +51 -0
  88. data/ext/snowcrash/sundown/src/buffer.c +225 -0
  89. data/ext/snowcrash/sundown/src/buffer.h +96 -0
  90. data/ext/snowcrash/sundown/src/html_blocks.h +206 -0
  91. data/ext/snowcrash/sundown/src/markdown.c +2701 -0
  92. data/ext/snowcrash/sundown/src/markdown.h +147 -0
  93. data/ext/snowcrash/sundown/src/src_map.c +200 -0
  94. data/ext/snowcrash/sundown/src/src_map.h +58 -0
  95. data/ext/snowcrash/sundown/src/stack.c +81 -0
  96. data/ext/snowcrash/sundown/src/stack.h +29 -0
  97. data/ext/snowcrash/sundown/sundown.def +20 -0
  98. data/ext/snowcrash/tools/gyp/AUTHORS +11 -0
  99. data/ext/snowcrash/tools/gyp/DEPS +24 -0
  100. data/ext/snowcrash/tools/gyp/OWNERS +1 -0
  101. data/ext/snowcrash/tools/gyp/PRESUBMIT.py +120 -0
  102. data/ext/snowcrash/tools/gyp/buildbot/buildbot_run.py +190 -0
  103. data/ext/snowcrash/tools/gyp/codereview.settings +10 -0
  104. data/ext/snowcrash/tools/gyp/data/win/large-pdb-shim.cc +12 -0
  105. data/ext/snowcrash/tools/gyp/gyp +8 -0
  106. data/ext/snowcrash/tools/gyp/gyp.bat +5 -0
  107. data/ext/snowcrash/tools/gyp/gyp_main.py +18 -0
  108. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSNew.py +340 -0
  109. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSProject.py +208 -0
  110. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSSettings.py +1063 -0
  111. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSToolFile.py +58 -0
  112. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSUserFile.py +147 -0
  113. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSUtil.py +267 -0
  114. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSVersion.py +409 -0
  115. data/ext/snowcrash/tools/gyp/pylib/gyp/__init__.py +537 -0
  116. data/ext/snowcrash/tools/gyp/pylib/gyp/__init__.pyc +0 -0
  117. data/ext/snowcrash/tools/gyp/pylib/gyp/common.py +521 -0
  118. data/ext/snowcrash/tools/gyp/pylib/gyp/common.pyc +0 -0
  119. data/ext/snowcrash/tools/gyp/pylib/gyp/easy_xml.py +157 -0
  120. data/ext/snowcrash/tools/gyp/pylib/gyp/flock_tool.py +49 -0
  121. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/__init__.py +0 -0
  122. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/__init__.pyc +0 -0
  123. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/android.py +1069 -0
  124. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/cmake.py +1143 -0
  125. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/dump_dependency_json.py +81 -0
  126. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/eclipse.py +335 -0
  127. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/gypd.py +87 -0
  128. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/gypsh.py +56 -0
  129. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/make.py +2181 -0
  130. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/make.pyc +0 -0
  131. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/msvs.py +3335 -0
  132. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/ninja.py +2156 -0
  133. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/xcode.py +1224 -0
  134. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/xcode.pyc +0 -0
  135. data/ext/snowcrash/tools/gyp/pylib/gyp/input.py +2809 -0
  136. data/ext/snowcrash/tools/gyp/pylib/gyp/input.pyc +0 -0
  137. data/ext/snowcrash/tools/gyp/pylib/gyp/mac_tool.py +510 -0
  138. data/ext/snowcrash/tools/gyp/pylib/gyp/msvs_emulation.py +972 -0
  139. data/ext/snowcrash/tools/gyp/pylib/gyp/ninja_syntax.py +160 -0
  140. data/ext/snowcrash/tools/gyp/pylib/gyp/ordered_dict.py +289 -0
  141. data/ext/snowcrash/tools/gyp/pylib/gyp/win_tool.py +292 -0
  142. data/ext/snowcrash/tools/gyp/pylib/gyp/xcode_emulation.py +1440 -0
  143. data/ext/snowcrash/tools/gyp/pylib/gyp/xcode_emulation.pyc +0 -0
  144. data/ext/snowcrash/tools/gyp/pylib/gyp/xcodeproj_file.py +2889 -0
  145. data/ext/snowcrash/tools/gyp/pylib/gyp/xcodeproj_file.pyc +0 -0
  146. data/ext/snowcrash/tools/gyp/pylib/gyp/xml_fix.py +69 -0
  147. data/ext/snowcrash/tools/gyp/pylintrc +307 -0
  148. data/ext/snowcrash/tools/gyp/samples/samples +81 -0
  149. data/ext/snowcrash/tools/gyp/samples/samples.bat +5 -0
  150. data/ext/snowcrash/tools/gyp/setup.py +19 -0
  151. data/ext/snowcrash/tools/gyp/tools/Xcode/Specifications/gyp.pbfilespec +27 -0
  152. data/ext/snowcrash/tools/gyp/tools/Xcode/Specifications/gyp.xclangspec +226 -0
  153. data/ext/snowcrash/tools/gyp/tools/emacs/gyp.el +252 -0
  154. data/ext/snowcrash/tools/gyp/tools/graphviz.py +100 -0
  155. data/ext/snowcrash/tools/gyp/tools/pretty_gyp.py +155 -0
  156. data/ext/snowcrash/tools/gyp/tools/pretty_sln.py +168 -0
  157. data/ext/snowcrash/tools/gyp/tools/pretty_vcproj.py +329 -0
  158. data/ext/snowcrash/tools/homebrew/snowcrash.rb +11 -0
  159. data/ext/snowcrash/vcbuild.bat +184 -0
  160. data/lib/redsnow.rb +31 -0
  161. data/lib/redsnow/binding.rb +132 -0
  162. data/lib/redsnow/blueprint.rb +365 -0
  163. data/lib/redsnow/object.rb +18 -0
  164. data/lib/redsnow/parseresult.rb +107 -0
  165. data/lib/redsnow/version.rb +4 -0
  166. data/provisioning.sh +20 -0
  167. data/redsnow.gemspec +35 -0
  168. data/test/_helper.rb +15 -0
  169. data/test/fixtures/sample-api-ast.json +97 -0
  170. data/test/fixtures/sample-api.apib +20 -0
  171. data/test/redsnow_binding_test.rb +35 -0
  172. data/test/redsnow_parseresult_test.rb +50 -0
  173. data/test/redsnow_test.rb +285 -0
  174. metadata +358 -0
@@ -0,0 +1,96 @@
1
+ /*
2
+ * Copyright (c) 2008, Natacha Porté
3
+ * Copyright (c) 2011, Vicent Martí
4
+ *
5
+ * Permission to use, copy, modify, and distribute this software for any
6
+ * purpose with or without fee is hereby granted, provided that the above
7
+ * copyright notice and this permission notice appear in all copies.
8
+ *
9
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16
+ */
17
+
18
+ #ifndef BUFFER_H__
19
+ #define BUFFER_H__
20
+
21
+ #include <stddef.h>
22
+ #include <stdarg.h>
23
+ #include <stdint.h>
24
+
25
+ #ifdef __cplusplus
26
+ extern "C" {
27
+ #endif
28
+
29
+ #if defined(_MSC_VER)
30
+ #define __attribute__(x)
31
+ #define inline
32
+ #endif
33
+
34
+ typedef enum {
35
+ BUF_OK = 0,
36
+ BUF_ENOMEM = -1
37
+ } buferror_t;
38
+
39
+ /* struct buf: character array buffer */
40
+ struct buf {
41
+ uint8_t *data; /* actual character data */
42
+ size_t size; /* size of the string */
43
+ size_t asize; /* allocated size (0 = volatile buffer) */
44
+ size_t unit; /* reallocation unit size (0 = read-only buffer) */
45
+ };
46
+
47
+ /* CONST_BUF: global buffer from a string litteral */
48
+ #define BUF_STATIC(string) \
49
+ { (uint8_t *)string, sizeof string -1, sizeof string, 0, 0 }
50
+
51
+ /* VOLATILE_BUF: macro for creating a volatile buffer on the stack */
52
+ #define BUF_VOLATILE(strname) \
53
+ { (uint8_t *)strname, strlen(strname), 0, 0, 0 }
54
+
55
+ /* BUFPUTSL: optimized bufputs of a string litteral */
56
+ #define BUFPUTSL(output, literal) \
57
+ bufput(output, literal, sizeof literal - 1)
58
+
59
+ /* bufgrow: increasing the allocated size to the given value */
60
+ int bufgrow(struct buf *, size_t);
61
+
62
+ /* bufnew: allocation of a new buffer */
63
+ struct buf *bufnew(size_t) __attribute__ ((malloc));
64
+
65
+ /* bufnullterm: NUL-termination of the string array (making a C-string) */
66
+ const char *bufcstr(struct buf *);
67
+
68
+ /* bufprefix: compare the beginning of a buffer with a string */
69
+ int bufprefix(const struct buf *buf, const char *prefix);
70
+
71
+ /* bufput: appends raw data to a buffer */
72
+ void bufput(struct buf *, const void *, size_t);
73
+
74
+ /* bufputs: appends a NUL-terminated string to a buffer */
75
+ void bufputs(struct buf *, const char *);
76
+
77
+ /* bufputc: appends a single char to a buffer */
78
+ void bufputc(struct buf *, int);
79
+
80
+ /* bufrelease: decrease the reference count and free the buffer if needed */
81
+ void bufrelease(struct buf *);
82
+
83
+ /* bufreset: frees internal data of the buffer */
84
+ void bufreset(struct buf *);
85
+
86
+ /* bufslurp: removes a given number of bytes from the head of the array */
87
+ void bufslurp(struct buf *, size_t);
88
+
89
+ /* bufprintf: formatted printing to a buffer */
90
+ void bufprintf(struct buf *, const char *, ...) __attribute__ ((format (printf, 2, 3)));
91
+
92
+ #ifdef __cplusplus
93
+ }
94
+ #endif
95
+
96
+ #endif
@@ -0,0 +1,206 @@
1
+ /* C code produced by gperf version 3.0.3 */
2
+ /* Command-line: gperf -N find_block_tag -H hash_block_tag -C -c -E --ignore-case html_block_names.txt */
3
+ /* Computed positions: -k'1-2' */
4
+
5
+ #if !((' ' == 32) && ('!' == 33) && ('"' == 34) && ('#' == 35) \
6
+ && ('%' == 37) && ('&' == 38) && ('\'' == 39) && ('(' == 40) \
7
+ && (')' == 41) && ('*' == 42) && ('+' == 43) && (',' == 44) \
8
+ && ('-' == 45) && ('.' == 46) && ('/' == 47) && ('0' == 48) \
9
+ && ('1' == 49) && ('2' == 50) && ('3' == 51) && ('4' == 52) \
10
+ && ('5' == 53) && ('6' == 54) && ('7' == 55) && ('8' == 56) \
11
+ && ('9' == 57) && (':' == 58) && (';' == 59) && ('<' == 60) \
12
+ && ('=' == 61) && ('>' == 62) && ('?' == 63) && ('A' == 65) \
13
+ && ('B' == 66) && ('C' == 67) && ('D' == 68) && ('E' == 69) \
14
+ && ('F' == 70) && ('G' == 71) && ('H' == 72) && ('I' == 73) \
15
+ && ('J' == 74) && ('K' == 75) && ('L' == 76) && ('M' == 77) \
16
+ && ('N' == 78) && ('O' == 79) && ('P' == 80) && ('Q' == 81) \
17
+ && ('R' == 82) && ('S' == 83) && ('T' == 84) && ('U' == 85) \
18
+ && ('V' == 86) && ('W' == 87) && ('X' == 88) && ('Y' == 89) \
19
+ && ('Z' == 90) && ('[' == 91) && ('\\' == 92) && (']' == 93) \
20
+ && ('^' == 94) && ('_' == 95) && ('a' == 97) && ('b' == 98) \
21
+ && ('c' == 99) && ('d' == 100) && ('e' == 101) && ('f' == 102) \
22
+ && ('g' == 103) && ('h' == 104) && ('i' == 105) && ('j' == 106) \
23
+ && ('k' == 107) && ('l' == 108) && ('m' == 109) && ('n' == 110) \
24
+ && ('o' == 111) && ('p' == 112) && ('q' == 113) && ('r' == 114) \
25
+ && ('s' == 115) && ('t' == 116) && ('u' == 117) && ('v' == 118) \
26
+ && ('w' == 119) && ('x' == 120) && ('y' == 121) && ('z' == 122) \
27
+ && ('{' == 123) && ('|' == 124) && ('}' == 125) && ('~' == 126))
28
+ /* The character set is not based on ISO-646. */
29
+ error "gperf generated tables don't work with this execution character set. Please report a bug to <bug-gnu-gperf@gnu.org>."
30
+ #endif
31
+
32
+ /* maximum key range = 37, duplicates = 0 */
33
+
34
+ #ifndef GPERF_DOWNCASE
35
+ #define GPERF_DOWNCASE 1
36
+ static unsigned char gperf_downcase[256] =
37
+ {
38
+ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14,
39
+ 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
40
+ 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44,
41
+ 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59,
42
+ 60, 61, 62, 63, 64, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106,
43
+ 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121,
44
+ 122, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104,
45
+ 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119,
46
+ 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134,
47
+ 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149,
48
+ 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164,
49
+ 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179,
50
+ 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194,
51
+ 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209,
52
+ 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224,
53
+ 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239,
54
+ 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254,
55
+ 255
56
+ };
57
+ #endif
58
+
59
+ #ifndef GPERF_CASE_STRNCMP
60
+ #define GPERF_CASE_STRNCMP 1
61
+ static int
62
+ gperf_case_strncmp (s1, s2, n)
63
+ register const char *s1;
64
+ register const char *s2;
65
+ register unsigned int n;
66
+ {
67
+ for (; n > 0;)
68
+ {
69
+ unsigned char c1 = gperf_downcase[(unsigned char)*s1++];
70
+ unsigned char c2 = gperf_downcase[(unsigned char)*s2++];
71
+ if (c1 != 0 && c1 == c2)
72
+ {
73
+ n--;
74
+ continue;
75
+ }
76
+ return (int)c1 - (int)c2;
77
+ }
78
+ return 0;
79
+ }
80
+ #endif
81
+
82
+ #ifdef __GNUC__
83
+ __inline
84
+ #else
85
+ #ifdef __cplusplus
86
+ inline
87
+ #endif
88
+ #endif
89
+ static unsigned int
90
+ hash_block_tag (str, len)
91
+ register const char *str;
92
+ register unsigned int len;
93
+ {
94
+ static const unsigned char asso_values[] =
95
+ {
96
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
97
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
98
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
99
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
100
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
101
+ 8, 30, 25, 20, 15, 10, 38, 38, 38, 38,
102
+ 38, 38, 38, 38, 38, 38, 0, 38, 0, 38,
103
+ 5, 5, 5, 15, 0, 38, 38, 0, 15, 10,
104
+ 0, 38, 38, 15, 0, 5, 38, 38, 38, 38,
105
+ 38, 38, 38, 38, 38, 38, 38, 38, 0, 38,
106
+ 0, 38, 5, 5, 5, 15, 0, 38, 38, 0,
107
+ 15, 10, 0, 38, 38, 15, 0, 5, 38, 38,
108
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
109
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
110
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
111
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
112
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
113
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
114
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
115
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
116
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
117
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
118
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
119
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
120
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
121
+ 38, 38, 38, 38, 38, 38, 38
122
+ };
123
+ register int hval = len;
124
+
125
+ switch (hval)
126
+ {
127
+ default:
128
+ hval += asso_values[(unsigned char)str[1]+1];
129
+ /*FALLTHROUGH*/
130
+ case 1:
131
+ hval += asso_values[(unsigned char)str[0]];
132
+ break;
133
+ }
134
+ return hval;
135
+ }
136
+
137
+ #ifdef __GNUC__
138
+ __inline
139
+ #ifdef __GNUC_STDC_INLINE__
140
+ __attribute__ ((__gnu_inline__))
141
+ #endif
142
+ #endif
143
+ const char *
144
+ find_block_tag (str, len)
145
+ register const char *str;
146
+ register unsigned int len;
147
+ {
148
+ enum
149
+ {
150
+ TOTAL_KEYWORDS = 24,
151
+ MIN_WORD_LENGTH = 1,
152
+ MAX_WORD_LENGTH = 10,
153
+ MIN_HASH_VALUE = 1,
154
+ MAX_HASH_VALUE = 37
155
+ };
156
+
157
+ static const char * const wordlist[] =
158
+ {
159
+ "",
160
+ "p",
161
+ "dl",
162
+ "div",
163
+ "math",
164
+ "table",
165
+ "",
166
+ "ul",
167
+ "del",
168
+ "form",
169
+ "blockquote",
170
+ "figure",
171
+ "ol",
172
+ "fieldset",
173
+ "",
174
+ "h1",
175
+ "",
176
+ "h6",
177
+ "pre",
178
+ "", "",
179
+ "script",
180
+ "h5",
181
+ "noscript",
182
+ "",
183
+ "style",
184
+ "iframe",
185
+ "h4",
186
+ "ins",
187
+ "", "", "",
188
+ "h3",
189
+ "", "", "", "",
190
+ "h2"
191
+ };
192
+
193
+ if (len <= MAX_WORD_LENGTH && len >= MIN_WORD_LENGTH)
194
+ {
195
+ register int key = hash_block_tag (str, len);
196
+
197
+ if (key <= MAX_HASH_VALUE && key >= 0)
198
+ {
199
+ register const char *s = wordlist[key];
200
+
201
+ if ((((unsigned char)*str ^ (unsigned char)*s) & ~32) == 0 && !gperf_case_strncmp (str, s, len) && s[len] == '\0')
202
+ return s;
203
+ }
204
+ }
205
+ return 0;
206
+ }
@@ -0,0 +1,2701 @@
1
+ /* markdown.c - generic markdown parser */
2
+
3
+ /*
4
+ * Copyright (c) 2009, Natacha Porté
5
+ * Copyright (c) 2011, Vicent Marti
6
+ *
7
+ * Permission to use, copy, modify, and distribute this software for any
8
+ * purpose with or without fee is hereby granted, provided that the above
9
+ * copyright notice and this permission notice appear in all copies.
10
+ *
11
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
12
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
14
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18
+ */
19
+
20
+ #include "markdown.h"
21
+ #include "stack.h"
22
+ #include "src_map.h"
23
+
24
+ #include <assert.h>
25
+ #include <string.h>
26
+ #include <ctype.h>
27
+ #include <stdio.h>
28
+
29
+ #if defined(_WIN32)
30
+ #define strncasecmp _strnicmp
31
+ #endif
32
+
33
+ #define REF_TABLE_SIZE 8
34
+
35
+ #define BUFFER_BLOCK 0
36
+ #define BUFFER_SPAN 1
37
+
38
+ #define MKD_LI_END 8 /* internal list flag */
39
+
40
+ #define gperf_case_strncmp(s1, s2, n) strncasecmp(s1, s2, n)
41
+ #define GPERF_DOWNCASE 1
42
+ #define GPERF_CASE_STRNCMP 1
43
+ #include "html_blocks.h"
44
+
45
+ /***************
46
+ * LOCAL TYPES *
47
+ ***************/
48
+
49
+ /* link_ref: reference to a link */
50
+ struct link_ref {
51
+ unsigned int id;
52
+
53
+ struct buf *link;
54
+ struct buf *title;
55
+
56
+ struct link_ref *next;
57
+ };
58
+
59
+ /* char_trigger: function pointer to render active chars */
60
+ /* returns the number of chars taken care of */
61
+ /* data is the pointer of the beginning of the span */
62
+ /* offset is the number of valid chars before data */
63
+ struct sd_markdown;
64
+ typedef size_t
65
+ (*char_trigger)(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
66
+
67
+ static size_t char_emphasis(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
68
+ static size_t char_linebreak(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
69
+ static size_t char_codespan(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
70
+ static size_t char_escape(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
71
+ static size_t char_entity(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
72
+ static size_t char_langle_tag(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
73
+ static size_t char_autolink_url(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
74
+ static size_t char_autolink_email(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
75
+ static size_t char_autolink_www(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
76
+ static size_t char_link(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
77
+ static size_t char_superscript(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
78
+
79
+ enum markdown_char_t {
80
+ MD_CHAR_NONE = 0,
81
+ MD_CHAR_EMPHASIS,
82
+ MD_CHAR_CODESPAN,
83
+ MD_CHAR_LINEBREAK,
84
+ MD_CHAR_LINK,
85
+ MD_CHAR_LANGLE,
86
+ MD_CHAR_ESCAPE,
87
+ MD_CHAR_ENTITITY,
88
+ MD_CHAR_AUTOLINK_URL,
89
+ MD_CHAR_AUTOLINK_EMAIL,
90
+ MD_CHAR_AUTOLINK_WWW,
91
+ MD_CHAR_SUPERSCRIPT,
92
+ };
93
+
94
+ static char_trigger markdown_char_ptrs[] = {
95
+ NULL,
96
+ &char_emphasis,
97
+ &char_codespan,
98
+ &char_linebreak,
99
+ &char_link,
100
+ &char_langle_tag,
101
+ &char_escape,
102
+ &char_entity,
103
+ &char_autolink_url,
104
+ &char_autolink_email,
105
+ &char_autolink_www,
106
+ &char_superscript,
107
+ };
108
+
109
+ /* render • structure containing one particular render */
110
+ struct sd_markdown {
111
+ struct sd_callbacks cb;
112
+ void *opaque;
113
+
114
+ struct link_ref *refs[REF_TABLE_SIZE];
115
+ uint8_t active_char[256];
116
+ struct stack work_bufs[2];
117
+ unsigned int ext_flags;
118
+ size_t max_nesting;
119
+ int in_link_body;
120
+ };
121
+
122
+ /***************************
123
+ * HELPER FUNCTIONS *
124
+ ***************************/
125
+
126
+ static inline struct buf *
127
+ rndr_newbuf(struct sd_markdown *rndr, int type)
128
+ {
129
+ static const size_t buf_size[2] = {256, 64};
130
+ struct buf *work = NULL;
131
+ struct stack *pool = &rndr->work_bufs[type];
132
+
133
+ if (pool->size < pool->asize &&
134
+ pool->item[pool->size] != NULL) {
135
+ work = pool->item[pool->size++];
136
+ work->size = 0;
137
+ } else {
138
+ work = bufnew(buf_size[type]);
139
+ stack_push(pool, work);
140
+ }
141
+
142
+ return work;
143
+ }
144
+
145
+ static inline void
146
+ rndr_popbuf(struct sd_markdown *rndr, int type)
147
+ {
148
+ rndr->work_bufs[type].size--;
149
+ }
150
+
151
+ static void
152
+ unscape_text(struct buf *ob, struct buf *src)
153
+ {
154
+ size_t i = 0, org;
155
+ while (i < src->size) {
156
+ org = i;
157
+ while (i < src->size && src->data[i] != '\\')
158
+ i++;
159
+
160
+ if (i > org)
161
+ bufput(ob, src->data + org, i - org);
162
+
163
+ if (i + 1 >= src->size)
164
+ break;
165
+
166
+ bufputc(ob, src->data[i + 1]);
167
+ i += 2;
168
+ }
169
+ }
170
+
171
+ static unsigned int
172
+ hash_link_ref(const uint8_t *link_ref, size_t length)
173
+ {
174
+ size_t i;
175
+ unsigned int hash = 0;
176
+
177
+ for (i = 0; i < length; ++i)
178
+ hash = tolower(link_ref[i]) + (hash << 6) + (hash << 16) - hash;
179
+
180
+ return hash;
181
+ }
182
+
183
+ static struct link_ref *
184
+ add_link_ref(
185
+ struct link_ref **references,
186
+ const uint8_t *name, size_t name_size)
187
+ {
188
+ struct link_ref *ref = calloc(1, sizeof(struct link_ref));
189
+
190
+ if (!ref)
191
+ return NULL;
192
+
193
+ ref->id = hash_link_ref(name, name_size);
194
+ ref->next = references[ref->id % REF_TABLE_SIZE];
195
+
196
+ references[ref->id % REF_TABLE_SIZE] = ref;
197
+ return ref;
198
+ }
199
+
200
+ static struct link_ref *
201
+ find_link_ref(struct link_ref **references, uint8_t *name, size_t length)
202
+ {
203
+ unsigned int hash = hash_link_ref(name, length);
204
+ struct link_ref *ref = NULL;
205
+
206
+ ref = references[hash % REF_TABLE_SIZE];
207
+
208
+ while (ref != NULL) {
209
+ if (ref->id == hash)
210
+ return ref;
211
+
212
+ ref = ref->next;
213
+ }
214
+
215
+ return NULL;
216
+ }
217
+
218
+ static void
219
+ free_link_refs(struct link_ref **references)
220
+ {
221
+ size_t i;
222
+
223
+ for (i = 0; i < REF_TABLE_SIZE; ++i) {
224
+ struct link_ref *r = references[i];
225
+ struct link_ref *next;
226
+
227
+ while (r) {
228
+ next = r->next;
229
+ bufrelease(r->link);
230
+ bufrelease(r->title);
231
+ free(r);
232
+ r = next;
233
+ }
234
+ }
235
+ }
236
+
237
+ /*
238
+ * Check whether a char is a Markdown space.
239
+
240
+ * Right now we only consider spaces the actual
241
+ * space and a newline: tabs and carriage returns
242
+ * are filtered out during the preprocessing phase.
243
+ *
244
+ * If we wanted to actually be UTF-8 compliant, we
245
+ * should instead extract an Unicode codepoint from
246
+ * this character and check for space properties.
247
+ */
248
+ static inline int
249
+ _isspace(int c)
250
+ {
251
+ return c == ' ' || c == '\n';
252
+ }
253
+
254
+ /****************************
255
+ * INLINE PARSING FUNCTIONS *
256
+ ****************************/
257
+
258
+ /* is_mail_autolink • looks for the address part of a mail autolink and '>' */
259
+ /* this is less strict than the original markdown e-mail address matching */
260
+ static size_t
261
+ is_mail_autolink(uint8_t *data, size_t size)
262
+ {
263
+ size_t i = 0, nb = 0;
264
+
265
+ /* address is assumed to be: [-@._a-zA-Z0-9]+ with exactly one '@' */
266
+ for (i = 0; i < size; ++i) {
267
+ if (isalnum(data[i]))
268
+ continue;
269
+
270
+ switch (data[i]) {
271
+ case '@':
272
+ nb++;
273
+
274
+ case '-':
275
+ case '.':
276
+ case '_':
277
+ break;
278
+
279
+ case '>':
280
+ return (nb == 1) ? i + 1 : 0;
281
+
282
+ default:
283
+ return 0;
284
+ }
285
+ }
286
+
287
+ return 0;
288
+ }
289
+
290
+ /* tag_length • returns the length of the given tag, or 0 is it's not valid */
291
+ static size_t
292
+ tag_length(uint8_t *data, size_t size, enum mkd_autolink *autolink)
293
+ {
294
+ size_t i, j;
295
+
296
+ /* a valid tag can't be shorter than 3 chars */
297
+ if (size < 3) return 0;
298
+
299
+ /* begins with a '<' optionally followed by '/', followed by letter or number */
300
+ if (data[0] != '<') return 0;
301
+ i = (data[1] == '/') ? 2 : 1;
302
+
303
+ if (!isalnum(data[i]))
304
+ return 0;
305
+
306
+ /* scheme test */
307
+ *autolink = MKDA_NOT_AUTOLINK;
308
+
309
+ /* try to find the beginning of an URI */
310
+ while (i < size && (isalnum(data[i]) || data[i] == '.' || data[i] == '+' || data[i] == '-'))
311
+ i++;
312
+
313
+ if (i > 1 && data[i] == '@') {
314
+ if ((j = is_mail_autolink(data + i, size - i)) != 0) {
315
+ *autolink = MKDA_EMAIL;
316
+ return i + j;
317
+ }
318
+ }
319
+
320
+ if (i > 2 && data[i] == ':') {
321
+ *autolink = MKDA_NORMAL;
322
+ i++;
323
+ }
324
+
325
+ /* completing autolink test: no whitespace or ' or " */
326
+ if (i >= size)
327
+ *autolink = MKDA_NOT_AUTOLINK;
328
+
329
+ else if (*autolink) {
330
+ j = i;
331
+
332
+ while (i < size) {
333
+ if (data[i] == '\\') i += 2;
334
+ else if (data[i] == '>' || data[i] == '\'' ||
335
+ data[i] == '"' || data[i] == ' ' || data[i] == '\n')
336
+ break;
337
+ else i++;
338
+ }
339
+
340
+ if (i >= size) return 0;
341
+ if (i > j && data[i] == '>') return i + 1;
342
+ /* one of the forbidden chars has been found */
343
+ *autolink = MKDA_NOT_AUTOLINK;
344
+ }
345
+
346
+ /* looking for sometinhg looking like a tag end */
347
+ while (i < size && data[i] != '>') i++;
348
+ if (i >= size) return 0;
349
+ return i + 1;
350
+ }
351
+
352
+ /* parse_inline • parses inline markdown elements */
353
+ static void
354
+ parse_inline(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
355
+ {
356
+ size_t i = 0, end = 0;
357
+ uint8_t action = 0;
358
+ struct buf work = { 0, 0, 0, 0 };
359
+
360
+ if (rndr->work_bufs[BUFFER_SPAN].size +
361
+ rndr->work_bufs[BUFFER_BLOCK].size > rndr->max_nesting)
362
+ return;
363
+
364
+ while (i < size) {
365
+ /* copying inactive chars into the output */
366
+ while (end < size && (action = rndr->active_char[data[end]]) == 0) {
367
+ end++;
368
+ }
369
+
370
+ if (rndr->cb.normal_text) {
371
+ work.data = data + i;
372
+ work.size = end - i;
373
+ rndr->cb.normal_text(ob, &work, rndr->opaque);
374
+ }
375
+ else
376
+ bufput(ob, data + i, end - i);
377
+
378
+ if (end >= size) break;
379
+ i = end;
380
+
381
+ end = markdown_char_ptrs[(int)action](ob, rndr, data + i, i, size - i);
382
+ if (!end) /* no action from the callback */
383
+ end = i + 1;
384
+ else {
385
+ i += end;
386
+ end = i;
387
+ }
388
+ }
389
+ }
390
+
391
+ /* find_emph_char • looks for the next emph uint8_t, skipping other constructs */
392
+ static size_t
393
+ find_emph_char(uint8_t *data, size_t size, uint8_t c)
394
+ {
395
+ size_t i = 1;
396
+
397
+ while (i < size) {
398
+ while (i < size && data[i] != c && data[i] != '`' && data[i] != '[')
399
+ i++;
400
+
401
+ if (i == size)
402
+ return 0;
403
+
404
+ if (data[i] == c)
405
+ return i;
406
+
407
+ /* not counting escaped chars */
408
+ if (i && data[i - 1] == '\\') {
409
+ i++; continue;
410
+ }
411
+
412
+ if (data[i] == '`') {
413
+ size_t span_nb = 0, bt;
414
+ size_t tmp_i = 0;
415
+
416
+ /* counting the number of opening backticks */
417
+ while (i < size && data[i] == '`') {
418
+ i++; span_nb++;
419
+ }
420
+
421
+ if (i >= size) return 0;
422
+
423
+ /* finding the matching closing sequence */
424
+ bt = 0;
425
+ while (i < size && bt < span_nb) {
426
+ if (!tmp_i && data[i] == c) tmp_i = i;
427
+ if (data[i] == '`') bt++;
428
+ else bt = 0;
429
+ i++;
430
+ }
431
+
432
+ if (i >= size) return tmp_i;
433
+ }
434
+ /* skipping a link */
435
+ else if (data[i] == '[') {
436
+ size_t tmp_i = 0;
437
+ uint8_t cc;
438
+
439
+ i++;
440
+ while (i < size && data[i] != ']') {
441
+ if (!tmp_i && data[i] == c) tmp_i = i;
442
+ i++;
443
+ }
444
+
445
+ i++;
446
+ while (i < size && (data[i] == ' ' || data[i] == '\n'))
447
+ i++;
448
+
449
+ if (i >= size)
450
+ return tmp_i;
451
+
452
+ switch (data[i]) {
453
+ case '[':
454
+ cc = ']'; break;
455
+
456
+ case '(':
457
+ cc = ')'; break;
458
+
459
+ default:
460
+ if (tmp_i)
461
+ return tmp_i;
462
+ else
463
+ continue;
464
+ }
465
+
466
+ i++;
467
+ while (i < size && data[i] != cc) {
468
+ if (!tmp_i && data[i] == c) tmp_i = i;
469
+ i++;
470
+ }
471
+
472
+ if (i >= size)
473
+ return tmp_i;
474
+
475
+ i++;
476
+ }
477
+ }
478
+
479
+ return 0;
480
+ }
481
+
482
+ /* parse_emph1 • parsing single emphase */
483
+ /* closed by a symbol not preceded by whitespace and not followed by symbol */
484
+ static size_t
485
+ parse_emph1(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
486
+ {
487
+ size_t i = 0, len;
488
+ struct buf *work = 0;
489
+ int r;
490
+
491
+ if (!rndr->cb.emphasis) return 0;
492
+
493
+ /* skipping one symbol if coming from emph3 */
494
+ if (size > 1 && data[0] == c && data[1] == c) i = 1;
495
+
496
+ while (i < size) {
497
+ len = find_emph_char(data + i, size - i, c);
498
+ if (!len) return 0;
499
+ i += len;
500
+ if (i >= size) return 0;
501
+
502
+ if (data[i] == c && !_isspace(data[i - 1])) {
503
+
504
+ if (rndr->ext_flags & MKDEXT_NO_INTRA_EMPHASIS) {
505
+ if (i + 1 < size && isalnum(data[i + 1]))
506
+ continue;
507
+ }
508
+
509
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
510
+ parse_inline(work, rndr, data, i);
511
+ r = rndr->cb.emphasis(ob, work, rndr->opaque);
512
+ rndr_popbuf(rndr, BUFFER_SPAN);
513
+ return r ? i + 1 : 0;
514
+ }
515
+ }
516
+
517
+ return 0;
518
+ }
519
+
520
+ /* parse_emph2 • parsing single emphase */
521
+ static size_t
522
+ parse_emph2(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
523
+ {
524
+ int (*render_method)(struct buf *ob, const struct buf *text, void *opaque);
525
+ size_t i = 0, len;
526
+ struct buf *work = 0;
527
+ int r;
528
+
529
+ render_method = (c == '~') ? rndr->cb.strikethrough : rndr->cb.double_emphasis;
530
+
531
+ if (!render_method)
532
+ return 0;
533
+
534
+ while (i < size) {
535
+ len = find_emph_char(data + i, size - i, c);
536
+ if (!len) return 0;
537
+ i += len;
538
+
539
+ if (i + 1 < size && data[i] == c && data[i + 1] == c && i && !_isspace(data[i - 1])) {
540
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
541
+ parse_inline(work, rndr, data, i);
542
+ r = render_method(ob, work, rndr->opaque);
543
+ rndr_popbuf(rndr, BUFFER_SPAN);
544
+ return r ? i + 2 : 0;
545
+ }
546
+ i++;
547
+ }
548
+ return 0;
549
+ }
550
+
551
+ /* parse_emph3 • parsing single emphase */
552
+ /* finds the first closing tag, and delegates to the other emph */
553
+ static size_t
554
+ parse_emph3(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
555
+ {
556
+ size_t i = 0, len;
557
+ int r;
558
+
559
+ while (i < size) {
560
+ len = find_emph_char(data + i, size - i, c);
561
+ if (!len) return 0;
562
+ i += len;
563
+
564
+ /* skip whitespace preceded symbols */
565
+ if (data[i] != c || _isspace(data[i - 1]))
566
+ continue;
567
+
568
+ if (i + 2 < size && data[i + 1] == c && data[i + 2] == c && rndr->cb.triple_emphasis) {
569
+ /* triple symbol found */
570
+ struct buf *work = rndr_newbuf(rndr, BUFFER_SPAN);
571
+
572
+ parse_inline(work, rndr, data, i);
573
+ r = rndr->cb.triple_emphasis(ob, work, rndr->opaque);
574
+ rndr_popbuf(rndr, BUFFER_SPAN);
575
+ return r ? i + 3 : 0;
576
+
577
+ } else if (i + 1 < size && data[i + 1] == c) {
578
+ /* double symbol found, handing over to emph1 */
579
+ len = parse_emph1(ob, rndr, data - 2, size + 2, c);
580
+ if (!len) return 0;
581
+ else return len - 2;
582
+
583
+ } else {
584
+ /* single symbol found, handing over to emph2 */
585
+ len = parse_emph2(ob, rndr, data - 1, size + 1, c);
586
+ if (!len) return 0;
587
+ else return len - 1;
588
+ }
589
+ }
590
+ return 0;
591
+ }
592
+
593
+ /* char_emphasis • single and double emphasis parsing */
594
+ static size_t
595
+ char_emphasis(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
596
+ {
597
+ uint8_t c = data[0];
598
+ size_t ret;
599
+
600
+ if (rndr->ext_flags & MKDEXT_NO_INTRA_EMPHASIS) {
601
+ if (offset > 0 && !_isspace(data[-1]) && data[-1] != '>')
602
+ return 0;
603
+ }
604
+
605
+ if (size > 2 && data[1] != c) {
606
+ /* whitespace cannot follow an opening emphasis;
607
+ * strikethrough only takes two characters '~~' */
608
+ if (c == '~' || _isspace(data[1]) || (ret = parse_emph1(ob, rndr, data + 1, size - 1, c)) == 0)
609
+ return 0;
610
+
611
+ return ret + 1;
612
+ }
613
+
614
+ if (size > 3 && data[1] == c && data[2] != c) {
615
+ if (_isspace(data[2]) || (ret = parse_emph2(ob, rndr, data + 2, size - 2, c)) == 0)
616
+ return 0;
617
+
618
+ return ret + 2;
619
+ }
620
+
621
+ if (size > 4 && data[1] == c && data[2] == c && data[3] != c) {
622
+ if (c == '~' || _isspace(data[3]) || (ret = parse_emph3(ob, rndr, data + 3, size - 3, c)) == 0)
623
+ return 0;
624
+
625
+ return ret + 3;
626
+ }
627
+
628
+ return 0;
629
+ }
630
+
631
+
632
+ /* char_linebreak • '\n' preceded by two spaces (assuming linebreak != 0) */
633
+ static size_t
634
+ char_linebreak(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
635
+ {
636
+ if (offset < 2 || data[-1] != ' ' || data[-2] != ' ')
637
+ return 0;
638
+
639
+ /* removing the last space from ob and rendering */
640
+ while (ob->size && ob->data[ob->size - 1] == ' ')
641
+ ob->size--;
642
+
643
+ return rndr->cb.linebreak(ob, rndr->opaque) ? 1 : 0;
644
+ }
645
+
646
+
647
+ /* char_codespan • '`' parsing a code span (assuming codespan != 0) */
648
+ static size_t
649
+ char_codespan(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
650
+ {
651
+ size_t end, nb = 0, i, f_begin, f_end;
652
+
653
+ /* counting the number of backticks in the delimiter */
654
+ while (nb < size && data[nb] == '`')
655
+ nb++;
656
+
657
+ /* finding the next delimiter */
658
+ i = 0;
659
+ for (end = nb; end < size && i < nb; end++) {
660
+ if (data[end] == '`') i++;
661
+ else i = 0;
662
+ }
663
+
664
+ if (i < nb && end >= size)
665
+ return 0; /* no matching delimiter */
666
+
667
+ /* trimming outside whitespaces */
668
+ f_begin = nb;
669
+ while (f_begin < end && data[f_begin] == ' ')
670
+ f_begin++;
671
+
672
+ f_end = end - nb;
673
+ while (f_end > nb && data[f_end-1] == ' ')
674
+ f_end--;
675
+
676
+ /* real code span */
677
+ if (f_begin < f_end) {
678
+ struct buf work = { data + f_begin, f_end - f_begin, 0, 0 };
679
+ if (!rndr->cb.codespan(ob, &work, rndr->opaque))
680
+ end = 0;
681
+ } else {
682
+ if (!rndr->cb.codespan(ob, 0, rndr->opaque))
683
+ end = 0;
684
+ }
685
+
686
+ return end;
687
+ }
688
+
689
+
690
+ /* char_escape • '\\' backslash escape */
691
+ static size_t
692
+ char_escape(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
693
+ {
694
+ static const char *escape_chars = "\\`*_{}[]()#+-.!:|&<>^~";
695
+ struct buf work = { 0, 0, 0, 0 };
696
+
697
+ if (size > 1) {
698
+ if (strchr(escape_chars, data[1]) == NULL)
699
+ return 0;
700
+
701
+ if (rndr->cb.normal_text) {
702
+ work.data = data + 1;
703
+ work.size = 1;
704
+ rndr->cb.normal_text(ob, &work, rndr->opaque);
705
+ }
706
+ else bufputc(ob, data[1]);
707
+ } else if (size == 1) {
708
+ bufputc(ob, data[0]);
709
+ }
710
+
711
+ return 2;
712
+ }
713
+
714
+ /* char_entity • '&' escaped when it doesn't belong to an entity */
715
+ /* valid entities are assumed to be anything matching &#?[A-Za-z0-9]+; */
716
+ static size_t
717
+ char_entity(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
718
+ {
719
+ size_t end = 1;
720
+ struct buf work = { 0, 0, 0, 0 };
721
+
722
+ if (end < size && data[end] == '#')
723
+ end++;
724
+
725
+ while (end < size && isalnum(data[end]))
726
+ end++;
727
+
728
+ if (end < size && data[end] == ';')
729
+ end++; /* real entity */
730
+ else
731
+ return 0; /* lone '&' */
732
+
733
+ if (rndr->cb.entity) {
734
+ work.data = data;
735
+ work.size = end;
736
+ rndr->cb.entity(ob, &work, rndr->opaque);
737
+ }
738
+ else bufput(ob, data, end);
739
+
740
+ return end;
741
+ }
742
+
743
+ /* char_langle_tag • '<' when tags or autolinks are allowed */
744
+ static size_t
745
+ char_langle_tag(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
746
+ {
747
+ enum mkd_autolink altype = MKDA_NOT_AUTOLINK;
748
+ size_t end = tag_length(data, size, &altype);
749
+ struct buf work = { data, end, 0, 0 };
750
+ int ret = 0;
751
+
752
+ if (end > 2) {
753
+ if (rndr->cb.autolink && altype != MKDA_NOT_AUTOLINK) {
754
+ struct buf *u_link = rndr_newbuf(rndr, BUFFER_SPAN);
755
+ work.data = data + 1;
756
+ work.size = end - 2;
757
+ unscape_text(u_link, &work);
758
+ ret = rndr->cb.autolink(ob, u_link, altype, rndr->opaque);
759
+ rndr_popbuf(rndr, BUFFER_SPAN);
760
+ }
761
+ else if (rndr->cb.raw_html_tag)
762
+ ret = rndr->cb.raw_html_tag(ob, &work, rndr->opaque);
763
+ }
764
+
765
+ if (!ret) return 0;
766
+ else return end;
767
+ }
768
+
769
+ static size_t
770
+ char_autolink_www(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
771
+ {
772
+ struct buf *link, *link_url, *link_text;
773
+ size_t link_len, rewind;
774
+
775
+ if (!rndr->cb.link || rndr->in_link_body)
776
+ return 0;
777
+
778
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
779
+
780
+ if ((link_len = sd_autolink__www(&rewind, link, data, offset, size, 0)) > 0) {
781
+ link_url = rndr_newbuf(rndr, BUFFER_SPAN);
782
+ BUFPUTSL(link_url, "http://");
783
+ bufput(link_url, link->data, link->size);
784
+
785
+ ob->size -= rewind;
786
+ if (rndr->cb.normal_text) {
787
+ link_text = rndr_newbuf(rndr, BUFFER_SPAN);
788
+ rndr->cb.normal_text(link_text, link, rndr->opaque);
789
+ rndr->cb.link(ob, link_url, NULL, link_text, rndr->opaque);
790
+ rndr_popbuf(rndr, BUFFER_SPAN);
791
+ } else {
792
+ rndr->cb.link(ob, link_url, NULL, link, rndr->opaque);
793
+ }
794
+ rndr_popbuf(rndr, BUFFER_SPAN);
795
+ }
796
+
797
+ rndr_popbuf(rndr, BUFFER_SPAN);
798
+ return link_len;
799
+ }
800
+
801
+ static size_t
802
+ char_autolink_email(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
803
+ {
804
+ struct buf *link;
805
+ size_t link_len, rewind;
806
+
807
+ if (!rndr->cb.autolink || rndr->in_link_body)
808
+ return 0;
809
+
810
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
811
+
812
+ if ((link_len = sd_autolink__email(&rewind, link, data, offset, size, 0)) > 0) {
813
+ ob->size -= rewind;
814
+ rndr->cb.autolink(ob, link, MKDA_EMAIL, rndr->opaque);
815
+ }
816
+
817
+ rndr_popbuf(rndr, BUFFER_SPAN);
818
+ return link_len;
819
+ }
820
+
821
+ static size_t
822
+ char_autolink_url(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
823
+ {
824
+ struct buf *link;
825
+ size_t link_len, rewind;
826
+
827
+ if (!rndr->cb.autolink || rndr->in_link_body)
828
+ return 0;
829
+
830
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
831
+
832
+ if ((link_len = sd_autolink__url(&rewind, link, data, offset, size, 0)) > 0) {
833
+ ob->size -= rewind;
834
+ rndr->cb.autolink(ob, link, MKDA_NORMAL, rndr->opaque);
835
+ }
836
+
837
+ rndr_popbuf(rndr, BUFFER_SPAN);
838
+ return link_len;
839
+ }
840
+
841
+ /* char_link • '[': parsing a link or an image */
842
+ static size_t
843
+ char_link(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
844
+ {
845
+ int is_img = (offset && data[-1] == '!'), level;
846
+ size_t i = 1, txt_e, link_b = 0, link_e = 0, title_b = 0, title_e = 0;
847
+ struct buf *content = 0;
848
+ struct buf *link = 0;
849
+ struct buf *title = 0;
850
+ struct buf *u_link = 0;
851
+ size_t org_work_size = rndr->work_bufs[BUFFER_SPAN].size;
852
+ int text_has_nl = 0, ret = 0;
853
+ int in_title = 0, qtype = 0;
854
+
855
+ /* checking whether the correct renderer exists */
856
+ if ((is_img && !rndr->cb.image) || (!is_img && !rndr->cb.link))
857
+ goto cleanup;
858
+
859
+ /* looking for the matching closing bracket */
860
+ for (level = 1; i < size; i++) {
861
+ if (data[i] == '\n')
862
+ text_has_nl = 1;
863
+
864
+ else if (data[i - 1] == '\\')
865
+ continue;
866
+
867
+ else if (data[i] == '[')
868
+ level++;
869
+
870
+ else if (data[i] == ']') {
871
+ level--;
872
+ if (level <= 0)
873
+ break;
874
+ }
875
+ }
876
+
877
+ if (i >= size)
878
+ goto cleanup;
879
+
880
+ txt_e = i;
881
+ i++;
882
+
883
+ /* skip any amount of whitespace or newline */
884
+ /* (this is much more laxist than original markdown syntax) */
885
+ while (i < size && _isspace(data[i]))
886
+ i++;
887
+
888
+ /* inline style link */
889
+ if (i < size && data[i] == '(') {
890
+ /* skipping initial whitespace */
891
+ i++;
892
+
893
+ while (i < size && _isspace(data[i]))
894
+ i++;
895
+
896
+ link_b = i;
897
+
898
+ /* looking for link end: ' " ) */
899
+ while (i < size) {
900
+ if (data[i] == '\\') i += 2;
901
+ else if (data[i] == ')') break;
902
+ else if (i >= 1 && _isspace(data[i-1]) && (data[i] == '\'' || data[i] == '"')) break;
903
+ else i++;
904
+ }
905
+
906
+ if (i >= size) goto cleanup;
907
+ link_e = i;
908
+
909
+ /* looking for title end if present */
910
+ if (data[i] == '\'' || data[i] == '"') {
911
+ qtype = data[i];
912
+ in_title = 1;
913
+ i++;
914
+ title_b = i;
915
+
916
+ while (i < size) {
917
+ if (data[i] == '\\') i += 2;
918
+ else if (data[i] == qtype) {in_title = 0; i++;}
919
+ else if ((data[i] == ')') && !in_title) break;
920
+ else i++;
921
+ }
922
+
923
+ if (i >= size) goto cleanup;
924
+
925
+ /* skipping whitespaces after title */
926
+ title_e = i - 1;
927
+ while (title_e > title_b && _isspace(data[title_e]))
928
+ title_e--;
929
+
930
+ /* checking for closing quote presence */
931
+ if (data[title_e] != '\'' && data[title_e] != '"') {
932
+ title_b = title_e = 0;
933
+ link_e = i;
934
+ }
935
+ }
936
+
937
+ /* remove whitespace at the end of the link */
938
+ while (link_e > link_b && _isspace(data[link_e - 1]))
939
+ link_e--;
940
+
941
+ /* remove optional angle brackets around the link */
942
+ if (data[link_b] == '<') link_b++;
943
+ if (data[link_e - 1] == '>') link_e--;
944
+
945
+ /* building escaped link and title */
946
+ if (link_e > link_b) {
947
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
948
+ bufput(link, data + link_b, link_e - link_b);
949
+ }
950
+
951
+ if (title_e > title_b) {
952
+ title = rndr_newbuf(rndr, BUFFER_SPAN);
953
+ bufput(title, data + title_b, title_e - title_b);
954
+ }
955
+
956
+ i++;
957
+ }
958
+
959
+ /* reference style link */
960
+ else if (i < size && data[i] == '[') {
961
+ struct buf id = { 0, 0, 0, 0 };
962
+ struct link_ref *lr;
963
+
964
+ /* looking for the id */
965
+ i++;
966
+ link_b = i;
967
+ while (i < size && data[i] != ']') i++;
968
+ if (i >= size) goto cleanup;
969
+ link_e = i;
970
+
971
+ /* finding the link_ref */
972
+ if (link_b == link_e) {
973
+ if (text_has_nl) {
974
+ struct buf *b = rndr_newbuf(rndr, BUFFER_SPAN);
975
+ size_t j;
976
+
977
+ for (j = 1; j < txt_e; j++) {
978
+ if (data[j] != '\n')
979
+ bufputc(b, data[j]);
980
+ else if (data[j - 1] != ' ')
981
+ bufputc(b, ' ');
982
+ }
983
+
984
+ id.data = b->data;
985
+ id.size = b->size;
986
+ } else {
987
+ id.data = data + 1;
988
+ id.size = txt_e - 1;
989
+ }
990
+ } else {
991
+ id.data = data + link_b;
992
+ id.size = link_e - link_b;
993
+ }
994
+
995
+ lr = find_link_ref(rndr->refs, id.data, id.size);
996
+ if (!lr)
997
+ goto cleanup;
998
+
999
+ /* keeping link and title from link_ref */
1000
+ link = lr->link;
1001
+ title = lr->title;
1002
+ i++;
1003
+ }
1004
+
1005
+ /* shortcut reference style link */
1006
+ else {
1007
+ struct buf id = { 0, 0, 0, 0 };
1008
+ struct link_ref *lr;
1009
+
1010
+ /* crafting the id */
1011
+ if (text_has_nl) {
1012
+ struct buf *b = rndr_newbuf(rndr, BUFFER_SPAN);
1013
+ size_t j;
1014
+
1015
+ for (j = 1; j < txt_e; j++) {
1016
+ if (data[j] != '\n')
1017
+ bufputc(b, data[j]);
1018
+ else if (data[j - 1] != ' ')
1019
+ bufputc(b, ' ');
1020
+ }
1021
+
1022
+ id.data = b->data;
1023
+ id.size = b->size;
1024
+ } else {
1025
+ id.data = data + 1;
1026
+ id.size = txt_e - 1;
1027
+ }
1028
+
1029
+ /* finding the link_ref */
1030
+ lr = find_link_ref(rndr->refs, id.data, id.size);
1031
+ if (!lr)
1032
+ goto cleanup;
1033
+
1034
+ /* keeping link and title from link_ref */
1035
+ link = lr->link;
1036
+ title = lr->title;
1037
+
1038
+ /* rewinding the whitespace */
1039
+ i = txt_e + 1;
1040
+ }
1041
+
1042
+ /* building content: img alt is escaped, link content is parsed */
1043
+ if (txt_e > 1) {
1044
+ content = rndr_newbuf(rndr, BUFFER_SPAN);
1045
+ if (is_img) {
1046
+ bufput(content, data + 1, txt_e - 1);
1047
+ } else {
1048
+ /* disable autolinking when parsing inline the
1049
+ * content of a link */
1050
+ rndr->in_link_body = 1;
1051
+ parse_inline(content, rndr, data + 1, txt_e - 1);
1052
+ rndr->in_link_body = 0;
1053
+ }
1054
+ }
1055
+
1056
+ if (link) {
1057
+ u_link = rndr_newbuf(rndr, BUFFER_SPAN);
1058
+ unscape_text(u_link, link);
1059
+ }
1060
+
1061
+ /* calling the relevant rendering function */
1062
+ if (is_img) {
1063
+ if (ob->size && ob->data[ob->size - 1] == '!')
1064
+ ob->size -= 1;
1065
+
1066
+ ret = rndr->cb.image(ob, u_link, title, content, rndr->opaque);
1067
+ } else {
1068
+ ret = rndr->cb.link(ob, u_link, title, content, rndr->opaque);
1069
+ }
1070
+
1071
+ /* cleanup */
1072
+ cleanup:
1073
+ rndr->work_bufs[BUFFER_SPAN].size = (int)org_work_size;
1074
+ return ret ? i : 0;
1075
+ }
1076
+
1077
+ static size_t
1078
+ char_superscript(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
1079
+ {
1080
+ size_t sup_start, sup_len;
1081
+ struct buf *sup;
1082
+
1083
+ if (!rndr->cb.superscript)
1084
+ return 0;
1085
+
1086
+ if (size < 2)
1087
+ return 0;
1088
+
1089
+ if (data[1] == '(') {
1090
+ sup_start = sup_len = 2;
1091
+
1092
+ while (sup_len < size && data[sup_len] != ')' && data[sup_len - 1] != '\\')
1093
+ sup_len++;
1094
+
1095
+ if (sup_len == size)
1096
+ return 0;
1097
+ } else {
1098
+ sup_start = sup_len = 1;
1099
+
1100
+ while (sup_len < size && !_isspace(data[sup_len]))
1101
+ sup_len++;
1102
+ }
1103
+
1104
+ if (sup_len - sup_start == 0)
1105
+ return (sup_start == 2) ? 3 : 0;
1106
+
1107
+ sup = rndr_newbuf(rndr, BUFFER_SPAN);
1108
+ parse_inline(sup, rndr, data + sup_start, sup_len - sup_start);
1109
+ rndr->cb.superscript(ob, sup, rndr->opaque);
1110
+ rndr_popbuf(rndr, BUFFER_SPAN);
1111
+
1112
+ return (sup_start == 2) ? sup_len + 1 : sup_len;
1113
+ }
1114
+
1115
+ /*********************************
1116
+ * BLOCK-LEVEL PARSING FUNCTIONS *
1117
+ *********************************/
1118
+
1119
+ /* is_empty • returns the line length when it is empty, 0 otherwise */
1120
+ static size_t
1121
+ is_empty(uint8_t *data, size_t size)
1122
+ {
1123
+ size_t i;
1124
+
1125
+ for (i = 0; i < size && data[i] != '\n'; i++)
1126
+ if (data[i] != ' ')
1127
+ return 0;
1128
+
1129
+ return i + 1;
1130
+ }
1131
+
1132
+ /* is_hrule • returns whether a line is a horizontal rule */
1133
+ static int
1134
+ is_hrule(uint8_t *data, size_t size)
1135
+ {
1136
+ size_t i = 0, n = 0;
1137
+ uint8_t c;
1138
+
1139
+ /* skipping initial spaces */
1140
+ if (size < 3) return 0;
1141
+ if (data[0] == ' ') { i++;
1142
+ if (data[1] == ' ') { i++;
1143
+ if (data[2] == ' ') { i++; } } }
1144
+
1145
+ /* looking at the hrule uint8_t */
1146
+ if (i + 2 >= size
1147
+ || (data[i] != '*' && data[i] != '-' && data[i] != '_'))
1148
+ return 0;
1149
+ c = data[i];
1150
+
1151
+ /* the whole line must be the char or whitespace */
1152
+ while (i < size && data[i] != '\n') {
1153
+ if (data[i] == c) n++;
1154
+ else if (data[i] != ' ')
1155
+ return 0;
1156
+
1157
+ i++;
1158
+ }
1159
+
1160
+ return n >= 3;
1161
+ }
1162
+
1163
+ /* check if a line begins with a code fence; return the
1164
+ * width of the code fence */
1165
+ static size_t
1166
+ prefix_codefence(uint8_t *data, size_t size)
1167
+ {
1168
+ size_t i = 0, n = 0;
1169
+ uint8_t c;
1170
+
1171
+ /* skipping initial spaces */
1172
+ if (size < 3) return 0;
1173
+ if (data[0] == ' ') { i++;
1174
+ if (data[1] == ' ') { i++;
1175
+ if (data[2] == ' ') { i++; } } }
1176
+
1177
+ /* looking at the hrule uint8_t */
1178
+ if (i + 2 >= size || !(data[i] == '~' || data[i] == '`'))
1179
+ return 0;
1180
+
1181
+ c = data[i];
1182
+
1183
+ /* the whole line must be the uint8_t or whitespace */
1184
+ while (i < size && data[i] == c) {
1185
+ n++; i++;
1186
+ }
1187
+
1188
+ if (n < 3)
1189
+ return 0;
1190
+
1191
+ return i;
1192
+ }
1193
+
1194
+ /* check if a line is a code fence; return its size if it is */
1195
+ static size_t
1196
+ is_codefence(uint8_t *data, size_t size, struct buf *syntax)
1197
+ {
1198
+ size_t i = 0, syn_len = 0;
1199
+ uint8_t *syn_start;
1200
+
1201
+ i = prefix_codefence(data, size);
1202
+ if (i == 0)
1203
+ return 0;
1204
+
1205
+ while (i < size && data[i] == ' ')
1206
+ i++;
1207
+
1208
+ syn_start = data + i;
1209
+
1210
+ if (i < size && data[i] == '{') {
1211
+ i++; syn_start++;
1212
+
1213
+ while (i < size && data[i] != '}' && data[i] != '\n') {
1214
+ syn_len++; i++;
1215
+ }
1216
+
1217
+ if (i == size || data[i] != '}')
1218
+ return 0;
1219
+
1220
+ /* strip all whitespace at the beginning and the end
1221
+ * of the {} block */
1222
+ while (syn_len > 0 && _isspace(syn_start[0])) {
1223
+ syn_start++; syn_len--;
1224
+ }
1225
+
1226
+ while (syn_len > 0 && _isspace(syn_start[syn_len - 1]))
1227
+ syn_len--;
1228
+
1229
+ i++;
1230
+ } else {
1231
+ while (i < size && !_isspace(data[i])) {
1232
+ syn_len++; i++;
1233
+ }
1234
+ }
1235
+
1236
+ if (syntax) {
1237
+ syntax->data = syn_start;
1238
+ syntax->size = syn_len;
1239
+ }
1240
+
1241
+ while (i < size && data[i] != '\n') {
1242
+ if (!_isspace(data[i]))
1243
+ return 0;
1244
+
1245
+ i++;
1246
+ }
1247
+
1248
+ return i + 1;
1249
+ }
1250
+
1251
+ /* is_atxheader • returns whether the line is a hash-prefixed header */
1252
+ static int
1253
+ is_atxheader(struct sd_markdown *rndr, uint8_t *data, size_t size)
1254
+ {
1255
+ if (data[0] != '#')
1256
+ return 0;
1257
+
1258
+ if (rndr->ext_flags & MKDEXT_SPACE_HEADERS) {
1259
+ size_t level = 0;
1260
+
1261
+ while (level < size && level < 6 && data[level] == '#')
1262
+ level++;
1263
+
1264
+ if (level < size && data[level] != ' ')
1265
+ return 0;
1266
+ }
1267
+
1268
+ return 1;
1269
+ }
1270
+
1271
+ /* is_headerline • returns whether the line is a setext-style hdr underline */
1272
+ static int
1273
+ is_headerline(uint8_t *data, size_t size)
1274
+ {
1275
+ size_t i = 0;
1276
+
1277
+ /* test of level 1 header */
1278
+ if (data[i] == '=') {
1279
+ for (i = 1; i < size && data[i] == '='; i++);
1280
+ while (i < size && data[i] == ' ') i++;
1281
+ return (i >= size || data[i] == '\n') ? 1 : 0; }
1282
+
1283
+ /* test of level 2 header */
1284
+ if (data[i] == '-') {
1285
+ for (i = 1; i < size && data[i] == '-'; i++);
1286
+ while (i < size && data[i] == ' ') i++;
1287
+ return (i >= size || data[i] == '\n') ? 2 : 0; }
1288
+
1289
+ return 0;
1290
+ }
1291
+
1292
+ static int
1293
+ is_next_headerline(uint8_t *data, size_t size)
1294
+ {
1295
+ size_t i = 0;
1296
+
1297
+ while (i < size && data[i] != '\n')
1298
+ i++;
1299
+
1300
+ if (++i >= size)
1301
+ return 0;
1302
+
1303
+ return is_headerline(data + i, size - i);
1304
+ }
1305
+
1306
+ /* prefix_quote • returns blockquote prefix length */
1307
+ static size_t
1308
+ prefix_quote(uint8_t *data, size_t size)
1309
+ {
1310
+ size_t i = 0;
1311
+ if (i < size && data[i] == ' ') i++;
1312
+ if (i < size && data[i] == ' ') i++;
1313
+ if (i < size && data[i] == ' ') i++;
1314
+
1315
+ if (i < size && data[i] == '>') {
1316
+ if (i + 1 < size && data[i + 1] == ' ')
1317
+ return i + 2;
1318
+
1319
+ return i + 1;
1320
+ }
1321
+
1322
+ return 0;
1323
+ }
1324
+
1325
+ /* prefix_code • returns prefix length for block code*/
1326
+ static size_t
1327
+ prefix_code(uint8_t *data, size_t size)
1328
+ {
1329
+ if (size > 3 && data[0] == ' ' && data[1] == ' '
1330
+ && data[2] == ' ' && data[3] == ' ') return 4;
1331
+
1332
+ return 0;
1333
+ }
1334
+
1335
+ /* prefix_oli • returns ordered list item prefix */
1336
+ static size_t
1337
+ prefix_oli(uint8_t *data, size_t size)
1338
+ {
1339
+ size_t i = 0;
1340
+
1341
+ if (i < size && data[i] == ' ') i++;
1342
+ if (i < size && data[i] == ' ') i++;
1343
+ if (i < size && data[i] == ' ') i++;
1344
+
1345
+ if (i >= size || data[i] < '0' || data[i] > '9')
1346
+ return 0;
1347
+
1348
+ while (i < size && data[i] >= '0' && data[i] <= '9')
1349
+ i++;
1350
+
1351
+ if (i + 1 >= size || data[i] != '.' || data[i + 1] != ' ')
1352
+ return 0;
1353
+
1354
+ if (is_next_headerline(data + i, size - i))
1355
+ return 0;
1356
+
1357
+ return i + 2;
1358
+ }
1359
+
1360
+ /* prefix_uli • returns ordered list item prefix */
1361
+ static size_t
1362
+ prefix_uli(uint8_t *data, size_t size)
1363
+ {
1364
+ size_t i = 0;
1365
+
1366
+ if (i < size && data[i] == ' ') i++;
1367
+ if (i < size && data[i] == ' ') i++;
1368
+ if (i < size && data[i] == ' ') i++;
1369
+
1370
+ if (i + 1 >= size ||
1371
+ (data[i] != '*' && data[i] != '+' && data[i] != '-') ||
1372
+ data[i + 1] != ' ')
1373
+ return 0;
1374
+
1375
+ if (is_next_headerline(data + i, size - i))
1376
+ return 0;
1377
+
1378
+ return i + 2;
1379
+ }
1380
+
1381
+
1382
+ /* parse_block • parsing of one block, returning next uint8_t to parse */
1383
+ static void parse_block(struct buf *ob, struct sd_markdown *rndr,
1384
+ uint8_t *data, size_t size, const src_map *map);
1385
+
1386
+
1387
+ /* parse_blockquote • handles parsing of a blockquote fragment */
1388
+ static size_t
1389
+ parse_blockquote(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, const src_map *map)
1390
+ {
1391
+ size_t beg, end = 0, pre, work_size = 0;
1392
+ uint8_t *work_data = 0;
1393
+ struct buf *out = 0;
1394
+
1395
+ /* source map */
1396
+ src_map *block_map = NULL;
1397
+
1398
+ /* AST construction */
1399
+ if (rndr->cb.blockquote_begin)
1400
+ rndr->cb.blockquote_begin(rndr->opaque);
1401
+
1402
+ out = rndr_newbuf(rndr, BUFFER_BLOCK);
1403
+
1404
+ beg = 0;
1405
+ while (beg < size) {
1406
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++);
1407
+
1408
+ pre = prefix_quote(data + beg, end - beg);
1409
+
1410
+ if (pre)
1411
+ beg += pre; /* skipping prefix */
1412
+
1413
+ /* empty line followed by non-quote line */
1414
+ else if (is_empty(data + beg, end - beg) &&
1415
+ (end >= size || (prefix_quote(data + end, size - end) == 0 &&
1416
+ !is_empty(data + end, size - end))))
1417
+ break;
1418
+
1419
+ if (beg < end) { /* copy into the in-place working buffer */
1420
+ /* bufput(work, data + beg, end - beg); */
1421
+ if (!work_data)
1422
+ work_data = data + beg;
1423
+ else if (data + beg != work_data + work_size)
1424
+ memmove(work_data + work_size, data + beg, end - beg);
1425
+
1426
+ /* source map */
1427
+ if (map) {
1428
+ size_t cur = src_map_location(map, beg);
1429
+ range actual_range = { cur, end - beg };
1430
+ if (!block_map) {
1431
+ block_map = src_map_new_submap(map, &actual_range);
1432
+ }
1433
+ else {
1434
+ src_map_append(block_map, &actual_range);
1435
+ }
1436
+ }
1437
+
1438
+ work_size += end - beg;
1439
+ }
1440
+ beg = end;
1441
+ }
1442
+
1443
+ parse_block(out, rndr, work_data, work_size, block_map);
1444
+
1445
+ /* source map */
1446
+ if (block_map)
1447
+ src_map_release(block_map);
1448
+
1449
+ if (rndr->cb.blockquote)
1450
+ rndr->cb.blockquote(ob, out, rndr->opaque);
1451
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1452
+ return end;
1453
+ }
1454
+
1455
+ static size_t
1456
+ parse_htmlblock(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int do_render);
1457
+
1458
+ /* parse_blockquote • handles parsing of a regular paragraph */
1459
+ static size_t
1460
+ parse_paragraph(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1461
+ {
1462
+ size_t i = 0, end = 0;
1463
+ int level = 0;
1464
+ struct buf work = { data, 0, 0, 0 };
1465
+
1466
+ while (i < size) {
1467
+ for (end = i + 1; end < size && data[end - 1] != '\n'; end++) /* empty */;
1468
+
1469
+ if (is_empty(data + i, size - i))
1470
+ break;
1471
+
1472
+ if ((level = is_headerline(data + i, size - i)) != 0)
1473
+ break;
1474
+
1475
+ if (is_atxheader(rndr, data + i, size - i) ||
1476
+ is_hrule(data + i, size - i) ||
1477
+ prefix_quote(data + i, size - i)) {
1478
+ end = i;
1479
+ break;
1480
+ }
1481
+
1482
+ /*
1483
+ * Early termination of a paragraph with the same logic
1484
+ * as Markdown 1.0.0. If this logic is applied, the
1485
+ * Markdown 1.0.3 test suite won't pass cleanly
1486
+ *
1487
+ * :: If the first character in a new line is not a letter,
1488
+ * let's check to see if there's some kind of block starting
1489
+ * here
1490
+ */
1491
+ if ((rndr->ext_flags & MKDEXT_LAX_SPACING) && !isalnum(data[i])) {
1492
+ if (prefix_oli(data + i, size - i) ||
1493
+ prefix_uli(data + i, size - i)) {
1494
+ end = i;
1495
+ break;
1496
+ }
1497
+
1498
+ /* see if an html block starts here */
1499
+ if (data[i] == '<' && rndr->cb.blockhtml &&
1500
+ parse_htmlblock(ob, rndr, data + i, size - i, 0)) {
1501
+ end = i;
1502
+ break;
1503
+ }
1504
+
1505
+ /* see if a code fence starts here */
1506
+ if ((rndr->ext_flags & MKDEXT_FENCED_CODE) != 0 &&
1507
+ is_codefence(data + i, size - i, NULL) != 0) {
1508
+ end = i;
1509
+ break;
1510
+ }
1511
+ }
1512
+
1513
+ i = end;
1514
+ }
1515
+
1516
+ work.size = i;
1517
+ while (work.size && data[work.size - 1] == '\n')
1518
+ work.size--;
1519
+
1520
+ if (!level) {
1521
+ struct buf *tmp = rndr_newbuf(rndr, BUFFER_BLOCK);
1522
+ parse_inline(tmp, rndr, work.data, work.size);
1523
+ if (rndr->cb.paragraph)
1524
+ rndr->cb.paragraph(ob, tmp, rndr->opaque);
1525
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1526
+ } else {
1527
+ struct buf *header_work;
1528
+
1529
+ if (work.size) {
1530
+ size_t beg;
1531
+ i = work.size;
1532
+ work.size -= 1;
1533
+
1534
+ while (work.size && data[work.size] != '\n')
1535
+ work.size -= 1;
1536
+
1537
+ beg = work.size + 1;
1538
+ while (work.size && data[work.size - 1] == '\n')
1539
+ work.size -= 1;
1540
+
1541
+ if (work.size > 0) {
1542
+ struct buf *tmp = rndr_newbuf(rndr, BUFFER_BLOCK);
1543
+ parse_inline(tmp, rndr, work.data, work.size);
1544
+
1545
+ if (rndr->cb.paragraph)
1546
+ rndr->cb.paragraph(ob, tmp, rndr->opaque);
1547
+
1548
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1549
+ work.data += beg;
1550
+ work.size = i - beg;
1551
+ }
1552
+ else work.size = i;
1553
+ }
1554
+
1555
+ header_work = rndr_newbuf(rndr, BUFFER_SPAN);
1556
+ parse_inline(header_work, rndr, work.data, work.size);
1557
+
1558
+ if (rndr->cb.header)
1559
+ rndr->cb.header(ob, header_work, (int)level, rndr->opaque);
1560
+
1561
+ rndr_popbuf(rndr, BUFFER_SPAN);
1562
+ }
1563
+
1564
+ return end;
1565
+ }
1566
+
1567
+ /* parse_fencedcode • handles parsing of a block-level code fragment */
1568
+ static size_t
1569
+ parse_fencedcode(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1570
+ {
1571
+ size_t beg, end;
1572
+ struct buf *work = 0;
1573
+ struct buf lang = { 0, 0, 0, 0 };
1574
+
1575
+ beg = is_codefence(data, size, &lang);
1576
+ if (beg == 0) return 0;
1577
+
1578
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1579
+
1580
+ while (beg < size) {
1581
+ size_t fence_end;
1582
+ struct buf fence_trail = { 0, 0, 0, 0 };
1583
+
1584
+ fence_end = is_codefence(data + beg, size - beg, &fence_trail);
1585
+ if (fence_end != 0 && fence_trail.size == 0) {
1586
+ beg += fence_end;
1587
+ break;
1588
+ }
1589
+
1590
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++);
1591
+
1592
+ if (beg < end) {
1593
+ /* verbatim copy to the working buffer,
1594
+ escaping entities */
1595
+ if (is_empty(data + beg, end - beg))
1596
+ bufputc(work, '\n');
1597
+ else bufput(work, data + beg, end - beg);
1598
+ }
1599
+ beg = end;
1600
+ }
1601
+
1602
+ if (work->size && work->data[work->size - 1] != '\n')
1603
+ bufputc(work, '\n');
1604
+
1605
+ if (rndr->cb.blockcode)
1606
+ rndr->cb.blockcode(ob, work, lang.size ? &lang : NULL, rndr->opaque);
1607
+
1608
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1609
+ return beg;
1610
+ }
1611
+
1612
+ static size_t
1613
+ parse_blockcode(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1614
+ {
1615
+ size_t beg, end, pre;
1616
+ struct buf *work = 0;
1617
+
1618
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1619
+
1620
+ beg = 0;
1621
+ while (beg < size) {
1622
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++) {};
1623
+ pre = prefix_code(data + beg, end - beg);
1624
+
1625
+ if (pre)
1626
+ beg += pre; /* skipping prefix */
1627
+ else if (!is_empty(data + beg, end - beg))
1628
+ /* non-empty non-prefixed line breaks the pre */
1629
+ break;
1630
+
1631
+ if (beg < end) {
1632
+ /* verbatim copy to the working buffer,
1633
+ escaping entities */
1634
+ if (is_empty(data + beg, end - beg))
1635
+ bufputc(work, '\n');
1636
+ else bufput(work, data + beg, end - beg);
1637
+ }
1638
+ beg = end;
1639
+ }
1640
+
1641
+ while (work->size && work->data[work->size - 1] == '\n')
1642
+ work->size -= 1;
1643
+
1644
+ bufputc(work, '\n');
1645
+
1646
+ if (rndr->cb.blockcode)
1647
+ rndr->cb.blockcode(ob, work, NULL, rndr->opaque);
1648
+
1649
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1650
+ return beg;
1651
+ }
1652
+
1653
+ /* parse_listitem • parsing of a single list item */
1654
+ /* assuming initial prefix is already removed */
1655
+ static size_t
1656
+ parse_listitem(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int *flags, const src_map *map)
1657
+ {
1658
+ struct buf *work = 0, *inter = 0;
1659
+ size_t beg = 0, end, pre, sublist = 0, orgpre = 0, i = 0;
1660
+ int in_empty = 0, has_inside_empty = 0, in_fence = 0;
1661
+ src_map *item_map = NULL;
1662
+
1663
+ /* keeping track of the first indentation prefix */
1664
+ while (orgpre < 3 && orgpre < size && data[orgpre] == ' ')
1665
+ orgpre++;
1666
+
1667
+ beg = prefix_uli(data, size);
1668
+ if (!beg)
1669
+ beg = prefix_oli(data, size);
1670
+
1671
+ if (!beg)
1672
+ return 0;
1673
+
1674
+ /* AST construction */
1675
+ if (rndr->cb.listitem_begin)
1676
+ rndr->cb.listitem_begin(*flags, rndr->opaque);
1677
+
1678
+ /* skipping to the beginning of the following line */
1679
+ end = beg;
1680
+ while (end < size && data[end - 1] != '\n')
1681
+ end++;
1682
+
1683
+ /* getting working buffers */
1684
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
1685
+ inter = rndr_newbuf(rndr, BUFFER_SPAN);
1686
+
1687
+ /* source map */
1688
+ if (map) {
1689
+ size_t cur = src_map_location(map, beg);
1690
+ range item_range = { cur, end - beg };
1691
+ item_map = src_map_new_submap(map, &item_range);
1692
+ }
1693
+
1694
+ /* putting the first line into the working buffer */
1695
+ bufput(work, data + beg, end - beg);
1696
+ beg = end;
1697
+
1698
+ /* process the following lines */
1699
+ while (beg < size) {
1700
+ size_t has_next_uli = 0, has_next_oli = 0;
1701
+
1702
+ end++;
1703
+
1704
+ while (end < size && data[end - 1] != '\n')
1705
+ end++;
1706
+
1707
+ /* process an empty line */
1708
+ if (is_empty(data + beg, end - beg)) {
1709
+ in_empty = 1;
1710
+ beg = end;
1711
+ continue;
1712
+ }
1713
+
1714
+ /* calculating the indentation */
1715
+ i = 0;
1716
+ while (i < 4 && beg + i < end && data[beg + i] == ' ')
1717
+ i++;
1718
+
1719
+ pre = i;
1720
+
1721
+ if (rndr->ext_flags & MKDEXT_FENCED_CODE) {
1722
+ if (is_codefence(data + beg + i, end - beg - i, NULL) != 0)
1723
+ in_fence = !in_fence;
1724
+ }
1725
+
1726
+ /* Only check for new list items if we are **not** inside
1727
+ * a fenced code block */
1728
+ if (!in_fence) {
1729
+ has_next_uli = prefix_uli(data + beg + i, end - beg - i);
1730
+ has_next_oli = prefix_oli(data + beg + i, end - beg - i);
1731
+ }
1732
+
1733
+ /* checking for ul/ol switch */
1734
+ if (in_empty && (
1735
+ ((*flags & MKD_LIST_ORDERED) && has_next_uli) ||
1736
+ (!(*flags & MKD_LIST_ORDERED) && has_next_oli))){
1737
+ *flags |= MKD_LI_END;
1738
+ break; /* the following item must have same list type */
1739
+ }
1740
+
1741
+ /* checking for a new item */
1742
+ if ((has_next_uli && !is_hrule(data + beg + i, end - beg - i)) || has_next_oli) {
1743
+ if (in_empty)
1744
+ has_inside_empty = 1;
1745
+
1746
+ if (pre == orgpre) /* the following item must have */
1747
+ break; /* the same indentation */
1748
+
1749
+ if (!sublist)
1750
+ sublist = work->size;
1751
+ }
1752
+ /* joining only indented stuff after empty lines;
1753
+ * note that now we only require 1 space of indentation
1754
+ * to continue a list */
1755
+ else if (in_empty && pre == 0) {
1756
+ *flags |= MKD_LI_END;
1757
+ break;
1758
+ }
1759
+ else if (in_empty) {
1760
+ /* source map */
1761
+ if (item_map && item_map->size) {
1762
+ ((range *)item_map->item[item_map->size - 1])->len += 1;
1763
+ }
1764
+
1765
+ bufputc(work, '\n');
1766
+ has_inside_empty = 1;
1767
+ }
1768
+
1769
+ in_empty = 0;
1770
+
1771
+ /* source map */
1772
+ if (map) {
1773
+ size_t line_cur = src_map_location(map, beg + i);
1774
+ range line_range = { line_cur, end - beg - i };
1775
+ src_map_append(item_map, &line_range);
1776
+ }
1777
+
1778
+ /* adding the line without prefix into the working buffer */
1779
+ bufput(work, data + beg + i, end - beg - i);
1780
+ beg = end;
1781
+ }
1782
+
1783
+ /* render of li contents */
1784
+ if (has_inside_empty)
1785
+ *flags |= MKD_LI_BLOCK;
1786
+
1787
+ if (*flags & MKD_LI_BLOCK) {
1788
+ /* intermediate render of block li */
1789
+ if (sublist && sublist < work->size) {
1790
+ src_map *sublist_map = NULL;
1791
+
1792
+ parse_block(inter, rndr, work->data, sublist, item_map);
1793
+
1794
+ /* source map */
1795
+ if (item_map)
1796
+ sublist_map = src_map_new_tail(item_map, sublist);
1797
+
1798
+ parse_block(inter, rndr, work->data + sublist, work->size - sublist, sublist_map);
1799
+
1800
+ if (sublist_map)
1801
+ src_map_release(sublist_map);
1802
+ }
1803
+ else
1804
+ parse_block(inter, rndr, work->data, work->size, item_map);
1805
+ } else {
1806
+ /* intermediate render of inline li */
1807
+ if (sublist && sublist < work->size) {
1808
+ src_map *sublist_map = NULL;
1809
+
1810
+ parse_inline(inter, rndr, work->data, sublist);
1811
+
1812
+ /* source map */
1813
+ if (item_map)
1814
+ sublist_map = src_map_new_tail(item_map, sublist);
1815
+
1816
+ parse_block(inter, rndr, work->data + sublist, work->size - sublist, sublist_map);
1817
+
1818
+ if (sublist_map)
1819
+ src_map_release(sublist_map);
1820
+ }
1821
+ else
1822
+ parse_inline(inter, rndr, work->data, work->size);
1823
+ }
1824
+
1825
+ /* render of li itself */
1826
+ if (rndr->cb.listitem)
1827
+ rndr->cb.listitem(ob, inter, *flags, rndr->opaque);
1828
+
1829
+ /* source map */
1830
+ if (item_map) {
1831
+ if (rndr->cb.block_did_parse)
1832
+ rndr->cb.block_did_parse(item_map, data + i, size - i, rndr->opaque);
1833
+
1834
+ src_map_release(item_map);
1835
+ }
1836
+
1837
+ rndr_popbuf(rndr, BUFFER_SPAN);
1838
+ rndr_popbuf(rndr, BUFFER_SPAN);
1839
+ return beg;
1840
+ }
1841
+
1842
+
1843
+ /* parse_list • parsing ordered or unordered list block */
1844
+ static size_t
1845
+ parse_list(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int flags, const src_map *map)
1846
+ {
1847
+ struct buf *work = 0;
1848
+ size_t i = 0, j;
1849
+
1850
+ /* AST construction */
1851
+ if (rndr->cb.list_begin)
1852
+ rndr->cb.list_begin(flags, rndr->opaque);
1853
+
1854
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1855
+
1856
+ while (i < size) {
1857
+
1858
+ /* source map */
1859
+ src_map *block_map = NULL;
1860
+
1861
+ if (map) {
1862
+ size_t cur = src_map_location(map, i);
1863
+ range actual_range = { cur, size - i };
1864
+ block_map = src_map_new_submap(map, &actual_range);
1865
+ }
1866
+
1867
+ j = parse_listitem(work, rndr, data + i, size - i, &flags, block_map);
1868
+
1869
+ /* source map */
1870
+ if (block_map) {
1871
+ src_map_release(block_map);
1872
+ }
1873
+
1874
+ i += j;
1875
+ if (!j || (flags & MKD_LI_END))
1876
+ break;
1877
+ }
1878
+
1879
+ if (rndr->cb.list)
1880
+ rndr->cb.list(ob, work, flags, rndr->opaque);
1881
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1882
+ return i;
1883
+ }
1884
+
1885
+ /* parse_atxheader • parsing of atx-style headers */
1886
+ static size_t
1887
+ parse_atxheader(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1888
+ {
1889
+ size_t level = 0;
1890
+ size_t i, end, skip;
1891
+
1892
+ while (level < size && level < 6 && data[level] == '#')
1893
+ level++;
1894
+
1895
+ for (i = level; i < size && data[i] == ' '; i++);
1896
+
1897
+ for (end = i; end < size && data[end] != '\n'; end++);
1898
+ skip = end;
1899
+
1900
+ while (end && data[end - 1] == '#')
1901
+ end--;
1902
+
1903
+ while (end && data[end - 1] == ' ')
1904
+ end--;
1905
+
1906
+ if (end > i) {
1907
+ struct buf *work = rndr_newbuf(rndr, BUFFER_SPAN);
1908
+
1909
+ parse_inline(work, rndr, data + i, end - i);
1910
+
1911
+ if (rndr->cb.header)
1912
+ rndr->cb.header(ob, work, (int)level, rndr->opaque);
1913
+
1914
+ rndr_popbuf(rndr, BUFFER_SPAN);
1915
+ }
1916
+
1917
+ return skip;
1918
+ }
1919
+
1920
+
1921
+ /* htmlblock_end • checking end of HTML block : </tag>[ \t]*\n[ \t*]\n */
1922
+ /* returns the length on match, 0 otherwise */
1923
+ static size_t
1924
+ htmlblock_end_tag(
1925
+ const char *tag,
1926
+ size_t tag_len,
1927
+ struct sd_markdown *rndr,
1928
+ uint8_t *data,
1929
+ size_t size)
1930
+ {
1931
+ size_t i, w;
1932
+
1933
+ /* checking if tag is a match */
1934
+ if (tag_len + 3 >= size ||
1935
+ strncasecmp((char *)data + 2, tag, tag_len) != 0 ||
1936
+ data[tag_len + 2] != '>')
1937
+ return 0;
1938
+
1939
+ /* checking white lines */
1940
+ i = tag_len + 3;
1941
+ w = 0;
1942
+ if (i < size && (w = is_empty(data + i, size - i)) == 0)
1943
+ return 0; /* non-blank after tag */
1944
+ i += w;
1945
+ w = 0;
1946
+
1947
+ if (i < size)
1948
+ w = is_empty(data + i, size - i);
1949
+
1950
+ return i + w;
1951
+ }
1952
+
1953
+ static size_t
1954
+ htmlblock_end(const char *curtag,
1955
+ struct sd_markdown *rndr,
1956
+ uint8_t *data,
1957
+ size_t size,
1958
+ int start_of_line)
1959
+ {
1960
+ size_t tag_size = strlen(curtag);
1961
+ size_t i = 1, end_tag;
1962
+ int block_lines = 0;
1963
+
1964
+ while (i < size) {
1965
+ i++;
1966
+ while (i < size && !(data[i - 1] == '<' && data[i] == '/')) {
1967
+ if (data[i] == '\n')
1968
+ block_lines++;
1969
+
1970
+ i++;
1971
+ }
1972
+
1973
+ /* If we are only looking for unindented tags, skip the tag
1974
+ * if it doesn't follow a newline.
1975
+ *
1976
+ * The only exception to this is if the tag is still on the
1977
+ * initial line; in that case it still counts as a closing
1978
+ * tag
1979
+ */
1980
+ if (start_of_line && block_lines > 0 && data[i - 2] != '\n')
1981
+ continue;
1982
+
1983
+ if (i + 2 + tag_size >= size)
1984
+ break;
1985
+
1986
+ end_tag = htmlblock_end_tag(curtag, tag_size, rndr, data + i - 1, size - i + 1);
1987
+ if (end_tag)
1988
+ return i + end_tag - 1;
1989
+ }
1990
+
1991
+ return 0;
1992
+ }
1993
+
1994
+
1995
+ /* parse_htmlblock • parsing of inline HTML block */
1996
+ static size_t
1997
+ parse_htmlblock(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int do_render)
1998
+ {
1999
+ size_t i, j = 0, tag_end;
2000
+ const char *curtag = NULL;
2001
+ struct buf work = { data, 0, 0, 0 };
2002
+
2003
+ /* identification of the opening tag */
2004
+ if (size < 2 || data[0] != '<')
2005
+ return 0;
2006
+
2007
+ i = 1;
2008
+ while (i < size && data[i] != '>' && data[i] != ' ')
2009
+ i++;
2010
+
2011
+ if (i < size)
2012
+ curtag = find_block_tag((char *)data + 1, (int)i - 1);
2013
+
2014
+ /* handling of special cases */
2015
+ if (!curtag) {
2016
+
2017
+ /* HTML comment, laxist form */
2018
+ if (size > 5 && data[1] == '!' && data[2] == '-' && data[3] == '-') {
2019
+ i = 5;
2020
+
2021
+ while (i < size && !(data[i - 2] == '-' && data[i - 1] == '-' && data[i] == '>'))
2022
+ i++;
2023
+
2024
+ i++;
2025
+
2026
+ if (i < size)
2027
+ j = is_empty(data + i, size - i);
2028
+
2029
+ if (j) {
2030
+ work.size = i + j;
2031
+ if (do_render && rndr->cb.blockhtml)
2032
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2033
+ return work.size;
2034
+ }
2035
+ }
2036
+
2037
+ /* HR, which is the only self-closing block tag considered */
2038
+ if (size > 4 && (data[1] == 'h' || data[1] == 'H') && (data[2] == 'r' || data[2] == 'R')) {
2039
+ i = 3;
2040
+ while (i < size && data[i] != '>')
2041
+ i++;
2042
+
2043
+ if (i + 1 < size) {
2044
+ i++;
2045
+ j = is_empty(data + i, size - i);
2046
+ if (j) {
2047
+ work.size = i + j;
2048
+ if (do_render && rndr->cb.blockhtml)
2049
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2050
+ return work.size;
2051
+ }
2052
+ }
2053
+ }
2054
+
2055
+ /* no special case recognised */
2056
+ return 0;
2057
+ }
2058
+
2059
+ /* looking for an unindented matching closing tag */
2060
+ /* followed by a blank line */
2061
+ tag_end = htmlblock_end(curtag, rndr, data, size, 1);
2062
+
2063
+ /* if not found, trying a second pass looking for indented match */
2064
+ /* but not if tag is "ins" or "del" (following original Markdown.pl) */
2065
+ if (!tag_end && strcmp(curtag, "ins") != 0 && strcmp(curtag, "del") != 0) {
2066
+ tag_end = htmlblock_end(curtag, rndr, data, size, 0);
2067
+ }
2068
+
2069
+ if (!tag_end)
2070
+ return 0;
2071
+
2072
+ /* the end of the block has been found */
2073
+ work.size = tag_end;
2074
+ if (do_render && rndr->cb.blockhtml)
2075
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2076
+
2077
+ return tag_end;
2078
+ }
2079
+
2080
+ static void
2081
+ parse_table_row(
2082
+ struct buf *ob,
2083
+ struct sd_markdown *rndr,
2084
+ uint8_t *data,
2085
+ size_t size,
2086
+ size_t columns,
2087
+ int *col_data,
2088
+ int header_flag)
2089
+ {
2090
+ size_t i = 0, col;
2091
+ struct buf *row_work = 0;
2092
+
2093
+ if (!rndr->cb.table_cell || !rndr->cb.table_row)
2094
+ return;
2095
+
2096
+ row_work = rndr_newbuf(rndr, BUFFER_SPAN);
2097
+
2098
+ if (i < size && data[i] == '|')
2099
+ i++;
2100
+
2101
+ for (col = 0; col < columns && i < size; ++col) {
2102
+ size_t cell_start, cell_end;
2103
+ struct buf *cell_work;
2104
+
2105
+ cell_work = rndr_newbuf(rndr, BUFFER_SPAN);
2106
+
2107
+ while (i < size && _isspace(data[i]))
2108
+ i++;
2109
+
2110
+ cell_start = i;
2111
+
2112
+ while (i < size && data[i] != '|')
2113
+ i++;
2114
+
2115
+ cell_end = i - 1;
2116
+
2117
+ while (cell_end > cell_start && _isspace(data[cell_end]))
2118
+ cell_end--;
2119
+
2120
+ parse_inline(cell_work, rndr, data + cell_start, 1 + cell_end - cell_start);
2121
+ rndr->cb.table_cell(row_work, cell_work, col_data[col] | header_flag, rndr->opaque);
2122
+
2123
+ rndr_popbuf(rndr, BUFFER_SPAN);
2124
+ i++;
2125
+ }
2126
+
2127
+ for (; col < columns; ++col) {
2128
+ struct buf empty_cell = { 0, 0, 0, 0 };
2129
+ rndr->cb.table_cell(row_work, &empty_cell, col_data[col] | header_flag, rndr->opaque);
2130
+ }
2131
+
2132
+ rndr->cb.table_row(ob, row_work, rndr->opaque);
2133
+
2134
+ rndr_popbuf(rndr, BUFFER_SPAN);
2135
+ }
2136
+
2137
+ static size_t
2138
+ parse_table_header(
2139
+ struct buf *ob,
2140
+ struct sd_markdown *rndr,
2141
+ uint8_t *data,
2142
+ size_t size,
2143
+ size_t *columns,
2144
+ int **column_data)
2145
+ {
2146
+ int pipes;
2147
+ size_t i = 0, col, header_end, under_end;
2148
+
2149
+ pipes = 0;
2150
+ while (i < size && data[i] != '\n')
2151
+ if (data[i++] == '|')
2152
+ pipes++;
2153
+
2154
+ if (i == size || pipes == 0)
2155
+ return 0;
2156
+
2157
+ header_end = i;
2158
+
2159
+ while (header_end > 0 && _isspace(data[header_end - 1]))
2160
+ header_end--;
2161
+
2162
+ if (data[0] == '|')
2163
+ pipes--;
2164
+
2165
+ if (header_end && data[header_end - 1] == '|')
2166
+ pipes--;
2167
+
2168
+ if (pipes < 0)
2169
+ return 0;
2170
+
2171
+ *columns = pipes + 1;
2172
+ *column_data = calloc(*columns, sizeof(int));
2173
+
2174
+ /* Parse the header underline */
2175
+ i++;
2176
+ if (i < size && data[i] == '|')
2177
+ i++;
2178
+
2179
+ under_end = i;
2180
+ while (under_end < size && data[under_end] != '\n')
2181
+ under_end++;
2182
+
2183
+ for (col = 0; col < *columns && i < under_end; ++col) {
2184
+ size_t dashes = 0;
2185
+
2186
+ while (i < under_end && data[i] == ' ')
2187
+ i++;
2188
+
2189
+ if (data[i] == ':') {
2190
+ i++; (*column_data)[col] |= MKD_TABLE_ALIGN_L;
2191
+ dashes++;
2192
+ }
2193
+
2194
+ while (i < under_end && data[i] == '-') {
2195
+ i++; dashes++;
2196
+ }
2197
+
2198
+ if (i < under_end && data[i] == ':') {
2199
+ i++; (*column_data)[col] |= MKD_TABLE_ALIGN_R;
2200
+ dashes++;
2201
+ }
2202
+
2203
+ while (i < under_end && data[i] == ' ')
2204
+ i++;
2205
+
2206
+ if (i < under_end && data[i] != '|')
2207
+ break;
2208
+
2209
+ if (dashes < 3)
2210
+ break;
2211
+
2212
+ i++;
2213
+ }
2214
+
2215
+ if (col < *columns)
2216
+ return 0;
2217
+
2218
+ parse_table_row(
2219
+ ob, rndr, data,
2220
+ header_end,
2221
+ *columns,
2222
+ *column_data,
2223
+ MKD_TABLE_HEADER
2224
+ );
2225
+
2226
+ return under_end + 1;
2227
+ }
2228
+
2229
+ static size_t
2230
+ parse_table(
2231
+ struct buf *ob,
2232
+ struct sd_markdown *rndr,
2233
+ uint8_t *data,
2234
+ size_t size)
2235
+ {
2236
+ size_t i;
2237
+
2238
+ struct buf *header_work = 0;
2239
+ struct buf *body_work = 0;
2240
+
2241
+ size_t columns;
2242
+ int *col_data = NULL;
2243
+
2244
+ header_work = rndr_newbuf(rndr, BUFFER_SPAN);
2245
+ body_work = rndr_newbuf(rndr, BUFFER_BLOCK);
2246
+
2247
+ i = parse_table_header(header_work, rndr, data, size, &columns, &col_data);
2248
+ if (i > 0) {
2249
+
2250
+ while (i < size) {
2251
+ size_t row_start;
2252
+ int pipes = 0;
2253
+
2254
+ row_start = i;
2255
+
2256
+ while (i < size && data[i] != '\n')
2257
+ if (data[i++] == '|')
2258
+ pipes++;
2259
+
2260
+ if (pipes == 0 || i == size) {
2261
+ i = row_start;
2262
+ break;
2263
+ }
2264
+
2265
+ parse_table_row(
2266
+ body_work,
2267
+ rndr,
2268
+ data + row_start,
2269
+ i - row_start,
2270
+ columns,
2271
+ col_data, 0
2272
+ );
2273
+
2274
+ i++;
2275
+ }
2276
+
2277
+ if (rndr->cb.table)
2278
+ rndr->cb.table(ob, header_work, body_work, rndr->opaque);
2279
+ }
2280
+
2281
+ free(col_data);
2282
+ rndr_popbuf(rndr, BUFFER_SPAN);
2283
+ rndr_popbuf(rndr, BUFFER_BLOCK);
2284
+ return i;
2285
+ }
2286
+
2287
+ /* parse_block • parsing of one block, returning next uint8_t to parse */
2288
+ static void
2289
+ parse_block(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, const src_map *map)
2290
+ {
2291
+ size_t beg, end, i, block_beg;
2292
+ uint8_t *txt_data;
2293
+ beg = 0;
2294
+
2295
+ if (rndr->work_bufs[BUFFER_SPAN].size +
2296
+ rndr->work_bufs[BUFFER_BLOCK].size > rndr->max_nesting)
2297
+ return;
2298
+
2299
+ while (beg < size) {
2300
+ size_t cur = 0;
2301
+ src_map *block_map = NULL;
2302
+
2303
+ block_beg = beg;
2304
+ txt_data = data + beg;
2305
+ end = size - beg;
2306
+
2307
+ /* source map */
2308
+ if (map) {
2309
+ range actual_range;
2310
+
2311
+ cur = src_map_location(map, beg);
2312
+ actual_range.loc = cur;
2313
+ actual_range.len = end;
2314
+
2315
+ block_map = src_map_new_submap(map, &actual_range);
2316
+ }
2317
+
2318
+ if (is_atxheader(rndr, txt_data, end))
2319
+ beg += parse_atxheader(ob, rndr, txt_data, end);
2320
+
2321
+ else if (data[beg] == '<' && rndr->cb.blockhtml &&
2322
+ (i = parse_htmlblock(ob, rndr, txt_data, end, 1)) != 0)
2323
+ beg += i;
2324
+
2325
+ else if ((i = is_empty(txt_data, end)) != 0) {
2326
+ beg += i;
2327
+ }
2328
+
2329
+ else if (is_hrule(txt_data, end)) {
2330
+ if (rndr->cb.hrule)
2331
+ rndr->cb.hrule(ob, rndr->opaque);
2332
+
2333
+ while (beg < size && data[beg] != '\n')
2334
+ beg++;
2335
+
2336
+ beg++;
2337
+ }
2338
+
2339
+ else if ((rndr->ext_flags & MKDEXT_FENCED_CODE) != 0 &&
2340
+ (i = parse_fencedcode(ob, rndr, txt_data, end)) != 0)
2341
+ beg += i;
2342
+
2343
+ else if ((rndr->ext_flags & MKDEXT_TABLES) != 0 &&
2344
+ (i = parse_table(ob, rndr, txt_data, end)) != 0)
2345
+ beg += i;
2346
+
2347
+ else if (prefix_quote(txt_data, end))
2348
+ beg += parse_blockquote(ob, rndr, txt_data, end, block_map);
2349
+
2350
+ else if (prefix_code(txt_data, end))
2351
+ beg += parse_blockcode(ob, rndr, txt_data, end);
2352
+
2353
+ else if (prefix_uli(txt_data, end))
2354
+ beg += parse_list(ob, rndr, txt_data, end, 0, block_map);
2355
+
2356
+ else if (prefix_oli(txt_data, end))
2357
+ beg += parse_list(ob, rndr, txt_data, end, MKD_LIST_ORDERED, block_map);
2358
+
2359
+ else
2360
+ beg += parse_paragraph(ob, rndr, txt_data, end);
2361
+
2362
+ /* source map */
2363
+ if (block_map) {
2364
+ if (rndr->cb.block_did_parse) {
2365
+ range parse_range = { cur, beg - block_beg };
2366
+ src_map *parse_map = src_map_new_submap(block_map, &parse_range);
2367
+
2368
+ rndr->cb.block_did_parse(parse_map, txt_data, beg - block_beg, rndr->opaque);
2369
+
2370
+ src_map_release(parse_map);
2371
+ }
2372
+ src_map_release(block_map);
2373
+ }
2374
+ }
2375
+ }
2376
+
2377
+ /*********************
2378
+ * REFERENCE PARSING *
2379
+ *********************/
2380
+
2381
+ /* is_ref • returns whether a line is a reference or not */
2382
+ static int
2383
+ is_ref(const uint8_t *data, size_t beg, size_t end, size_t *last, struct link_ref **refs)
2384
+ {
2385
+ /* int n; */
2386
+ size_t i = 0;
2387
+ size_t id_offset, id_end;
2388
+ size_t link_offset, link_end;
2389
+ size_t title_offset, title_end;
2390
+ size_t line_end;
2391
+
2392
+ /* up to 3 optional leading spaces */
2393
+ if (beg + 3 >= end) return 0;
2394
+ if (data[beg] == ' ') { i = 1;
2395
+ if (data[beg + 1] == ' ') { i = 2;
2396
+ if (data[beg + 2] == ' ') { i = 3;
2397
+ if (data[beg + 3] == ' ') return 0; } } }
2398
+ i += beg;
2399
+
2400
+ /* id part: anything but a newline between brackets */
2401
+ if (data[i] != '[') return 0;
2402
+ i++;
2403
+ id_offset = i;
2404
+ while (i < end && data[i] != '\n' && data[i] != '\r' && data[i] != ']')
2405
+ i++;
2406
+ if (i >= end || data[i] != ']') return 0;
2407
+ id_end = i;
2408
+
2409
+ /* spacer: colon (space | tab)* newline? (space | tab)* */
2410
+ i++;
2411
+ if (i >= end || data[i] != ':') return 0;
2412
+ i++;
2413
+ while (i < end && data[i] == ' ') i++;
2414
+ if (i < end && (data[i] == '\n' || data[i] == '\r')) {
2415
+ i++;
2416
+ if (i < end && data[i] == '\r' && data[i - 1] == '\n') i++; }
2417
+ while (i < end && data[i] == ' ') i++;
2418
+ if (i >= end) return 0;
2419
+
2420
+ /* link: whitespace-free sequence, optionally between angle brackets */
2421
+ if (data[i] == '<')
2422
+ i++;
2423
+
2424
+ link_offset = i;
2425
+
2426
+ while (i < end && data[i] != ' ' && data[i] != '\n' && data[i] != '\r')
2427
+ i++;
2428
+
2429
+ if (data[i - 1] == '>') link_end = i - 1;
2430
+ else link_end = i;
2431
+
2432
+ /* optional spacer: (space | tab)* (newline | '\'' | '"' | '(' ) */
2433
+ while (i < end && data[i] == ' ') i++;
2434
+ if (i < end && data[i] != '\n' && data[i] != '\r'
2435
+ && data[i] != '\'' && data[i] != '"' && data[i] != '(')
2436
+ return 0;
2437
+ line_end = 0;
2438
+ /* computing end-of-line */
2439
+ if (i >= end || data[i] == '\r' || data[i] == '\n') line_end = i;
2440
+ if (i + 1 < end && data[i] == '\n' && data[i + 1] == '\r')
2441
+ line_end = i + 1;
2442
+
2443
+ /* optional (space|tab)* spacer after a newline */
2444
+ if (line_end) {
2445
+ i = line_end + 1;
2446
+ while (i < end && data[i] == ' ') i++; }
2447
+
2448
+ /* optional title: any non-newline sequence enclosed in '"()
2449
+ alone on its line */
2450
+ title_offset = title_end = 0;
2451
+ if (i + 1 < end
2452
+ && (data[i] == '\'' || data[i] == '"' || data[i] == '(')) {
2453
+ i++;
2454
+ title_offset = i;
2455
+ /* looking for EOL */
2456
+ while (i < end && data[i] != '\n' && data[i] != '\r') i++;
2457
+ if (i + 1 < end && data[i] == '\n' && data[i + 1] == '\r')
2458
+ title_end = i + 1;
2459
+ else title_end = i;
2460
+ /* stepping back */
2461
+ i -= 1;
2462
+ while (i > title_offset && data[i] == ' ')
2463
+ i -= 1;
2464
+ if (i > title_offset
2465
+ && (data[i] == '\'' || data[i] == '"' || data[i] == ')')) {
2466
+ line_end = title_end;
2467
+ title_end = i; } }
2468
+
2469
+ if (!line_end || link_end == link_offset)
2470
+ return 0; /* garbage after the link empty link */
2471
+
2472
+ /* a valid ref has been found, filling-in return structures */
2473
+ if (last)
2474
+ *last = line_end;
2475
+
2476
+ if (refs) {
2477
+ struct link_ref *ref;
2478
+
2479
+ ref = add_link_ref(refs, data + id_offset, id_end - id_offset);
2480
+ if (!ref)
2481
+ return 0;
2482
+
2483
+ ref->link = bufnew(link_end - link_offset);
2484
+ bufput(ref->link, data + link_offset, link_end - link_offset);
2485
+
2486
+ if (title_end > title_offset) {
2487
+ ref->title = bufnew(title_end - title_offset);
2488
+ bufput(ref->title, data + title_offset, title_end - title_offset);
2489
+ }
2490
+ }
2491
+
2492
+ return 1;
2493
+ }
2494
+
2495
+ static void expand_tabs(struct buf *ob, const uint8_t *line, size_t size)
2496
+ {
2497
+ size_t i = 0, tab = 0;
2498
+
2499
+ while (i < size) {
2500
+ size_t org = i;
2501
+
2502
+ while (i < size && line[i] != '\t') {
2503
+ i++; tab++;
2504
+ }
2505
+
2506
+ if (i > org)
2507
+ bufput(ob, line + org, i - org);
2508
+
2509
+ if (i >= size)
2510
+ break;
2511
+
2512
+ do {
2513
+ bufputc(ob, ' '); tab++;
2514
+ } while (tab % 4);
2515
+
2516
+ i++;
2517
+ }
2518
+ }
2519
+
2520
+ /**********************
2521
+ * EXPORTED FUNCTIONS *
2522
+ **********************/
2523
+
2524
+ struct sd_markdown *
2525
+ sd_markdown_new(
2526
+ unsigned int extensions,
2527
+ size_t max_nesting,
2528
+ const struct sd_callbacks *callbacks,
2529
+ void *opaque)
2530
+ {
2531
+ struct sd_markdown *md = NULL;
2532
+
2533
+ assert(max_nesting > 0 && callbacks);
2534
+
2535
+ md = malloc(sizeof(struct sd_markdown));
2536
+ if (!md)
2537
+ return NULL;
2538
+
2539
+ memcpy(&md->cb, callbacks, sizeof(struct sd_callbacks));
2540
+
2541
+ stack_init(&md->work_bufs[BUFFER_BLOCK], 4);
2542
+ stack_init(&md->work_bufs[BUFFER_SPAN], 8);
2543
+
2544
+ memset(md->active_char, 0x0, 256);
2545
+
2546
+ if (md->cb.emphasis || md->cb.double_emphasis || md->cb.triple_emphasis) {
2547
+ md->active_char['*'] = MD_CHAR_EMPHASIS;
2548
+ md->active_char['_'] = MD_CHAR_EMPHASIS;
2549
+ if (extensions & MKDEXT_STRIKETHROUGH)
2550
+ md->active_char['~'] = MD_CHAR_EMPHASIS;
2551
+ }
2552
+
2553
+ if (md->cb.codespan)
2554
+ md->active_char['`'] = MD_CHAR_CODESPAN;
2555
+
2556
+ if (md->cb.linebreak)
2557
+ md->active_char['\n'] = MD_CHAR_LINEBREAK;
2558
+
2559
+ if (md->cb.image || md->cb.link)
2560
+ md->active_char['['] = MD_CHAR_LINK;
2561
+
2562
+ md->active_char['<'] = MD_CHAR_LANGLE;
2563
+ md->active_char['\\'] = MD_CHAR_ESCAPE;
2564
+ md->active_char['&'] = MD_CHAR_ENTITITY;
2565
+
2566
+ if (extensions & MKDEXT_AUTOLINK) {
2567
+ md->active_char[':'] = MD_CHAR_AUTOLINK_URL;
2568
+ md->active_char['@'] = MD_CHAR_AUTOLINK_EMAIL;
2569
+ md->active_char['w'] = MD_CHAR_AUTOLINK_WWW;
2570
+ }
2571
+
2572
+ if (extensions & MKDEXT_SUPERSCRIPT)
2573
+ md->active_char['^'] = MD_CHAR_SUPERSCRIPT;
2574
+
2575
+ /* Extension data */
2576
+ md->ext_flags = extensions;
2577
+ md->opaque = opaque;
2578
+ md->max_nesting = max_nesting;
2579
+ md->in_link_body = 0;
2580
+
2581
+ return md;
2582
+ }
2583
+
2584
+ void
2585
+ sd_markdown_render(struct buf *ob, const uint8_t *document, size_t doc_size, struct sd_markdown *md)
2586
+ {
2587
+ #define MARKDOWN_GROW(x) ((x) + ((x) >> 1))
2588
+ static const char UTF8_BOM[] = {0xEF, 0xBB, 0xBF};
2589
+
2590
+ struct buf *text;
2591
+ size_t beg, end;
2592
+ src_map *map;
2593
+
2594
+ /* source map */
2595
+ if (md->cb.block_did_parse)
2596
+ map = src_map_new();
2597
+ else
2598
+ map = NULL;
2599
+
2600
+ text = bufnew(64);
2601
+ if (!text)
2602
+ return;
2603
+
2604
+ /* Preallocate enough space for our buffer to avoid expanding while copying */
2605
+ bufgrow(text, doc_size);
2606
+
2607
+ /* reset the references table */
2608
+ memset(&md->refs, 0x0, REF_TABLE_SIZE * sizeof(void *));
2609
+
2610
+ /* first pass: looking for references, copying everything else */
2611
+ beg = 0;
2612
+
2613
+ /* Skip a possible UTF-8 BOM, even though the Unicode standard
2614
+ * discourages having these in UTF-8 documents */
2615
+ if (doc_size >= 3 && memcmp(document, UTF8_BOM, 3) == 0)
2616
+ beg += 3;
2617
+
2618
+ while (beg < doc_size) /* iterating over lines */
2619
+ if (is_ref(document, beg, doc_size, &end, md->refs))
2620
+ beg = end;
2621
+ else { /* skipping to the next line */
2622
+ end = beg;
2623
+ while (end < doc_size && document[end] != '\n' && document[end] != '\r')
2624
+ end++;
2625
+
2626
+ /* adding the line body if present */
2627
+ if (end > beg)
2628
+ expand_tabs(text, document + beg, end - beg);
2629
+
2630
+ while (end < doc_size && (document[end] == '\n' || document[end] == '\r')) {
2631
+ /* add one \n per newline */
2632
+ if (document[end] == '\n' || (end + 1 < doc_size && document[end + 1] != '\n'))
2633
+ bufputc(text, '\n');
2634
+ end++;
2635
+ }
2636
+
2637
+ beg = end;
2638
+ }
2639
+
2640
+ /* pre-grow the output buffer to minimize allocations */
2641
+ bufgrow(ob, MARKDOWN_GROW(text->size));
2642
+
2643
+ /* second pass: actual rendering */
2644
+ if (md->cb.doc_header)
2645
+ md->cb.doc_header(ob, md->opaque);
2646
+
2647
+ if (text->size) {
2648
+
2649
+ /* adding a final newline if not already present */
2650
+ if (text->data[text->size - 1] != '\n' && text->data[text->size - 1] != '\r')
2651
+ bufputc(text, '\n');
2652
+
2653
+ /* source map */
2654
+ if (map) {
2655
+ range rng = {0, text->size};
2656
+ src_map_append(map, &rng);
2657
+ }
2658
+
2659
+ parse_block(ob, md, text->data, text->size, map);
2660
+
2661
+ /* source map */
2662
+ src_map_release(map);
2663
+ }
2664
+
2665
+ if (md->cb.doc_footer)
2666
+ md->cb.doc_footer(ob, md->opaque);
2667
+
2668
+ /* clean-up */
2669
+ bufrelease(text);
2670
+ free_link_refs(md->refs);
2671
+
2672
+ assert(md->work_bufs[BUFFER_SPAN].size == 0);
2673
+ assert(md->work_bufs[BUFFER_BLOCK].size == 0);
2674
+ }
2675
+
2676
+ void
2677
+ sd_markdown_free(struct sd_markdown *md)
2678
+ {
2679
+ size_t i;
2680
+
2681
+ for (i = 0; i < (size_t)md->work_bufs[BUFFER_SPAN].asize; ++i)
2682
+ bufrelease(md->work_bufs[BUFFER_SPAN].item[i]);
2683
+
2684
+ for (i = 0; i < (size_t)md->work_bufs[BUFFER_BLOCK].asize; ++i)
2685
+ bufrelease(md->work_bufs[BUFFER_BLOCK].item[i]);
2686
+
2687
+ stack_free(&md->work_bufs[BUFFER_SPAN]);
2688
+ stack_free(&md->work_bufs[BUFFER_BLOCK]);
2689
+
2690
+ free(md);
2691
+ }
2692
+
2693
+ void
2694
+ sd_version(int *ver_major, int *ver_minor, int *ver_revision)
2695
+ {
2696
+ *ver_major = SUNDOWN_VER_MAJOR;
2697
+ *ver_minor = SUNDOWN_VER_MINOR;
2698
+ *ver_revision = SUNDOWN_VER_REVISION;
2699
+ }
2700
+
2701
+ /* vim: set filetype=c: */