redsnow 0.0.8

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (174) hide show
  1. checksums.yaml +7 -0
  2. data/.gitignore +34 -0
  3. data/.gitmodules +3 -0
  4. data/.travis.yml +20 -0
  5. data/CHANGELOG.md +4 -0
  6. data/Gemfile +4 -0
  7. data/LICENSE +21 -0
  8. data/README.md +62 -0
  9. data/Rakefile +36 -0
  10. data/Vagrantfile +20 -0
  11. data/ext/snowcrash/Makefile +64 -0
  12. data/ext/snowcrash/Vagrantfile +20 -0
  13. data/ext/snowcrash/bin/snowcrash +0 -0
  14. data/ext/snowcrash/common.gypi +163 -0
  15. data/ext/snowcrash/config.gypi +10 -0
  16. data/ext/snowcrash/config.mk +5 -0
  17. data/ext/snowcrash/configure +213 -0
  18. data/ext/snowcrash/provisioning.sh +15 -0
  19. data/ext/snowcrash/snowcrash.gyp +141 -0
  20. data/ext/snowcrash/src/ActionParser.h +503 -0
  21. data/ext/snowcrash/src/AssetParser.h +215 -0
  22. data/ext/snowcrash/src/BlockUtility.h +186 -0
  23. data/ext/snowcrash/src/Blueprint.h +283 -0
  24. data/ext/snowcrash/src/BlueprintParser.h +347 -0
  25. data/ext/snowcrash/src/BlueprintParserCore.h +190 -0
  26. data/ext/snowcrash/src/BlueprintSection.h +140 -0
  27. data/ext/snowcrash/src/BlueprintUtility.h +126 -0
  28. data/ext/snowcrash/src/CBlueprint.cc +600 -0
  29. data/ext/snowcrash/src/CBlueprint.h +354 -0
  30. data/ext/snowcrash/src/CSourceAnnotation.cc +140 -0
  31. data/ext/snowcrash/src/CSourceAnnotation.h +106 -0
  32. data/ext/snowcrash/src/CodeBlockUtility.h +189 -0
  33. data/ext/snowcrash/src/DescriptionSectionUtility.h +156 -0
  34. data/ext/snowcrash/src/HTTP.cc +46 -0
  35. data/ext/snowcrash/src/HTTP.h +105 -0
  36. data/ext/snowcrash/src/HeaderParser.h +289 -0
  37. data/ext/snowcrash/src/ListBlockUtility.h +273 -0
  38. data/ext/snowcrash/src/ListUtility.h +95 -0
  39. data/ext/snowcrash/src/MarkdownBlock.cc +176 -0
  40. data/ext/snowcrash/src/MarkdownBlock.h +93 -0
  41. data/ext/snowcrash/src/MarkdownParser.cc +266 -0
  42. data/ext/snowcrash/src/MarkdownParser.h +88 -0
  43. data/ext/snowcrash/src/ParameterDefinitonParser.h +570 -0
  44. data/ext/snowcrash/src/ParametersParser.h +252 -0
  45. data/ext/snowcrash/src/Parser.cc +71 -0
  46. data/ext/snowcrash/src/Parser.h +29 -0
  47. data/ext/snowcrash/src/ParserCore.cc +120 -0
  48. data/ext/snowcrash/src/ParserCore.h +82 -0
  49. data/ext/snowcrash/src/PayloadParser.h +672 -0
  50. data/ext/snowcrash/src/Platform.h +54 -0
  51. data/ext/snowcrash/src/RegexMatch.h +32 -0
  52. data/ext/snowcrash/src/ResourceGroupParser.h +195 -0
  53. data/ext/snowcrash/src/ResourceParser.h +584 -0
  54. data/ext/snowcrash/src/SectionUtility.h +142 -0
  55. data/ext/snowcrash/src/Serialize.cc +52 -0
  56. data/ext/snowcrash/src/Serialize.h +69 -0
  57. data/ext/snowcrash/src/SerializeJSON.cc +601 -0
  58. data/ext/snowcrash/src/SerializeJSON.h +21 -0
  59. data/ext/snowcrash/src/SerializeYAML.cc +336 -0
  60. data/ext/snowcrash/src/SerializeYAML.h +21 -0
  61. data/ext/snowcrash/src/SourceAnnotation.h +177 -0
  62. data/ext/snowcrash/src/StringUtility.h +109 -0
  63. data/ext/snowcrash/src/SymbolTable.h +83 -0
  64. data/ext/snowcrash/src/UriTemplateParser.cc +195 -0
  65. data/ext/snowcrash/src/UriTemplateParser.h +243 -0
  66. data/ext/snowcrash/src/Version.h +39 -0
  67. data/ext/snowcrash/src/csnowcrash.cc +23 -0
  68. data/ext/snowcrash/src/csnowcrash.h +38 -0
  69. data/ext/snowcrash/src/posix/RegexMatch.cc +99 -0
  70. data/ext/snowcrash/src/snowcrash.cc +18 -0
  71. data/ext/snowcrash/src/snowcrash.h +41 -0
  72. data/ext/snowcrash/src/snowcrash/snowcrash.cc +170 -0
  73. data/ext/snowcrash/src/win/RegexMatch.cc +78 -0
  74. data/ext/snowcrash/sundown/CONTRIBUTING.md +10 -0
  75. data/ext/snowcrash/sundown/Makefile +83 -0
  76. data/ext/snowcrash/sundown/Makefile.win +33 -0
  77. data/ext/snowcrash/sundown/examples/smartypants.c +72 -0
  78. data/ext/snowcrash/sundown/examples/sundown.c +80 -0
  79. data/ext/snowcrash/sundown/html/houdini.h +37 -0
  80. data/ext/snowcrash/sundown/html/houdini_href_e.c +108 -0
  81. data/ext/snowcrash/sundown/html/houdini_html_e.c +84 -0
  82. data/ext/snowcrash/sundown/html/html.c +647 -0
  83. data/ext/snowcrash/sundown/html/html.h +77 -0
  84. data/ext/snowcrash/sundown/html/html_smartypants.c +389 -0
  85. data/ext/snowcrash/sundown/html_block_names.txt +25 -0
  86. data/ext/snowcrash/sundown/src/autolink.c +297 -0
  87. data/ext/snowcrash/sundown/src/autolink.h +51 -0
  88. data/ext/snowcrash/sundown/src/buffer.c +225 -0
  89. data/ext/snowcrash/sundown/src/buffer.h +96 -0
  90. data/ext/snowcrash/sundown/src/html_blocks.h +206 -0
  91. data/ext/snowcrash/sundown/src/markdown.c +2701 -0
  92. data/ext/snowcrash/sundown/src/markdown.h +147 -0
  93. data/ext/snowcrash/sundown/src/src_map.c +200 -0
  94. data/ext/snowcrash/sundown/src/src_map.h +58 -0
  95. data/ext/snowcrash/sundown/src/stack.c +81 -0
  96. data/ext/snowcrash/sundown/src/stack.h +29 -0
  97. data/ext/snowcrash/sundown/sundown.def +20 -0
  98. data/ext/snowcrash/tools/gyp/AUTHORS +11 -0
  99. data/ext/snowcrash/tools/gyp/DEPS +24 -0
  100. data/ext/snowcrash/tools/gyp/OWNERS +1 -0
  101. data/ext/snowcrash/tools/gyp/PRESUBMIT.py +120 -0
  102. data/ext/snowcrash/tools/gyp/buildbot/buildbot_run.py +190 -0
  103. data/ext/snowcrash/tools/gyp/codereview.settings +10 -0
  104. data/ext/snowcrash/tools/gyp/data/win/large-pdb-shim.cc +12 -0
  105. data/ext/snowcrash/tools/gyp/gyp +8 -0
  106. data/ext/snowcrash/tools/gyp/gyp.bat +5 -0
  107. data/ext/snowcrash/tools/gyp/gyp_main.py +18 -0
  108. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSNew.py +340 -0
  109. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSProject.py +208 -0
  110. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSSettings.py +1063 -0
  111. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSToolFile.py +58 -0
  112. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSUserFile.py +147 -0
  113. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSUtil.py +267 -0
  114. data/ext/snowcrash/tools/gyp/pylib/gyp/MSVSVersion.py +409 -0
  115. data/ext/snowcrash/tools/gyp/pylib/gyp/__init__.py +537 -0
  116. data/ext/snowcrash/tools/gyp/pylib/gyp/__init__.pyc +0 -0
  117. data/ext/snowcrash/tools/gyp/pylib/gyp/common.py +521 -0
  118. data/ext/snowcrash/tools/gyp/pylib/gyp/common.pyc +0 -0
  119. data/ext/snowcrash/tools/gyp/pylib/gyp/easy_xml.py +157 -0
  120. data/ext/snowcrash/tools/gyp/pylib/gyp/flock_tool.py +49 -0
  121. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/__init__.py +0 -0
  122. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/__init__.pyc +0 -0
  123. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/android.py +1069 -0
  124. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/cmake.py +1143 -0
  125. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/dump_dependency_json.py +81 -0
  126. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/eclipse.py +335 -0
  127. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/gypd.py +87 -0
  128. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/gypsh.py +56 -0
  129. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/make.py +2181 -0
  130. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/make.pyc +0 -0
  131. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/msvs.py +3335 -0
  132. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/ninja.py +2156 -0
  133. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/xcode.py +1224 -0
  134. data/ext/snowcrash/tools/gyp/pylib/gyp/generator/xcode.pyc +0 -0
  135. data/ext/snowcrash/tools/gyp/pylib/gyp/input.py +2809 -0
  136. data/ext/snowcrash/tools/gyp/pylib/gyp/input.pyc +0 -0
  137. data/ext/snowcrash/tools/gyp/pylib/gyp/mac_tool.py +510 -0
  138. data/ext/snowcrash/tools/gyp/pylib/gyp/msvs_emulation.py +972 -0
  139. data/ext/snowcrash/tools/gyp/pylib/gyp/ninja_syntax.py +160 -0
  140. data/ext/snowcrash/tools/gyp/pylib/gyp/ordered_dict.py +289 -0
  141. data/ext/snowcrash/tools/gyp/pylib/gyp/win_tool.py +292 -0
  142. data/ext/snowcrash/tools/gyp/pylib/gyp/xcode_emulation.py +1440 -0
  143. data/ext/snowcrash/tools/gyp/pylib/gyp/xcode_emulation.pyc +0 -0
  144. data/ext/snowcrash/tools/gyp/pylib/gyp/xcodeproj_file.py +2889 -0
  145. data/ext/snowcrash/tools/gyp/pylib/gyp/xcodeproj_file.pyc +0 -0
  146. data/ext/snowcrash/tools/gyp/pylib/gyp/xml_fix.py +69 -0
  147. data/ext/snowcrash/tools/gyp/pylintrc +307 -0
  148. data/ext/snowcrash/tools/gyp/samples/samples +81 -0
  149. data/ext/snowcrash/tools/gyp/samples/samples.bat +5 -0
  150. data/ext/snowcrash/tools/gyp/setup.py +19 -0
  151. data/ext/snowcrash/tools/gyp/tools/Xcode/Specifications/gyp.pbfilespec +27 -0
  152. data/ext/snowcrash/tools/gyp/tools/Xcode/Specifications/gyp.xclangspec +226 -0
  153. data/ext/snowcrash/tools/gyp/tools/emacs/gyp.el +252 -0
  154. data/ext/snowcrash/tools/gyp/tools/graphviz.py +100 -0
  155. data/ext/snowcrash/tools/gyp/tools/pretty_gyp.py +155 -0
  156. data/ext/snowcrash/tools/gyp/tools/pretty_sln.py +168 -0
  157. data/ext/snowcrash/tools/gyp/tools/pretty_vcproj.py +329 -0
  158. data/ext/snowcrash/tools/homebrew/snowcrash.rb +11 -0
  159. data/ext/snowcrash/vcbuild.bat +184 -0
  160. data/lib/redsnow.rb +31 -0
  161. data/lib/redsnow/binding.rb +132 -0
  162. data/lib/redsnow/blueprint.rb +365 -0
  163. data/lib/redsnow/object.rb +18 -0
  164. data/lib/redsnow/parseresult.rb +107 -0
  165. data/lib/redsnow/version.rb +4 -0
  166. data/provisioning.sh +20 -0
  167. data/redsnow.gemspec +35 -0
  168. data/test/_helper.rb +15 -0
  169. data/test/fixtures/sample-api-ast.json +97 -0
  170. data/test/fixtures/sample-api.apib +20 -0
  171. data/test/redsnow_binding_test.rb +35 -0
  172. data/test/redsnow_parseresult_test.rb +50 -0
  173. data/test/redsnow_test.rb +285 -0
  174. metadata +358 -0
@@ -0,0 +1,96 @@
1
+ /*
2
+ * Copyright (c) 2008, Natacha Porté
3
+ * Copyright (c) 2011, Vicent Martí
4
+ *
5
+ * Permission to use, copy, modify, and distribute this software for any
6
+ * purpose with or without fee is hereby granted, provided that the above
7
+ * copyright notice and this permission notice appear in all copies.
8
+ *
9
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
10
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
11
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
12
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
13
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
14
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
15
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
16
+ */
17
+
18
+ #ifndef BUFFER_H__
19
+ #define BUFFER_H__
20
+
21
+ #include <stddef.h>
22
+ #include <stdarg.h>
23
+ #include <stdint.h>
24
+
25
+ #ifdef __cplusplus
26
+ extern "C" {
27
+ #endif
28
+
29
+ #if defined(_MSC_VER)
30
+ #define __attribute__(x)
31
+ #define inline
32
+ #endif
33
+
34
+ typedef enum {
35
+ BUF_OK = 0,
36
+ BUF_ENOMEM = -1
37
+ } buferror_t;
38
+
39
+ /* struct buf: character array buffer */
40
+ struct buf {
41
+ uint8_t *data; /* actual character data */
42
+ size_t size; /* size of the string */
43
+ size_t asize; /* allocated size (0 = volatile buffer) */
44
+ size_t unit; /* reallocation unit size (0 = read-only buffer) */
45
+ };
46
+
47
+ /* CONST_BUF: global buffer from a string litteral */
48
+ #define BUF_STATIC(string) \
49
+ { (uint8_t *)string, sizeof string -1, sizeof string, 0, 0 }
50
+
51
+ /* VOLATILE_BUF: macro for creating a volatile buffer on the stack */
52
+ #define BUF_VOLATILE(strname) \
53
+ { (uint8_t *)strname, strlen(strname), 0, 0, 0 }
54
+
55
+ /* BUFPUTSL: optimized bufputs of a string litteral */
56
+ #define BUFPUTSL(output, literal) \
57
+ bufput(output, literal, sizeof literal - 1)
58
+
59
+ /* bufgrow: increasing the allocated size to the given value */
60
+ int bufgrow(struct buf *, size_t);
61
+
62
+ /* bufnew: allocation of a new buffer */
63
+ struct buf *bufnew(size_t) __attribute__ ((malloc));
64
+
65
+ /* bufnullterm: NUL-termination of the string array (making a C-string) */
66
+ const char *bufcstr(struct buf *);
67
+
68
+ /* bufprefix: compare the beginning of a buffer with a string */
69
+ int bufprefix(const struct buf *buf, const char *prefix);
70
+
71
+ /* bufput: appends raw data to a buffer */
72
+ void bufput(struct buf *, const void *, size_t);
73
+
74
+ /* bufputs: appends a NUL-terminated string to a buffer */
75
+ void bufputs(struct buf *, const char *);
76
+
77
+ /* bufputc: appends a single char to a buffer */
78
+ void bufputc(struct buf *, int);
79
+
80
+ /* bufrelease: decrease the reference count and free the buffer if needed */
81
+ void bufrelease(struct buf *);
82
+
83
+ /* bufreset: frees internal data of the buffer */
84
+ void bufreset(struct buf *);
85
+
86
+ /* bufslurp: removes a given number of bytes from the head of the array */
87
+ void bufslurp(struct buf *, size_t);
88
+
89
+ /* bufprintf: formatted printing to a buffer */
90
+ void bufprintf(struct buf *, const char *, ...) __attribute__ ((format (printf, 2, 3)));
91
+
92
+ #ifdef __cplusplus
93
+ }
94
+ #endif
95
+
96
+ #endif
@@ -0,0 +1,206 @@
1
+ /* C code produced by gperf version 3.0.3 */
2
+ /* Command-line: gperf -N find_block_tag -H hash_block_tag -C -c -E --ignore-case html_block_names.txt */
3
+ /* Computed positions: -k'1-2' */
4
+
5
+ #if !((' ' == 32) && ('!' == 33) && ('"' == 34) && ('#' == 35) \
6
+ && ('%' == 37) && ('&' == 38) && ('\'' == 39) && ('(' == 40) \
7
+ && (')' == 41) && ('*' == 42) && ('+' == 43) && (',' == 44) \
8
+ && ('-' == 45) && ('.' == 46) && ('/' == 47) && ('0' == 48) \
9
+ && ('1' == 49) && ('2' == 50) && ('3' == 51) && ('4' == 52) \
10
+ && ('5' == 53) && ('6' == 54) && ('7' == 55) && ('8' == 56) \
11
+ && ('9' == 57) && (':' == 58) && (';' == 59) && ('<' == 60) \
12
+ && ('=' == 61) && ('>' == 62) && ('?' == 63) && ('A' == 65) \
13
+ && ('B' == 66) && ('C' == 67) && ('D' == 68) && ('E' == 69) \
14
+ && ('F' == 70) && ('G' == 71) && ('H' == 72) && ('I' == 73) \
15
+ && ('J' == 74) && ('K' == 75) && ('L' == 76) && ('M' == 77) \
16
+ && ('N' == 78) && ('O' == 79) && ('P' == 80) && ('Q' == 81) \
17
+ && ('R' == 82) && ('S' == 83) && ('T' == 84) && ('U' == 85) \
18
+ && ('V' == 86) && ('W' == 87) && ('X' == 88) && ('Y' == 89) \
19
+ && ('Z' == 90) && ('[' == 91) && ('\\' == 92) && (']' == 93) \
20
+ && ('^' == 94) && ('_' == 95) && ('a' == 97) && ('b' == 98) \
21
+ && ('c' == 99) && ('d' == 100) && ('e' == 101) && ('f' == 102) \
22
+ && ('g' == 103) && ('h' == 104) && ('i' == 105) && ('j' == 106) \
23
+ && ('k' == 107) && ('l' == 108) && ('m' == 109) && ('n' == 110) \
24
+ && ('o' == 111) && ('p' == 112) && ('q' == 113) && ('r' == 114) \
25
+ && ('s' == 115) && ('t' == 116) && ('u' == 117) && ('v' == 118) \
26
+ && ('w' == 119) && ('x' == 120) && ('y' == 121) && ('z' == 122) \
27
+ && ('{' == 123) && ('|' == 124) && ('}' == 125) && ('~' == 126))
28
+ /* The character set is not based on ISO-646. */
29
+ error "gperf generated tables don't work with this execution character set. Please report a bug to <bug-gnu-gperf@gnu.org>."
30
+ #endif
31
+
32
+ /* maximum key range = 37, duplicates = 0 */
33
+
34
+ #ifndef GPERF_DOWNCASE
35
+ #define GPERF_DOWNCASE 1
36
+ static unsigned char gperf_downcase[256] =
37
+ {
38
+ 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14,
39
+ 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29,
40
+ 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44,
41
+ 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59,
42
+ 60, 61, 62, 63, 64, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106,
43
+ 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121,
44
+ 122, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104,
45
+ 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119,
46
+ 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134,
47
+ 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149,
48
+ 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164,
49
+ 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179,
50
+ 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194,
51
+ 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209,
52
+ 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224,
53
+ 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239,
54
+ 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254,
55
+ 255
56
+ };
57
+ #endif
58
+
59
+ #ifndef GPERF_CASE_STRNCMP
60
+ #define GPERF_CASE_STRNCMP 1
61
+ static int
62
+ gperf_case_strncmp (s1, s2, n)
63
+ register const char *s1;
64
+ register const char *s2;
65
+ register unsigned int n;
66
+ {
67
+ for (; n > 0;)
68
+ {
69
+ unsigned char c1 = gperf_downcase[(unsigned char)*s1++];
70
+ unsigned char c2 = gperf_downcase[(unsigned char)*s2++];
71
+ if (c1 != 0 && c1 == c2)
72
+ {
73
+ n--;
74
+ continue;
75
+ }
76
+ return (int)c1 - (int)c2;
77
+ }
78
+ return 0;
79
+ }
80
+ #endif
81
+
82
+ #ifdef __GNUC__
83
+ __inline
84
+ #else
85
+ #ifdef __cplusplus
86
+ inline
87
+ #endif
88
+ #endif
89
+ static unsigned int
90
+ hash_block_tag (str, len)
91
+ register const char *str;
92
+ register unsigned int len;
93
+ {
94
+ static const unsigned char asso_values[] =
95
+ {
96
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
97
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
98
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
99
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
100
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
101
+ 8, 30, 25, 20, 15, 10, 38, 38, 38, 38,
102
+ 38, 38, 38, 38, 38, 38, 0, 38, 0, 38,
103
+ 5, 5, 5, 15, 0, 38, 38, 0, 15, 10,
104
+ 0, 38, 38, 15, 0, 5, 38, 38, 38, 38,
105
+ 38, 38, 38, 38, 38, 38, 38, 38, 0, 38,
106
+ 0, 38, 5, 5, 5, 15, 0, 38, 38, 0,
107
+ 15, 10, 0, 38, 38, 15, 0, 5, 38, 38,
108
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
109
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
110
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
111
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
112
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
113
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
114
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
115
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
116
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
117
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
118
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
119
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
120
+ 38, 38, 38, 38, 38, 38, 38, 38, 38, 38,
121
+ 38, 38, 38, 38, 38, 38, 38
122
+ };
123
+ register int hval = len;
124
+
125
+ switch (hval)
126
+ {
127
+ default:
128
+ hval += asso_values[(unsigned char)str[1]+1];
129
+ /*FALLTHROUGH*/
130
+ case 1:
131
+ hval += asso_values[(unsigned char)str[0]];
132
+ break;
133
+ }
134
+ return hval;
135
+ }
136
+
137
+ #ifdef __GNUC__
138
+ __inline
139
+ #ifdef __GNUC_STDC_INLINE__
140
+ __attribute__ ((__gnu_inline__))
141
+ #endif
142
+ #endif
143
+ const char *
144
+ find_block_tag (str, len)
145
+ register const char *str;
146
+ register unsigned int len;
147
+ {
148
+ enum
149
+ {
150
+ TOTAL_KEYWORDS = 24,
151
+ MIN_WORD_LENGTH = 1,
152
+ MAX_WORD_LENGTH = 10,
153
+ MIN_HASH_VALUE = 1,
154
+ MAX_HASH_VALUE = 37
155
+ };
156
+
157
+ static const char * const wordlist[] =
158
+ {
159
+ "",
160
+ "p",
161
+ "dl",
162
+ "div",
163
+ "math",
164
+ "table",
165
+ "",
166
+ "ul",
167
+ "del",
168
+ "form",
169
+ "blockquote",
170
+ "figure",
171
+ "ol",
172
+ "fieldset",
173
+ "",
174
+ "h1",
175
+ "",
176
+ "h6",
177
+ "pre",
178
+ "", "",
179
+ "script",
180
+ "h5",
181
+ "noscript",
182
+ "",
183
+ "style",
184
+ "iframe",
185
+ "h4",
186
+ "ins",
187
+ "", "", "",
188
+ "h3",
189
+ "", "", "", "",
190
+ "h2"
191
+ };
192
+
193
+ if (len <= MAX_WORD_LENGTH && len >= MIN_WORD_LENGTH)
194
+ {
195
+ register int key = hash_block_tag (str, len);
196
+
197
+ if (key <= MAX_HASH_VALUE && key >= 0)
198
+ {
199
+ register const char *s = wordlist[key];
200
+
201
+ if ((((unsigned char)*str ^ (unsigned char)*s) & ~32) == 0 && !gperf_case_strncmp (str, s, len) && s[len] == '\0')
202
+ return s;
203
+ }
204
+ }
205
+ return 0;
206
+ }
@@ -0,0 +1,2701 @@
1
+ /* markdown.c - generic markdown parser */
2
+
3
+ /*
4
+ * Copyright (c) 2009, Natacha Porté
5
+ * Copyright (c) 2011, Vicent Marti
6
+ *
7
+ * Permission to use, copy, modify, and distribute this software for any
8
+ * purpose with or without fee is hereby granted, provided that the above
9
+ * copyright notice and this permission notice appear in all copies.
10
+ *
11
+ * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
12
+ * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
13
+ * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
14
+ * ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
15
+ * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
16
+ * ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
17
+ * OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
18
+ */
19
+
20
+ #include "markdown.h"
21
+ #include "stack.h"
22
+ #include "src_map.h"
23
+
24
+ #include <assert.h>
25
+ #include <string.h>
26
+ #include <ctype.h>
27
+ #include <stdio.h>
28
+
29
+ #if defined(_WIN32)
30
+ #define strncasecmp _strnicmp
31
+ #endif
32
+
33
+ #define REF_TABLE_SIZE 8
34
+
35
+ #define BUFFER_BLOCK 0
36
+ #define BUFFER_SPAN 1
37
+
38
+ #define MKD_LI_END 8 /* internal list flag */
39
+
40
+ #define gperf_case_strncmp(s1, s2, n) strncasecmp(s1, s2, n)
41
+ #define GPERF_DOWNCASE 1
42
+ #define GPERF_CASE_STRNCMP 1
43
+ #include "html_blocks.h"
44
+
45
+ /***************
46
+ * LOCAL TYPES *
47
+ ***************/
48
+
49
+ /* link_ref: reference to a link */
50
+ struct link_ref {
51
+ unsigned int id;
52
+
53
+ struct buf *link;
54
+ struct buf *title;
55
+
56
+ struct link_ref *next;
57
+ };
58
+
59
+ /* char_trigger: function pointer to render active chars */
60
+ /* returns the number of chars taken care of */
61
+ /* data is the pointer of the beginning of the span */
62
+ /* offset is the number of valid chars before data */
63
+ struct sd_markdown;
64
+ typedef size_t
65
+ (*char_trigger)(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
66
+
67
+ static size_t char_emphasis(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
68
+ static size_t char_linebreak(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
69
+ static size_t char_codespan(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
70
+ static size_t char_escape(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
71
+ static size_t char_entity(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
72
+ static size_t char_langle_tag(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
73
+ static size_t char_autolink_url(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
74
+ static size_t char_autolink_email(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
75
+ static size_t char_autolink_www(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
76
+ static size_t char_link(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
77
+ static size_t char_superscript(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size);
78
+
79
+ enum markdown_char_t {
80
+ MD_CHAR_NONE = 0,
81
+ MD_CHAR_EMPHASIS,
82
+ MD_CHAR_CODESPAN,
83
+ MD_CHAR_LINEBREAK,
84
+ MD_CHAR_LINK,
85
+ MD_CHAR_LANGLE,
86
+ MD_CHAR_ESCAPE,
87
+ MD_CHAR_ENTITITY,
88
+ MD_CHAR_AUTOLINK_URL,
89
+ MD_CHAR_AUTOLINK_EMAIL,
90
+ MD_CHAR_AUTOLINK_WWW,
91
+ MD_CHAR_SUPERSCRIPT,
92
+ };
93
+
94
+ static char_trigger markdown_char_ptrs[] = {
95
+ NULL,
96
+ &char_emphasis,
97
+ &char_codespan,
98
+ &char_linebreak,
99
+ &char_link,
100
+ &char_langle_tag,
101
+ &char_escape,
102
+ &char_entity,
103
+ &char_autolink_url,
104
+ &char_autolink_email,
105
+ &char_autolink_www,
106
+ &char_superscript,
107
+ };
108
+
109
+ /* render • structure containing one particular render */
110
+ struct sd_markdown {
111
+ struct sd_callbacks cb;
112
+ void *opaque;
113
+
114
+ struct link_ref *refs[REF_TABLE_SIZE];
115
+ uint8_t active_char[256];
116
+ struct stack work_bufs[2];
117
+ unsigned int ext_flags;
118
+ size_t max_nesting;
119
+ int in_link_body;
120
+ };
121
+
122
+ /***************************
123
+ * HELPER FUNCTIONS *
124
+ ***************************/
125
+
126
+ static inline struct buf *
127
+ rndr_newbuf(struct sd_markdown *rndr, int type)
128
+ {
129
+ static const size_t buf_size[2] = {256, 64};
130
+ struct buf *work = NULL;
131
+ struct stack *pool = &rndr->work_bufs[type];
132
+
133
+ if (pool->size < pool->asize &&
134
+ pool->item[pool->size] != NULL) {
135
+ work = pool->item[pool->size++];
136
+ work->size = 0;
137
+ } else {
138
+ work = bufnew(buf_size[type]);
139
+ stack_push(pool, work);
140
+ }
141
+
142
+ return work;
143
+ }
144
+
145
+ static inline void
146
+ rndr_popbuf(struct sd_markdown *rndr, int type)
147
+ {
148
+ rndr->work_bufs[type].size--;
149
+ }
150
+
151
+ static void
152
+ unscape_text(struct buf *ob, struct buf *src)
153
+ {
154
+ size_t i = 0, org;
155
+ while (i < src->size) {
156
+ org = i;
157
+ while (i < src->size && src->data[i] != '\\')
158
+ i++;
159
+
160
+ if (i > org)
161
+ bufput(ob, src->data + org, i - org);
162
+
163
+ if (i + 1 >= src->size)
164
+ break;
165
+
166
+ bufputc(ob, src->data[i + 1]);
167
+ i += 2;
168
+ }
169
+ }
170
+
171
+ static unsigned int
172
+ hash_link_ref(const uint8_t *link_ref, size_t length)
173
+ {
174
+ size_t i;
175
+ unsigned int hash = 0;
176
+
177
+ for (i = 0; i < length; ++i)
178
+ hash = tolower(link_ref[i]) + (hash << 6) + (hash << 16) - hash;
179
+
180
+ return hash;
181
+ }
182
+
183
+ static struct link_ref *
184
+ add_link_ref(
185
+ struct link_ref **references,
186
+ const uint8_t *name, size_t name_size)
187
+ {
188
+ struct link_ref *ref = calloc(1, sizeof(struct link_ref));
189
+
190
+ if (!ref)
191
+ return NULL;
192
+
193
+ ref->id = hash_link_ref(name, name_size);
194
+ ref->next = references[ref->id % REF_TABLE_SIZE];
195
+
196
+ references[ref->id % REF_TABLE_SIZE] = ref;
197
+ return ref;
198
+ }
199
+
200
+ static struct link_ref *
201
+ find_link_ref(struct link_ref **references, uint8_t *name, size_t length)
202
+ {
203
+ unsigned int hash = hash_link_ref(name, length);
204
+ struct link_ref *ref = NULL;
205
+
206
+ ref = references[hash % REF_TABLE_SIZE];
207
+
208
+ while (ref != NULL) {
209
+ if (ref->id == hash)
210
+ return ref;
211
+
212
+ ref = ref->next;
213
+ }
214
+
215
+ return NULL;
216
+ }
217
+
218
+ static void
219
+ free_link_refs(struct link_ref **references)
220
+ {
221
+ size_t i;
222
+
223
+ for (i = 0; i < REF_TABLE_SIZE; ++i) {
224
+ struct link_ref *r = references[i];
225
+ struct link_ref *next;
226
+
227
+ while (r) {
228
+ next = r->next;
229
+ bufrelease(r->link);
230
+ bufrelease(r->title);
231
+ free(r);
232
+ r = next;
233
+ }
234
+ }
235
+ }
236
+
237
+ /*
238
+ * Check whether a char is a Markdown space.
239
+
240
+ * Right now we only consider spaces the actual
241
+ * space and a newline: tabs and carriage returns
242
+ * are filtered out during the preprocessing phase.
243
+ *
244
+ * If we wanted to actually be UTF-8 compliant, we
245
+ * should instead extract an Unicode codepoint from
246
+ * this character and check for space properties.
247
+ */
248
+ static inline int
249
+ _isspace(int c)
250
+ {
251
+ return c == ' ' || c == '\n';
252
+ }
253
+
254
+ /****************************
255
+ * INLINE PARSING FUNCTIONS *
256
+ ****************************/
257
+
258
+ /* is_mail_autolink • looks for the address part of a mail autolink and '>' */
259
+ /* this is less strict than the original markdown e-mail address matching */
260
+ static size_t
261
+ is_mail_autolink(uint8_t *data, size_t size)
262
+ {
263
+ size_t i = 0, nb = 0;
264
+
265
+ /* address is assumed to be: [-@._a-zA-Z0-9]+ with exactly one '@' */
266
+ for (i = 0; i < size; ++i) {
267
+ if (isalnum(data[i]))
268
+ continue;
269
+
270
+ switch (data[i]) {
271
+ case '@':
272
+ nb++;
273
+
274
+ case '-':
275
+ case '.':
276
+ case '_':
277
+ break;
278
+
279
+ case '>':
280
+ return (nb == 1) ? i + 1 : 0;
281
+
282
+ default:
283
+ return 0;
284
+ }
285
+ }
286
+
287
+ return 0;
288
+ }
289
+
290
+ /* tag_length • returns the length of the given tag, or 0 is it's not valid */
291
+ static size_t
292
+ tag_length(uint8_t *data, size_t size, enum mkd_autolink *autolink)
293
+ {
294
+ size_t i, j;
295
+
296
+ /* a valid tag can't be shorter than 3 chars */
297
+ if (size < 3) return 0;
298
+
299
+ /* begins with a '<' optionally followed by '/', followed by letter or number */
300
+ if (data[0] != '<') return 0;
301
+ i = (data[1] == '/') ? 2 : 1;
302
+
303
+ if (!isalnum(data[i]))
304
+ return 0;
305
+
306
+ /* scheme test */
307
+ *autolink = MKDA_NOT_AUTOLINK;
308
+
309
+ /* try to find the beginning of an URI */
310
+ while (i < size && (isalnum(data[i]) || data[i] == '.' || data[i] == '+' || data[i] == '-'))
311
+ i++;
312
+
313
+ if (i > 1 && data[i] == '@') {
314
+ if ((j = is_mail_autolink(data + i, size - i)) != 0) {
315
+ *autolink = MKDA_EMAIL;
316
+ return i + j;
317
+ }
318
+ }
319
+
320
+ if (i > 2 && data[i] == ':') {
321
+ *autolink = MKDA_NORMAL;
322
+ i++;
323
+ }
324
+
325
+ /* completing autolink test: no whitespace or ' or " */
326
+ if (i >= size)
327
+ *autolink = MKDA_NOT_AUTOLINK;
328
+
329
+ else if (*autolink) {
330
+ j = i;
331
+
332
+ while (i < size) {
333
+ if (data[i] == '\\') i += 2;
334
+ else if (data[i] == '>' || data[i] == '\'' ||
335
+ data[i] == '"' || data[i] == ' ' || data[i] == '\n')
336
+ break;
337
+ else i++;
338
+ }
339
+
340
+ if (i >= size) return 0;
341
+ if (i > j && data[i] == '>') return i + 1;
342
+ /* one of the forbidden chars has been found */
343
+ *autolink = MKDA_NOT_AUTOLINK;
344
+ }
345
+
346
+ /* looking for sometinhg looking like a tag end */
347
+ while (i < size && data[i] != '>') i++;
348
+ if (i >= size) return 0;
349
+ return i + 1;
350
+ }
351
+
352
+ /* parse_inline • parses inline markdown elements */
353
+ static void
354
+ parse_inline(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
355
+ {
356
+ size_t i = 0, end = 0;
357
+ uint8_t action = 0;
358
+ struct buf work = { 0, 0, 0, 0 };
359
+
360
+ if (rndr->work_bufs[BUFFER_SPAN].size +
361
+ rndr->work_bufs[BUFFER_BLOCK].size > rndr->max_nesting)
362
+ return;
363
+
364
+ while (i < size) {
365
+ /* copying inactive chars into the output */
366
+ while (end < size && (action = rndr->active_char[data[end]]) == 0) {
367
+ end++;
368
+ }
369
+
370
+ if (rndr->cb.normal_text) {
371
+ work.data = data + i;
372
+ work.size = end - i;
373
+ rndr->cb.normal_text(ob, &work, rndr->opaque);
374
+ }
375
+ else
376
+ bufput(ob, data + i, end - i);
377
+
378
+ if (end >= size) break;
379
+ i = end;
380
+
381
+ end = markdown_char_ptrs[(int)action](ob, rndr, data + i, i, size - i);
382
+ if (!end) /* no action from the callback */
383
+ end = i + 1;
384
+ else {
385
+ i += end;
386
+ end = i;
387
+ }
388
+ }
389
+ }
390
+
391
+ /* find_emph_char • looks for the next emph uint8_t, skipping other constructs */
392
+ static size_t
393
+ find_emph_char(uint8_t *data, size_t size, uint8_t c)
394
+ {
395
+ size_t i = 1;
396
+
397
+ while (i < size) {
398
+ while (i < size && data[i] != c && data[i] != '`' && data[i] != '[')
399
+ i++;
400
+
401
+ if (i == size)
402
+ return 0;
403
+
404
+ if (data[i] == c)
405
+ return i;
406
+
407
+ /* not counting escaped chars */
408
+ if (i && data[i - 1] == '\\') {
409
+ i++; continue;
410
+ }
411
+
412
+ if (data[i] == '`') {
413
+ size_t span_nb = 0, bt;
414
+ size_t tmp_i = 0;
415
+
416
+ /* counting the number of opening backticks */
417
+ while (i < size && data[i] == '`') {
418
+ i++; span_nb++;
419
+ }
420
+
421
+ if (i >= size) return 0;
422
+
423
+ /* finding the matching closing sequence */
424
+ bt = 0;
425
+ while (i < size && bt < span_nb) {
426
+ if (!tmp_i && data[i] == c) tmp_i = i;
427
+ if (data[i] == '`') bt++;
428
+ else bt = 0;
429
+ i++;
430
+ }
431
+
432
+ if (i >= size) return tmp_i;
433
+ }
434
+ /* skipping a link */
435
+ else if (data[i] == '[') {
436
+ size_t tmp_i = 0;
437
+ uint8_t cc;
438
+
439
+ i++;
440
+ while (i < size && data[i] != ']') {
441
+ if (!tmp_i && data[i] == c) tmp_i = i;
442
+ i++;
443
+ }
444
+
445
+ i++;
446
+ while (i < size && (data[i] == ' ' || data[i] == '\n'))
447
+ i++;
448
+
449
+ if (i >= size)
450
+ return tmp_i;
451
+
452
+ switch (data[i]) {
453
+ case '[':
454
+ cc = ']'; break;
455
+
456
+ case '(':
457
+ cc = ')'; break;
458
+
459
+ default:
460
+ if (tmp_i)
461
+ return tmp_i;
462
+ else
463
+ continue;
464
+ }
465
+
466
+ i++;
467
+ while (i < size && data[i] != cc) {
468
+ if (!tmp_i && data[i] == c) tmp_i = i;
469
+ i++;
470
+ }
471
+
472
+ if (i >= size)
473
+ return tmp_i;
474
+
475
+ i++;
476
+ }
477
+ }
478
+
479
+ return 0;
480
+ }
481
+
482
+ /* parse_emph1 • parsing single emphase */
483
+ /* closed by a symbol not preceded by whitespace and not followed by symbol */
484
+ static size_t
485
+ parse_emph1(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
486
+ {
487
+ size_t i = 0, len;
488
+ struct buf *work = 0;
489
+ int r;
490
+
491
+ if (!rndr->cb.emphasis) return 0;
492
+
493
+ /* skipping one symbol if coming from emph3 */
494
+ if (size > 1 && data[0] == c && data[1] == c) i = 1;
495
+
496
+ while (i < size) {
497
+ len = find_emph_char(data + i, size - i, c);
498
+ if (!len) return 0;
499
+ i += len;
500
+ if (i >= size) return 0;
501
+
502
+ if (data[i] == c && !_isspace(data[i - 1])) {
503
+
504
+ if (rndr->ext_flags & MKDEXT_NO_INTRA_EMPHASIS) {
505
+ if (i + 1 < size && isalnum(data[i + 1]))
506
+ continue;
507
+ }
508
+
509
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
510
+ parse_inline(work, rndr, data, i);
511
+ r = rndr->cb.emphasis(ob, work, rndr->opaque);
512
+ rndr_popbuf(rndr, BUFFER_SPAN);
513
+ return r ? i + 1 : 0;
514
+ }
515
+ }
516
+
517
+ return 0;
518
+ }
519
+
520
+ /* parse_emph2 • parsing single emphase */
521
+ static size_t
522
+ parse_emph2(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
523
+ {
524
+ int (*render_method)(struct buf *ob, const struct buf *text, void *opaque);
525
+ size_t i = 0, len;
526
+ struct buf *work = 0;
527
+ int r;
528
+
529
+ render_method = (c == '~') ? rndr->cb.strikethrough : rndr->cb.double_emphasis;
530
+
531
+ if (!render_method)
532
+ return 0;
533
+
534
+ while (i < size) {
535
+ len = find_emph_char(data + i, size - i, c);
536
+ if (!len) return 0;
537
+ i += len;
538
+
539
+ if (i + 1 < size && data[i] == c && data[i + 1] == c && i && !_isspace(data[i - 1])) {
540
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
541
+ parse_inline(work, rndr, data, i);
542
+ r = render_method(ob, work, rndr->opaque);
543
+ rndr_popbuf(rndr, BUFFER_SPAN);
544
+ return r ? i + 2 : 0;
545
+ }
546
+ i++;
547
+ }
548
+ return 0;
549
+ }
550
+
551
+ /* parse_emph3 • parsing single emphase */
552
+ /* finds the first closing tag, and delegates to the other emph */
553
+ static size_t
554
+ parse_emph3(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, uint8_t c)
555
+ {
556
+ size_t i = 0, len;
557
+ int r;
558
+
559
+ while (i < size) {
560
+ len = find_emph_char(data + i, size - i, c);
561
+ if (!len) return 0;
562
+ i += len;
563
+
564
+ /* skip whitespace preceded symbols */
565
+ if (data[i] != c || _isspace(data[i - 1]))
566
+ continue;
567
+
568
+ if (i + 2 < size && data[i + 1] == c && data[i + 2] == c && rndr->cb.triple_emphasis) {
569
+ /* triple symbol found */
570
+ struct buf *work = rndr_newbuf(rndr, BUFFER_SPAN);
571
+
572
+ parse_inline(work, rndr, data, i);
573
+ r = rndr->cb.triple_emphasis(ob, work, rndr->opaque);
574
+ rndr_popbuf(rndr, BUFFER_SPAN);
575
+ return r ? i + 3 : 0;
576
+
577
+ } else if (i + 1 < size && data[i + 1] == c) {
578
+ /* double symbol found, handing over to emph1 */
579
+ len = parse_emph1(ob, rndr, data - 2, size + 2, c);
580
+ if (!len) return 0;
581
+ else return len - 2;
582
+
583
+ } else {
584
+ /* single symbol found, handing over to emph2 */
585
+ len = parse_emph2(ob, rndr, data - 1, size + 1, c);
586
+ if (!len) return 0;
587
+ else return len - 1;
588
+ }
589
+ }
590
+ return 0;
591
+ }
592
+
593
+ /* char_emphasis • single and double emphasis parsing */
594
+ static size_t
595
+ char_emphasis(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
596
+ {
597
+ uint8_t c = data[0];
598
+ size_t ret;
599
+
600
+ if (rndr->ext_flags & MKDEXT_NO_INTRA_EMPHASIS) {
601
+ if (offset > 0 && !_isspace(data[-1]) && data[-1] != '>')
602
+ return 0;
603
+ }
604
+
605
+ if (size > 2 && data[1] != c) {
606
+ /* whitespace cannot follow an opening emphasis;
607
+ * strikethrough only takes two characters '~~' */
608
+ if (c == '~' || _isspace(data[1]) || (ret = parse_emph1(ob, rndr, data + 1, size - 1, c)) == 0)
609
+ return 0;
610
+
611
+ return ret + 1;
612
+ }
613
+
614
+ if (size > 3 && data[1] == c && data[2] != c) {
615
+ if (_isspace(data[2]) || (ret = parse_emph2(ob, rndr, data + 2, size - 2, c)) == 0)
616
+ return 0;
617
+
618
+ return ret + 2;
619
+ }
620
+
621
+ if (size > 4 && data[1] == c && data[2] == c && data[3] != c) {
622
+ if (c == '~' || _isspace(data[3]) || (ret = parse_emph3(ob, rndr, data + 3, size - 3, c)) == 0)
623
+ return 0;
624
+
625
+ return ret + 3;
626
+ }
627
+
628
+ return 0;
629
+ }
630
+
631
+
632
+ /* char_linebreak • '\n' preceded by two spaces (assuming linebreak != 0) */
633
+ static size_t
634
+ char_linebreak(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
635
+ {
636
+ if (offset < 2 || data[-1] != ' ' || data[-2] != ' ')
637
+ return 0;
638
+
639
+ /* removing the last space from ob and rendering */
640
+ while (ob->size && ob->data[ob->size - 1] == ' ')
641
+ ob->size--;
642
+
643
+ return rndr->cb.linebreak(ob, rndr->opaque) ? 1 : 0;
644
+ }
645
+
646
+
647
+ /* char_codespan • '`' parsing a code span (assuming codespan != 0) */
648
+ static size_t
649
+ char_codespan(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
650
+ {
651
+ size_t end, nb = 0, i, f_begin, f_end;
652
+
653
+ /* counting the number of backticks in the delimiter */
654
+ while (nb < size && data[nb] == '`')
655
+ nb++;
656
+
657
+ /* finding the next delimiter */
658
+ i = 0;
659
+ for (end = nb; end < size && i < nb; end++) {
660
+ if (data[end] == '`') i++;
661
+ else i = 0;
662
+ }
663
+
664
+ if (i < nb && end >= size)
665
+ return 0; /* no matching delimiter */
666
+
667
+ /* trimming outside whitespaces */
668
+ f_begin = nb;
669
+ while (f_begin < end && data[f_begin] == ' ')
670
+ f_begin++;
671
+
672
+ f_end = end - nb;
673
+ while (f_end > nb && data[f_end-1] == ' ')
674
+ f_end--;
675
+
676
+ /* real code span */
677
+ if (f_begin < f_end) {
678
+ struct buf work = { data + f_begin, f_end - f_begin, 0, 0 };
679
+ if (!rndr->cb.codespan(ob, &work, rndr->opaque))
680
+ end = 0;
681
+ } else {
682
+ if (!rndr->cb.codespan(ob, 0, rndr->opaque))
683
+ end = 0;
684
+ }
685
+
686
+ return end;
687
+ }
688
+
689
+
690
+ /* char_escape • '\\' backslash escape */
691
+ static size_t
692
+ char_escape(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
693
+ {
694
+ static const char *escape_chars = "\\`*_{}[]()#+-.!:|&<>^~";
695
+ struct buf work = { 0, 0, 0, 0 };
696
+
697
+ if (size > 1) {
698
+ if (strchr(escape_chars, data[1]) == NULL)
699
+ return 0;
700
+
701
+ if (rndr->cb.normal_text) {
702
+ work.data = data + 1;
703
+ work.size = 1;
704
+ rndr->cb.normal_text(ob, &work, rndr->opaque);
705
+ }
706
+ else bufputc(ob, data[1]);
707
+ } else if (size == 1) {
708
+ bufputc(ob, data[0]);
709
+ }
710
+
711
+ return 2;
712
+ }
713
+
714
+ /* char_entity • '&' escaped when it doesn't belong to an entity */
715
+ /* valid entities are assumed to be anything matching &#?[A-Za-z0-9]+; */
716
+ static size_t
717
+ char_entity(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
718
+ {
719
+ size_t end = 1;
720
+ struct buf work = { 0, 0, 0, 0 };
721
+
722
+ if (end < size && data[end] == '#')
723
+ end++;
724
+
725
+ while (end < size && isalnum(data[end]))
726
+ end++;
727
+
728
+ if (end < size && data[end] == ';')
729
+ end++; /* real entity */
730
+ else
731
+ return 0; /* lone '&' */
732
+
733
+ if (rndr->cb.entity) {
734
+ work.data = data;
735
+ work.size = end;
736
+ rndr->cb.entity(ob, &work, rndr->opaque);
737
+ }
738
+ else bufput(ob, data, end);
739
+
740
+ return end;
741
+ }
742
+
743
+ /* char_langle_tag • '<' when tags or autolinks are allowed */
744
+ static size_t
745
+ char_langle_tag(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
746
+ {
747
+ enum mkd_autolink altype = MKDA_NOT_AUTOLINK;
748
+ size_t end = tag_length(data, size, &altype);
749
+ struct buf work = { data, end, 0, 0 };
750
+ int ret = 0;
751
+
752
+ if (end > 2) {
753
+ if (rndr->cb.autolink && altype != MKDA_NOT_AUTOLINK) {
754
+ struct buf *u_link = rndr_newbuf(rndr, BUFFER_SPAN);
755
+ work.data = data + 1;
756
+ work.size = end - 2;
757
+ unscape_text(u_link, &work);
758
+ ret = rndr->cb.autolink(ob, u_link, altype, rndr->opaque);
759
+ rndr_popbuf(rndr, BUFFER_SPAN);
760
+ }
761
+ else if (rndr->cb.raw_html_tag)
762
+ ret = rndr->cb.raw_html_tag(ob, &work, rndr->opaque);
763
+ }
764
+
765
+ if (!ret) return 0;
766
+ else return end;
767
+ }
768
+
769
+ static size_t
770
+ char_autolink_www(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
771
+ {
772
+ struct buf *link, *link_url, *link_text;
773
+ size_t link_len, rewind;
774
+
775
+ if (!rndr->cb.link || rndr->in_link_body)
776
+ return 0;
777
+
778
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
779
+
780
+ if ((link_len = sd_autolink__www(&rewind, link, data, offset, size, 0)) > 0) {
781
+ link_url = rndr_newbuf(rndr, BUFFER_SPAN);
782
+ BUFPUTSL(link_url, "http://");
783
+ bufput(link_url, link->data, link->size);
784
+
785
+ ob->size -= rewind;
786
+ if (rndr->cb.normal_text) {
787
+ link_text = rndr_newbuf(rndr, BUFFER_SPAN);
788
+ rndr->cb.normal_text(link_text, link, rndr->opaque);
789
+ rndr->cb.link(ob, link_url, NULL, link_text, rndr->opaque);
790
+ rndr_popbuf(rndr, BUFFER_SPAN);
791
+ } else {
792
+ rndr->cb.link(ob, link_url, NULL, link, rndr->opaque);
793
+ }
794
+ rndr_popbuf(rndr, BUFFER_SPAN);
795
+ }
796
+
797
+ rndr_popbuf(rndr, BUFFER_SPAN);
798
+ return link_len;
799
+ }
800
+
801
+ static size_t
802
+ char_autolink_email(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
803
+ {
804
+ struct buf *link;
805
+ size_t link_len, rewind;
806
+
807
+ if (!rndr->cb.autolink || rndr->in_link_body)
808
+ return 0;
809
+
810
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
811
+
812
+ if ((link_len = sd_autolink__email(&rewind, link, data, offset, size, 0)) > 0) {
813
+ ob->size -= rewind;
814
+ rndr->cb.autolink(ob, link, MKDA_EMAIL, rndr->opaque);
815
+ }
816
+
817
+ rndr_popbuf(rndr, BUFFER_SPAN);
818
+ return link_len;
819
+ }
820
+
821
+ static size_t
822
+ char_autolink_url(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
823
+ {
824
+ struct buf *link;
825
+ size_t link_len, rewind;
826
+
827
+ if (!rndr->cb.autolink || rndr->in_link_body)
828
+ return 0;
829
+
830
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
831
+
832
+ if ((link_len = sd_autolink__url(&rewind, link, data, offset, size, 0)) > 0) {
833
+ ob->size -= rewind;
834
+ rndr->cb.autolink(ob, link, MKDA_NORMAL, rndr->opaque);
835
+ }
836
+
837
+ rndr_popbuf(rndr, BUFFER_SPAN);
838
+ return link_len;
839
+ }
840
+
841
+ /* char_link • '[': parsing a link or an image */
842
+ static size_t
843
+ char_link(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
844
+ {
845
+ int is_img = (offset && data[-1] == '!'), level;
846
+ size_t i = 1, txt_e, link_b = 0, link_e = 0, title_b = 0, title_e = 0;
847
+ struct buf *content = 0;
848
+ struct buf *link = 0;
849
+ struct buf *title = 0;
850
+ struct buf *u_link = 0;
851
+ size_t org_work_size = rndr->work_bufs[BUFFER_SPAN].size;
852
+ int text_has_nl = 0, ret = 0;
853
+ int in_title = 0, qtype = 0;
854
+
855
+ /* checking whether the correct renderer exists */
856
+ if ((is_img && !rndr->cb.image) || (!is_img && !rndr->cb.link))
857
+ goto cleanup;
858
+
859
+ /* looking for the matching closing bracket */
860
+ for (level = 1; i < size; i++) {
861
+ if (data[i] == '\n')
862
+ text_has_nl = 1;
863
+
864
+ else if (data[i - 1] == '\\')
865
+ continue;
866
+
867
+ else if (data[i] == '[')
868
+ level++;
869
+
870
+ else if (data[i] == ']') {
871
+ level--;
872
+ if (level <= 0)
873
+ break;
874
+ }
875
+ }
876
+
877
+ if (i >= size)
878
+ goto cleanup;
879
+
880
+ txt_e = i;
881
+ i++;
882
+
883
+ /* skip any amount of whitespace or newline */
884
+ /* (this is much more laxist than original markdown syntax) */
885
+ while (i < size && _isspace(data[i]))
886
+ i++;
887
+
888
+ /* inline style link */
889
+ if (i < size && data[i] == '(') {
890
+ /* skipping initial whitespace */
891
+ i++;
892
+
893
+ while (i < size && _isspace(data[i]))
894
+ i++;
895
+
896
+ link_b = i;
897
+
898
+ /* looking for link end: ' " ) */
899
+ while (i < size) {
900
+ if (data[i] == '\\') i += 2;
901
+ else if (data[i] == ')') break;
902
+ else if (i >= 1 && _isspace(data[i-1]) && (data[i] == '\'' || data[i] == '"')) break;
903
+ else i++;
904
+ }
905
+
906
+ if (i >= size) goto cleanup;
907
+ link_e = i;
908
+
909
+ /* looking for title end if present */
910
+ if (data[i] == '\'' || data[i] == '"') {
911
+ qtype = data[i];
912
+ in_title = 1;
913
+ i++;
914
+ title_b = i;
915
+
916
+ while (i < size) {
917
+ if (data[i] == '\\') i += 2;
918
+ else if (data[i] == qtype) {in_title = 0; i++;}
919
+ else if ((data[i] == ')') && !in_title) break;
920
+ else i++;
921
+ }
922
+
923
+ if (i >= size) goto cleanup;
924
+
925
+ /* skipping whitespaces after title */
926
+ title_e = i - 1;
927
+ while (title_e > title_b && _isspace(data[title_e]))
928
+ title_e--;
929
+
930
+ /* checking for closing quote presence */
931
+ if (data[title_e] != '\'' && data[title_e] != '"') {
932
+ title_b = title_e = 0;
933
+ link_e = i;
934
+ }
935
+ }
936
+
937
+ /* remove whitespace at the end of the link */
938
+ while (link_e > link_b && _isspace(data[link_e - 1]))
939
+ link_e--;
940
+
941
+ /* remove optional angle brackets around the link */
942
+ if (data[link_b] == '<') link_b++;
943
+ if (data[link_e - 1] == '>') link_e--;
944
+
945
+ /* building escaped link and title */
946
+ if (link_e > link_b) {
947
+ link = rndr_newbuf(rndr, BUFFER_SPAN);
948
+ bufput(link, data + link_b, link_e - link_b);
949
+ }
950
+
951
+ if (title_e > title_b) {
952
+ title = rndr_newbuf(rndr, BUFFER_SPAN);
953
+ bufput(title, data + title_b, title_e - title_b);
954
+ }
955
+
956
+ i++;
957
+ }
958
+
959
+ /* reference style link */
960
+ else if (i < size && data[i] == '[') {
961
+ struct buf id = { 0, 0, 0, 0 };
962
+ struct link_ref *lr;
963
+
964
+ /* looking for the id */
965
+ i++;
966
+ link_b = i;
967
+ while (i < size && data[i] != ']') i++;
968
+ if (i >= size) goto cleanup;
969
+ link_e = i;
970
+
971
+ /* finding the link_ref */
972
+ if (link_b == link_e) {
973
+ if (text_has_nl) {
974
+ struct buf *b = rndr_newbuf(rndr, BUFFER_SPAN);
975
+ size_t j;
976
+
977
+ for (j = 1; j < txt_e; j++) {
978
+ if (data[j] != '\n')
979
+ bufputc(b, data[j]);
980
+ else if (data[j - 1] != ' ')
981
+ bufputc(b, ' ');
982
+ }
983
+
984
+ id.data = b->data;
985
+ id.size = b->size;
986
+ } else {
987
+ id.data = data + 1;
988
+ id.size = txt_e - 1;
989
+ }
990
+ } else {
991
+ id.data = data + link_b;
992
+ id.size = link_e - link_b;
993
+ }
994
+
995
+ lr = find_link_ref(rndr->refs, id.data, id.size);
996
+ if (!lr)
997
+ goto cleanup;
998
+
999
+ /* keeping link and title from link_ref */
1000
+ link = lr->link;
1001
+ title = lr->title;
1002
+ i++;
1003
+ }
1004
+
1005
+ /* shortcut reference style link */
1006
+ else {
1007
+ struct buf id = { 0, 0, 0, 0 };
1008
+ struct link_ref *lr;
1009
+
1010
+ /* crafting the id */
1011
+ if (text_has_nl) {
1012
+ struct buf *b = rndr_newbuf(rndr, BUFFER_SPAN);
1013
+ size_t j;
1014
+
1015
+ for (j = 1; j < txt_e; j++) {
1016
+ if (data[j] != '\n')
1017
+ bufputc(b, data[j]);
1018
+ else if (data[j - 1] != ' ')
1019
+ bufputc(b, ' ');
1020
+ }
1021
+
1022
+ id.data = b->data;
1023
+ id.size = b->size;
1024
+ } else {
1025
+ id.data = data + 1;
1026
+ id.size = txt_e - 1;
1027
+ }
1028
+
1029
+ /* finding the link_ref */
1030
+ lr = find_link_ref(rndr->refs, id.data, id.size);
1031
+ if (!lr)
1032
+ goto cleanup;
1033
+
1034
+ /* keeping link and title from link_ref */
1035
+ link = lr->link;
1036
+ title = lr->title;
1037
+
1038
+ /* rewinding the whitespace */
1039
+ i = txt_e + 1;
1040
+ }
1041
+
1042
+ /* building content: img alt is escaped, link content is parsed */
1043
+ if (txt_e > 1) {
1044
+ content = rndr_newbuf(rndr, BUFFER_SPAN);
1045
+ if (is_img) {
1046
+ bufput(content, data + 1, txt_e - 1);
1047
+ } else {
1048
+ /* disable autolinking when parsing inline the
1049
+ * content of a link */
1050
+ rndr->in_link_body = 1;
1051
+ parse_inline(content, rndr, data + 1, txt_e - 1);
1052
+ rndr->in_link_body = 0;
1053
+ }
1054
+ }
1055
+
1056
+ if (link) {
1057
+ u_link = rndr_newbuf(rndr, BUFFER_SPAN);
1058
+ unscape_text(u_link, link);
1059
+ }
1060
+
1061
+ /* calling the relevant rendering function */
1062
+ if (is_img) {
1063
+ if (ob->size && ob->data[ob->size - 1] == '!')
1064
+ ob->size -= 1;
1065
+
1066
+ ret = rndr->cb.image(ob, u_link, title, content, rndr->opaque);
1067
+ } else {
1068
+ ret = rndr->cb.link(ob, u_link, title, content, rndr->opaque);
1069
+ }
1070
+
1071
+ /* cleanup */
1072
+ cleanup:
1073
+ rndr->work_bufs[BUFFER_SPAN].size = (int)org_work_size;
1074
+ return ret ? i : 0;
1075
+ }
1076
+
1077
+ static size_t
1078
+ char_superscript(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t offset, size_t size)
1079
+ {
1080
+ size_t sup_start, sup_len;
1081
+ struct buf *sup;
1082
+
1083
+ if (!rndr->cb.superscript)
1084
+ return 0;
1085
+
1086
+ if (size < 2)
1087
+ return 0;
1088
+
1089
+ if (data[1] == '(') {
1090
+ sup_start = sup_len = 2;
1091
+
1092
+ while (sup_len < size && data[sup_len] != ')' && data[sup_len - 1] != '\\')
1093
+ sup_len++;
1094
+
1095
+ if (sup_len == size)
1096
+ return 0;
1097
+ } else {
1098
+ sup_start = sup_len = 1;
1099
+
1100
+ while (sup_len < size && !_isspace(data[sup_len]))
1101
+ sup_len++;
1102
+ }
1103
+
1104
+ if (sup_len - sup_start == 0)
1105
+ return (sup_start == 2) ? 3 : 0;
1106
+
1107
+ sup = rndr_newbuf(rndr, BUFFER_SPAN);
1108
+ parse_inline(sup, rndr, data + sup_start, sup_len - sup_start);
1109
+ rndr->cb.superscript(ob, sup, rndr->opaque);
1110
+ rndr_popbuf(rndr, BUFFER_SPAN);
1111
+
1112
+ return (sup_start == 2) ? sup_len + 1 : sup_len;
1113
+ }
1114
+
1115
+ /*********************************
1116
+ * BLOCK-LEVEL PARSING FUNCTIONS *
1117
+ *********************************/
1118
+
1119
+ /* is_empty • returns the line length when it is empty, 0 otherwise */
1120
+ static size_t
1121
+ is_empty(uint8_t *data, size_t size)
1122
+ {
1123
+ size_t i;
1124
+
1125
+ for (i = 0; i < size && data[i] != '\n'; i++)
1126
+ if (data[i] != ' ')
1127
+ return 0;
1128
+
1129
+ return i + 1;
1130
+ }
1131
+
1132
+ /* is_hrule • returns whether a line is a horizontal rule */
1133
+ static int
1134
+ is_hrule(uint8_t *data, size_t size)
1135
+ {
1136
+ size_t i = 0, n = 0;
1137
+ uint8_t c;
1138
+
1139
+ /* skipping initial spaces */
1140
+ if (size < 3) return 0;
1141
+ if (data[0] == ' ') { i++;
1142
+ if (data[1] == ' ') { i++;
1143
+ if (data[2] == ' ') { i++; } } }
1144
+
1145
+ /* looking at the hrule uint8_t */
1146
+ if (i + 2 >= size
1147
+ || (data[i] != '*' && data[i] != '-' && data[i] != '_'))
1148
+ return 0;
1149
+ c = data[i];
1150
+
1151
+ /* the whole line must be the char or whitespace */
1152
+ while (i < size && data[i] != '\n') {
1153
+ if (data[i] == c) n++;
1154
+ else if (data[i] != ' ')
1155
+ return 0;
1156
+
1157
+ i++;
1158
+ }
1159
+
1160
+ return n >= 3;
1161
+ }
1162
+
1163
+ /* check if a line begins with a code fence; return the
1164
+ * width of the code fence */
1165
+ static size_t
1166
+ prefix_codefence(uint8_t *data, size_t size)
1167
+ {
1168
+ size_t i = 0, n = 0;
1169
+ uint8_t c;
1170
+
1171
+ /* skipping initial spaces */
1172
+ if (size < 3) return 0;
1173
+ if (data[0] == ' ') { i++;
1174
+ if (data[1] == ' ') { i++;
1175
+ if (data[2] == ' ') { i++; } } }
1176
+
1177
+ /* looking at the hrule uint8_t */
1178
+ if (i + 2 >= size || !(data[i] == '~' || data[i] == '`'))
1179
+ return 0;
1180
+
1181
+ c = data[i];
1182
+
1183
+ /* the whole line must be the uint8_t or whitespace */
1184
+ while (i < size && data[i] == c) {
1185
+ n++; i++;
1186
+ }
1187
+
1188
+ if (n < 3)
1189
+ return 0;
1190
+
1191
+ return i;
1192
+ }
1193
+
1194
+ /* check if a line is a code fence; return its size if it is */
1195
+ static size_t
1196
+ is_codefence(uint8_t *data, size_t size, struct buf *syntax)
1197
+ {
1198
+ size_t i = 0, syn_len = 0;
1199
+ uint8_t *syn_start;
1200
+
1201
+ i = prefix_codefence(data, size);
1202
+ if (i == 0)
1203
+ return 0;
1204
+
1205
+ while (i < size && data[i] == ' ')
1206
+ i++;
1207
+
1208
+ syn_start = data + i;
1209
+
1210
+ if (i < size && data[i] == '{') {
1211
+ i++; syn_start++;
1212
+
1213
+ while (i < size && data[i] != '}' && data[i] != '\n') {
1214
+ syn_len++; i++;
1215
+ }
1216
+
1217
+ if (i == size || data[i] != '}')
1218
+ return 0;
1219
+
1220
+ /* strip all whitespace at the beginning and the end
1221
+ * of the {} block */
1222
+ while (syn_len > 0 && _isspace(syn_start[0])) {
1223
+ syn_start++; syn_len--;
1224
+ }
1225
+
1226
+ while (syn_len > 0 && _isspace(syn_start[syn_len - 1]))
1227
+ syn_len--;
1228
+
1229
+ i++;
1230
+ } else {
1231
+ while (i < size && !_isspace(data[i])) {
1232
+ syn_len++; i++;
1233
+ }
1234
+ }
1235
+
1236
+ if (syntax) {
1237
+ syntax->data = syn_start;
1238
+ syntax->size = syn_len;
1239
+ }
1240
+
1241
+ while (i < size && data[i] != '\n') {
1242
+ if (!_isspace(data[i]))
1243
+ return 0;
1244
+
1245
+ i++;
1246
+ }
1247
+
1248
+ return i + 1;
1249
+ }
1250
+
1251
+ /* is_atxheader • returns whether the line is a hash-prefixed header */
1252
+ static int
1253
+ is_atxheader(struct sd_markdown *rndr, uint8_t *data, size_t size)
1254
+ {
1255
+ if (data[0] != '#')
1256
+ return 0;
1257
+
1258
+ if (rndr->ext_flags & MKDEXT_SPACE_HEADERS) {
1259
+ size_t level = 0;
1260
+
1261
+ while (level < size && level < 6 && data[level] == '#')
1262
+ level++;
1263
+
1264
+ if (level < size && data[level] != ' ')
1265
+ return 0;
1266
+ }
1267
+
1268
+ return 1;
1269
+ }
1270
+
1271
+ /* is_headerline • returns whether the line is a setext-style hdr underline */
1272
+ static int
1273
+ is_headerline(uint8_t *data, size_t size)
1274
+ {
1275
+ size_t i = 0;
1276
+
1277
+ /* test of level 1 header */
1278
+ if (data[i] == '=') {
1279
+ for (i = 1; i < size && data[i] == '='; i++);
1280
+ while (i < size && data[i] == ' ') i++;
1281
+ return (i >= size || data[i] == '\n') ? 1 : 0; }
1282
+
1283
+ /* test of level 2 header */
1284
+ if (data[i] == '-') {
1285
+ for (i = 1; i < size && data[i] == '-'; i++);
1286
+ while (i < size && data[i] == ' ') i++;
1287
+ return (i >= size || data[i] == '\n') ? 2 : 0; }
1288
+
1289
+ return 0;
1290
+ }
1291
+
1292
+ static int
1293
+ is_next_headerline(uint8_t *data, size_t size)
1294
+ {
1295
+ size_t i = 0;
1296
+
1297
+ while (i < size && data[i] != '\n')
1298
+ i++;
1299
+
1300
+ if (++i >= size)
1301
+ return 0;
1302
+
1303
+ return is_headerline(data + i, size - i);
1304
+ }
1305
+
1306
+ /* prefix_quote • returns blockquote prefix length */
1307
+ static size_t
1308
+ prefix_quote(uint8_t *data, size_t size)
1309
+ {
1310
+ size_t i = 0;
1311
+ if (i < size && data[i] == ' ') i++;
1312
+ if (i < size && data[i] == ' ') i++;
1313
+ if (i < size && data[i] == ' ') i++;
1314
+
1315
+ if (i < size && data[i] == '>') {
1316
+ if (i + 1 < size && data[i + 1] == ' ')
1317
+ return i + 2;
1318
+
1319
+ return i + 1;
1320
+ }
1321
+
1322
+ return 0;
1323
+ }
1324
+
1325
+ /* prefix_code • returns prefix length for block code*/
1326
+ static size_t
1327
+ prefix_code(uint8_t *data, size_t size)
1328
+ {
1329
+ if (size > 3 && data[0] == ' ' && data[1] == ' '
1330
+ && data[2] == ' ' && data[3] == ' ') return 4;
1331
+
1332
+ return 0;
1333
+ }
1334
+
1335
+ /* prefix_oli • returns ordered list item prefix */
1336
+ static size_t
1337
+ prefix_oli(uint8_t *data, size_t size)
1338
+ {
1339
+ size_t i = 0;
1340
+
1341
+ if (i < size && data[i] == ' ') i++;
1342
+ if (i < size && data[i] == ' ') i++;
1343
+ if (i < size && data[i] == ' ') i++;
1344
+
1345
+ if (i >= size || data[i] < '0' || data[i] > '9')
1346
+ return 0;
1347
+
1348
+ while (i < size && data[i] >= '0' && data[i] <= '9')
1349
+ i++;
1350
+
1351
+ if (i + 1 >= size || data[i] != '.' || data[i + 1] != ' ')
1352
+ return 0;
1353
+
1354
+ if (is_next_headerline(data + i, size - i))
1355
+ return 0;
1356
+
1357
+ return i + 2;
1358
+ }
1359
+
1360
+ /* prefix_uli • returns ordered list item prefix */
1361
+ static size_t
1362
+ prefix_uli(uint8_t *data, size_t size)
1363
+ {
1364
+ size_t i = 0;
1365
+
1366
+ if (i < size && data[i] == ' ') i++;
1367
+ if (i < size && data[i] == ' ') i++;
1368
+ if (i < size && data[i] == ' ') i++;
1369
+
1370
+ if (i + 1 >= size ||
1371
+ (data[i] != '*' && data[i] != '+' && data[i] != '-') ||
1372
+ data[i + 1] != ' ')
1373
+ return 0;
1374
+
1375
+ if (is_next_headerline(data + i, size - i))
1376
+ return 0;
1377
+
1378
+ return i + 2;
1379
+ }
1380
+
1381
+
1382
+ /* parse_block • parsing of one block, returning next uint8_t to parse */
1383
+ static void parse_block(struct buf *ob, struct sd_markdown *rndr,
1384
+ uint8_t *data, size_t size, const src_map *map);
1385
+
1386
+
1387
+ /* parse_blockquote • handles parsing of a blockquote fragment */
1388
+ static size_t
1389
+ parse_blockquote(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, const src_map *map)
1390
+ {
1391
+ size_t beg, end = 0, pre, work_size = 0;
1392
+ uint8_t *work_data = 0;
1393
+ struct buf *out = 0;
1394
+
1395
+ /* source map */
1396
+ src_map *block_map = NULL;
1397
+
1398
+ /* AST construction */
1399
+ if (rndr->cb.blockquote_begin)
1400
+ rndr->cb.blockquote_begin(rndr->opaque);
1401
+
1402
+ out = rndr_newbuf(rndr, BUFFER_BLOCK);
1403
+
1404
+ beg = 0;
1405
+ while (beg < size) {
1406
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++);
1407
+
1408
+ pre = prefix_quote(data + beg, end - beg);
1409
+
1410
+ if (pre)
1411
+ beg += pre; /* skipping prefix */
1412
+
1413
+ /* empty line followed by non-quote line */
1414
+ else if (is_empty(data + beg, end - beg) &&
1415
+ (end >= size || (prefix_quote(data + end, size - end) == 0 &&
1416
+ !is_empty(data + end, size - end))))
1417
+ break;
1418
+
1419
+ if (beg < end) { /* copy into the in-place working buffer */
1420
+ /* bufput(work, data + beg, end - beg); */
1421
+ if (!work_data)
1422
+ work_data = data + beg;
1423
+ else if (data + beg != work_data + work_size)
1424
+ memmove(work_data + work_size, data + beg, end - beg);
1425
+
1426
+ /* source map */
1427
+ if (map) {
1428
+ size_t cur = src_map_location(map, beg);
1429
+ range actual_range = { cur, end - beg };
1430
+ if (!block_map) {
1431
+ block_map = src_map_new_submap(map, &actual_range);
1432
+ }
1433
+ else {
1434
+ src_map_append(block_map, &actual_range);
1435
+ }
1436
+ }
1437
+
1438
+ work_size += end - beg;
1439
+ }
1440
+ beg = end;
1441
+ }
1442
+
1443
+ parse_block(out, rndr, work_data, work_size, block_map);
1444
+
1445
+ /* source map */
1446
+ if (block_map)
1447
+ src_map_release(block_map);
1448
+
1449
+ if (rndr->cb.blockquote)
1450
+ rndr->cb.blockquote(ob, out, rndr->opaque);
1451
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1452
+ return end;
1453
+ }
1454
+
1455
+ static size_t
1456
+ parse_htmlblock(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int do_render);
1457
+
1458
+ /* parse_blockquote • handles parsing of a regular paragraph */
1459
+ static size_t
1460
+ parse_paragraph(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1461
+ {
1462
+ size_t i = 0, end = 0;
1463
+ int level = 0;
1464
+ struct buf work = { data, 0, 0, 0 };
1465
+
1466
+ while (i < size) {
1467
+ for (end = i + 1; end < size && data[end - 1] != '\n'; end++) /* empty */;
1468
+
1469
+ if (is_empty(data + i, size - i))
1470
+ break;
1471
+
1472
+ if ((level = is_headerline(data + i, size - i)) != 0)
1473
+ break;
1474
+
1475
+ if (is_atxheader(rndr, data + i, size - i) ||
1476
+ is_hrule(data + i, size - i) ||
1477
+ prefix_quote(data + i, size - i)) {
1478
+ end = i;
1479
+ break;
1480
+ }
1481
+
1482
+ /*
1483
+ * Early termination of a paragraph with the same logic
1484
+ * as Markdown 1.0.0. If this logic is applied, the
1485
+ * Markdown 1.0.3 test suite won't pass cleanly
1486
+ *
1487
+ * :: If the first character in a new line is not a letter,
1488
+ * let's check to see if there's some kind of block starting
1489
+ * here
1490
+ */
1491
+ if ((rndr->ext_flags & MKDEXT_LAX_SPACING) && !isalnum(data[i])) {
1492
+ if (prefix_oli(data + i, size - i) ||
1493
+ prefix_uli(data + i, size - i)) {
1494
+ end = i;
1495
+ break;
1496
+ }
1497
+
1498
+ /* see if an html block starts here */
1499
+ if (data[i] == '<' && rndr->cb.blockhtml &&
1500
+ parse_htmlblock(ob, rndr, data + i, size - i, 0)) {
1501
+ end = i;
1502
+ break;
1503
+ }
1504
+
1505
+ /* see if a code fence starts here */
1506
+ if ((rndr->ext_flags & MKDEXT_FENCED_CODE) != 0 &&
1507
+ is_codefence(data + i, size - i, NULL) != 0) {
1508
+ end = i;
1509
+ break;
1510
+ }
1511
+ }
1512
+
1513
+ i = end;
1514
+ }
1515
+
1516
+ work.size = i;
1517
+ while (work.size && data[work.size - 1] == '\n')
1518
+ work.size--;
1519
+
1520
+ if (!level) {
1521
+ struct buf *tmp = rndr_newbuf(rndr, BUFFER_BLOCK);
1522
+ parse_inline(tmp, rndr, work.data, work.size);
1523
+ if (rndr->cb.paragraph)
1524
+ rndr->cb.paragraph(ob, tmp, rndr->opaque);
1525
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1526
+ } else {
1527
+ struct buf *header_work;
1528
+
1529
+ if (work.size) {
1530
+ size_t beg;
1531
+ i = work.size;
1532
+ work.size -= 1;
1533
+
1534
+ while (work.size && data[work.size] != '\n')
1535
+ work.size -= 1;
1536
+
1537
+ beg = work.size + 1;
1538
+ while (work.size && data[work.size - 1] == '\n')
1539
+ work.size -= 1;
1540
+
1541
+ if (work.size > 0) {
1542
+ struct buf *tmp = rndr_newbuf(rndr, BUFFER_BLOCK);
1543
+ parse_inline(tmp, rndr, work.data, work.size);
1544
+
1545
+ if (rndr->cb.paragraph)
1546
+ rndr->cb.paragraph(ob, tmp, rndr->opaque);
1547
+
1548
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1549
+ work.data += beg;
1550
+ work.size = i - beg;
1551
+ }
1552
+ else work.size = i;
1553
+ }
1554
+
1555
+ header_work = rndr_newbuf(rndr, BUFFER_SPAN);
1556
+ parse_inline(header_work, rndr, work.data, work.size);
1557
+
1558
+ if (rndr->cb.header)
1559
+ rndr->cb.header(ob, header_work, (int)level, rndr->opaque);
1560
+
1561
+ rndr_popbuf(rndr, BUFFER_SPAN);
1562
+ }
1563
+
1564
+ return end;
1565
+ }
1566
+
1567
+ /* parse_fencedcode • handles parsing of a block-level code fragment */
1568
+ static size_t
1569
+ parse_fencedcode(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1570
+ {
1571
+ size_t beg, end;
1572
+ struct buf *work = 0;
1573
+ struct buf lang = { 0, 0, 0, 0 };
1574
+
1575
+ beg = is_codefence(data, size, &lang);
1576
+ if (beg == 0) return 0;
1577
+
1578
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1579
+
1580
+ while (beg < size) {
1581
+ size_t fence_end;
1582
+ struct buf fence_trail = { 0, 0, 0, 0 };
1583
+
1584
+ fence_end = is_codefence(data + beg, size - beg, &fence_trail);
1585
+ if (fence_end != 0 && fence_trail.size == 0) {
1586
+ beg += fence_end;
1587
+ break;
1588
+ }
1589
+
1590
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++);
1591
+
1592
+ if (beg < end) {
1593
+ /* verbatim copy to the working buffer,
1594
+ escaping entities */
1595
+ if (is_empty(data + beg, end - beg))
1596
+ bufputc(work, '\n');
1597
+ else bufput(work, data + beg, end - beg);
1598
+ }
1599
+ beg = end;
1600
+ }
1601
+
1602
+ if (work->size && work->data[work->size - 1] != '\n')
1603
+ bufputc(work, '\n');
1604
+
1605
+ if (rndr->cb.blockcode)
1606
+ rndr->cb.blockcode(ob, work, lang.size ? &lang : NULL, rndr->opaque);
1607
+
1608
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1609
+ return beg;
1610
+ }
1611
+
1612
+ static size_t
1613
+ parse_blockcode(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1614
+ {
1615
+ size_t beg, end, pre;
1616
+ struct buf *work = 0;
1617
+
1618
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1619
+
1620
+ beg = 0;
1621
+ while (beg < size) {
1622
+ for (end = beg + 1; end < size && data[end - 1] != '\n'; end++) {};
1623
+ pre = prefix_code(data + beg, end - beg);
1624
+
1625
+ if (pre)
1626
+ beg += pre; /* skipping prefix */
1627
+ else if (!is_empty(data + beg, end - beg))
1628
+ /* non-empty non-prefixed line breaks the pre */
1629
+ break;
1630
+
1631
+ if (beg < end) {
1632
+ /* verbatim copy to the working buffer,
1633
+ escaping entities */
1634
+ if (is_empty(data + beg, end - beg))
1635
+ bufputc(work, '\n');
1636
+ else bufput(work, data + beg, end - beg);
1637
+ }
1638
+ beg = end;
1639
+ }
1640
+
1641
+ while (work->size && work->data[work->size - 1] == '\n')
1642
+ work->size -= 1;
1643
+
1644
+ bufputc(work, '\n');
1645
+
1646
+ if (rndr->cb.blockcode)
1647
+ rndr->cb.blockcode(ob, work, NULL, rndr->opaque);
1648
+
1649
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1650
+ return beg;
1651
+ }
1652
+
1653
+ /* parse_listitem • parsing of a single list item */
1654
+ /* assuming initial prefix is already removed */
1655
+ static size_t
1656
+ parse_listitem(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int *flags, const src_map *map)
1657
+ {
1658
+ struct buf *work = 0, *inter = 0;
1659
+ size_t beg = 0, end, pre, sublist = 0, orgpre = 0, i = 0;
1660
+ int in_empty = 0, has_inside_empty = 0, in_fence = 0;
1661
+ src_map *item_map = NULL;
1662
+
1663
+ /* keeping track of the first indentation prefix */
1664
+ while (orgpre < 3 && orgpre < size && data[orgpre] == ' ')
1665
+ orgpre++;
1666
+
1667
+ beg = prefix_uli(data, size);
1668
+ if (!beg)
1669
+ beg = prefix_oli(data, size);
1670
+
1671
+ if (!beg)
1672
+ return 0;
1673
+
1674
+ /* AST construction */
1675
+ if (rndr->cb.listitem_begin)
1676
+ rndr->cb.listitem_begin(*flags, rndr->opaque);
1677
+
1678
+ /* skipping to the beginning of the following line */
1679
+ end = beg;
1680
+ while (end < size && data[end - 1] != '\n')
1681
+ end++;
1682
+
1683
+ /* getting working buffers */
1684
+ work = rndr_newbuf(rndr, BUFFER_SPAN);
1685
+ inter = rndr_newbuf(rndr, BUFFER_SPAN);
1686
+
1687
+ /* source map */
1688
+ if (map) {
1689
+ size_t cur = src_map_location(map, beg);
1690
+ range item_range = { cur, end - beg };
1691
+ item_map = src_map_new_submap(map, &item_range);
1692
+ }
1693
+
1694
+ /* putting the first line into the working buffer */
1695
+ bufput(work, data + beg, end - beg);
1696
+ beg = end;
1697
+
1698
+ /* process the following lines */
1699
+ while (beg < size) {
1700
+ size_t has_next_uli = 0, has_next_oli = 0;
1701
+
1702
+ end++;
1703
+
1704
+ while (end < size && data[end - 1] != '\n')
1705
+ end++;
1706
+
1707
+ /* process an empty line */
1708
+ if (is_empty(data + beg, end - beg)) {
1709
+ in_empty = 1;
1710
+ beg = end;
1711
+ continue;
1712
+ }
1713
+
1714
+ /* calculating the indentation */
1715
+ i = 0;
1716
+ while (i < 4 && beg + i < end && data[beg + i] == ' ')
1717
+ i++;
1718
+
1719
+ pre = i;
1720
+
1721
+ if (rndr->ext_flags & MKDEXT_FENCED_CODE) {
1722
+ if (is_codefence(data + beg + i, end - beg - i, NULL) != 0)
1723
+ in_fence = !in_fence;
1724
+ }
1725
+
1726
+ /* Only check for new list items if we are **not** inside
1727
+ * a fenced code block */
1728
+ if (!in_fence) {
1729
+ has_next_uli = prefix_uli(data + beg + i, end - beg - i);
1730
+ has_next_oli = prefix_oli(data + beg + i, end - beg - i);
1731
+ }
1732
+
1733
+ /* checking for ul/ol switch */
1734
+ if (in_empty && (
1735
+ ((*flags & MKD_LIST_ORDERED) && has_next_uli) ||
1736
+ (!(*flags & MKD_LIST_ORDERED) && has_next_oli))){
1737
+ *flags |= MKD_LI_END;
1738
+ break; /* the following item must have same list type */
1739
+ }
1740
+
1741
+ /* checking for a new item */
1742
+ if ((has_next_uli && !is_hrule(data + beg + i, end - beg - i)) || has_next_oli) {
1743
+ if (in_empty)
1744
+ has_inside_empty = 1;
1745
+
1746
+ if (pre == orgpre) /* the following item must have */
1747
+ break; /* the same indentation */
1748
+
1749
+ if (!sublist)
1750
+ sublist = work->size;
1751
+ }
1752
+ /* joining only indented stuff after empty lines;
1753
+ * note that now we only require 1 space of indentation
1754
+ * to continue a list */
1755
+ else if (in_empty && pre == 0) {
1756
+ *flags |= MKD_LI_END;
1757
+ break;
1758
+ }
1759
+ else if (in_empty) {
1760
+ /* source map */
1761
+ if (item_map && item_map->size) {
1762
+ ((range *)item_map->item[item_map->size - 1])->len += 1;
1763
+ }
1764
+
1765
+ bufputc(work, '\n');
1766
+ has_inside_empty = 1;
1767
+ }
1768
+
1769
+ in_empty = 0;
1770
+
1771
+ /* source map */
1772
+ if (map) {
1773
+ size_t line_cur = src_map_location(map, beg + i);
1774
+ range line_range = { line_cur, end - beg - i };
1775
+ src_map_append(item_map, &line_range);
1776
+ }
1777
+
1778
+ /* adding the line without prefix into the working buffer */
1779
+ bufput(work, data + beg + i, end - beg - i);
1780
+ beg = end;
1781
+ }
1782
+
1783
+ /* render of li contents */
1784
+ if (has_inside_empty)
1785
+ *flags |= MKD_LI_BLOCK;
1786
+
1787
+ if (*flags & MKD_LI_BLOCK) {
1788
+ /* intermediate render of block li */
1789
+ if (sublist && sublist < work->size) {
1790
+ src_map *sublist_map = NULL;
1791
+
1792
+ parse_block(inter, rndr, work->data, sublist, item_map);
1793
+
1794
+ /* source map */
1795
+ if (item_map)
1796
+ sublist_map = src_map_new_tail(item_map, sublist);
1797
+
1798
+ parse_block(inter, rndr, work->data + sublist, work->size - sublist, sublist_map);
1799
+
1800
+ if (sublist_map)
1801
+ src_map_release(sublist_map);
1802
+ }
1803
+ else
1804
+ parse_block(inter, rndr, work->data, work->size, item_map);
1805
+ } else {
1806
+ /* intermediate render of inline li */
1807
+ if (sublist && sublist < work->size) {
1808
+ src_map *sublist_map = NULL;
1809
+
1810
+ parse_inline(inter, rndr, work->data, sublist);
1811
+
1812
+ /* source map */
1813
+ if (item_map)
1814
+ sublist_map = src_map_new_tail(item_map, sublist);
1815
+
1816
+ parse_block(inter, rndr, work->data + sublist, work->size - sublist, sublist_map);
1817
+
1818
+ if (sublist_map)
1819
+ src_map_release(sublist_map);
1820
+ }
1821
+ else
1822
+ parse_inline(inter, rndr, work->data, work->size);
1823
+ }
1824
+
1825
+ /* render of li itself */
1826
+ if (rndr->cb.listitem)
1827
+ rndr->cb.listitem(ob, inter, *flags, rndr->opaque);
1828
+
1829
+ /* source map */
1830
+ if (item_map) {
1831
+ if (rndr->cb.block_did_parse)
1832
+ rndr->cb.block_did_parse(item_map, data + i, size - i, rndr->opaque);
1833
+
1834
+ src_map_release(item_map);
1835
+ }
1836
+
1837
+ rndr_popbuf(rndr, BUFFER_SPAN);
1838
+ rndr_popbuf(rndr, BUFFER_SPAN);
1839
+ return beg;
1840
+ }
1841
+
1842
+
1843
+ /* parse_list • parsing ordered or unordered list block */
1844
+ static size_t
1845
+ parse_list(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int flags, const src_map *map)
1846
+ {
1847
+ struct buf *work = 0;
1848
+ size_t i = 0, j;
1849
+
1850
+ /* AST construction */
1851
+ if (rndr->cb.list_begin)
1852
+ rndr->cb.list_begin(flags, rndr->opaque);
1853
+
1854
+ work = rndr_newbuf(rndr, BUFFER_BLOCK);
1855
+
1856
+ while (i < size) {
1857
+
1858
+ /* source map */
1859
+ src_map *block_map = NULL;
1860
+
1861
+ if (map) {
1862
+ size_t cur = src_map_location(map, i);
1863
+ range actual_range = { cur, size - i };
1864
+ block_map = src_map_new_submap(map, &actual_range);
1865
+ }
1866
+
1867
+ j = parse_listitem(work, rndr, data + i, size - i, &flags, block_map);
1868
+
1869
+ /* source map */
1870
+ if (block_map) {
1871
+ src_map_release(block_map);
1872
+ }
1873
+
1874
+ i += j;
1875
+ if (!j || (flags & MKD_LI_END))
1876
+ break;
1877
+ }
1878
+
1879
+ if (rndr->cb.list)
1880
+ rndr->cb.list(ob, work, flags, rndr->opaque);
1881
+ rndr_popbuf(rndr, BUFFER_BLOCK);
1882
+ return i;
1883
+ }
1884
+
1885
+ /* parse_atxheader • parsing of atx-style headers */
1886
+ static size_t
1887
+ parse_atxheader(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size)
1888
+ {
1889
+ size_t level = 0;
1890
+ size_t i, end, skip;
1891
+
1892
+ while (level < size && level < 6 && data[level] == '#')
1893
+ level++;
1894
+
1895
+ for (i = level; i < size && data[i] == ' '; i++);
1896
+
1897
+ for (end = i; end < size && data[end] != '\n'; end++);
1898
+ skip = end;
1899
+
1900
+ while (end && data[end - 1] == '#')
1901
+ end--;
1902
+
1903
+ while (end && data[end - 1] == ' ')
1904
+ end--;
1905
+
1906
+ if (end > i) {
1907
+ struct buf *work = rndr_newbuf(rndr, BUFFER_SPAN);
1908
+
1909
+ parse_inline(work, rndr, data + i, end - i);
1910
+
1911
+ if (rndr->cb.header)
1912
+ rndr->cb.header(ob, work, (int)level, rndr->opaque);
1913
+
1914
+ rndr_popbuf(rndr, BUFFER_SPAN);
1915
+ }
1916
+
1917
+ return skip;
1918
+ }
1919
+
1920
+
1921
+ /* htmlblock_end • checking end of HTML block : </tag>[ \t]*\n[ \t*]\n */
1922
+ /* returns the length on match, 0 otherwise */
1923
+ static size_t
1924
+ htmlblock_end_tag(
1925
+ const char *tag,
1926
+ size_t tag_len,
1927
+ struct sd_markdown *rndr,
1928
+ uint8_t *data,
1929
+ size_t size)
1930
+ {
1931
+ size_t i, w;
1932
+
1933
+ /* checking if tag is a match */
1934
+ if (tag_len + 3 >= size ||
1935
+ strncasecmp((char *)data + 2, tag, tag_len) != 0 ||
1936
+ data[tag_len + 2] != '>')
1937
+ return 0;
1938
+
1939
+ /* checking white lines */
1940
+ i = tag_len + 3;
1941
+ w = 0;
1942
+ if (i < size && (w = is_empty(data + i, size - i)) == 0)
1943
+ return 0; /* non-blank after tag */
1944
+ i += w;
1945
+ w = 0;
1946
+
1947
+ if (i < size)
1948
+ w = is_empty(data + i, size - i);
1949
+
1950
+ return i + w;
1951
+ }
1952
+
1953
+ static size_t
1954
+ htmlblock_end(const char *curtag,
1955
+ struct sd_markdown *rndr,
1956
+ uint8_t *data,
1957
+ size_t size,
1958
+ int start_of_line)
1959
+ {
1960
+ size_t tag_size = strlen(curtag);
1961
+ size_t i = 1, end_tag;
1962
+ int block_lines = 0;
1963
+
1964
+ while (i < size) {
1965
+ i++;
1966
+ while (i < size && !(data[i - 1] == '<' && data[i] == '/')) {
1967
+ if (data[i] == '\n')
1968
+ block_lines++;
1969
+
1970
+ i++;
1971
+ }
1972
+
1973
+ /* If we are only looking for unindented tags, skip the tag
1974
+ * if it doesn't follow a newline.
1975
+ *
1976
+ * The only exception to this is if the tag is still on the
1977
+ * initial line; in that case it still counts as a closing
1978
+ * tag
1979
+ */
1980
+ if (start_of_line && block_lines > 0 && data[i - 2] != '\n')
1981
+ continue;
1982
+
1983
+ if (i + 2 + tag_size >= size)
1984
+ break;
1985
+
1986
+ end_tag = htmlblock_end_tag(curtag, tag_size, rndr, data + i - 1, size - i + 1);
1987
+ if (end_tag)
1988
+ return i + end_tag - 1;
1989
+ }
1990
+
1991
+ return 0;
1992
+ }
1993
+
1994
+
1995
+ /* parse_htmlblock • parsing of inline HTML block */
1996
+ static size_t
1997
+ parse_htmlblock(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, int do_render)
1998
+ {
1999
+ size_t i, j = 0, tag_end;
2000
+ const char *curtag = NULL;
2001
+ struct buf work = { data, 0, 0, 0 };
2002
+
2003
+ /* identification of the opening tag */
2004
+ if (size < 2 || data[0] != '<')
2005
+ return 0;
2006
+
2007
+ i = 1;
2008
+ while (i < size && data[i] != '>' && data[i] != ' ')
2009
+ i++;
2010
+
2011
+ if (i < size)
2012
+ curtag = find_block_tag((char *)data + 1, (int)i - 1);
2013
+
2014
+ /* handling of special cases */
2015
+ if (!curtag) {
2016
+
2017
+ /* HTML comment, laxist form */
2018
+ if (size > 5 && data[1] == '!' && data[2] == '-' && data[3] == '-') {
2019
+ i = 5;
2020
+
2021
+ while (i < size && !(data[i - 2] == '-' && data[i - 1] == '-' && data[i] == '>'))
2022
+ i++;
2023
+
2024
+ i++;
2025
+
2026
+ if (i < size)
2027
+ j = is_empty(data + i, size - i);
2028
+
2029
+ if (j) {
2030
+ work.size = i + j;
2031
+ if (do_render && rndr->cb.blockhtml)
2032
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2033
+ return work.size;
2034
+ }
2035
+ }
2036
+
2037
+ /* HR, which is the only self-closing block tag considered */
2038
+ if (size > 4 && (data[1] == 'h' || data[1] == 'H') && (data[2] == 'r' || data[2] == 'R')) {
2039
+ i = 3;
2040
+ while (i < size && data[i] != '>')
2041
+ i++;
2042
+
2043
+ if (i + 1 < size) {
2044
+ i++;
2045
+ j = is_empty(data + i, size - i);
2046
+ if (j) {
2047
+ work.size = i + j;
2048
+ if (do_render && rndr->cb.blockhtml)
2049
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2050
+ return work.size;
2051
+ }
2052
+ }
2053
+ }
2054
+
2055
+ /* no special case recognised */
2056
+ return 0;
2057
+ }
2058
+
2059
+ /* looking for an unindented matching closing tag */
2060
+ /* followed by a blank line */
2061
+ tag_end = htmlblock_end(curtag, rndr, data, size, 1);
2062
+
2063
+ /* if not found, trying a second pass looking for indented match */
2064
+ /* but not if tag is "ins" or "del" (following original Markdown.pl) */
2065
+ if (!tag_end && strcmp(curtag, "ins") != 0 && strcmp(curtag, "del") != 0) {
2066
+ tag_end = htmlblock_end(curtag, rndr, data, size, 0);
2067
+ }
2068
+
2069
+ if (!tag_end)
2070
+ return 0;
2071
+
2072
+ /* the end of the block has been found */
2073
+ work.size = tag_end;
2074
+ if (do_render && rndr->cb.blockhtml)
2075
+ rndr->cb.blockhtml(ob, &work, rndr->opaque);
2076
+
2077
+ return tag_end;
2078
+ }
2079
+
2080
+ static void
2081
+ parse_table_row(
2082
+ struct buf *ob,
2083
+ struct sd_markdown *rndr,
2084
+ uint8_t *data,
2085
+ size_t size,
2086
+ size_t columns,
2087
+ int *col_data,
2088
+ int header_flag)
2089
+ {
2090
+ size_t i = 0, col;
2091
+ struct buf *row_work = 0;
2092
+
2093
+ if (!rndr->cb.table_cell || !rndr->cb.table_row)
2094
+ return;
2095
+
2096
+ row_work = rndr_newbuf(rndr, BUFFER_SPAN);
2097
+
2098
+ if (i < size && data[i] == '|')
2099
+ i++;
2100
+
2101
+ for (col = 0; col < columns && i < size; ++col) {
2102
+ size_t cell_start, cell_end;
2103
+ struct buf *cell_work;
2104
+
2105
+ cell_work = rndr_newbuf(rndr, BUFFER_SPAN);
2106
+
2107
+ while (i < size && _isspace(data[i]))
2108
+ i++;
2109
+
2110
+ cell_start = i;
2111
+
2112
+ while (i < size && data[i] != '|')
2113
+ i++;
2114
+
2115
+ cell_end = i - 1;
2116
+
2117
+ while (cell_end > cell_start && _isspace(data[cell_end]))
2118
+ cell_end--;
2119
+
2120
+ parse_inline(cell_work, rndr, data + cell_start, 1 + cell_end - cell_start);
2121
+ rndr->cb.table_cell(row_work, cell_work, col_data[col] | header_flag, rndr->opaque);
2122
+
2123
+ rndr_popbuf(rndr, BUFFER_SPAN);
2124
+ i++;
2125
+ }
2126
+
2127
+ for (; col < columns; ++col) {
2128
+ struct buf empty_cell = { 0, 0, 0, 0 };
2129
+ rndr->cb.table_cell(row_work, &empty_cell, col_data[col] | header_flag, rndr->opaque);
2130
+ }
2131
+
2132
+ rndr->cb.table_row(ob, row_work, rndr->opaque);
2133
+
2134
+ rndr_popbuf(rndr, BUFFER_SPAN);
2135
+ }
2136
+
2137
+ static size_t
2138
+ parse_table_header(
2139
+ struct buf *ob,
2140
+ struct sd_markdown *rndr,
2141
+ uint8_t *data,
2142
+ size_t size,
2143
+ size_t *columns,
2144
+ int **column_data)
2145
+ {
2146
+ int pipes;
2147
+ size_t i = 0, col, header_end, under_end;
2148
+
2149
+ pipes = 0;
2150
+ while (i < size && data[i] != '\n')
2151
+ if (data[i++] == '|')
2152
+ pipes++;
2153
+
2154
+ if (i == size || pipes == 0)
2155
+ return 0;
2156
+
2157
+ header_end = i;
2158
+
2159
+ while (header_end > 0 && _isspace(data[header_end - 1]))
2160
+ header_end--;
2161
+
2162
+ if (data[0] == '|')
2163
+ pipes--;
2164
+
2165
+ if (header_end && data[header_end - 1] == '|')
2166
+ pipes--;
2167
+
2168
+ if (pipes < 0)
2169
+ return 0;
2170
+
2171
+ *columns = pipes + 1;
2172
+ *column_data = calloc(*columns, sizeof(int));
2173
+
2174
+ /* Parse the header underline */
2175
+ i++;
2176
+ if (i < size && data[i] == '|')
2177
+ i++;
2178
+
2179
+ under_end = i;
2180
+ while (under_end < size && data[under_end] != '\n')
2181
+ under_end++;
2182
+
2183
+ for (col = 0; col < *columns && i < under_end; ++col) {
2184
+ size_t dashes = 0;
2185
+
2186
+ while (i < under_end && data[i] == ' ')
2187
+ i++;
2188
+
2189
+ if (data[i] == ':') {
2190
+ i++; (*column_data)[col] |= MKD_TABLE_ALIGN_L;
2191
+ dashes++;
2192
+ }
2193
+
2194
+ while (i < under_end && data[i] == '-') {
2195
+ i++; dashes++;
2196
+ }
2197
+
2198
+ if (i < under_end && data[i] == ':') {
2199
+ i++; (*column_data)[col] |= MKD_TABLE_ALIGN_R;
2200
+ dashes++;
2201
+ }
2202
+
2203
+ while (i < under_end && data[i] == ' ')
2204
+ i++;
2205
+
2206
+ if (i < under_end && data[i] != '|')
2207
+ break;
2208
+
2209
+ if (dashes < 3)
2210
+ break;
2211
+
2212
+ i++;
2213
+ }
2214
+
2215
+ if (col < *columns)
2216
+ return 0;
2217
+
2218
+ parse_table_row(
2219
+ ob, rndr, data,
2220
+ header_end,
2221
+ *columns,
2222
+ *column_data,
2223
+ MKD_TABLE_HEADER
2224
+ );
2225
+
2226
+ return under_end + 1;
2227
+ }
2228
+
2229
+ static size_t
2230
+ parse_table(
2231
+ struct buf *ob,
2232
+ struct sd_markdown *rndr,
2233
+ uint8_t *data,
2234
+ size_t size)
2235
+ {
2236
+ size_t i;
2237
+
2238
+ struct buf *header_work = 0;
2239
+ struct buf *body_work = 0;
2240
+
2241
+ size_t columns;
2242
+ int *col_data = NULL;
2243
+
2244
+ header_work = rndr_newbuf(rndr, BUFFER_SPAN);
2245
+ body_work = rndr_newbuf(rndr, BUFFER_BLOCK);
2246
+
2247
+ i = parse_table_header(header_work, rndr, data, size, &columns, &col_data);
2248
+ if (i > 0) {
2249
+
2250
+ while (i < size) {
2251
+ size_t row_start;
2252
+ int pipes = 0;
2253
+
2254
+ row_start = i;
2255
+
2256
+ while (i < size && data[i] != '\n')
2257
+ if (data[i++] == '|')
2258
+ pipes++;
2259
+
2260
+ if (pipes == 0 || i == size) {
2261
+ i = row_start;
2262
+ break;
2263
+ }
2264
+
2265
+ parse_table_row(
2266
+ body_work,
2267
+ rndr,
2268
+ data + row_start,
2269
+ i - row_start,
2270
+ columns,
2271
+ col_data, 0
2272
+ );
2273
+
2274
+ i++;
2275
+ }
2276
+
2277
+ if (rndr->cb.table)
2278
+ rndr->cb.table(ob, header_work, body_work, rndr->opaque);
2279
+ }
2280
+
2281
+ free(col_data);
2282
+ rndr_popbuf(rndr, BUFFER_SPAN);
2283
+ rndr_popbuf(rndr, BUFFER_BLOCK);
2284
+ return i;
2285
+ }
2286
+
2287
+ /* parse_block • parsing of one block, returning next uint8_t to parse */
2288
+ static void
2289
+ parse_block(struct buf *ob, struct sd_markdown *rndr, uint8_t *data, size_t size, const src_map *map)
2290
+ {
2291
+ size_t beg, end, i, block_beg;
2292
+ uint8_t *txt_data;
2293
+ beg = 0;
2294
+
2295
+ if (rndr->work_bufs[BUFFER_SPAN].size +
2296
+ rndr->work_bufs[BUFFER_BLOCK].size > rndr->max_nesting)
2297
+ return;
2298
+
2299
+ while (beg < size) {
2300
+ size_t cur = 0;
2301
+ src_map *block_map = NULL;
2302
+
2303
+ block_beg = beg;
2304
+ txt_data = data + beg;
2305
+ end = size - beg;
2306
+
2307
+ /* source map */
2308
+ if (map) {
2309
+ range actual_range;
2310
+
2311
+ cur = src_map_location(map, beg);
2312
+ actual_range.loc = cur;
2313
+ actual_range.len = end;
2314
+
2315
+ block_map = src_map_new_submap(map, &actual_range);
2316
+ }
2317
+
2318
+ if (is_atxheader(rndr, txt_data, end))
2319
+ beg += parse_atxheader(ob, rndr, txt_data, end);
2320
+
2321
+ else if (data[beg] == '<' && rndr->cb.blockhtml &&
2322
+ (i = parse_htmlblock(ob, rndr, txt_data, end, 1)) != 0)
2323
+ beg += i;
2324
+
2325
+ else if ((i = is_empty(txt_data, end)) != 0) {
2326
+ beg += i;
2327
+ }
2328
+
2329
+ else if (is_hrule(txt_data, end)) {
2330
+ if (rndr->cb.hrule)
2331
+ rndr->cb.hrule(ob, rndr->opaque);
2332
+
2333
+ while (beg < size && data[beg] != '\n')
2334
+ beg++;
2335
+
2336
+ beg++;
2337
+ }
2338
+
2339
+ else if ((rndr->ext_flags & MKDEXT_FENCED_CODE) != 0 &&
2340
+ (i = parse_fencedcode(ob, rndr, txt_data, end)) != 0)
2341
+ beg += i;
2342
+
2343
+ else if ((rndr->ext_flags & MKDEXT_TABLES) != 0 &&
2344
+ (i = parse_table(ob, rndr, txt_data, end)) != 0)
2345
+ beg += i;
2346
+
2347
+ else if (prefix_quote(txt_data, end))
2348
+ beg += parse_blockquote(ob, rndr, txt_data, end, block_map);
2349
+
2350
+ else if (prefix_code(txt_data, end))
2351
+ beg += parse_blockcode(ob, rndr, txt_data, end);
2352
+
2353
+ else if (prefix_uli(txt_data, end))
2354
+ beg += parse_list(ob, rndr, txt_data, end, 0, block_map);
2355
+
2356
+ else if (prefix_oli(txt_data, end))
2357
+ beg += parse_list(ob, rndr, txt_data, end, MKD_LIST_ORDERED, block_map);
2358
+
2359
+ else
2360
+ beg += parse_paragraph(ob, rndr, txt_data, end);
2361
+
2362
+ /* source map */
2363
+ if (block_map) {
2364
+ if (rndr->cb.block_did_parse) {
2365
+ range parse_range = { cur, beg - block_beg };
2366
+ src_map *parse_map = src_map_new_submap(block_map, &parse_range);
2367
+
2368
+ rndr->cb.block_did_parse(parse_map, txt_data, beg - block_beg, rndr->opaque);
2369
+
2370
+ src_map_release(parse_map);
2371
+ }
2372
+ src_map_release(block_map);
2373
+ }
2374
+ }
2375
+ }
2376
+
2377
+ /*********************
2378
+ * REFERENCE PARSING *
2379
+ *********************/
2380
+
2381
+ /* is_ref • returns whether a line is a reference or not */
2382
+ static int
2383
+ is_ref(const uint8_t *data, size_t beg, size_t end, size_t *last, struct link_ref **refs)
2384
+ {
2385
+ /* int n; */
2386
+ size_t i = 0;
2387
+ size_t id_offset, id_end;
2388
+ size_t link_offset, link_end;
2389
+ size_t title_offset, title_end;
2390
+ size_t line_end;
2391
+
2392
+ /* up to 3 optional leading spaces */
2393
+ if (beg + 3 >= end) return 0;
2394
+ if (data[beg] == ' ') { i = 1;
2395
+ if (data[beg + 1] == ' ') { i = 2;
2396
+ if (data[beg + 2] == ' ') { i = 3;
2397
+ if (data[beg + 3] == ' ') return 0; } } }
2398
+ i += beg;
2399
+
2400
+ /* id part: anything but a newline between brackets */
2401
+ if (data[i] != '[') return 0;
2402
+ i++;
2403
+ id_offset = i;
2404
+ while (i < end && data[i] != '\n' && data[i] != '\r' && data[i] != ']')
2405
+ i++;
2406
+ if (i >= end || data[i] != ']') return 0;
2407
+ id_end = i;
2408
+
2409
+ /* spacer: colon (space | tab)* newline? (space | tab)* */
2410
+ i++;
2411
+ if (i >= end || data[i] != ':') return 0;
2412
+ i++;
2413
+ while (i < end && data[i] == ' ') i++;
2414
+ if (i < end && (data[i] == '\n' || data[i] == '\r')) {
2415
+ i++;
2416
+ if (i < end && data[i] == '\r' && data[i - 1] == '\n') i++; }
2417
+ while (i < end && data[i] == ' ') i++;
2418
+ if (i >= end) return 0;
2419
+
2420
+ /* link: whitespace-free sequence, optionally between angle brackets */
2421
+ if (data[i] == '<')
2422
+ i++;
2423
+
2424
+ link_offset = i;
2425
+
2426
+ while (i < end && data[i] != ' ' && data[i] != '\n' && data[i] != '\r')
2427
+ i++;
2428
+
2429
+ if (data[i - 1] == '>') link_end = i - 1;
2430
+ else link_end = i;
2431
+
2432
+ /* optional spacer: (space | tab)* (newline | '\'' | '"' | '(' ) */
2433
+ while (i < end && data[i] == ' ') i++;
2434
+ if (i < end && data[i] != '\n' && data[i] != '\r'
2435
+ && data[i] != '\'' && data[i] != '"' && data[i] != '(')
2436
+ return 0;
2437
+ line_end = 0;
2438
+ /* computing end-of-line */
2439
+ if (i >= end || data[i] == '\r' || data[i] == '\n') line_end = i;
2440
+ if (i + 1 < end && data[i] == '\n' && data[i + 1] == '\r')
2441
+ line_end = i + 1;
2442
+
2443
+ /* optional (space|tab)* spacer after a newline */
2444
+ if (line_end) {
2445
+ i = line_end + 1;
2446
+ while (i < end && data[i] == ' ') i++; }
2447
+
2448
+ /* optional title: any non-newline sequence enclosed in '"()
2449
+ alone on its line */
2450
+ title_offset = title_end = 0;
2451
+ if (i + 1 < end
2452
+ && (data[i] == '\'' || data[i] == '"' || data[i] == '(')) {
2453
+ i++;
2454
+ title_offset = i;
2455
+ /* looking for EOL */
2456
+ while (i < end && data[i] != '\n' && data[i] != '\r') i++;
2457
+ if (i + 1 < end && data[i] == '\n' && data[i + 1] == '\r')
2458
+ title_end = i + 1;
2459
+ else title_end = i;
2460
+ /* stepping back */
2461
+ i -= 1;
2462
+ while (i > title_offset && data[i] == ' ')
2463
+ i -= 1;
2464
+ if (i > title_offset
2465
+ && (data[i] == '\'' || data[i] == '"' || data[i] == ')')) {
2466
+ line_end = title_end;
2467
+ title_end = i; } }
2468
+
2469
+ if (!line_end || link_end == link_offset)
2470
+ return 0; /* garbage after the link empty link */
2471
+
2472
+ /* a valid ref has been found, filling-in return structures */
2473
+ if (last)
2474
+ *last = line_end;
2475
+
2476
+ if (refs) {
2477
+ struct link_ref *ref;
2478
+
2479
+ ref = add_link_ref(refs, data + id_offset, id_end - id_offset);
2480
+ if (!ref)
2481
+ return 0;
2482
+
2483
+ ref->link = bufnew(link_end - link_offset);
2484
+ bufput(ref->link, data + link_offset, link_end - link_offset);
2485
+
2486
+ if (title_end > title_offset) {
2487
+ ref->title = bufnew(title_end - title_offset);
2488
+ bufput(ref->title, data + title_offset, title_end - title_offset);
2489
+ }
2490
+ }
2491
+
2492
+ return 1;
2493
+ }
2494
+
2495
+ static void expand_tabs(struct buf *ob, const uint8_t *line, size_t size)
2496
+ {
2497
+ size_t i = 0, tab = 0;
2498
+
2499
+ while (i < size) {
2500
+ size_t org = i;
2501
+
2502
+ while (i < size && line[i] != '\t') {
2503
+ i++; tab++;
2504
+ }
2505
+
2506
+ if (i > org)
2507
+ bufput(ob, line + org, i - org);
2508
+
2509
+ if (i >= size)
2510
+ break;
2511
+
2512
+ do {
2513
+ bufputc(ob, ' '); tab++;
2514
+ } while (tab % 4);
2515
+
2516
+ i++;
2517
+ }
2518
+ }
2519
+
2520
+ /**********************
2521
+ * EXPORTED FUNCTIONS *
2522
+ **********************/
2523
+
2524
+ struct sd_markdown *
2525
+ sd_markdown_new(
2526
+ unsigned int extensions,
2527
+ size_t max_nesting,
2528
+ const struct sd_callbacks *callbacks,
2529
+ void *opaque)
2530
+ {
2531
+ struct sd_markdown *md = NULL;
2532
+
2533
+ assert(max_nesting > 0 && callbacks);
2534
+
2535
+ md = malloc(sizeof(struct sd_markdown));
2536
+ if (!md)
2537
+ return NULL;
2538
+
2539
+ memcpy(&md->cb, callbacks, sizeof(struct sd_callbacks));
2540
+
2541
+ stack_init(&md->work_bufs[BUFFER_BLOCK], 4);
2542
+ stack_init(&md->work_bufs[BUFFER_SPAN], 8);
2543
+
2544
+ memset(md->active_char, 0x0, 256);
2545
+
2546
+ if (md->cb.emphasis || md->cb.double_emphasis || md->cb.triple_emphasis) {
2547
+ md->active_char['*'] = MD_CHAR_EMPHASIS;
2548
+ md->active_char['_'] = MD_CHAR_EMPHASIS;
2549
+ if (extensions & MKDEXT_STRIKETHROUGH)
2550
+ md->active_char['~'] = MD_CHAR_EMPHASIS;
2551
+ }
2552
+
2553
+ if (md->cb.codespan)
2554
+ md->active_char['`'] = MD_CHAR_CODESPAN;
2555
+
2556
+ if (md->cb.linebreak)
2557
+ md->active_char['\n'] = MD_CHAR_LINEBREAK;
2558
+
2559
+ if (md->cb.image || md->cb.link)
2560
+ md->active_char['['] = MD_CHAR_LINK;
2561
+
2562
+ md->active_char['<'] = MD_CHAR_LANGLE;
2563
+ md->active_char['\\'] = MD_CHAR_ESCAPE;
2564
+ md->active_char['&'] = MD_CHAR_ENTITITY;
2565
+
2566
+ if (extensions & MKDEXT_AUTOLINK) {
2567
+ md->active_char[':'] = MD_CHAR_AUTOLINK_URL;
2568
+ md->active_char['@'] = MD_CHAR_AUTOLINK_EMAIL;
2569
+ md->active_char['w'] = MD_CHAR_AUTOLINK_WWW;
2570
+ }
2571
+
2572
+ if (extensions & MKDEXT_SUPERSCRIPT)
2573
+ md->active_char['^'] = MD_CHAR_SUPERSCRIPT;
2574
+
2575
+ /* Extension data */
2576
+ md->ext_flags = extensions;
2577
+ md->opaque = opaque;
2578
+ md->max_nesting = max_nesting;
2579
+ md->in_link_body = 0;
2580
+
2581
+ return md;
2582
+ }
2583
+
2584
+ void
2585
+ sd_markdown_render(struct buf *ob, const uint8_t *document, size_t doc_size, struct sd_markdown *md)
2586
+ {
2587
+ #define MARKDOWN_GROW(x) ((x) + ((x) >> 1))
2588
+ static const char UTF8_BOM[] = {0xEF, 0xBB, 0xBF};
2589
+
2590
+ struct buf *text;
2591
+ size_t beg, end;
2592
+ src_map *map;
2593
+
2594
+ /* source map */
2595
+ if (md->cb.block_did_parse)
2596
+ map = src_map_new();
2597
+ else
2598
+ map = NULL;
2599
+
2600
+ text = bufnew(64);
2601
+ if (!text)
2602
+ return;
2603
+
2604
+ /* Preallocate enough space for our buffer to avoid expanding while copying */
2605
+ bufgrow(text, doc_size);
2606
+
2607
+ /* reset the references table */
2608
+ memset(&md->refs, 0x0, REF_TABLE_SIZE * sizeof(void *));
2609
+
2610
+ /* first pass: looking for references, copying everything else */
2611
+ beg = 0;
2612
+
2613
+ /* Skip a possible UTF-8 BOM, even though the Unicode standard
2614
+ * discourages having these in UTF-8 documents */
2615
+ if (doc_size >= 3 && memcmp(document, UTF8_BOM, 3) == 0)
2616
+ beg += 3;
2617
+
2618
+ while (beg < doc_size) /* iterating over lines */
2619
+ if (is_ref(document, beg, doc_size, &end, md->refs))
2620
+ beg = end;
2621
+ else { /* skipping to the next line */
2622
+ end = beg;
2623
+ while (end < doc_size && document[end] != '\n' && document[end] != '\r')
2624
+ end++;
2625
+
2626
+ /* adding the line body if present */
2627
+ if (end > beg)
2628
+ expand_tabs(text, document + beg, end - beg);
2629
+
2630
+ while (end < doc_size && (document[end] == '\n' || document[end] == '\r')) {
2631
+ /* add one \n per newline */
2632
+ if (document[end] == '\n' || (end + 1 < doc_size && document[end + 1] != '\n'))
2633
+ bufputc(text, '\n');
2634
+ end++;
2635
+ }
2636
+
2637
+ beg = end;
2638
+ }
2639
+
2640
+ /* pre-grow the output buffer to minimize allocations */
2641
+ bufgrow(ob, MARKDOWN_GROW(text->size));
2642
+
2643
+ /* second pass: actual rendering */
2644
+ if (md->cb.doc_header)
2645
+ md->cb.doc_header(ob, md->opaque);
2646
+
2647
+ if (text->size) {
2648
+
2649
+ /* adding a final newline if not already present */
2650
+ if (text->data[text->size - 1] != '\n' && text->data[text->size - 1] != '\r')
2651
+ bufputc(text, '\n');
2652
+
2653
+ /* source map */
2654
+ if (map) {
2655
+ range rng = {0, text->size};
2656
+ src_map_append(map, &rng);
2657
+ }
2658
+
2659
+ parse_block(ob, md, text->data, text->size, map);
2660
+
2661
+ /* source map */
2662
+ src_map_release(map);
2663
+ }
2664
+
2665
+ if (md->cb.doc_footer)
2666
+ md->cb.doc_footer(ob, md->opaque);
2667
+
2668
+ /* clean-up */
2669
+ bufrelease(text);
2670
+ free_link_refs(md->refs);
2671
+
2672
+ assert(md->work_bufs[BUFFER_SPAN].size == 0);
2673
+ assert(md->work_bufs[BUFFER_BLOCK].size == 0);
2674
+ }
2675
+
2676
+ void
2677
+ sd_markdown_free(struct sd_markdown *md)
2678
+ {
2679
+ size_t i;
2680
+
2681
+ for (i = 0; i < (size_t)md->work_bufs[BUFFER_SPAN].asize; ++i)
2682
+ bufrelease(md->work_bufs[BUFFER_SPAN].item[i]);
2683
+
2684
+ for (i = 0; i < (size_t)md->work_bufs[BUFFER_BLOCK].asize; ++i)
2685
+ bufrelease(md->work_bufs[BUFFER_BLOCK].item[i]);
2686
+
2687
+ stack_free(&md->work_bufs[BUFFER_SPAN]);
2688
+ stack_free(&md->work_bufs[BUFFER_BLOCK]);
2689
+
2690
+ free(md);
2691
+ }
2692
+
2693
+ void
2694
+ sd_version(int *ver_major, int *ver_minor, int *ver_revision)
2695
+ {
2696
+ *ver_major = SUNDOWN_VER_MAJOR;
2697
+ *ver_minor = SUNDOWN_VER_MINOR;
2698
+ *ver_revision = SUNDOWN_VER_REVISION;
2699
+ }
2700
+
2701
+ /* vim: set filetype=c: */