@apitap/core 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (236) hide show
  1. package/LICENSE +60 -0
  2. package/README.md +362 -0
  3. package/SKILL.md +270 -0
  4. package/dist/auth/crypto.d.ts +31 -0
  5. package/dist/auth/crypto.js +66 -0
  6. package/dist/auth/crypto.js.map +1 -0
  7. package/dist/auth/handoff.d.ts +29 -0
  8. package/dist/auth/handoff.js +180 -0
  9. package/dist/auth/handoff.js.map +1 -0
  10. package/dist/auth/manager.d.ts +46 -0
  11. package/dist/auth/manager.js +127 -0
  12. package/dist/auth/manager.js.map +1 -0
  13. package/dist/auth/oauth-refresh.d.ts +16 -0
  14. package/dist/auth/oauth-refresh.js +91 -0
  15. package/dist/auth/oauth-refresh.js.map +1 -0
  16. package/dist/auth/refresh.d.ts +43 -0
  17. package/dist/auth/refresh.js +217 -0
  18. package/dist/auth/refresh.js.map +1 -0
  19. package/dist/capture/anti-bot.d.ts +15 -0
  20. package/dist/capture/anti-bot.js +43 -0
  21. package/dist/capture/anti-bot.js.map +1 -0
  22. package/dist/capture/blocklist.d.ts +6 -0
  23. package/dist/capture/blocklist.js +70 -0
  24. package/dist/capture/blocklist.js.map +1 -0
  25. package/dist/capture/body-diff.d.ts +8 -0
  26. package/dist/capture/body-diff.js +102 -0
  27. package/dist/capture/body-diff.js.map +1 -0
  28. package/dist/capture/body-variables.d.ts +13 -0
  29. package/dist/capture/body-variables.js +142 -0
  30. package/dist/capture/body-variables.js.map +1 -0
  31. package/dist/capture/domain.d.ts +8 -0
  32. package/dist/capture/domain.js +34 -0
  33. package/dist/capture/domain.js.map +1 -0
  34. package/dist/capture/entropy.d.ts +33 -0
  35. package/dist/capture/entropy.js +100 -0
  36. package/dist/capture/entropy.js.map +1 -0
  37. package/dist/capture/filter.d.ts +11 -0
  38. package/dist/capture/filter.js +49 -0
  39. package/dist/capture/filter.js.map +1 -0
  40. package/dist/capture/graphql.d.ts +21 -0
  41. package/dist/capture/graphql.js +99 -0
  42. package/dist/capture/graphql.js.map +1 -0
  43. package/dist/capture/idle.d.ts +23 -0
  44. package/dist/capture/idle.js +44 -0
  45. package/dist/capture/idle.js.map +1 -0
  46. package/dist/capture/monitor.d.ts +26 -0
  47. package/dist/capture/monitor.js +183 -0
  48. package/dist/capture/monitor.js.map +1 -0
  49. package/dist/capture/oauth-detector.d.ts +18 -0
  50. package/dist/capture/oauth-detector.js +96 -0
  51. package/dist/capture/oauth-detector.js.map +1 -0
  52. package/dist/capture/pagination.d.ts +9 -0
  53. package/dist/capture/pagination.js +40 -0
  54. package/dist/capture/pagination.js.map +1 -0
  55. package/dist/capture/parameterize.d.ts +17 -0
  56. package/dist/capture/parameterize.js +63 -0
  57. package/dist/capture/parameterize.js.map +1 -0
  58. package/dist/capture/scrubber.d.ts +5 -0
  59. package/dist/capture/scrubber.js +38 -0
  60. package/dist/capture/scrubber.js.map +1 -0
  61. package/dist/capture/session.d.ts +46 -0
  62. package/dist/capture/session.js +445 -0
  63. package/dist/capture/session.js.map +1 -0
  64. package/dist/capture/token-detector.d.ts +16 -0
  65. package/dist/capture/token-detector.js +62 -0
  66. package/dist/capture/token-detector.js.map +1 -0
  67. package/dist/capture/verifier.d.ts +17 -0
  68. package/dist/capture/verifier.js +147 -0
  69. package/dist/capture/verifier.js.map +1 -0
  70. package/dist/cli.d.ts +2 -0
  71. package/dist/cli.js +930 -0
  72. package/dist/cli.js.map +1 -0
  73. package/dist/discovery/auth.d.ts +17 -0
  74. package/dist/discovery/auth.js +81 -0
  75. package/dist/discovery/auth.js.map +1 -0
  76. package/dist/discovery/fetch.d.ts +17 -0
  77. package/dist/discovery/fetch.js +59 -0
  78. package/dist/discovery/fetch.js.map +1 -0
  79. package/dist/discovery/frameworks.d.ts +11 -0
  80. package/dist/discovery/frameworks.js +249 -0
  81. package/dist/discovery/frameworks.js.map +1 -0
  82. package/dist/discovery/index.d.ts +21 -0
  83. package/dist/discovery/index.js +219 -0
  84. package/dist/discovery/index.js.map +1 -0
  85. package/dist/discovery/openapi.d.ts +13 -0
  86. package/dist/discovery/openapi.js +175 -0
  87. package/dist/discovery/openapi.js.map +1 -0
  88. package/dist/discovery/probes.d.ts +9 -0
  89. package/dist/discovery/probes.js +70 -0
  90. package/dist/discovery/probes.js.map +1 -0
  91. package/dist/index.d.ts +25 -0
  92. package/dist/index.js +25 -0
  93. package/dist/index.js.map +1 -0
  94. package/dist/inspect/report.d.ts +52 -0
  95. package/dist/inspect/report.js +191 -0
  96. package/dist/inspect/report.js.map +1 -0
  97. package/dist/mcp.d.ts +8 -0
  98. package/dist/mcp.js +526 -0
  99. package/dist/mcp.js.map +1 -0
  100. package/dist/orchestration/browse.d.ts +38 -0
  101. package/dist/orchestration/browse.js +198 -0
  102. package/dist/orchestration/browse.js.map +1 -0
  103. package/dist/orchestration/cache.d.ts +15 -0
  104. package/dist/orchestration/cache.js +24 -0
  105. package/dist/orchestration/cache.js.map +1 -0
  106. package/dist/plugin.d.ts +17 -0
  107. package/dist/plugin.js +158 -0
  108. package/dist/plugin.js.map +1 -0
  109. package/dist/read/decoders/deepwiki.d.ts +2 -0
  110. package/dist/read/decoders/deepwiki.js +148 -0
  111. package/dist/read/decoders/deepwiki.js.map +1 -0
  112. package/dist/read/decoders/grokipedia.d.ts +2 -0
  113. package/dist/read/decoders/grokipedia.js +210 -0
  114. package/dist/read/decoders/grokipedia.js.map +1 -0
  115. package/dist/read/decoders/hackernews.d.ts +2 -0
  116. package/dist/read/decoders/hackernews.js +168 -0
  117. package/dist/read/decoders/hackernews.js.map +1 -0
  118. package/dist/read/decoders/index.d.ts +2 -0
  119. package/dist/read/decoders/index.js +12 -0
  120. package/dist/read/decoders/index.js.map +1 -0
  121. package/dist/read/decoders/reddit.d.ts +2 -0
  122. package/dist/read/decoders/reddit.js +142 -0
  123. package/dist/read/decoders/reddit.js.map +1 -0
  124. package/dist/read/decoders/twitter.d.ts +12 -0
  125. package/dist/read/decoders/twitter.js +187 -0
  126. package/dist/read/decoders/twitter.js.map +1 -0
  127. package/dist/read/decoders/wikipedia.d.ts +2 -0
  128. package/dist/read/decoders/wikipedia.js +66 -0
  129. package/dist/read/decoders/wikipedia.js.map +1 -0
  130. package/dist/read/decoders/youtube.d.ts +2 -0
  131. package/dist/read/decoders/youtube.js +69 -0
  132. package/dist/read/decoders/youtube.js.map +1 -0
  133. package/dist/read/extract.d.ts +25 -0
  134. package/dist/read/extract.js +320 -0
  135. package/dist/read/extract.js.map +1 -0
  136. package/dist/read/index.d.ts +14 -0
  137. package/dist/read/index.js +66 -0
  138. package/dist/read/index.js.map +1 -0
  139. package/dist/read/peek.d.ts +9 -0
  140. package/dist/read/peek.js +137 -0
  141. package/dist/read/peek.js.map +1 -0
  142. package/dist/read/types.d.ts +44 -0
  143. package/dist/read/types.js +3 -0
  144. package/dist/read/types.js.map +1 -0
  145. package/dist/replay/engine.d.ts +53 -0
  146. package/dist/replay/engine.js +441 -0
  147. package/dist/replay/engine.js.map +1 -0
  148. package/dist/replay/truncate.d.ts +16 -0
  149. package/dist/replay/truncate.js +92 -0
  150. package/dist/replay/truncate.js.map +1 -0
  151. package/dist/serve.d.ts +31 -0
  152. package/dist/serve.js +149 -0
  153. package/dist/serve.js.map +1 -0
  154. package/dist/skill/generator.d.ts +44 -0
  155. package/dist/skill/generator.js +419 -0
  156. package/dist/skill/generator.js.map +1 -0
  157. package/dist/skill/importer.d.ts +26 -0
  158. package/dist/skill/importer.js +80 -0
  159. package/dist/skill/importer.js.map +1 -0
  160. package/dist/skill/search.d.ts +19 -0
  161. package/dist/skill/search.js +51 -0
  162. package/dist/skill/search.js.map +1 -0
  163. package/dist/skill/signing.d.ts +16 -0
  164. package/dist/skill/signing.js +34 -0
  165. package/dist/skill/signing.js.map +1 -0
  166. package/dist/skill/ssrf.d.ts +27 -0
  167. package/dist/skill/ssrf.js +210 -0
  168. package/dist/skill/ssrf.js.map +1 -0
  169. package/dist/skill/store.d.ts +7 -0
  170. package/dist/skill/store.js +93 -0
  171. package/dist/skill/store.js.map +1 -0
  172. package/dist/stats/report.d.ts +26 -0
  173. package/dist/stats/report.js +157 -0
  174. package/dist/stats/report.js.map +1 -0
  175. package/dist/types.d.ts +214 -0
  176. package/dist/types.js +3 -0
  177. package/dist/types.js.map +1 -0
  178. package/package.json +58 -0
  179. package/src/auth/crypto.ts +92 -0
  180. package/src/auth/handoff.ts +229 -0
  181. package/src/auth/manager.ts +140 -0
  182. package/src/auth/oauth-refresh.ts +120 -0
  183. package/src/auth/refresh.ts +300 -0
  184. package/src/capture/anti-bot.ts +63 -0
  185. package/src/capture/blocklist.ts +75 -0
  186. package/src/capture/body-diff.ts +109 -0
  187. package/src/capture/body-variables.ts +156 -0
  188. package/src/capture/domain.ts +34 -0
  189. package/src/capture/entropy.ts +121 -0
  190. package/src/capture/filter.ts +56 -0
  191. package/src/capture/graphql.ts +124 -0
  192. package/src/capture/idle.ts +45 -0
  193. package/src/capture/monitor.ts +224 -0
  194. package/src/capture/oauth-detector.ts +106 -0
  195. package/src/capture/pagination.ts +49 -0
  196. package/src/capture/parameterize.ts +68 -0
  197. package/src/capture/scrubber.ts +49 -0
  198. package/src/capture/session.ts +502 -0
  199. package/src/capture/token-detector.ts +76 -0
  200. package/src/capture/verifier.ts +171 -0
  201. package/src/cli.ts +1031 -0
  202. package/src/discovery/auth.ts +99 -0
  203. package/src/discovery/fetch.ts +85 -0
  204. package/src/discovery/frameworks.ts +231 -0
  205. package/src/discovery/index.ts +256 -0
  206. package/src/discovery/openapi.ts +230 -0
  207. package/src/discovery/probes.ts +76 -0
  208. package/src/index.ts +26 -0
  209. package/src/inspect/report.ts +247 -0
  210. package/src/mcp.ts +618 -0
  211. package/src/orchestration/browse.ts +250 -0
  212. package/src/orchestration/cache.ts +37 -0
  213. package/src/plugin.ts +188 -0
  214. package/src/read/decoders/deepwiki.ts +180 -0
  215. package/src/read/decoders/grokipedia.ts +246 -0
  216. package/src/read/decoders/hackernews.ts +198 -0
  217. package/src/read/decoders/index.ts +15 -0
  218. package/src/read/decoders/reddit.ts +158 -0
  219. package/src/read/decoders/twitter.ts +211 -0
  220. package/src/read/decoders/wikipedia.ts +75 -0
  221. package/src/read/decoders/youtube.ts +75 -0
  222. package/src/read/extract.ts +396 -0
  223. package/src/read/index.ts +78 -0
  224. package/src/read/peek.ts +175 -0
  225. package/src/read/types.ts +37 -0
  226. package/src/replay/engine.ts +559 -0
  227. package/src/replay/truncate.ts +116 -0
  228. package/src/serve.ts +189 -0
  229. package/src/skill/generator.ts +473 -0
  230. package/src/skill/importer.ts +107 -0
  231. package/src/skill/search.ts +76 -0
  232. package/src/skill/signing.ts +36 -0
  233. package/src/skill/ssrf.ts +238 -0
  234. package/src/skill/store.ts +107 -0
  235. package/src/stats/report.ts +208 -0
  236. package/src/types.ts +233 -0
@@ -0,0 +1,187 @@
1
+ import { safeFetch } from '../../discovery/fetch.js';
2
+ const DEFAULT_API_BASE = 'https://api.fxtwitter.com';
3
+ function estimateTokens(text) {
4
+ return Math.ceil(text.length / 4);
5
+ }
6
+ /**
7
+ * Twitter/X decoder — uses fxtwitter.com public API as side channel.
8
+ *
9
+ * Handles:
10
+ * - Individual tweets/posts (with text, media, quotes, articles)
11
+ * - Profile URLs (basic profile info)
12
+ *
13
+ * fxtwitter API returns full tweet JSON including embedded articles,
14
+ * media URLs, quote tweets, and engagement metrics — all without auth.
15
+ */
16
+ export const twitterDecoder = {
17
+ name: 'twitter',
18
+ patterns: [
19
+ /(?:twitter\.com|x\.com)\/\w+\/status\/\d+/,
20
+ /(?:twitter\.com|x\.com)\/(\w+)\/?$/,
21
+ ],
22
+ async decode(url, options = {}) {
23
+ try {
24
+ const apiBase = options._apiBaseUrl || DEFAULT_API_BASE;
25
+ // Tweet/status URL
26
+ const statusMatch = url.match(/(?:twitter\.com|x\.com)\/(\w+)\/status\/(\d+)/);
27
+ if (statusMatch) {
28
+ return decodeTweet(apiBase, statusMatch[1], statusMatch[2], url, options);
29
+ }
30
+ // Profile URL
31
+ const profileMatch = url.match(/(?:twitter\.com|x\.com)\/(\w+)\/?$/);
32
+ if (profileMatch && !isReservedPath(profileMatch[1])) {
33
+ return decodeProfile(apiBase, profileMatch[1], url, options);
34
+ }
35
+ return null;
36
+ }
37
+ catch {
38
+ return null;
39
+ }
40
+ },
41
+ };
42
+ function isReservedPath(path) {
43
+ const reserved = new Set([
44
+ 'home', 'explore', 'search', 'notifications', 'messages',
45
+ 'settings', 'i', 'compose', 'hashtag', 'login', 'signup',
46
+ ]);
47
+ return reserved.has(path.toLowerCase());
48
+ }
49
+ async function decodeTweet(apiBase, username, tweetId, url, options) {
50
+ const apiUrl = `${apiBase}/${username}/status/${tweetId}`;
51
+ const result = await safeFetch(apiUrl, { skipSsrf: options.skipSsrf });
52
+ if (!result || result.status !== 200)
53
+ return null;
54
+ let data;
55
+ try {
56
+ data = JSON.parse(result.body);
57
+ }
58
+ catch {
59
+ return null;
60
+ }
61
+ const tweet = data?.tweet;
62
+ if (!tweet)
63
+ return null;
64
+ const author = tweet.author;
65
+ const authorName = author ? `${author.name} (@${author.screen_name})` : username;
66
+ // Build content
67
+ const parts = [];
68
+ // Author info
69
+ if (author) {
70
+ parts.push(`**${author.name}** (@${author.screen_name})`);
71
+ if (author.description)
72
+ parts.push(author.description);
73
+ if (author.followers)
74
+ parts.push(`Followers: ${Number(author.followers).toLocaleString()}`);
75
+ }
76
+ // Tweet text
77
+ const tweetText = tweet.text || tweet.raw_text?.text || '';
78
+ if (tweetText)
79
+ parts.push(`\n${tweetText}`);
80
+ // Engagement
81
+ const engagement = [];
82
+ if (tweet.likes)
83
+ engagement.push(`${Number(tweet.likes).toLocaleString()} likes`);
84
+ if (tweet.retweets)
85
+ engagement.push(`${Number(tweet.retweets).toLocaleString()} RTs`);
86
+ if (tweet.views)
87
+ engagement.push(`${Number(tweet.views).toLocaleString()} views`);
88
+ if (tweet.bookmarks)
89
+ engagement.push(`${Number(tweet.bookmarks).toLocaleString()} bookmarks`);
90
+ if (engagement.length > 0)
91
+ parts.push(engagement.join(' · '));
92
+ // Embedded article (X Articles / long-form posts)
93
+ if (tweet.article) {
94
+ const article = tweet.article;
95
+ parts.push(`\n## ${article.title || 'Article'}`);
96
+ if (article.content?.blocks) {
97
+ const articleText = extractArticleBlocks(article.content.blocks);
98
+ parts.push(articleText);
99
+ }
100
+ else if (article.preview_text) {
101
+ parts.push(article.preview_text);
102
+ }
103
+ }
104
+ // Quote tweet
105
+ if (tweet.quote) {
106
+ const q = tweet.quote;
107
+ const qAuthor = q.author ? `${q.author.name} (@${q.author.screen_name})` : 'Unknown';
108
+ const qText = q.text || '';
109
+ parts.push(`\n> Quoting ${qAuthor}:\n> ${qText}`);
110
+ }
111
+ const content = parts.join('\n');
112
+ // Links
113
+ const links = [];
114
+ if (author?.website?.url) {
115
+ links.push({ text: author.website.display_url || 'Website', href: author.website.url });
116
+ }
117
+ // Images
118
+ const images = [];
119
+ if (tweet.media?.photos) {
120
+ for (const photo of tweet.media.photos.slice(0, 4)) {
121
+ images.push({ alt: 'Tweet image', src: photo.url });
122
+ }
123
+ }
124
+ if (tweet.article?.cover_media?.media_info?.original_img_url) {
125
+ images.push({
126
+ alt: tweet.article.title || 'Article cover',
127
+ src: tweet.article.cover_media.media_info.original_img_url,
128
+ });
129
+ }
130
+ return {
131
+ url,
132
+ title: tweet.article?.title || (tweetText ? `${authorName}: ${tweetText.slice(0, 80)}${tweetText.length > 80 ? '…' : ''}` : `Tweet by ${authorName}`),
133
+ author: author?.name || username,
134
+ description: tweetText?.slice(0, 200) || null,
135
+ content,
136
+ links,
137
+ images,
138
+ metadata: {
139
+ type: tweet.article ? 'article' : 'social',
140
+ publishedAt: tweet.created_at || null,
141
+ source: 'twitter-fxtwitter',
142
+ canonical: url,
143
+ siteName: 'X (Twitter)',
144
+ },
145
+ cost: { tokens: estimateTokens(content) },
146
+ };
147
+ }
148
+ function extractArticleBlocks(blocks) {
149
+ const parts = [];
150
+ for (const block of blocks) {
151
+ const text = block.text || '';
152
+ if (!text)
153
+ continue;
154
+ switch (block.type) {
155
+ case 'header-one':
156
+ parts.push(`\n# ${text}`);
157
+ break;
158
+ case 'header-two':
159
+ parts.push(`\n## ${text}`);
160
+ break;
161
+ case 'header-three':
162
+ parts.push(`\n### ${text}`);
163
+ break;
164
+ case 'unordered-list-item':
165
+ parts.push(`• ${text}`);
166
+ break;
167
+ case 'ordered-list-item':
168
+ parts.push(`1. ${text}`);
169
+ break;
170
+ case 'blockquote':
171
+ parts.push(`> ${text}`);
172
+ break;
173
+ default:
174
+ parts.push(text);
175
+ break;
176
+ }
177
+ }
178
+ return parts.join('\n');
179
+ }
180
+ async function decodeProfile(apiBase, username, url, options) {
181
+ // fxtwitter doesn't have a dedicated profile endpoint,
182
+ // but we can get profile data from any tweet by the user.
183
+ // For now, return null and let generic decoder handle profiles.
184
+ // Profile data is included in tweet responses anyway.
185
+ return null;
186
+ }
187
+ //# sourceMappingURL=twitter.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"twitter.js","sourceRoot":"","sources":["../../../src/read/decoders/twitter.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,SAAS,EAAE,MAAM,0BAA0B,CAAC;AAErD,MAAM,gBAAgB,GAAG,2BAA2B,CAAC;AAErD,SAAS,cAAc,CAAC,IAAY;IAClC,OAAO,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AACpC,CAAC;AAED;;;;;;;;;GASG;AACH,MAAM,CAAC,MAAM,cAAc,GAAY;IACrC,IAAI,EAAE,SAAS;IACf,QAAQ,EAAE;QACR,2CAA2C;QAC3C,oCAAoC;KACrC;IAED,KAAK,CAAC,MAAM,CAAC,GAAW,EAAE,UAAsD,EAAE;QAChF,IAAI,CAAC;YACH,MAAM,OAAO,GAAG,OAAO,CAAC,WAAW,IAAI,gBAAgB,CAAC;YAExD,mBAAmB;YACnB,MAAM,WAAW,GAAG,GAAG,CAAC,KAAK,CAAC,+CAA+C,CAAC,CAAC;YAC/E,IAAI,WAAW,EAAE,CAAC;gBAChB,OAAO,WAAW,CAAC,OAAO,EAAE,WAAW,CAAC,CAAC,CAAC,EAAE,WAAW,CAAC,CAAC,CAAC,EAAE,GAAG,EAAE,OAAO,CAAC,CAAC;YAC5E,CAAC;YAED,cAAc;YACd,MAAM,YAAY,GAAG,GAAG,CAAC,KAAK,CAAC,oCAAoC,CAAC,CAAC;YACrE,IAAI,YAAY,IAAI,CAAC,cAAc,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC;gBACrD,OAAO,aAAa,CAAC,OAAO,EAAE,YAAY,CAAC,CAAC,CAAC,EAAE,GAAG,EAAE,OAAO,CAAC,CAAC;YAC/D,CAAC;YAED,OAAO,IAAI,CAAC;QACd,CAAC;QAAC,MAAM,CAAC;YACP,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;CACF,CAAC;AAEF,SAAS,cAAc,CAAC,IAAY;IAClC,MAAM,QAAQ,GAAG,IAAI,GAAG,CAAC;QACvB,MAAM,EAAE,SAAS,EAAE,QAAQ,EAAE,eAAe,EAAE,UAAU;QACxD,UAAU,EAAE,GAAG,EAAE,SAAS,EAAE,SAAS,EAAE,OAAO,EAAE,QAAQ;KACzD,CAAC,CAAC;IACH,OAAO,QAAQ,CAAC,GAAG,CAAC,IAAI,CAAC,WAAW,EAAE,CAAC,CAAC;AAC1C,CAAC;AAED,KAAK,UAAU,WAAW,CACxB,OAAe,EACf,QAAgB,EAChB,OAAe,EACf,GAAW,EACX,OAAmD;IAEnD,MAAM,MAAM,GAAG,GAAG,OAAO,IAAI,QAAQ,WAAW,OAAO,EAAE,CAAC;IAC1D,MAAM,MAAM,GAAG,MAAM,SAAS,CAAC,MAAM,EAAE,EAAE,QAAQ,EAAE,OAAO,CAAC,QAAQ,EAAE,CAAC,CAAC;IACvE,IAAI,CAAC,MAAM,IAAI,MAAM,CAAC,MAAM,KAAK,GAAG;QAAE,OAAO,IAAI,CAAC;IAElD,IAAI,IAAS,CAAC;IACd,IAAI,CAAC;QACH,IAAI,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;IACjC,CAAC;IAAC,MAAM,CAAC;QACP,OAAO,IAAI,CAAC;IACd,CAAC;IAED,MAAM,KAAK,GAAG,IAAI,EAAE,KAAK,CAAC;IAC1B,IAAI,CAAC,KAAK;QAAE,OAAO,IAAI,CAAC;IAExB,MAAM,MAAM,GAAG,KAAK,CAAC,MAAM,CAAC;IAC5B,MAAM,UAAU,GAAG,MAAM,CAAC,CAAC,CAAC,GAAG,MAAM,CAAC,IAAI,MAAM,MAAM,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,QAAQ,CAAC;IAEjF,gBAAgB;IAChB,MAAM,KAAK,GAAa,EAAE,CAAC;IAE3B,cAAc;IACd,IAAI,MAAM,EAAE,CAAC;QACX,KAAK,CAAC,IAAI,CAAC,KAAK,MAAM,CAAC,IAAI,QAAQ,MAAM,CAAC,WAAW,GAAG,CAAC,CAAC;QAC1D,IAAI,MAAM,CAAC,WAAW;YAAE,KAAK,CAAC,IAAI,CAAC,MAAM,CAAC,WAAW,CAAC,CAAC;QACvD,IAAI,MAAM,CAAC,SAAS;YAAE,KAAK,CAAC,IAAI,CAAC,cAAc,MAAM,CAAC,MAAM,CAAC,SAAS,CAAC,CAAC,cAAc,EAAE,EAAE,CAAC,CAAC;IAC9F,CAAC;IAED,aAAa;IACb,MAAM,SAAS,GAAG,KAAK,CAAC,IAAI,IAAI,KAAK,CAAC,QAAQ,EAAE,IAAI,IAAI,EAAE,CAAC;IAC3D,IAAI,SAAS;QAAE,KAAK,CAAC,IAAI,CAAC,KAAK,SAAS,EAAE,CAAC,CAAC;IAE5C,aAAa;IACb,MAAM,UAAU,GAAa,EAAE,CAAC;IAChC,IAAI,KAAK,CAAC,KAAK;QAAE,UAAU,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,cAAc,EAAE,QAAQ,CAAC,CAAC;IAClF,IAAI,KAAK,CAAC,QAAQ;QAAE,UAAU,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,cAAc,EAAE,MAAM,CAAC,CAAC;IACtF,IAAI,KAAK,CAAC,KAAK;QAAE,UAAU,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,cAAc,EAAE,QAAQ,CAAC,CAAC;IAClF,IAAI,KAAK,CAAC,SAAS;QAAE,UAAU,CAAC,IAAI,CAAC,GAAG,MAAM,CAAC,KAAK,CAAC,SAAS,CAAC,CAAC,cAAc,EAAE,YAAY,CAAC,CAAC;IAC9F,IAAI,UAAU,CAAC,MAAM,GAAG,CAAC;QAAE,KAAK,CAAC,IAAI,CAAC,UAAU,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC,CAAC;IAE9D,kDAAkD;IAClD,IAAI,KAAK,CAAC,OAAO,EAAE,CAAC;QAClB,MAAM,OAAO,GAAG,KAAK,CAAC,OAAO,CAAC;QAC9B,KAAK,CAAC,IAAI,CAAC,QAAQ,OAAO,CAAC,KAAK,IAAI,SAAS,EAAE,CAAC,CAAC;QAEjD,IAAI,OAAO,CAAC,OAAO,EAAE,MAAM,EAAE,CAAC;YAC5B,MAAM,WAAW,GAAG,oBAAoB,CAAC,OAAO,CAAC,OAAO,CAAC,MAAM,CAAC,CAAC;YACjE,KAAK,CAAC,IAAI,CAAC,WAAW,CAAC,CAAC;QAC1B,CAAC;aAAM,IAAI,OAAO,CAAC,YAAY,EAAE,CAAC;YAChC,KAAK,CAAC,IAAI,CAAC,OAAO,CAAC,YAAY,CAAC,CAAC;QACnC,CAAC;IACH,CAAC;IAED,cAAc;IACd,IAAI,KAAK,CAAC,KAAK,EAAE,CAAC;QAChB,MAAM,CAAC,GAAG,KAAK,CAAC,KAAK,CAAC;QACtB,MAAM,OAAO,GAAG,CAAC,CAAC,MAAM,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,MAAM,CAAC,IAAI,MAAM,CAAC,CAAC,MAAM,CAAC,WAAW,GAAG,CAAC,CAAC,CAAC,SAAS,CAAC;QACrF,MAAM,KAAK,GAAG,CAAC,CAAC,IAAI,IAAI,EAAE,CAAC;QAC3B,KAAK,CAAC,IAAI,CAAC,eAAe,OAAO,QAAQ,KAAK,EAAE,CAAC,CAAC;IACpD,CAAC;IAED,MAAM,OAAO,GAAG,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;IAEjC,QAAQ;IACR,MAAM,KAAK,GAA0C,EAAE,CAAC;IACxD,IAAI,MAAM,EAAE,OAAO,EAAE,GAAG,EAAE,CAAC;QACzB,KAAK,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,MAAM,CAAC,OAAO,CAAC,WAAW,IAAI,SAAS,EAAE,IAAI,EAAE,MAAM,CAAC,OAAO,CAAC,GAAG,EAAE,CAAC,CAAC;IAC1F,CAAC;IAED,SAAS;IACT,MAAM,MAAM,GAAwC,EAAE,CAAC;IACvD,IAAI,KAAK,CAAC,KAAK,EAAE,MAAM,EAAE,CAAC;QACxB,KAAK,MAAM,KAAK,IAAI,KAAK,CAAC,KAAK,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,EAAE,CAAC;YACnD,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,aAAa,EAAE,GAAG,EAAE,KAAK,CAAC,GAAG,EAAE,CAAC,CAAC;QACtD,CAAC;IACH,CAAC;IACD,IAAI,KAAK,CAAC,OAAO,EAAE,WAAW,EAAE,UAAU,EAAE,gBAAgB,EAAE,CAAC;QAC7D,MAAM,CAAC,IAAI,CAAC;YACV,GAAG,EAAE,KAAK,CAAC,OAAO,CAAC,KAAK,IAAI,eAAe;YAC3C,GAAG,EAAE,KAAK,CAAC,OAAO,CAAC,WAAW,CAAC,UAAU,CAAC,gBAAgB;SAC3D,CAAC,CAAC;IACL,CAAC;IAED,OAAO;QACL,GAAG;QACH,KAAK,EAAE,KAAK,CAAC,OAAO,EAAE,KAAK,IAAI,CAAC,SAAS,CAAC,CAAC,CAAC,GAAG,UAAU,KAAK,SAAS,CAAC,KAAK,CAAC,CAAC,EAAE,EAAE,CAAC,GAAG,SAAS,CAAC,MAAM,GAAG,EAAE,CAAC,CAAC,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,EAAE,CAAC,CAAC,CAAC,YAAY,UAAU,EAAE,CAAC;QACrJ,MAAM,EAAE,MAAM,EAAE,IAAI,IAAI,QAAQ;QAChC,WAAW,EAAE,SAAS,EAAE,KAAK,CAAC,CAAC,EAAE,GAAG,CAAC,IAAI,IAAI;QAC7C,OAAO;QACP,KAAK;QACL,MAAM;QACN,QAAQ,EAAE;YACR,IAAI,EAAE,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,SAAS,CAAC,CAAC,CAAC,QAAQ;YAC1C,WAAW,EAAE,KAAK,CAAC,UAAU,IAAI,IAAI;YACrC,MAAM,EAAE,mBAAmB;YAC3B,SAAS,EAAE,GAAG;YACd,QAAQ,EAAE,aAAa;SACxB;QACD,IAAI,EAAE,EAAE,MAAM,EAAE,cAAc,CAAC,OAAO,CAAC,EAAE;KAC1C,CAAC;AACJ,CAAC;AAED,SAAS,oBAAoB,CAAC,MAAa;IACzC,MAAM,KAAK,GAAa,EAAE,CAAC;IAC3B,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;QAC3B,MAAM,IAAI,GAAG,KAAK,CAAC,IAAI,IAAI,EAAE,CAAC;QAC9B,IAAI,CAAC,IAAI;YAAE,SAAS;QAEpB,QAAQ,KAAK,CAAC,IAAI,EAAE,CAAC;YACnB,KAAK,YAAY;gBACf,KAAK,CAAC,IAAI,CAAC,OAAO,IAAI,EAAE,CAAC,CAAC;gBAC1B,MAAM;YACR,KAAK,YAAY;gBACf,KAAK,CAAC,IAAI,CAAC,QAAQ,IAAI,EAAE,CAAC,CAAC;gBAC3B,MAAM;YACR,KAAK,cAAc;gBACjB,KAAK,CAAC,IAAI,CAAC,SAAS,IAAI,EAAE,CAAC,CAAC;gBAC5B,MAAM;YACR,KAAK,qBAAqB;gBACxB,KAAK,CAAC,IAAI,CAAC,KAAK,IAAI,EAAE,CAAC,CAAC;gBACxB,MAAM;YACR,KAAK,mBAAmB;gBACtB,KAAK,CAAC,IAAI,CAAC,MAAM,IAAI,EAAE,CAAC,CAAC;gBACzB,MAAM;YACR,KAAK,YAAY;gBACf,KAAK,CAAC,IAAI,CAAC,KAAK,IAAI,EAAE,CAAC,CAAC;gBACxB,MAAM;YACR;gBACE,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;gBACjB,MAAM;QACV,CAAC;IACH,CAAC;IACD,OAAO,KAAK,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;AAC1B,CAAC;AAED,KAAK,UAAU,aAAa,CAC1B,OAAe,EACf,QAAgB,EAChB,GAAW,EACX,OAAmD;IAEnD,uDAAuD;IACvD,0DAA0D;IAC1D,gEAAgE;IAChE,sDAAsD;IACtD,OAAO,IAAI,CAAC;AACd,CAAC"}
@@ -0,0 +1,2 @@
1
+ import type { Decoder } from '../types.js';
2
+ export declare const wikipediaDecoder: Decoder;
@@ -0,0 +1,66 @@
1
+ import { safeFetch } from '../../discovery/fetch.js';
2
+ function estimateTokens(text) {
3
+ return Math.ceil(text.length / 4);
4
+ }
5
+ export const wikipediaDecoder = {
6
+ name: 'wikipedia',
7
+ patterns: [
8
+ /([a-z]{2,3})\.wikipedia\.org\/wiki\/([^#?]+)/,
9
+ ],
10
+ async decode(url, options = {}) {
11
+ try {
12
+ const match = url.match(/([a-z]{2,3})\.wikipedia\.org\/wiki\/([^#?]+)/);
13
+ if (!match)
14
+ return null;
15
+ const lang = match[1];
16
+ const title = match[2];
17
+ const apiBase = options._apiBaseUrl || `https://${lang}.wikipedia.org`;
18
+ const apiUrl = `${apiBase}/api/rest_v1/page/summary/${title}`;
19
+ const result = await safeFetch(apiUrl, { skipSsrf: options.skipSsrf });
20
+ if (!result || result.status !== 200)
21
+ return null;
22
+ let data;
23
+ try {
24
+ data = JSON.parse(result.body);
25
+ }
26
+ catch {
27
+ return null;
28
+ }
29
+ if (!data)
30
+ return null;
31
+ const articleTitle = data.title || data.displaytitle || decodeURIComponent(title);
32
+ const extract = data.extract || '';
33
+ const description = data.description || null;
34
+ const content = extract;
35
+ const links = [];
36
+ if (data.content_urls?.desktop?.page) {
37
+ links.push({ text: 'Full article', href: data.content_urls.desktop.page });
38
+ }
39
+ const images = [];
40
+ if (data.thumbnail?.source) {
41
+ images.push({ alt: articleTitle, src: data.thumbnail.source });
42
+ }
43
+ return {
44
+ url,
45
+ title: articleTitle,
46
+ author: null,
47
+ description,
48
+ content,
49
+ links,
50
+ images,
51
+ metadata: {
52
+ type: 'article',
53
+ publishedAt: data.timestamp || null,
54
+ source: 'wikipedia-rest',
55
+ canonical: data.content_urls?.desktop?.page || null,
56
+ siteName: 'Wikipedia',
57
+ },
58
+ cost: { tokens: estimateTokens(content) },
59
+ };
60
+ }
61
+ catch {
62
+ return null;
63
+ }
64
+ },
65
+ };
66
+ //# sourceMappingURL=wikipedia.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"wikipedia.js","sourceRoot":"","sources":["../../../src/read/decoders/wikipedia.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,SAAS,EAAE,MAAM,0BAA0B,CAAC;AAErD,SAAS,cAAc,CAAC,IAAY;IAClC,OAAO,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AACpC,CAAC;AAED,MAAM,CAAC,MAAM,gBAAgB,GAAY;IACvC,IAAI,EAAE,WAAW;IACjB,QAAQ,EAAE;QACR,8CAA8C;KAC/C;IAED,KAAK,CAAC,MAAM,CAAC,GAAW,EAAE,UAAsD,EAAE;QAChF,IAAI,CAAC;YACH,MAAM,KAAK,GAAG,GAAG,CAAC,KAAK,CAAC,8CAA8C,CAAC,CAAC;YACxE,IAAI,CAAC,KAAK;gBAAE,OAAO,IAAI,CAAC;YAExB,MAAM,IAAI,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YACtB,MAAM,KAAK,GAAG,KAAK,CAAC,CAAC,CAAC,CAAC;YAEvB,MAAM,OAAO,GAAG,OAAO,CAAC,WAAW,IAAI,WAAW,IAAI,gBAAgB,CAAC;YACvE,MAAM,MAAM,GAAG,GAAG,OAAO,6BAA6B,KAAK,EAAE,CAAC;YAE9D,MAAM,MAAM,GAAG,MAAM,SAAS,CAAC,MAAM,EAAE,EAAE,QAAQ,EAAE,OAAO,CAAC,QAAQ,EAAE,CAAC,CAAC;YACvE,IAAI,CAAC,MAAM,IAAI,MAAM,CAAC,MAAM,KAAK,GAAG;gBAAE,OAAO,IAAI,CAAC;YAElD,IAAI,IAAS,CAAC;YACd,IAAI,CAAC;gBACH,IAAI,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;YACjC,CAAC;YAAC,MAAM,CAAC;gBACP,OAAO,IAAI,CAAC;YACd,CAAC;YAED,IAAI,CAAC,IAAI;gBAAE,OAAO,IAAI,CAAC;YAEvB,MAAM,YAAY,GAAG,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC,YAAY,IAAI,kBAAkB,CAAC,KAAK,CAAC,CAAC;YAClF,MAAM,OAAO,GAAG,IAAI,CAAC,OAAO,IAAI,EAAE,CAAC;YACnC,MAAM,WAAW,GAAG,IAAI,CAAC,WAAW,IAAI,IAAI,CAAC;YAE7C,MAAM,OAAO,GAAG,OAAO,CAAC;YAExB,MAAM,KAAK,GAA0C,EAAE,CAAC;YACxD,IAAI,IAAI,CAAC,YAAY,EAAE,OAAO,EAAE,IAAI,EAAE,CAAC;gBACrC,KAAK,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,cAAc,EAAE,IAAI,EAAE,IAAI,CAAC,YAAY,CAAC,OAAO,CAAC,IAAI,EAAE,CAAC,CAAC;YAC7E,CAAC;YAED,MAAM,MAAM,GAAwC,EAAE,CAAC;YACvD,IAAI,IAAI,CAAC,SAAS,EAAE,MAAM,EAAE,CAAC;gBAC3B,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,YAAY,EAAE,GAAG,EAAE,IAAI,CAAC,SAAS,CAAC,MAAM,EAAE,CAAC,CAAC;YACjE,CAAC;YAED,OAAO;gBACL,GAAG;gBACH,KAAK,EAAE,YAAY;gBACnB,MAAM,EAAE,IAAI;gBACZ,WAAW;gBACX,OAAO;gBACP,KAAK;gBACL,MAAM;gBACN,QAAQ,EAAE;oBACR,IAAI,EAAE,SAAS;oBACf,WAAW,EAAE,IAAI,CAAC,SAAS,IAAI,IAAI;oBACnC,MAAM,EAAE,gBAAgB;oBACxB,SAAS,EAAE,IAAI,CAAC,YAAY,EAAE,OAAO,EAAE,IAAI,IAAI,IAAI;oBACnD,QAAQ,EAAE,WAAW;iBACtB;gBACD,IAAI,EAAE,EAAE,MAAM,EAAE,cAAc,CAAC,OAAO,CAAC,EAAE;aAC1C,CAAC;QACJ,CAAC;QAAC,MAAM,CAAC;YACP,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;CACF,CAAC"}
@@ -0,0 +1,2 @@
1
+ import type { Decoder } from '../types.js';
2
+ export declare const youtubeDecoder: Decoder;
@@ -0,0 +1,69 @@
1
+ import { safeFetch } from '../../discovery/fetch.js';
2
+ const DEFAULT_OEMBED_BASE = 'https://noembed.com';
3
+ function estimateTokens(text) {
4
+ return Math.ceil(text.length / 4);
5
+ }
6
+ export const youtubeDecoder = {
7
+ name: 'youtube',
8
+ patterns: [
9
+ /youtube\.com\/watch\?v=/,
10
+ /youtu\.be\//,
11
+ ],
12
+ async decode(url, options = {}) {
13
+ try {
14
+ const base = options._oembedBaseUrl || DEFAULT_OEMBED_BASE;
15
+ const oembedUrl = `${base}/embed?url=${encodeURIComponent(url)}`;
16
+ const result = await safeFetch(oembedUrl, { skipSsrf: options.skipSsrf });
17
+ if (!result || result.status !== 200)
18
+ return null;
19
+ let data;
20
+ try {
21
+ data = JSON.parse(result.body);
22
+ }
23
+ catch {
24
+ return null;
25
+ }
26
+ if (!data || !data.title)
27
+ return null;
28
+ const title = data.title || null;
29
+ const author = data.author_name || null;
30
+ const contentParts = [];
31
+ if (title)
32
+ contentParts.push(`Title: ${title}`);
33
+ if (author)
34
+ contentParts.push(`Author: ${author}`);
35
+ if (data.author_url)
36
+ contentParts.push(`Channel: ${data.author_url}`);
37
+ const content = contentParts.join('\n');
38
+ const links = [];
39
+ if (data.author_url) {
40
+ links.push({ text: author || 'Channel', href: data.author_url });
41
+ }
42
+ const images = [];
43
+ if (data.thumbnail_url) {
44
+ images.push({ alt: title || 'Thumbnail', src: data.thumbnail_url });
45
+ }
46
+ return {
47
+ url,
48
+ title,
49
+ author,
50
+ description: author ? `Video by ${author}` : 'YouTube video',
51
+ content,
52
+ links,
53
+ images,
54
+ metadata: {
55
+ type: 'video',
56
+ publishedAt: null,
57
+ source: 'youtube-oembed',
58
+ canonical: url,
59
+ siteName: 'YouTube',
60
+ },
61
+ cost: { tokens: estimateTokens(content) },
62
+ };
63
+ }
64
+ catch {
65
+ return null;
66
+ }
67
+ },
68
+ };
69
+ //# sourceMappingURL=youtube.js.map
@@ -0,0 +1 @@
1
+ {"version":3,"file":"youtube.js","sourceRoot":"","sources":["../../../src/read/decoders/youtube.ts"],"names":[],"mappings":"AAEA,OAAO,EAAE,SAAS,EAAE,MAAM,0BAA0B,CAAC;AAErD,MAAM,mBAAmB,GAAG,qBAAqB,CAAC;AAElD,SAAS,cAAc,CAAC,IAAY;IAClC,OAAO,IAAI,CAAC,IAAI,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AACpC,CAAC;AAED,MAAM,CAAC,MAAM,cAAc,GAAY;IACrC,IAAI,EAAE,SAAS;IACf,QAAQ,EAAE;QACR,yBAAyB;QACzB,aAAa;KACd;IAED,KAAK,CAAC,MAAM,CAAC,GAAW,EAAE,UAAsD,EAAE;QAChF,IAAI,CAAC;YACH,MAAM,IAAI,GAAG,OAAO,CAAC,cAAc,IAAI,mBAAmB,CAAC;YAC3D,MAAM,SAAS,GAAG,GAAG,IAAI,cAAc,kBAAkB,CAAC,GAAG,CAAC,EAAE,CAAC;YAEjE,MAAM,MAAM,GAAG,MAAM,SAAS,CAAC,SAAS,EAAE,EAAE,QAAQ,EAAE,OAAO,CAAC,QAAQ,EAAE,CAAC,CAAC;YAC1E,IAAI,CAAC,MAAM,IAAI,MAAM,CAAC,MAAM,KAAK,GAAG;gBAAE,OAAO,IAAI,CAAC;YAElD,IAAI,IAAS,CAAC;YACd,IAAI,CAAC;gBACH,IAAI,GAAG,IAAI,CAAC,KAAK,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;YACjC,CAAC;YAAC,MAAM,CAAC;gBACP,OAAO,IAAI,CAAC;YACd,CAAC;YAED,IAAI,CAAC,IAAI,IAAI,CAAC,IAAI,CAAC,KAAK;gBAAE,OAAO,IAAI,CAAC;YAEtC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,IAAI,IAAI,CAAC;YACjC,MAAM,MAAM,GAAG,IAAI,CAAC,WAAW,IAAI,IAAI,CAAC;YAExC,MAAM,YAAY,GAAa,EAAE,CAAC;YAClC,IAAI,KAAK;gBAAE,YAAY,CAAC,IAAI,CAAC,UAAU,KAAK,EAAE,CAAC,CAAC;YAChD,IAAI,MAAM;gBAAE,YAAY,CAAC,IAAI,CAAC,WAAW,MAAM,EAAE,CAAC,CAAC;YACnD,IAAI,IAAI,CAAC,UAAU;gBAAE,YAAY,CAAC,IAAI,CAAC,YAAY,IAAI,CAAC,UAAU,EAAE,CAAC,CAAC;YACtE,MAAM,OAAO,GAAG,YAAY,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;YAExC,MAAM,KAAK,GAA0C,EAAE,CAAC;YACxD,IAAI,IAAI,CAAC,UAAU,EAAE,CAAC;gBACpB,KAAK,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,MAAM,IAAI,SAAS,EAAE,IAAI,EAAE,IAAI,CAAC,UAAU,EAAE,CAAC,CAAC;YACnE,CAAC;YAED,MAAM,MAAM,GAAwC,EAAE,CAAC;YACvD,IAAI,IAAI,CAAC,aAAa,EAAE,CAAC;gBACvB,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,EAAE,KAAK,IAAI,WAAW,EAAE,GAAG,EAAE,IAAI,CAAC,aAAa,EAAE,CAAC,CAAC;YACtE,CAAC;YAED,OAAO;gBACL,GAAG;gBACH,KAAK;gBACL,MAAM;gBACN,WAAW,EAAE,MAAM,CAAC,CAAC,CAAC,YAAY,MAAM,EAAE,CAAC,CAAC,CAAC,eAAe;gBAC5D,OAAO;gBACP,KAAK;gBACL,MAAM;gBACN,QAAQ,EAAE;oBACR,IAAI,EAAE,OAAO;oBACb,WAAW,EAAE,IAAI;oBACjB,MAAM,EAAE,gBAAgB;oBACxB,SAAS,EAAE,GAAG;oBACd,QAAQ,EAAE,SAAS;iBACpB;gBACD,IAAI,EAAE,EAAE,MAAM,EAAE,cAAc,CAAC,OAAO,CAAC,EAAE;aAC1C,CAAC;QACJ,CAAC;QAAC,MAAM,CAAC;YACP,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;CACF,CAAC"}
@@ -0,0 +1,25 @@
1
+ export interface HeadMeta {
2
+ title: string | null;
3
+ ogTitle: string | null;
4
+ ogDescription: string | null;
5
+ ogImage: string | null;
6
+ ogType: string | null;
7
+ ogSiteName: string | null;
8
+ canonical: string | null;
9
+ author: string | null;
10
+ publishedTime: string | null;
11
+ }
12
+ export interface ExtractResult {
13
+ content: string;
14
+ links: Array<{
15
+ text: string;
16
+ href: string;
17
+ }>;
18
+ images: Array<{
19
+ alt: string;
20
+ src: string;
21
+ }>;
22
+ isSpaShell: boolean;
23
+ }
24
+ export declare function parseHead(html: string): HeadMeta;
25
+ export declare function extractContent(html: string): ExtractResult;