@promptbook/remote-server 0.72.0-8 → 0.72.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (196) hide show
  1. package/README.md +8 -8
  2. package/esm/index.es.js +183 -78
  3. package/esm/index.es.js.map +1 -1
  4. package/esm/typings/src/_packages/browser.index.d.ts +2 -0
  5. package/esm/typings/src/_packages/cli.index.d.ts +20 -0
  6. package/esm/typings/src/_packages/core.index.d.ts +42 -30
  7. package/esm/typings/src/_packages/documents.index.d.ts +8 -0
  8. package/esm/typings/src/_packages/legacy-documents.index.d.ts +8 -0
  9. package/esm/typings/src/_packages/markdown-utils.index.d.ts +6 -0
  10. package/esm/typings/src/_packages/node.index.d.ts +12 -4
  11. package/esm/typings/src/_packages/pdf.index.d.ts +8 -0
  12. package/esm/typings/src/_packages/types.index.d.ts +33 -17
  13. package/esm/typings/src/_packages/utils.index.d.ts +2 -2
  14. package/esm/typings/src/_packages/website-crawler.index.d.ts +8 -0
  15. package/esm/typings/src/collection/PipelineCollection.d.ts +1 -1
  16. package/esm/typings/src/collection/SimplePipelineCollection.d.ts +2 -2
  17. package/esm/typings/src/collection/collectionToJson.d.ts +1 -1
  18. package/esm/typings/src/collection/constructors/createCollectionFromDirectory.d.ts +5 -3
  19. package/esm/typings/src/collection/constructors/createCollectionFromJson.d.ts +1 -1
  20. package/esm/typings/src/collection/constructors/createCollectionFromPromise.d.ts +1 -1
  21. package/esm/typings/src/commands/_common/types/CommandParser.d.ts +5 -5
  22. package/esm/typings/src/config.d.ts +26 -13
  23. package/esm/typings/src/conversion/pipelineStringToJson.d.ts +3 -1
  24. package/esm/typings/src/dialogs/callback/CallbackInterfaceToolsOptions.d.ts +2 -2
  25. package/esm/typings/src/dialogs/simple-prompt/SimplePromptInterfaceTools.d.ts +3 -3
  26. package/esm/typings/src/executables/$provideExecutablesForNode.d.ts +12 -0
  27. package/esm/typings/src/executables/apps/locateLibreoffice.d.ts +11 -0
  28. package/esm/typings/src/executables/apps/locatePandoc.d.ts +11 -0
  29. package/esm/typings/src/executables/locateApp.d.ts +33 -0
  30. package/esm/typings/src/executables/platforms/locateAppOnLinux.d.ts +12 -0
  31. package/esm/typings/src/executables/platforms/locateAppOnMacOs.d.ts +12 -0
  32. package/esm/typings/src/executables/platforms/locateAppOnWindows.d.ts +12 -0
  33. package/esm/typings/src/execution/{CommonExecutionToolsOptions.d.ts → CommonToolsOptions.d.ts} +1 -1
  34. package/esm/typings/src/execution/EmbeddingVector.d.ts +1 -1
  35. package/esm/typings/src/execution/Executables.d.ts +18 -0
  36. package/esm/typings/src/execution/ExecutionTools.d.ts +32 -6
  37. package/esm/typings/src/execution/FilesystemTools.d.ts +9 -0
  38. package/esm/typings/src/execution/LlmExecutionTools.d.ts +2 -2
  39. package/esm/typings/src/execution/PipelineExecutorResult.d.ts +2 -2
  40. package/esm/typings/src/execution/assertsExecutionSuccessful.d.ts +3 -2
  41. package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorOptions.d.ts +29 -6
  42. package/esm/typings/src/execution/createPipelineExecutor/10-executePipeline.d.ts +3 -12
  43. package/esm/typings/src/execution/createPipelineExecutor/20-executeTemplate.d.ts +4 -18
  44. package/esm/typings/src/execution/createPipelineExecutor/40-executeAttempts.d.ts +9 -19
  45. package/esm/typings/src/execution/translation/automatic-translate/automatic-translators/LindatAutomaticTranslator.d.ts +11 -3
  46. package/esm/typings/src/execution/translation/automatic-translate/translateMessages.d.ts +1 -0
  47. package/esm/typings/src/execution/utils/$provideExecutionToolsForNode.d.ts +13 -0
  48. package/esm/typings/src/execution/utils/addUsage.d.ts +1 -1
  49. package/esm/typings/src/execution/utils/forEachAsync.d.ts +1 -1
  50. package/esm/typings/src/formats/_common/FormatDefinition.d.ts +2 -2
  51. package/esm/typings/src/formats/_common/FormatSubvalueDefinition.d.ts +2 -2
  52. package/esm/typings/src/llm-providers/_common/{$llmToolsMetadataRegister.d.ts → register/$llmToolsMetadataRegister.d.ts} +4 -1
  53. package/esm/typings/src/llm-providers/_common/{$llmToolsRegister.d.ts → register/$llmToolsRegister.d.ts} +5 -2
  54. package/esm/typings/src/llm-providers/_common/{createLlmToolsFromConfigurationFromEnv.d.ts → register/$provideLlmToolsConfigurationFromEnv.d.ts} +3 -3
  55. package/esm/typings/src/llm-providers/_common/{getLlmToolsForCli.d.ts → register/$provideLlmToolsForCli.d.ts} +4 -11
  56. package/esm/typings/src/llm-providers/_common/{getLlmToolsForTestingAndScriptsAndPlayground.d.ts → register/$provideLlmToolsForTestingAndScriptsAndPlayground.d.ts} +4 -3
  57. package/esm/typings/src/llm-providers/_common/{createLlmToolsFromEnv.d.ts → register/$provideLlmToolsFromEnv.d.ts} +6 -5
  58. package/esm/typings/src/llm-providers/_common/{$registeredLlmToolsMessage.d.ts → register/$registeredLlmToolsMessage.d.ts} +5 -2
  59. package/esm/typings/src/llm-providers/_common/{LlmToolsConfiguration.d.ts → register/LlmToolsConfiguration.d.ts} +6 -5
  60. package/esm/typings/src/llm-providers/_common/{LlmToolsMetadata.d.ts → register/LlmToolsMetadata.d.ts} +5 -4
  61. package/esm/typings/src/llm-providers/_common/{LlmToolsOptions.d.ts → register/LlmToolsOptions.d.ts} +4 -1
  62. package/esm/typings/src/llm-providers/_common/{createLlmToolsFromConfiguration.d.ts → register/createLlmToolsFromConfiguration.d.ts} +12 -4
  63. package/esm/typings/src/llm-providers/_common/utils/cache/CacheLlmToolsOptions.d.ts +4 -1
  64. package/esm/typings/src/llm-providers/anthropic-claude/AnthropicClaudeExecutionTools.d.ts +1 -1
  65. package/esm/typings/src/llm-providers/anthropic-claude/AnthropicClaudeExecutionToolsOptions.d.ts +5 -5
  66. package/esm/typings/src/llm-providers/anthropic-claude/anthropic-claude-models.d.ts +1 -1
  67. package/esm/typings/src/llm-providers/anthropic-claude/register-configuration.d.ts +4 -3
  68. package/esm/typings/src/llm-providers/anthropic-claude/register-constructor.d.ts +4 -3
  69. package/esm/typings/src/llm-providers/azure-openai/AzureOpenAiExecutionTools.d.ts +1 -1
  70. package/esm/typings/src/llm-providers/azure-openai/AzureOpenAiExecutionToolsOptions.d.ts +4 -3
  71. package/esm/typings/src/llm-providers/azure-openai/register-configuration.d.ts +4 -3
  72. package/esm/typings/src/llm-providers/azure-openai/register-constructor.d.ts +4 -3
  73. package/esm/typings/src/llm-providers/langtail/LangtailExecutionTools.d.ts +1 -1
  74. package/esm/typings/src/llm-providers/mocked/$fakeTextToExpectations.d.ts +1 -1
  75. package/esm/typings/src/llm-providers/mocked/MockedEchoLlmExecutionTools.d.ts +4 -4
  76. package/esm/typings/src/llm-providers/mocked/MockedFackedLlmExecutionTools.d.ts +4 -4
  77. package/esm/typings/src/llm-providers/multiple/MultipleLlmExecutionTools.d.ts +4 -4
  78. package/esm/typings/src/llm-providers/multiple/joinLlmExecutionTools.d.ts +1 -1
  79. package/esm/typings/src/llm-providers/openai/OpenAiAssistantExecutionTools.d.ts +0 -1
  80. package/esm/typings/src/llm-providers/openai/OpenAiExecutionTools.d.ts +2 -2
  81. package/esm/typings/src/llm-providers/openai/OpenAiExecutionToolsOptions.d.ts +4 -4
  82. package/esm/typings/src/llm-providers/openai/openai-models.d.ts +1 -1
  83. package/esm/typings/src/llm-providers/openai/register-configuration.d.ts +5 -4
  84. package/esm/typings/src/llm-providers/openai/register-constructor.d.ts +5 -4
  85. package/esm/typings/src/llm-providers/remote/RemoteLlmExecutionTools.d.ts +4 -4
  86. package/esm/typings/src/llm-providers/remote/interfaces/PromptbookServer_ListModels_Request.d.ts +16 -7
  87. package/esm/typings/src/llm-providers/remote/interfaces/PromptbookServer_ListModels_Response.d.ts +4 -4
  88. package/esm/typings/src/llm-providers/remote/interfaces/PromptbookServer_Prompt_Request.d.ts +7 -13
  89. package/esm/typings/src/llm-providers/remote/interfaces/PromptbookServer_Prompt_Response.d.ts +3 -3
  90. package/esm/typings/src/llm-providers/remote/interfaces/RemoteLlmExecutionToolsOptions.d.ts +11 -16
  91. package/esm/typings/src/llm-providers/remote/interfaces/RemoteServerOptions.d.ts +24 -9
  92. package/esm/typings/src/llm-providers/remote/startRemoteServer.d.ts +1 -1
  93. package/esm/typings/src/personas/preparePersona.d.ts +2 -1
  94. package/esm/typings/src/prepare/PrepareAndScrapeOptions.d.ts +10 -28
  95. package/esm/typings/src/prepare/preparePipeline.d.ts +2 -1
  96. package/esm/typings/src/prepare/prepareTemplates.d.ts +3 -2
  97. package/esm/typings/src/scrapers/_common/Converter.d.ts +4 -10
  98. package/esm/typings/src/scrapers/_common/Scraper.d.ts +5 -17
  99. package/esm/typings/src/scrapers/_common/prepareKnowledgePieces.d.ts +2 -1
  100. package/esm/typings/src/scrapers/_common/register/$provideFilesystemForNode.d.ts +11 -0
  101. package/esm/typings/src/scrapers/_common/register/$provideScrapersForBrowser.d.ts +12 -0
  102. package/esm/typings/src/scrapers/_common/register/$provideScrapersForNode.d.ts +15 -0
  103. package/esm/typings/src/scrapers/_common/register/$registeredScrapersMessage.d.ts +12 -0
  104. package/esm/typings/src/scrapers/_common/register/$scrapersMetadataRegister.d.ts +13 -0
  105. package/esm/typings/src/scrapers/_common/register/$scrapersRegister.d.ts +13 -0
  106. package/esm/typings/src/scrapers/_common/register/ScraperAndConverterMetadata.d.ts +41 -0
  107. package/esm/typings/src/scrapers/_common/register/ScraperConstructor.d.ts +12 -0
  108. package/esm/typings/src/scrapers/_common/utils/getScraperIntermediateSource.d.ts +3 -2
  109. package/esm/typings/src/scrapers/_common/utils/makeKnowledgeSourceHandler.d.ts +3 -2
  110. package/esm/typings/src/scrapers/document/{documentScraper.d.ts → DocumentScraper.d.ts} +18 -12
  111. package/esm/typings/src/scrapers/document/createDocumentScraper.d.ts +20 -0
  112. package/esm/typings/src/scrapers/document/register-constructor.d.ts +13 -0
  113. package/esm/typings/src/scrapers/document/register-metadata.d.ts +24 -0
  114. package/esm/typings/src/scrapers/document-legacy/LegacyDocumentScraper.d.ts +43 -0
  115. package/esm/typings/src/scrapers/document-legacy/createLegacyDocumentScraper.d.ts +20 -0
  116. package/esm/typings/src/scrapers/document-legacy/register-constructor.d.ts +13 -0
  117. package/esm/typings/src/scrapers/document-legacy/register-metadata.d.ts +24 -0
  118. package/esm/typings/src/scrapers/markdown/MarkdownScraper.d.ts +29 -0
  119. package/esm/typings/src/scrapers/markdown/createMarkdownScraper.d.ts +20 -0
  120. package/esm/typings/src/scrapers/markdown/register-constructor.d.ts +13 -0
  121. package/esm/typings/src/scrapers/markdown/register-metadata.d.ts +24 -0
  122. package/esm/typings/src/scrapers/pdf/PdfScraper.d.ts +40 -0
  123. package/esm/typings/src/scrapers/pdf/createPdfScraper.d.ts +20 -0
  124. package/esm/typings/src/scrapers/pdf/register-constructor.d.ts +13 -0
  125. package/esm/typings/src/scrapers/pdf/register-metadata.d.ts +24 -0
  126. package/esm/typings/src/scrapers/website/WebsiteScraper.d.ts +50 -0
  127. package/esm/typings/src/scrapers/website/createWebsiteScraper.d.ts +20 -0
  128. package/esm/typings/src/scrapers/website/register-constructor.d.ts +13 -0
  129. package/esm/typings/src/scrapers/website/register-metadata.d.ts +24 -0
  130. package/esm/typings/src/scrapers/website/utils/createShowdownConverter.d.ts +7 -0
  131. package/esm/typings/src/scripting/javascript/JavascriptExecutionToolsOptions.d.ts +2 -2
  132. package/esm/typings/src/scripting/javascript/utils/preserve.d.ts +1 -1
  133. package/esm/typings/src/scripting/python/PythonExecutionTools.d.ts +3 -3
  134. package/esm/typings/src/scripting/typescript/TypescriptExecutionTools.d.ts +3 -3
  135. package/esm/typings/src/storage/file-cache-storage/FileCacheStorage.d.ts +5 -3
  136. package/esm/typings/src/storage/file-cache-storage/utils/nameToSubfolderPath.d.ts +1 -1
  137. package/esm/typings/src/storage/{utils → memory/utils}/PrefixStorage.d.ts +1 -1
  138. package/esm/typings/src/storage/{utils → memory/utils}/makePromptbookStorageFromWebStorage.d.ts +1 -1
  139. package/esm/typings/src/types/Arrayable.d.ts +1 -1
  140. package/esm/typings/src/types/IntermediateFilesStrategy.d.ts +7 -0
  141. package/esm/typings/src/types/PipelineJson/KnowledgePieceJson.d.ts +4 -4
  142. package/esm/typings/src/types/PipelineJson/KnowledgeSourceJson.d.ts +1 -1
  143. package/esm/typings/src/types/PipelineJson/PersonaJson.d.ts +1 -1
  144. package/esm/typings/src/types/PipelineJson/TemplateJsonCommon.d.ts +2 -2
  145. package/esm/typings/src/types/Prompt.d.ts +2 -1
  146. package/esm/typings/src/types/execution-report/ExecutionReportJson.d.ts +1 -1
  147. package/esm/typings/src/types/typeAliases.d.ts +18 -8
  148. package/esm/typings/src/utils/$Register.d.ts +20 -7
  149. package/esm/typings/src/utils/FromtoItems.d.ts +1 -1
  150. package/esm/typings/src/utils/arrayableToArray.d.ts +1 -1
  151. package/esm/typings/src/utils/emojis.d.ts +1 -1
  152. package/esm/typings/src/utils/execCommand/$execCommand.d.ts +5 -3
  153. package/esm/typings/src/utils/execCommand/$execCommandNormalizeOptions.d.ts +12 -0
  154. package/esm/typings/src/utils/execCommand/$execCommands.d.ts +2 -1
  155. package/esm/typings/src/utils/execCommand/ExecCommandOptions.d.ts +45 -0
  156. package/esm/typings/src/utils/expectation-counters/countSentences.d.ts +1 -1
  157. package/esm/typings/src/utils/files/isDirectoryExisting.d.ts +14 -0
  158. package/esm/typings/src/utils/files/isExecutable.d.ts +11 -0
  159. package/esm/typings/src/utils/files/isFileExisting.d.ts +13 -0
  160. package/esm/typings/src/utils/files/isFileExisting.test.d.ts +1 -0
  161. package/esm/typings/src/utils/files/{$listAllFiles.d.ts → listAllFiles.d.ts} +3 -4
  162. package/esm/typings/src/utils/files/listAllFiles.test.d.ts +1 -0
  163. package/esm/typings/src/utils/markdown/extractAllBlocksFromMarkdown.d.ts +1 -1
  164. package/esm/typings/src/utils/markdown/splitMarkdownIntoSections.d.ts +1 -1
  165. package/esm/typings/src/utils/normalization/IKeywords.d.ts +2 -2
  166. package/esm/typings/src/utils/normalization/parseKeywords.d.ts +2 -2
  167. package/esm/typings/src/utils/normalization/parseKeywordsFromString.d.ts +2 -2
  168. package/esm/typings/src/utils/normalization/searchKeywords.d.ts +2 -2
  169. package/esm/typings/src/utils/organization/TODO_USE.d.ts +1 -1
  170. package/esm/typings/src/utils/organization/keepUnused.d.ts +1 -1
  171. package/esm/typings/src/utils/random/$randomSeed.d.ts +1 -1
  172. package/esm/typings/src/utils/sets/intersection.d.ts +1 -1
  173. package/esm/typings/src/utils/sets/union.d.ts +1 -1
  174. package/esm/typings/src/utils/unwrapResult.d.ts +4 -4
  175. package/package.json +4 -3
  176. package/umd/index.umd.js +183 -78
  177. package/umd/index.umd.js.map +1 -1
  178. package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorSettings.d.ts +0 -29
  179. package/esm/typings/src/scrapers/document-legacy/legacyDocumentScraper.d.ts +0 -37
  180. package/esm/typings/src/scrapers/index.d.ts +0 -8
  181. package/esm/typings/src/scrapers/markdown/markdownScraper.d.ts +0 -29
  182. package/esm/typings/src/scrapers/pdf/pdfScraper.d.ts +0 -35
  183. package/esm/typings/src/scrapers/website/utils/markdownConverter.d.ts +0 -12
  184. package/esm/typings/src/scrapers/website/websiteScraper.d.ts +0 -43
  185. package/esm/typings/src/utils/execCommand/IExecCommandOptions.d.ts +0 -23
  186. package/esm/typings/src/utils/execCommand/execCommandNormalizeOptions.d.ts +0 -10
  187. package/esm/typings/src/utils/files/$isDirectoryExisting.d.ts +0 -15
  188. package/esm/typings/src/utils/files/$isFileExisting.d.ts +0 -14
  189. /package/esm/typings/src/{scrapers/website/utils/markdownConverter.test.d.ts → executables/apps/locateLibreoffice.test.d.ts} +0 -0
  190. /package/esm/typings/src/{scrapers/website/websiteScraper.test.d.ts → executables/apps/locatePandoc.test.d.ts} +0 -0
  191. /package/esm/typings/src/{utils/files/$isDirectoryExisting.test.d.ts → executables/locateApp.test.d.ts} +0 -0
  192. /package/esm/typings/src/scrapers/document/{documentScraper.test.d.ts → DocumentScraper.test.d.ts} +0 -0
  193. /package/esm/typings/src/scrapers/document-legacy/{legacyDocumentScraper.test.d.ts → LegacyDocumentScraper.test.d.ts} +0 -0
  194. /package/esm/typings/src/scrapers/markdown/{markdownScraper.test.d.ts → MarkdownScraper.test.d.ts} +0 -0
  195. /package/esm/typings/src/{utils/files/$isFileExisting.test.d.ts → scrapers/website/utils/createShowdownConverter.test.d.ts} +0 -0
  196. /package/esm/typings/src/utils/files/{$listAllFiles.test.d.ts → isDirectoryExisting.test.d.ts} +0 -0
@@ -1,14 +1,15 @@
1
- import type { CommonExecutionToolsOptions } from '../../../execution/CommonExecutionToolsOptions';
1
+ import type { CommonToolsOptions } from '../../../execution/CommonToolsOptions';
2
2
  import type { string_base_url } from '../../../types/typeAliases';
3
3
  import type { string_uri } from '../../../types/typeAliases';
4
4
  import type { string_user_id } from '../../../types/typeAliases';
5
- import type { LlmToolsConfiguration } from '../../_common/LlmToolsConfiguration';
5
+ import type { LlmToolsConfiguration } from '../../_common/register/LlmToolsConfiguration';
6
+ import type { CollectionRemoteServerClientOptions } from './RemoteServerOptions';
6
7
  /**
7
8
  * Options for `RemoteLlmExecutionTools`
8
9
  *
9
10
  * @public exported from `@promptbook/remote-client`
10
11
  */
11
- export type RemoteLlmExecutionToolsOptions = CommonExecutionToolsOptions & {
12
+ export type RemoteLlmExecutionToolsOptions<TCustomOptions> = CommonToolsOptions & {
12
13
  /**
13
14
  * URL of the remote PROMPTBOOK server
14
15
  * On this server will be connected to the socket.io server
@@ -29,7 +30,7 @@ export type RemoteLlmExecutionToolsOptions = CommonExecutionToolsOptions & {
29
30
  /**
30
31
  * Use anonymous server with anonymous mode
31
32
  */
32
- isAnonymous: true;
33
+ readonly isAnonymous: true;
33
34
  /**
34
35
  * Configuration for the LLM tools
35
36
  */
@@ -37,22 +38,16 @@ export type RemoteLlmExecutionToolsOptions = CommonExecutionToolsOptions & {
37
38
  /**
38
39
  * Identifier of the end user
39
40
  *
40
- * Note: this is passed to the certain model providers to identify misuse
41
- * Note: In anonymous mode it is not required to identify
41
+ * Note: This is passed to the certain model providers to identify misuse
42
+ * Note: In anonymous mode, there is no need to identify yourself, nor does it change the actual configuration of LLM Tools (unlike in application mode).
42
43
  */
43
- readonly userId?: string_user_id;
44
- } | {
44
+ readonly userId: string_user_id | null;
45
+ } | ({
45
46
  /**
46
47
  * Use anonymous server with client identification and fixed collection
47
48
  */
48
- isAnonymous: false;
49
- /**
50
- * Identifier of the end user
51
- *
52
- * Note: this is passed to the certain model providers to identify misuse
53
- */
54
- readonly userId: string_user_id;
55
- });
49
+ readonly isAnonymous: false;
50
+ } & CollectionRemoteServerClientOptions<TCustomOptions>));
56
51
  /**
57
52
  * TODO: [🧠][🛍] Maybe not `isAnonymous: boolean` BUT `mode: 'ANONYMOUS'|'COLLECTION'`
58
53
  * TODO: [🧠][🧜‍♂️] Maybe join remoteUrl and path into single value
@@ -1,6 +1,8 @@
1
+ import type { Promisable } from 'type-fest';
1
2
  import type { PipelineCollection } from '../../../collection/PipelineCollection';
2
- import type { CommonExecutionToolsOptions } from '../../../execution/CommonExecutionToolsOptions';
3
+ import type { CommonToolsOptions } from '../../../execution/CommonToolsOptions';
3
4
  import type { LlmExecutionTools } from '../../../execution/LlmExecutionTools';
5
+ import type { string_app_id } from '../../../types/typeAliases';
4
6
  import type { string_uri } from '../../../types/typeAliases';
5
7
  import type { string_user_id } from '../../../types/typeAliases';
6
8
  /**
@@ -8,7 +10,7 @@ import type { string_user_id } from '../../../types/typeAliases';
8
10
  *
9
11
  * There are two modes of remote server:
10
12
  *
11
- * 1) **Collection mode** Server will recieve `collection` and execute prompts only from this collection
13
+ * 1) **Application mode** Server will recieve `collection` and execute prompts only from this collection
12
14
  * 2) **Anonymous mode** Server will recieve full `LlmToolsConfiguration` (with api keys) and just acts as a proxy
13
15
  * In anonymous mode, `collection` will be ignored and any prompt will be executed
14
16
  *
@@ -17,7 +19,7 @@ import type { string_user_id } from '../../../types/typeAliases';
17
19
  * @public exported from `@promptbook/remote-client`
18
20
  * @public exported from `@promptbook/remote-server`
19
21
  */
20
- export type RemoteServerOptions = CommonExecutionToolsOptions & {
22
+ export type RemoteServerOptions<TCustomOptions> = CommonToolsOptions & {
21
23
  /**
22
24
  * Port on which the server will listen
23
25
  */
@@ -29,18 +31,18 @@ export type RemoteServerOptions = CommonExecutionToolsOptions & {
29
31
  * @example '/promptbook/socket.io'
30
32
  */
31
33
  readonly path: string_uri;
32
- } & (AnonymousRemoteServerOptions | CollectionRemoteServerOptions | (AnonymousRemoteServerOptions & CollectionRemoteServerOptions));
34
+ } & (AnonymousRemoteServerOptions | CollectionRemoteServerOptions<TCustomOptions> | (AnonymousRemoteServerOptions & CollectionRemoteServerOptions<TCustomOptions>));
33
35
  export type AnonymousRemoteServerOptions = {
34
36
  /**
35
37
  * Enable anonymous mode
36
38
  */
37
39
  readonly isAnonymousModeAllowed: true;
38
40
  };
39
- export type CollectionRemoteServerOptions = {
41
+ export type CollectionRemoteServerOptions<TCustomOptions> = {
40
42
  /**
41
- * Enable collection mode
43
+ * Enable application mode
42
44
  */
43
- readonly isCollectionModeAllowed: true;
45
+ readonly isApplicationModeAllowed: true;
44
46
  /**
45
47
  * Promptbook collection to use
46
48
  *
@@ -50,9 +52,22 @@ export type CollectionRemoteServerOptions = {
50
52
  /**
51
53
  * Creates llm execution tools for each client
52
54
  */
53
- createLlmExecutionTools(userId: string_user_id | undefined): LlmExecutionTools;
55
+ createLlmExecutionTools(options: CollectionRemoteServerClientOptions<TCustomOptions>): Promisable<LlmExecutionTools>;
56
+ };
57
+ export type CollectionRemoteServerClientOptions<TCustomOptions> = {
58
+ /**
59
+ * @@@
60
+ */
61
+ readonly appId: string_app_id | null;
62
+ /**
63
+ * @@@
64
+ */
65
+ readonly userId: string_user_id | null;
66
+ /**
67
+ * @@@
68
+ */
69
+ readonly customOptions?: TCustomOptions;
54
70
  };
55
71
  /**
56
72
  * TODO: Constrain anonymous mode for specific models / providers
57
- * TODO: [🧠][🤺] Remove `createLlmExecutionTools`, pass just `llmExecutionTools`
58
73
  */
@@ -9,7 +9,7 @@ import type { RemoteServerOptions } from './interfaces/RemoteServerOptions';
9
9
  * @see https://github.com/webgptorg/promptbook#remote-server
10
10
  * @public exported from `@promptbook/remote-server`
11
11
  */
12
- export declare function startRemoteServer(options: RemoteServerOptions): IDestroyable;
12
+ export declare function startRemoteServer<TCustomOptions = undefined>(options: RemoteServerOptions<TCustomOptions>): IDestroyable;
13
13
  /**
14
14
  * TODO: Maybe use `$asDeeplyFrozenSerializableJson`
15
15
  * TODO: [🧠][🛍] Maybe not `isAnonymous: boolean` BUT `mode: 'ANONYMOUS'|'COLLECTION'`
@@ -1,3 +1,4 @@
1
+ import type { ExecutionTools } from '../execution/ExecutionTools';
1
2
  import type { PrepareAndScrapeOptions } from '../prepare/PrepareAndScrapeOptions';
2
3
  import type { PersonaPreparedJson } from '../types/PipelineJson/PersonaJson';
3
4
  import type { string_persona_description } from '../types/typeAliases';
@@ -7,7 +8,7 @@ import type { string_persona_description } from '../types/typeAliases';
7
8
  * @see https://github.com/webgptorg/promptbook/discussions/22
8
9
  * @public exported from `@promptbook/core`
9
10
  */
10
- export declare function preparePersona(personaDescription: string_persona_description, options: PrepareAndScrapeOptions): Promise<PersonaPreparedJson['modelRequirements']>;
11
+ export declare function preparePersona(personaDescription: string_persona_description, tools: Pick<ExecutionTools, 'llm'>, options: PrepareAndScrapeOptions): Promise<PersonaPreparedJson['modelRequirements']>;
11
12
  /**
12
13
  * TODO: [🔃][main] !!!!! If the persona was prepared with different version or different set of models, prepare it once again
13
14
  * TODO: [🏢] !! Check validity of `modelName` in pipeline
@@ -1,20 +1,18 @@
1
- import type { LlmExecutionTools } from '../execution/LlmExecutionTools';
1
+ import type { IntermediateFilesStrategy } from '../types/IntermediateFilesStrategy';
2
2
  import type { string_dirname } from '../types/typeAliases';
3
3
  /**
4
4
  * Options for preparation of the pipeline
5
5
  */
6
6
  export type PrepareAndScrapeOptions = {
7
- /**
8
- * LLM tools
9
- */
10
- readonly llmTools?: LlmExecutionTools;
11
7
  /**
12
8
  * Path to the root folder of the pipeline
13
9
  *
14
10
  * Note: When the pipeline is not created from files, it is `null`
15
- * Note: This folder must exist
11
+ * Note: This folder must exist (=it is not created recursively)
12
+ *
13
+ * @default process.cwd()
16
14
  */
17
- readonly rootDirname: string_dirname | null;
15
+ readonly rootDirname?: string_dirname | null;
18
16
  /**
19
17
  * Path to the cache folder
20
18
  *
@@ -24,12 +22,11 @@ export type PrepareAndScrapeOptions = {
24
22
  */
25
23
  readonly cacheDirname?: string_dirname;
26
24
  /**
27
- * If true, the cache is cleaned after the scraping
25
+ * Strategy for caching the intermediate results for knowledge source
28
26
  *
29
- *
30
- * @default false // <- TODO: !!!!!! Change to `cacheStrategy`/`intermediateFiles`, Put to global config, change to `true` and explicitly set to `false` in all playgrounds
27
+ * @default DEFAULT_INTERMEDIATE_FILES_STRATEGY
31
28
  */
32
- readonly isCacheCleaned?: boolean;
29
+ readonly intermediateFilesStrategy?: IntermediateFilesStrategy;
33
30
  /**
34
31
  * Maximum number of tasks running in parallel
35
32
  *
@@ -37,24 +34,9 @@ export type PrepareAndScrapeOptions = {
37
34
  */
38
35
  readonly maxParallelCount?: number;
39
36
  /**
40
- * Path to the external programs executables
41
- *
42
- * TODO: !!!!!! Transform to scrapers and make them Classy
37
+ * If true, the missing software is automatically installed
43
38
  */
44
- readonly externalProgramsPaths?: {
45
- /**
46
- * Path to the `pandoc` executable
47
- *
48
- * @example 'C:/Users/me/AppData/Local/Pandoc/pandoc.exe'
49
- */
50
- readonly pandocPath?: string;
51
- /**
52
- * Path to the LibreOffice executable
53
- *
54
- * @example 'C:/Program Files/LibreOffice/program/swriter.exe'
55
- */
56
- readonly libreOfficePath?: string;
57
- };
39
+ readonly isAutoInstalled?: boolean;
58
40
  /**
59
41
  * If true, the preparation logs additional information
60
42
  *
@@ -1,3 +1,4 @@
1
+ import type { ExecutionTools } from '../execution/ExecutionTools';
1
2
  import type { PipelineJson } from '../types/PipelineJson/PipelineJson';
2
3
  import type { PrepareAndScrapeOptions } from './PrepareAndScrapeOptions';
3
4
  /**
@@ -8,7 +9,7 @@ import type { PrepareAndScrapeOptions } from './PrepareAndScrapeOptions';
8
9
  * Note: When the pipeline is already prepared, it returns the same pipeline
9
10
  * @public exported from `@promptbook/core`
10
11
  */
11
- export declare function preparePipeline(pipeline: PipelineJson, options: PrepareAndScrapeOptions): Promise<PipelineJson>;
12
+ export declare function preparePipeline(pipeline: PipelineJson, tools: Pick<ExecutionTools, 'llm' | 'fs' | 'scrapers'>, options: PrepareAndScrapeOptions): Promise<PipelineJson>;
12
13
  /**
13
14
  * TODO: Write tests for `preparePipeline`
14
15
  * TODO: [🏏] Leverage the batch API and build queues @see https://platform.openai.com/docs/guides/batch
@@ -1,3 +1,4 @@
1
+ import type { ExecutionTools } from '../execution/ExecutionTools';
1
2
  import type { PipelineJson } from '../types/PipelineJson/PipelineJson';
2
3
  import type { TemplateJson } from '../types/PipelineJson/TemplateJson';
3
4
  import type { PrepareAndScrapeOptions } from './PrepareAndScrapeOptions';
@@ -11,14 +12,14 @@ type PreparedTemplates = {
11
12
  /**
12
13
  * @@@ Sequence of templates that are chained together to form a pipeline
13
14
  */
14
- readonly templatesPrepared: Array<TemplateJson>;
15
+ readonly templatesPrepared: ReadonlyArray<TemplateJson>;
15
16
  };
16
17
  /**
17
18
  * @@@
18
19
  *
19
20
  * @public exported from `@promptbook/core`
20
21
  */
21
- export declare function prepareTemplates(pipeline: PrepareTemplateInput, options: PrepareAndScrapeOptions): Promise<PreparedTemplates>;
22
+ export declare function prepareTemplates(pipeline: PrepareTemplateInput, tools: Pick<ExecutionTools, 'llm' | 'fs' | 'scrapers'>, options: PrepareAndScrapeOptions): Promise<PreparedTemplates>;
22
23
  export {};
23
24
  /**
24
25
  * TODO: [🧠] Add context to each template (if missing)
@@ -1,6 +1,4 @@
1
- import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
2
- import type { string_mime_type } from '../../types/typeAliases';
3
- import type { string_promptbook_documentation_url } from '../../types/typeAliases';
1
+ import type { ScraperAndConverterMetadata } from './register/ScraperAndConverterMetadata';
4
2
  import type { ScraperSourceHandler } from './Scraper';
5
3
  import type { ScraperIntermediateSource } from './ScraperIntermediateSource';
6
4
  /**
@@ -9,13 +7,9 @@ import type { ScraperIntermediateSource } from './ScraperIntermediateSource';
9
7
  */
10
8
  export type Converter = {
11
9
  /**
12
- * Mime types that this scraper can handle
10
+ * Metadata of the converter which includes title, mime types, etc.
13
11
  */
14
- readonly mimeTypes: Array<string_mime_type>;
15
- /**
16
- * Link to documentation
17
- */
18
- readonly documentationUrl: string_promptbook_documentation_url;
12
+ readonly metadata: ScraperAndConverterMetadata;
19
13
  /**
20
14
  * Convert the the file and returns intermediate source or `null` if it can't convert it
21
15
  *
@@ -24,5 +18,5 @@ export type Converter = {
24
18
  *
25
19
  * Note: `$` is used to indicate that this function is not a pure function - it leaves files on the disk and you are responsible for cleaning them by calling `destroy` method of returned object
26
20
  */
27
- $convert(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<ScraperIntermediateSource>;
21
+ $convert(source: ScraperSourceHandler): Promise<ScraperIntermediateSource>;
28
22
  };
@@ -1,28 +1,23 @@
1
1
  import type { Promisable } from 'type-fest';
2
- import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
3
2
  import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
4
3
  import type { string_filename } from '../../types/typeAliases';
5
4
  import type { string_knowledge_source_link } from '../../types/typeAliases';
6
5
  import type { string_mime_type } from '../../types/typeAliases';
7
- import type { string_promptbook_documentation_url } from '../../types/typeAliases';
8
6
  import type { string_url } from '../../types/typeAliases';
7
+ import type { ScraperAndConverterMetadata } from './register/ScraperAndConverterMetadata';
9
8
  /**
10
9
  * @@@
11
10
  *
12
11
  */
13
12
  export type Scraper = {
14
13
  /**
15
- * Mime types that this scraper can handle
14
+ * Metadata of the scraper which includes title, mime types, etc.
16
15
  */
17
- readonly mimeTypes: Array<string_mime_type>;
18
- /**
19
- * Link to documentation
20
- */
21
- readonly documentationUrl: string_promptbook_documentation_url;
16
+ readonly metadata: ScraperAndConverterMetadata;
22
17
  /**
23
18
  * Scrapes the markdown file and returns the knowledge pieces or `null` if it can't scrape it
24
19
  */
25
- scrape(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promisable<Array<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
20
+ scrape(source: ScraperSourceHandler): Promisable<ReadonlyArray<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
26
21
  };
27
22
  /**
28
23
  * @@@
@@ -56,16 +51,9 @@ export type ScraperSourceHandler = {
56
51
  * Get the content as a utf-8 string
57
52
  */
58
53
  asText(): Promisable<string>;
59
- /**
60
- * Get the content as a blob
61
- */
62
- asBlob(): Promisable<Blob>;
63
54
  };
64
55
  /**
56
+ * TODO: [🥽] Add ` asBlob(): Promisable<Blob>;` or asFile
65
57
  * TODO: [🐝] @@@ Annotate all
66
58
  * TODO: [🔼] Export via types
67
59
  */
68
- /**
69
- * TODO: !!!!!! Test that this is catched
70
- * Note: [⚫] Code in this file should never be published in any package
71
- */
@@ -1,13 +1,14 @@
1
1
  import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
2
2
  import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
3
3
  import type { KnowledgeSourceJson } from '../../types/PipelineJson/KnowledgeSourceJson';
4
+ import type { ExecutionTools } from '../../execution/ExecutionTools';
4
5
  /**
5
6
  * Prepares the knowle
6
7
  *
7
8
  * @see https://github.com/webgptorg/promptbook/discussions/41
8
9
  * @public exported from `@promptbook/core`
9
10
  */
10
- export declare function prepareKnowledgePieces(knowledgeSources: Array<KnowledgeSourceJson>, options: PrepareAndScrapeOptions): Promise<Array<Omit<KnowledgePiecePreparedJson, 'preparationIds'>>>;
11
+ export declare function prepareKnowledgePieces(knowledgeSources: ReadonlyArray<KnowledgeSourceJson>, tools: Pick<ExecutionTools, 'llm' | 'fs' | 'scrapers'>, options: PrepareAndScrapeOptions): Promise<ReadonlyArray<Omit<KnowledgePiecePreparedJson, 'preparationIds'>>>;
11
12
  /**
12
13
  * TODO: [🧊] In future one preparation can take data from previous preparation and save tokens and time
13
14
  * Put `knowledgePieces` into `PrepareKnowledgeOptions`
@@ -0,0 +1,11 @@
1
+ import type { FilesystemTools } from '../../../execution/FilesystemTools';
2
+ import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
3
+ /**
4
+ * @@@
5
+ *
6
+ * @public exported from `@promptbook/node`
7
+ */
8
+ export declare function $provideFilesystemForNode(options?: Pick<PrepareAndScrapeOptions, 'isVerbose'>): FilesystemTools;
9
+ /**
10
+ * Note: [🟢] Code in this file should never be never released in packages that could be imported into browser environment
11
+ */
@@ -0,0 +1,12 @@
1
+ import type { ExecutionTools } from '../../../execution/ExecutionTools';
2
+ import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
3
+ import type { Scraper } from '../Scraper';
4
+ /**
5
+ * @@@
6
+ *
7
+ * 1) @@@
8
+ * 2) @@@
9
+ *
10
+ * @public exported from `@promptbook/browser`
11
+ */
12
+ export declare function $provideScrapersForBrowser(tools: Pick<ExecutionTools, 'llm'>, options?: PrepareAndScrapeOptions): Promise<ReadonlyArray<Scraper>>;
@@ -0,0 +1,15 @@
1
+ import type { ExecutionTools } from '../../../execution/ExecutionTools';
2
+ import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
3
+ import type { Scraper } from '../Scraper';
4
+ /**
5
+ * @@@
6
+ *
7
+ * 1) @@@
8
+ * 2) @@@
9
+ *
10
+ * @public exported from `@promptbook/node`
11
+ */
12
+ export declare function $provideScrapersForNode(tools: Pick<ExecutionTools, 'fs' | 'llm' | 'executables'>, options?: PrepareAndScrapeOptions): Promise<ReadonlyArray<Scraper>>;
13
+ /**
14
+ * Note: [🟢] Code in this file should never be never released in packages that could be imported into browser environment
15
+ */
@@ -0,0 +1,12 @@
1
+ import type { string_markdown } from '../../../types/typeAliases';
2
+ /**
3
+ * Creates a message with all registered scrapers
4
+ *
5
+ * Note: This function is used to create a (error) message when there is no scraper for particular mime type
6
+ *
7
+ * @private internal function of `createScrapersFromConfiguration` and `createScrapersFromEnv`
8
+ */
9
+ export declare function $registeredScrapersMessage(): string_markdown;
10
+ /**
11
+ * TODO: [®] DRY Register logic
12
+ */
@@ -0,0 +1,13 @@
1
+ import { $Register } from '../../../utils/$Register';
2
+ import type { ScraperAndConverterMetadata } from './ScraperAndConverterMetadata';
3
+ /**
4
+ * @@@
5
+ *
6
+ * Note: `$` is used to indicate that this interacts with the global scope
7
+ * @singleton Only one instance of each register is created per build, but thare can be more @@@
8
+ * @public exported from `@promptbook/core`
9
+ */
10
+ export declare const $scrapersMetadataRegister: $Register<ScraperAndConverterMetadata>;
11
+ /**
12
+ * TODO: [®] DRY Register logic
13
+ */
@@ -0,0 +1,13 @@
1
+ import { $Register } from '../../../utils/$Register';
2
+ import type { ScraperConstructor } from './ScraperConstructor';
3
+ /**
4
+ * @@@
5
+ *
6
+ * Note: `$` is used to indicate that this interacts with the global scope
7
+ * @singleton Only one instance of each register is created per build, but thare can be more @@@
8
+ * @public exported from `@promptbook/core`
9
+ */
10
+ export declare const $scrapersRegister: $Register<ScraperConstructor>;
11
+ /**
12
+ * TODO: [®] DRY Register logic
13
+ */
@@ -0,0 +1,41 @@
1
+ import type { Executables } from '../../../execution/Executables';
2
+ import type { string_mime_type } from '../../../types/typeAliases';
3
+ import type { string_promptbook_documentation_url } from '../../../types/typeAliases';
4
+ import type { string_title } from '../../../types/typeAliases';
5
+ import type { Registered } from '../../../utils/$Register';
6
+ /**
7
+ * @@@
8
+ *
9
+ * @@@
10
+ * x) `Scraper`
11
+ * x) `Converter`
12
+ * x) `ScraperConstructor`
13
+ * x) `Registered`
14
+ * x) `ExecutionTools`
15
+ * x) `ScraperAndConverterMetadata`
16
+ * x) `PrepareAndScrapeOptions`
17
+ * x) `ScraperConfiguration`
18
+ * x) `ScraperOptions`
19
+ */
20
+ export type ScraperAndConverterMetadata = Registered & {
21
+ /**
22
+ * @@@
23
+ */
24
+ readonly title: string_title;
25
+ /**
26
+ * Mime types that this scraper can handle
27
+ */
28
+ readonly mimeTypes: ReadonlyArray<string_mime_type>;
29
+ /**
30
+ * @@@
31
+ */
32
+ readonly isAvilableInBrowser: boolean;
33
+ /**
34
+ * @@@
35
+ */
36
+ readonly requiredExecutables: ReadonlyArray<Capitalize<keyof Executables extends `${infer N}Path` ? N : never>>;
37
+ /**
38
+ * Link to documentation
39
+ */
40
+ readonly documentationUrl: string_promptbook_documentation_url;
41
+ };
@@ -0,0 +1,12 @@
1
+ import type { ExecutionTools } from '../../../execution/ExecutionTools';
2
+ import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
3
+ import type { Registered } from '../../../utils/$Register';
4
+ import type { Scraper } from '../Scraper';
5
+ import type { ScraperAndConverterMetadata } from './ScraperAndConverterMetadata';
6
+ /**
7
+ * @@@
8
+ */
9
+ export type ScraperConstructor = Registered & ScraperAndConverterMetadata & ((tools: Pick<ExecutionTools, 'llm'>, options: PrepareAndScrapeOptions) => Scraper);
10
+ /**
11
+ * TODO: [🎶] Naming "constructor" vs "creator" vs "factory"
12
+ */
@@ -13,7 +13,7 @@ type GetScraperIntermediateSourceSource = Pick<ScraperSourceHandler, 'filename'
13
13
  *
14
14
  * @private internal utility of `getScraperIntermediateSource`
15
15
  */
16
- type GetScraperIntermediateSourceHandler = Required<Pick<PrepareAndScrapeOptions, 'rootDirname' | 'cacheDirname' | 'isCacheCleaned' | 'isVerbose'>> & {
16
+ type GetScraperIntermediateSourceHandler = Required<Pick<PrepareAndScrapeOptions, 'rootDirname' | 'cacheDirname' | 'intermediateFilesStrategy' | 'isVerbose'>> & {
17
17
  readonly extension: string_file_extension;
18
18
  };
19
19
  /**
@@ -28,6 +28,7 @@ export {};
28
28
  /**
29
29
  * Note: Not using `FileCacheStorage` for two reasons:
30
30
  * 1) Need to store more than serialized JSONs
31
- * 2) Need to switch between a `rootDirname` and `cacheDirname` <- TODO: !!!!
31
+ * 2) Need to switch between a `rootDirname` and `cacheDirname` <- TODO: [😡]
32
32
  * TODO: [🐱‍🐉][🧠] Make some smart crop
33
+ * Note: [🟢] Code in this file should never be never released in packages that could be imported into browser environment
33
34
  */
@@ -1,10 +1,11 @@
1
1
  import type { SetOptional } from 'type-fest';
2
+ import type { ExecutionTools } from '../../../execution/ExecutionTools';
2
3
  import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
3
4
  import type { KnowledgeSourceJson } from '../../../types/PipelineJson/KnowledgeSourceJson';
4
5
  import type { ScraperSourceHandler } from '../Scraper';
5
6
  /**
6
7
  * @@@
7
8
  *
8
- * @private for scraper utilities
9
+ * @public exported from `@promptbook/core`
9
10
  */
10
- export declare function makeKnowledgeSourceHandler(knowledgeSource: SetOptional<KnowledgeSourceJson, 'name'>, options?: Pick<PrepareAndScrapeOptions, 'rootDirname' | 'isVerbose'>): Promise<ScraperSourceHandler>;
11
+ export declare function makeKnowledgeSourceHandler(knowledgeSource: SetOptional<KnowledgeSourceJson, 'name'>, tools: Pick<ExecutionTools, 'fs'>, options?: Pick<PrepareAndScrapeOptions, 'rootDirname' | 'isVerbose'>): Promise<ScraperSourceHandler>;
@@ -1,37 +1,43 @@
1
- import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
2
1
  import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
2
+ import type { ExecutionTools } from '../../execution/ExecutionTools';
3
+ import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
4
+ import type { Converter } from '../_common/Converter';
5
+ import type { ScraperAndConverterMetadata } from '../_common/register/ScraperAndConverterMetadata';
6
+ import type { Scraper } from '../_common/Scraper';
3
7
  import type { ScraperSourceHandler } from '../_common/Scraper';
4
8
  import type { ScraperIntermediateSource } from '../_common/ScraperIntermediateSource';
5
9
  /**
6
10
  * Scraper of .docx and .odt files
7
11
  *
8
12
  * @see `documentationUrl` for more details
9
- * @public exported from `@promptbook/core`
13
+ * @public exported from `@promptbook/documents`
10
14
  */
11
- export declare const documentScraper: {
15
+ export declare class DocumentScraper implements Converter, Scraper {
16
+ private readonly tools;
17
+ private readonly options;
12
18
  /**
13
- * Mime types that this scraper can handle
19
+ * Metadata of the scraper which includes title, mime types, etc.
14
20
  */
15
- mimeTypes: string[];
21
+ get metadata(): ScraperAndConverterMetadata;
16
22
  /**
17
- * Link to documentation
23
+ * Markdown scraper is used internally
18
24
  */
19
- documentationUrl: "https://github.com/webgptorg/promptbook/discussions/@@";
25
+ private readonly markdownScraper;
26
+ constructor(tools: Pick<ExecutionTools, 'fs' | 'llm' | 'executables'>, options: PrepareAndScrapeOptions);
20
27
  /**
21
28
  * Convert the `.docx` or `.odt` to `.md` file and returns intermediate source
22
29
  *
23
30
  * Note: `$` is used to indicate that this function is not a pure function - it leaves files on the disk and you are responsible for cleaning them by calling `destroy` method of returned object
24
31
  */
25
- $convert(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<ScraperIntermediateSource>;
32
+ $convert(source: ScraperSourceHandler): Promise<ScraperIntermediateSource>;
26
33
  /**
27
34
  * Scrapes the docx file and returns the knowledge pieces or `null` if it can't scrape it
28
35
  */
29
- scrape(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<Array<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
30
- };
36
+ scrape(source: ScraperSourceHandler): Promise<ReadonlyArray<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
37
+ }
31
38
  /**
32
39
  * TODO: [👣] Converted documents can act as cached items - there is no need to run conversion each time
33
- * TODO: [🦖] Make some system for putting scrapers to separete packages
34
40
  * TODO: [🪂] Do it in parallel 11:11
35
- * TODO: [🦷] Ideally use `as const satisfies Converter & Scraper` BUT this combination throws errors
36
41
  * Note: No need to aggregate usage here, it is done by intercepting the llmTools
42
+ * Note: [🟢] Code in this file should never be never released in packages that could be imported into browser environment
37
43
  */
@@ -0,0 +1,20 @@
1
+ import type { ExecutionTools } from '../../execution/ExecutionTools';
2
+ import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
3
+ import { DocumentScraper } from './DocumentScraper';
4
+ /**
5
+ * @@@
6
+ *
7
+ * @public exported from `@promptbook/documents`
8
+ */
9
+ export declare const createDocumentScraper: ((tools: Pick<ExecutionTools, 'llm'>, options: PrepareAndScrapeOptions) => DocumentScraper) & import("type-fest/source/readonly-deep").ReadonlyObjectDeep<{
10
+ title: string;
11
+ packageName: string;
12
+ className: string;
13
+ mimeTypes: string[];
14
+ documentationUrl: "https://github.com/webgptorg/promptbook/discussions/@@";
15
+ isAvilableInBrowser: false;
16
+ requiredExecutables: "Pandoc"[];
17
+ }>;
18
+ /**
19
+ * TODO: [🎶] Naming "constructor" vs "creator" vs "factory"
20
+ */
@@ -0,0 +1,13 @@
1
+ import type { Registration } from '../../utils/$Register';
2
+ /**
3
+ * Registration of known scraper
4
+ *
5
+ * Warning: This is not useful for the end user, it is just a side effect of the mechanism that handles all available known scrapers
6
+ *
7
+ * @public exported from `@promptbook/documents`
8
+ * @public exported from `@promptbook/cli`
9
+ */
10
+ export declare const _DocumentScraperRegistration: Registration;
11
+ /**
12
+ * TODO: [🎶] Naming "constructor" vs "creator" vs "factory"
13
+ */