@promptbook/cli 0.72.0-5 → 0.72.0-7
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +6 -0
- package/esm/index.es.js +2554 -1370
- package/esm/index.es.js.map +1 -1
- package/esm/typings/src/_packages/browser.index.d.ts +1 -1
- package/esm/typings/src/_packages/core.index.d.ts +24 -10
- package/esm/typings/src/_packages/node.index.d.ts +6 -2
- package/esm/typings/src/_packages/types.index.d.ts +28 -20
- package/esm/typings/src/cli/cli-commands/about.d.ts +1 -1
- package/esm/typings/src/cli/cli-commands/hello.d.ts +2 -1
- package/esm/typings/src/cli/cli-commands/make.d.ts +1 -1
- package/esm/typings/src/cli/cli-commands/prettify.d.ts +2 -1
- package/esm/typings/src/cli/cli-commands/test-command.d.ts +13 -0
- package/esm/typings/src/cli/main.d.ts +1 -1
- package/esm/typings/src/cli/promptbookCli.d.ts +1 -1
- package/esm/typings/src/collection/constructors/createCollectionFromDirectory.d.ts +8 -5
- package/esm/typings/src/commands/EXPECT/expectCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/FOREACH/foreachCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/FORMAT/formatCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/JOKER/jokerCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/KNOWLEDGE/knowledgeCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/KNOWLEDGE/utils/sourceContentToName.d.ts +11 -0
- package/esm/typings/src/commands/KNOWLEDGE/utils/sourceContentToName.test.d.ts +4 -0
- package/esm/typings/src/commands/MODEL/modelCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/PARAMETER/parameterCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/PERSONA/personaCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/POSTPROCESS/postprocessCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/PROMPTBOOK_VERSION/promptbookVersionCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/TEMPLATE/templateCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/URL/urlCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/X_ACTION/actionCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/X_INSTRUMENT/instrumentCommandParser.d.ts +1 -1
- package/esm/typings/src/commands/_BOILERPLATE/boilerplateCommandParser.d.ts +1 -1
- package/esm/typings/src/config.d.ts +10 -0
- package/esm/typings/src/conversion/pipelineStringToJson.d.ts +2 -15
- package/esm/typings/src/conversion/validation/_importPipeline.d.ts +1 -1
- package/esm/typings/src/conversion/validation/validatePipeline.d.ts +5 -5
- package/esm/typings/src/{knowledge/dialogs → dialogs}/callback/CallbackInterfaceTools.d.ts +2 -2
- package/esm/typings/src/{knowledge/dialogs → dialogs}/callback/CallbackInterfaceToolsOptions.d.ts +2 -2
- package/esm/typings/src/{knowledge/dialogs → dialogs}/simple-prompt/SimplePromptInterfaceTools.d.ts +4 -4
- package/esm/typings/src/errors/KnowledgeScrapeError.d.ts +9 -0
- package/esm/typings/src/errors/MissingToolsError.d.ts +9 -0
- package/esm/typings/src/execution/ExecutionTools.d.ts +3 -3
- package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorOptions.d.ts +5 -2
- package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorSettings.d.ts +2 -13
- package/esm/typings/src/execution/createPipelineExecutor/00-createPipelineExecutor.d.ts +1 -1
- package/esm/typings/src/execution/createPipelineExecutor/10-executePipeline.d.ts +1 -1
- package/esm/typings/src/execution/translation/automatic-translate/translateMessages.d.ts +3 -0
- package/esm/typings/src/execution/utils/forEachAsync.d.ts +1 -0
- package/esm/typings/src/llm-providers/_common/createLlmToolsFromConfigurationFromEnv.d.ts +1 -1
- package/esm/typings/src/llm-providers/_common/createLlmToolsFromEnv.d.ts +1 -1
- package/esm/typings/src/llm-providers/_common/getLlmToolsForCli.d.ts +1 -1
- package/esm/typings/src/llm-providers/anthropic-claude/playground/playground.d.ts +1 -0
- package/esm/typings/src/llm-providers/azure-openai/AzureOpenAiExecutionTools.d.ts +6 -0
- package/esm/typings/src/llm-providers/azure-openai/playground/playground.d.ts +1 -0
- package/esm/typings/src/llm-providers/langtail/playground/playground.d.ts +3 -0
- package/esm/typings/src/llm-providers/multiple/playground/playground.d.ts +3 -0
- package/esm/typings/src/llm-providers/openai/playground/playground.d.ts +1 -0
- package/esm/typings/src/llm-providers/remote/playground/playground.d.ts +3 -0
- package/esm/typings/src/personas/preparePersona.d.ts +2 -2
- package/esm/typings/src/prepare/PrepareAndScrapeOptions.d.ts +67 -0
- package/esm/typings/src/prepare/preparePipeline.d.ts +2 -2
- package/esm/typings/src/prepare/prepareTemplates.d.ts +2 -2
- package/esm/typings/src/scrapers/_common/Converter.d.ts +28 -0
- package/esm/typings/src/scrapers/_common/Scraper.d.ts +71 -0
- package/esm/typings/src/scrapers/_common/ScraperIntermediateSource.d.ts +11 -0
- package/esm/typings/src/{knowledge/prepare-knowledge → scrapers}/_common/prepareKnowledgePieces.d.ts +4 -4
- package/esm/typings/src/scrapers/_common/utils/getScraperIntermediateSource.d.ts +33 -0
- package/esm/typings/src/scrapers/_common/utils/getScraperIntermediateSource.test.d.ts +4 -0
- package/esm/typings/src/scrapers/_common/utils/makeKnowledgeSourceHandler.d.ts +10 -0
- package/esm/typings/src/scrapers/document/documentScraper.d.ts +37 -0
- package/esm/typings/src/scrapers/document/documentScraper.test.d.ts +4 -0
- package/esm/typings/src/scrapers/document/playground/document-scraper-playground.d.ts +5 -0
- package/esm/typings/src/scrapers/document-legacy/legacyDocumentScraper.d.ts +37 -0
- package/esm/typings/src/scrapers/document-legacy/legacyDocumentScraper.test.d.ts +4 -0
- package/esm/typings/src/scrapers/document-legacy/playground/legacy-document-scraper-playground.d.ts +5 -0
- package/esm/typings/src/scrapers/index.d.ts +7 -0
- package/esm/typings/src/scrapers/markdown/markdownScraper.d.ts +29 -0
- package/esm/typings/src/scrapers/markdown/playground/markdown-scraper-playground.d.ts +5 -0
- package/esm/typings/src/scrapers/pdf/pdfScraper.d.ts +35 -0
- package/esm/typings/src/scrapers/pdf/playground/pdf-scraper-playground.d.ts +5 -0
- package/esm/typings/src/scrapers/website/playground/website-scraper-playground.d.ts +5 -0
- package/esm/typings/src/scrapers/website/utils/markdownConverter.d.ts +12 -0
- package/esm/typings/src/scrapers/website/websiteScraper.d.ts +43 -0
- package/esm/typings/src/storage/{files-storage/FilesStorage.d.ts → file-cache-storage/FileCacheStorage.d.ts} +5 -5
- package/esm/typings/src/storage/file-cache-storage/FileCacheStorageOptions.d.ts +10 -0
- package/esm/typings/src/storage/{files-storage → file-cache-storage}/utils/nameToSubfolderPath.d.ts +1 -1
- package/esm/typings/src/storage/file-cache-storage/utils/nameToSubfolderPath.test.d.ts +1 -0
- package/esm/typings/src/storage/local-storage/getLocalStorage.d.ts +1 -1
- package/esm/typings/src/storage/local-storage/getSessionStorage.d.ts +1 -1
- package/esm/typings/src/types/PipelineJson/KnowledgeSourceJson.d.ts +9 -2
- package/esm/typings/src/types/PipelineJson/PipelineJson.d.ts +2 -2
- package/esm/typings/src/types/typeAliases.d.ts +8 -11
- package/esm/typings/src/utils/execCommand/$execCommand.d.ts +14 -0
- package/esm/typings/src/utils/execCommand/$execCommands.d.ts +17 -0
- package/esm/typings/src/utils/execCommand/IExecCommandOptions.d.ts +23 -0
- package/esm/typings/src/utils/execCommand/execCommand.test.d.ts +1 -0
- package/esm/typings/src/utils/execCommand/execCommandNormalizeOptions.d.ts +10 -0
- package/esm/typings/src/utils/execCommand/execCommandNormalizeOptions.test.d.ts +1 -0
- package/esm/typings/src/utils/files/$isDirectoryExisting.d.ts +3 -3
- package/esm/typings/src/utils/files/$isFileExisting.d.ts +3 -3
- package/esm/typings/src/utils/files/$listAllFiles.d.ts +5 -4
- package/esm/typings/src/utils/files/extensionToMimeType.d.ts +8 -0
- package/esm/typings/src/utils/files/extensionToMimeType.test.d.ts +1 -0
- package/esm/typings/src/utils/files/getFileExtension.d.ts +8 -0
- package/esm/typings/src/utils/files/getFileExtension.test.d.ts +1 -0
- package/esm/typings/src/utils/validators/filePath/isValidFilePath.d.ts +2 -2
- package/package.json +5 -1
- package/umd/index.umd.js +2552 -1373
- package/umd/index.umd.js.map +1 -1
- package/esm/typings/src/knowledge/prepare-knowledge/_common/Scraper.d.ts +0 -37
- package/esm/typings/src/knowledge/prepare-knowledge/markdown/playground/markdown-knowledge-playground.d.ts +0 -2
- package/esm/typings/src/knowledge/prepare-knowledge/markdown/prepareKnowledgeFromMarkdown.d.ts +0 -14
- package/esm/typings/src/knowledge/prepare-knowledge/pdf/prepareKnowledgeFromPdf.d.ts +0 -15
- package/esm/typings/src/prepare/PrepareOptions.d.ts +0 -22
- package/esm/typings/src/storage/files-storage/FilesStorageOptions.d.ts +0 -10
- /package/esm/typings/src/{knowledge/dialogs → dialogs}/user-interface-execution-tools.test.d.ts +0 -0
- /package/esm/typings/src/{knowledge/prepare-knowledge → scrapers}/_common/prepareKnowledgePieces.test.d.ts +0 -0
- /package/esm/typings/src/{knowledge/prepare-knowledge/markdown/prepareKnowledgeFromMarkdown.test.d.ts → scrapers/markdown/markdownScraper.test.d.ts} +0 -0
- /package/esm/typings/src/{knowledge/prepare-knowledge/pdf/prepareKnowledgeFromPdf.test.d.ts → scrapers/website/utils/markdownConverter.test.d.ts} +0 -0
- /package/esm/typings/src/{storage/files-storage/utils/nameToSubfolderPath.test.d.ts → scrapers/website/websiteScraper.test.d.ts} +0 -0
package/esm/typings/src/{knowledge/dialogs → dialogs}/callback/CallbackInterfaceToolsOptions.d.ts
RENAMED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
import type { Promisable } from 'type-fest';
|
|
2
|
-
import type { CommonExecutionToolsOptions } from '
|
|
3
|
-
import type { UserInterfaceToolsPromptDialogOptions } from '
|
|
2
|
+
import type { CommonExecutionToolsOptions } from '../../execution/CommonExecutionToolsOptions';
|
|
3
|
+
import type { UserInterfaceToolsPromptDialogOptions } from '../../execution/UserInterfaceTools';
|
|
4
4
|
/**
|
|
5
5
|
* Options for `CallbackInterfaceTools`
|
|
6
6
|
*
|
package/esm/typings/src/{knowledge/dialogs → dialogs}/simple-prompt/SimplePromptInterfaceTools.d.ts
RENAMED
|
@@ -1,6 +1,6 @@
|
|
|
1
|
-
import type { CommonExecutionToolsOptions } from '
|
|
2
|
-
import type { UserInterfaceTools } from '
|
|
3
|
-
import type { UserInterfaceToolsPromptDialogOptions } from '
|
|
1
|
+
import type { CommonExecutionToolsOptions } from '../../execution/CommonExecutionToolsOptions';
|
|
2
|
+
import type { UserInterfaceTools } from '../../execution/UserInterfaceTools';
|
|
3
|
+
import type { UserInterfaceToolsPromptDialogOptions } from '../../execution/UserInterfaceTools';
|
|
4
4
|
/**
|
|
5
5
|
* Wrapper around `window.prompt` synchronous function that interacts with the user via browser prompt
|
|
6
6
|
*
|
|
@@ -18,5 +18,5 @@ export declare class SimplePromptInterfaceTools implements UserInterfaceTools {
|
|
|
18
18
|
promptDialog(options: UserInterfaceToolsPromptDialogOptions): Promise<string>;
|
|
19
19
|
}
|
|
20
20
|
/**
|
|
21
|
-
* Note: [🔵]
|
|
21
|
+
* Note: [🔵] Code in this file should never be published outside of `@promptbook/browser`
|
|
22
22
|
*/
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* This error indicates that the promptbook can not retrieve knowledge from external sources
|
|
3
|
+
*
|
|
4
|
+
* @public exported from `@promptbook/core`
|
|
5
|
+
*/
|
|
6
|
+
export declare class KnowledgeScrapeError extends Error {
|
|
7
|
+
readonly name = "KnowledgeScrapeError";
|
|
8
|
+
constructor(message: string);
|
|
9
|
+
}
|
|
@@ -0,0 +1,9 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* This error type indicates that some tools are missing for pipeline execution or preparation
|
|
3
|
+
*
|
|
4
|
+
* @public exported from `@promptbook/core`
|
|
5
|
+
*/
|
|
6
|
+
export declare class MissingToolsError extends Error {
|
|
7
|
+
readonly name = "MissingToolsError";
|
|
8
|
+
constructor(message: string);
|
|
9
|
+
}
|
|
@@ -14,7 +14,7 @@ export type ExecutionTools = {
|
|
|
14
14
|
* Tip: Use `createLlmToolsFromEnv()` to use all available LLM providers you configured
|
|
15
15
|
* @see https://github.com/webgptorg/promptbook/?tab=readme-ov-file#llm-execution-tools
|
|
16
16
|
*/
|
|
17
|
-
llm?: Arrayable<LlmExecutionTools>;
|
|
17
|
+
readonly llm?: Arrayable<LlmExecutionTools>;
|
|
18
18
|
/**
|
|
19
19
|
* Tools for executing scripts
|
|
20
20
|
*
|
|
@@ -25,12 +25,12 @@ export type ExecutionTools = {
|
|
|
25
25
|
* @see https://github.com/webgptorg/promptbook/?tab=readme-ov-file#script-execution-tools
|
|
26
26
|
* @default [] - If not provided, no script execution will be possible
|
|
27
27
|
*/
|
|
28
|
-
script?: Arrayable<ScriptExecutionTools>;
|
|
28
|
+
readonly script?: Arrayable<ScriptExecutionTools>;
|
|
29
29
|
/**
|
|
30
30
|
* Tools for interacting with the user
|
|
31
31
|
*
|
|
32
32
|
* Note: When undefined, the user interface is disabled and promptbook which requires user interaction will fail
|
|
33
33
|
* @see https://github.com/webgptorg/promptbook/?tab=readme-ov-file#user-interface-tools
|
|
34
34
|
*/
|
|
35
|
-
userInterface?: UserInterfaceTools;
|
|
35
|
+
readonly userInterface?: UserInterfaceTools;
|
|
36
36
|
};
|
package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorOptions.d.ts
CHANGED
|
@@ -4,7 +4,7 @@ import type { CreatePipelineExecutorSettings } from './00-CreatePipelineExecutor
|
|
|
4
4
|
/**
|
|
5
5
|
* Options for `createPipelineExecutor`
|
|
6
6
|
*/
|
|
7
|
-
export
|
|
7
|
+
export type CreatePipelineExecutorOptions = {
|
|
8
8
|
/**
|
|
9
9
|
* The pipeline to be executed
|
|
10
10
|
*/
|
|
@@ -17,4 +17,7 @@ export interface CreatePipelineExecutorOptions {
|
|
|
17
17
|
* Optional settings for the pipeline executor
|
|
18
18
|
*/
|
|
19
19
|
readonly settings?: Partial<CreatePipelineExecutorSettings>;
|
|
20
|
-
}
|
|
20
|
+
};
|
|
21
|
+
/**
|
|
22
|
+
* TODO: !!!!!! Unite `CreatePipelineExecutorOptions` and `CreatePipelineExecutorSettings` OR describe the difference
|
|
23
|
+
*/
|
package/esm/typings/src/execution/createPipelineExecutor/00-CreatePipelineExecutorSettings.d.ts
CHANGED
|
@@ -1,23 +1,12 @@
|
|
|
1
1
|
import type { CsvSettings } from '../../formats/csv/CsvSettings';
|
|
2
|
-
|
|
2
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
3
|
+
export type CreatePipelineExecutorSettings = Omit<PrepareAndScrapeOptions, 'llmTools'> & {
|
|
3
4
|
/**
|
|
4
5
|
* When executor does not satisfy expectations it will be retried this amount of times
|
|
5
6
|
*
|
|
6
7
|
* @default MAX_EXECUTION_ATTEMPTS
|
|
7
8
|
*/
|
|
8
9
|
readonly maxExecutionAttempts: number;
|
|
9
|
-
/**
|
|
10
|
-
* Maximum number of tasks running in parallel
|
|
11
|
-
*
|
|
12
|
-
* @default MAX_PARALLEL_COUNT
|
|
13
|
-
*/
|
|
14
|
-
readonly maxParallelCount: number;
|
|
15
|
-
/**
|
|
16
|
-
* If true, the preparation logs additional information
|
|
17
|
-
*
|
|
18
|
-
* @default false
|
|
19
|
-
*/
|
|
20
|
-
readonly isVerbose: boolean;
|
|
21
10
|
/**
|
|
22
11
|
* Settings for CSV format
|
|
23
12
|
*
|
|
@@ -10,4 +10,4 @@ import type { CreatePipelineExecutorOptions } from './00-CreatePipelineExecutorO
|
|
|
10
10
|
export declare function createPipelineExecutor(options: CreatePipelineExecutorOptions): PipelineExecutor;
|
|
11
11
|
/**
|
|
12
12
|
* TODO: [🐚] Change onProgress to object that represents the running execution, can be subscribed via RxJS to and also awaited
|
|
13
|
-
*/
|
|
13
|
+
*/
|
|
@@ -6,3 +6,6 @@ import type { TranslatorOptions } from './automatic-translators/TranslatorOption
|
|
|
6
6
|
export declare function translateMessages({ automaticTranslator, from, to, }: {
|
|
7
7
|
automaticTranslator: AutomaticTranslator;
|
|
8
8
|
} & TranslatorOptions): Promise<void>;
|
|
9
|
+
/**
|
|
10
|
+
* TODO: [😶] Unite floder listing
|
|
11
|
+
*/
|
|
@@ -14,6 +14,7 @@ type ForEachAsyncOptions = {
|
|
|
14
14
|
* @param options - Options for the function
|
|
15
15
|
* @param callbackfunction - Function to call for each item
|
|
16
16
|
* @public exported from `@promptbook/utils`
|
|
17
|
+
* @deprecated [🪂] Use queues instead
|
|
17
18
|
*/
|
|
18
19
|
export declare function forEachAsync<TItem>(array: Array<TItem>, options: ForEachAsyncOptions, callbackfunction: (value: TItem, index: number, array: Array<TItem>) => Promisable<void>): Promise<void>;
|
|
19
20
|
export {};
|
|
@@ -17,7 +17,7 @@ export declare function createLlmToolsFromConfigurationFromEnv(): LlmToolsConfig
|
|
|
17
17
|
* TODO: Add Azure OpenAI
|
|
18
18
|
* TODO: [🧠][🍛]
|
|
19
19
|
* TODO: [🧠] Is there some meaningfull way how to test this util
|
|
20
|
-
* Note: [🟢]
|
|
20
|
+
* Note: [🟢] Code in this file should never be published outside of `@promptbook/node` and `@promptbook/cli`
|
|
21
21
|
* TODO: [👷♂️] @@@ Manual about construction of llmTools
|
|
22
22
|
* TODO: This should be maybe not under `_common` but under `utils`
|
|
23
23
|
* TODO: [🧠] Maybe pass env as argument
|
|
@@ -19,7 +19,7 @@ export declare function createLlmToolsFromEnv(options?: CreateLlmToolsFromConfig
|
|
|
19
19
|
* TODO: @@@ write `createLlmToolsFromEnv` vs `createLlmToolsFromConfigurationFromEnv` vs `createLlmToolsFromConfiguration`
|
|
20
20
|
* TODO: [🧠][🍛] Which name is better `createLlmToolsFromEnv` or `createLlmToolsFromEnvironment`?
|
|
21
21
|
* TODO: [🧠] Is there some meaningfull way how to test this util
|
|
22
|
-
* Note: [🟢]
|
|
22
|
+
* Note: [🟢] Code in this file should never be published outside of `@promptbook/node` and `@promptbook/cli`
|
|
23
23
|
* TODO: [🥃] Allow `ptbk make` without llm tools
|
|
24
24
|
* TODO: This should be maybe not under `_common` but under `utils`
|
|
25
25
|
*/
|
|
@@ -15,7 +15,7 @@ type GetLlmToolsForCliOptions = {
|
|
|
15
15
|
export declare function getLlmToolsForCli(options?: GetLlmToolsForCliOptions): LlmExecutionToolsWithTotalUsage;
|
|
16
16
|
export {};
|
|
17
17
|
/**
|
|
18
|
-
* Note: [🟡]
|
|
18
|
+
* Note: [🟡] Code in this file should never be published outside of `@promptbook/cli`
|
|
19
19
|
* TODO: [👷♂️] @@@ Manual about construction of llmTools
|
|
20
20
|
* TODO: [🥃] Allow `ptbk make` without llm tools
|
|
21
21
|
* TODO: This should be maybe not under `_common` but under `utils-internal` / `utils/internal`
|
|
@@ -3,4 +3,5 @@ export {};
|
|
|
3
3
|
/**
|
|
4
4
|
* TODO: [main] !!! Playground with WebGPT / Promptbook.studio anonymous server
|
|
5
5
|
* TODO: [main] !!! Test here that `systemMessage`, `temperature` and `seed` are working correctly
|
|
6
|
+
* Note: [⚫] Code in this file should never be published in any package
|
|
6
7
|
*/
|
|
@@ -44,6 +44,12 @@ export declare class AzureOpenAiExecutionTools implements LlmExecutionTools {
|
|
|
44
44
|
* Calls Azure OpenAI API to use a complete model.
|
|
45
45
|
*/
|
|
46
46
|
callCompletionModel(prompt: Pick<Prompt, 'content' | 'parameters' | 'modelRequirements'>): Promise<CompletionPromptResult>;
|
|
47
|
+
/**
|
|
48
|
+
* Library `@azure/openai` has bug/weird behavior that it does not throw error but hangs forever
|
|
49
|
+
*
|
|
50
|
+
* This method wraps the promise with timeout
|
|
51
|
+
*/
|
|
52
|
+
private withTimeout;
|
|
47
53
|
/**
|
|
48
54
|
* Changes Azure error (which is not propper Error but object) to propper Error
|
|
49
55
|
*/
|
|
@@ -1,4 +1,4 @@
|
|
|
1
|
-
import type {
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../prepare/PrepareAndScrapeOptions';
|
|
2
2
|
import type { PersonaPreparedJson } from '../types/PipelineJson/PersonaJson';
|
|
3
3
|
import type { string_persona_description } from '../types/typeAliases';
|
|
4
4
|
/**
|
|
@@ -7,7 +7,7 @@ import type { string_persona_description } from '../types/typeAliases';
|
|
|
7
7
|
* @see https://github.com/webgptorg/promptbook/discussions/22
|
|
8
8
|
* @public exported from `@promptbook/core`
|
|
9
9
|
*/
|
|
10
|
-
export declare function preparePersona(personaDescription: string_persona_description, options:
|
|
10
|
+
export declare function preparePersona(personaDescription: string_persona_description, options: PrepareAndScrapeOptions): Promise<PersonaPreparedJson['modelRequirements']>;
|
|
11
11
|
/**
|
|
12
12
|
* TODO: [🔃][main] !!!!! If the persona was prepared with different version or different set of models, prepare it once again
|
|
13
13
|
* TODO: [🏢] !! Check validity of `modelName` in pipeline
|
|
@@ -0,0 +1,67 @@
|
|
|
1
|
+
import type { LlmExecutionTools } from '../execution/LlmExecutionTools';
|
|
2
|
+
import type { string_dirname } from '../types/typeAliases';
|
|
3
|
+
/**
|
|
4
|
+
* Options for preparation of the pipeline
|
|
5
|
+
*/
|
|
6
|
+
export type PrepareAndScrapeOptions = {
|
|
7
|
+
/**
|
|
8
|
+
* LLM tools
|
|
9
|
+
*/
|
|
10
|
+
readonly llmTools?: LlmExecutionTools;
|
|
11
|
+
/**
|
|
12
|
+
* Path to the root folder of the pipeline
|
|
13
|
+
*
|
|
14
|
+
* Note: When the pipeline is not created from files, it is `null`
|
|
15
|
+
* Note: This folder must exist
|
|
16
|
+
*/
|
|
17
|
+
readonly rootDirname: string_dirname | null;
|
|
18
|
+
/**
|
|
19
|
+
* Path to the cache folder
|
|
20
|
+
*
|
|
21
|
+
* Note: When the folder does not exist, it is created recursively
|
|
22
|
+
*
|
|
23
|
+
* @default SCRAPE_CACHE_DIRNAME
|
|
24
|
+
*/
|
|
25
|
+
readonly cacheDirname?: string_dirname;
|
|
26
|
+
/**
|
|
27
|
+
* If true, the cache is cleaned after the scraping
|
|
28
|
+
*
|
|
29
|
+
*
|
|
30
|
+
* @default false // <- TODO: !!!!!! Change to `cacheStrategy`/`intermediateFiles`, Put to global config, change to `true` and explicitly set to `false` in all playgrounds
|
|
31
|
+
*/
|
|
32
|
+
readonly isCacheCleaned?: boolean;
|
|
33
|
+
/**
|
|
34
|
+
* Maximum number of tasks running in parallel
|
|
35
|
+
*
|
|
36
|
+
* @default MAX_PARALLEL_COUNT
|
|
37
|
+
*/
|
|
38
|
+
readonly maxParallelCount?: number;
|
|
39
|
+
/**
|
|
40
|
+
* Path to the external programs executables
|
|
41
|
+
*
|
|
42
|
+
* TODO: !!!!!! Transform to scrapers and make them Classy
|
|
43
|
+
*/
|
|
44
|
+
readonly externalProgramsPaths?: {
|
|
45
|
+
/**
|
|
46
|
+
* Path to the `pandoc` executable
|
|
47
|
+
*
|
|
48
|
+
* @example 'C:/Users/me/AppData/Local/Pandoc/pandoc.exe'
|
|
49
|
+
*/
|
|
50
|
+
readonly pandocPath?: string;
|
|
51
|
+
/**
|
|
52
|
+
* Path to the LibreOffice executable
|
|
53
|
+
*
|
|
54
|
+
* @example 'C:/Program Files/LibreOffice/program/swriter.exe'
|
|
55
|
+
*/
|
|
56
|
+
readonly libreOfficePath?: string;
|
|
57
|
+
};
|
|
58
|
+
/**
|
|
59
|
+
* If true, the preparation logs additional information
|
|
60
|
+
*
|
|
61
|
+
* @default false
|
|
62
|
+
*/
|
|
63
|
+
readonly isVerbose?: boolean;
|
|
64
|
+
};
|
|
65
|
+
/**
|
|
66
|
+
* TODO: [🧠] Maybe split `PrepareAndScrapeOptions` and `ScrapeOptions` (`ScrapeOptions` should be extended from `PrepareAndScrapeOptions`)
|
|
67
|
+
*/
|
|
@@ -1,5 +1,5 @@
|
|
|
1
1
|
import type { PipelineJson } from '../types/PipelineJson/PipelineJson';
|
|
2
|
-
import type {
|
|
2
|
+
import type { PrepareAndScrapeOptions } from './PrepareAndScrapeOptions';
|
|
3
3
|
/**
|
|
4
4
|
* Prepare pipeline from string (markdown) format to JSON format
|
|
5
5
|
*
|
|
@@ -8,7 +8,7 @@ import type { PrepareOptions } from './PrepareOptions';
|
|
|
8
8
|
* Note: When the pipeline is already prepared, it returns the same pipeline
|
|
9
9
|
* @public exported from `@promptbook/core`
|
|
10
10
|
*/
|
|
11
|
-
export declare function preparePipeline(pipeline: PipelineJson, options:
|
|
11
|
+
export declare function preparePipeline(pipeline: PipelineJson, options: PrepareAndScrapeOptions): Promise<PipelineJson>;
|
|
12
12
|
/**
|
|
13
13
|
* TODO: Write tests for `preparePipeline`
|
|
14
14
|
* TODO: [🏏] Leverage the batch API and build queues @see https://platform.openai.com/docs/guides/batch
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
import type { PipelineJson } from '../types/PipelineJson/PipelineJson';
|
|
2
2
|
import type { TemplateJson } from '../types/PipelineJson/TemplateJson';
|
|
3
|
-
import type {
|
|
3
|
+
import type { PrepareAndScrapeOptions } from './PrepareAndScrapeOptions';
|
|
4
4
|
type PrepareTemplateInput = Pick<PipelineJson, 'templates' | 'parameters'> & {
|
|
5
5
|
/**
|
|
6
6
|
* @@@
|
|
@@ -18,7 +18,7 @@ type PreparedTemplates = {
|
|
|
18
18
|
*
|
|
19
19
|
* @public exported from `@promptbook/core`
|
|
20
20
|
*/
|
|
21
|
-
export declare function prepareTemplates(pipeline: PrepareTemplateInput, options:
|
|
21
|
+
export declare function prepareTemplates(pipeline: PrepareTemplateInput, options: PrepareAndScrapeOptions): Promise<PreparedTemplates>;
|
|
22
22
|
export {};
|
|
23
23
|
/**
|
|
24
24
|
* TODO: [🧠] Add context to each template (if missing)
|
|
@@ -0,0 +1,28 @@
|
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
2
|
+
import type { string_mime_type } from '../../types/typeAliases';
|
|
3
|
+
import type { string_promptbook_documentation_url } from '../../types/typeAliases';
|
|
4
|
+
import type { ScraperSourceHandler } from './Scraper';
|
|
5
|
+
import type { ScraperIntermediateSource } from './ScraperIntermediateSource';
|
|
6
|
+
/**
|
|
7
|
+
* @@@
|
|
8
|
+
*
|
|
9
|
+
*/
|
|
10
|
+
export type Converter = {
|
|
11
|
+
/**
|
|
12
|
+
* Mime types that this scraper can handle
|
|
13
|
+
*/
|
|
14
|
+
readonly mimeTypes: Array<string_mime_type>;
|
|
15
|
+
/**
|
|
16
|
+
* Link to documentation
|
|
17
|
+
*/
|
|
18
|
+
readonly documentationUrl: string_promptbook_documentation_url;
|
|
19
|
+
/**
|
|
20
|
+
* Convert the the file and returns intermediate source or `null` if it can't convert it
|
|
21
|
+
*
|
|
22
|
+
* For example, convert a `.docx` to `.doc` file
|
|
23
|
+
* Or convert a `.pdf` to `.md` file
|
|
24
|
+
*
|
|
25
|
+
* Note: `$` is used to indicate that this function is not a pure function - it leaves files on the disk and you are responsible for cleaning them by calling `destroy` method of returned object
|
|
26
|
+
*/
|
|
27
|
+
$convert(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<ScraperIntermediateSource>;
|
|
28
|
+
};
|
|
@@ -0,0 +1,71 @@
|
|
|
1
|
+
import type { Promisable } from 'type-fest';
|
|
2
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
3
|
+
import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
|
|
4
|
+
import type { string_filename } from '../../types/typeAliases';
|
|
5
|
+
import type { string_knowledge_source_link } from '../../types/typeAliases';
|
|
6
|
+
import type { string_mime_type } from '../../types/typeAliases';
|
|
7
|
+
import type { string_promptbook_documentation_url } from '../../types/typeAliases';
|
|
8
|
+
import type { string_url } from '../../types/typeAliases';
|
|
9
|
+
/**
|
|
10
|
+
* @@@
|
|
11
|
+
*
|
|
12
|
+
*/
|
|
13
|
+
export type Scraper = {
|
|
14
|
+
/**
|
|
15
|
+
* Mime types that this scraper can handle
|
|
16
|
+
*/
|
|
17
|
+
readonly mimeTypes: Array<string_mime_type>;
|
|
18
|
+
/**
|
|
19
|
+
* Link to documentation
|
|
20
|
+
*/
|
|
21
|
+
readonly documentationUrl: string_promptbook_documentation_url;
|
|
22
|
+
/**
|
|
23
|
+
* Scrapes the markdown file and returns the knowledge pieces or `null` if it can't scrape it
|
|
24
|
+
*/
|
|
25
|
+
scrape(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promisable<Array<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
|
|
26
|
+
};
|
|
27
|
+
/**
|
|
28
|
+
* @@@
|
|
29
|
+
*/
|
|
30
|
+
export type ScraperSourceHandler = {
|
|
31
|
+
/**
|
|
32
|
+
* The source of the knowledge
|
|
33
|
+
*/
|
|
34
|
+
readonly source: string_knowledge_source_link;
|
|
35
|
+
/**
|
|
36
|
+
* The path to the file, if it is a file
|
|
37
|
+
*
|
|
38
|
+
* Note: Typically one of the `filename` or `url` is set and the other is `null`
|
|
39
|
+
*/
|
|
40
|
+
readonly filename: string_filename | null;
|
|
41
|
+
/**
|
|
42
|
+
* The URL, if it is online
|
|
43
|
+
*
|
|
44
|
+
* Note: Typically one of the `filename` or `url` is set and the other is `null`
|
|
45
|
+
*/
|
|
46
|
+
readonly url: string_url | null;
|
|
47
|
+
/**
|
|
48
|
+
* Mime type of the source
|
|
49
|
+
*/
|
|
50
|
+
readonly mimeType: string_mime_type;
|
|
51
|
+
/**
|
|
52
|
+
* Get the content as parsed JSON
|
|
53
|
+
*/
|
|
54
|
+
asJson(): Promisable<unknown>;
|
|
55
|
+
/**
|
|
56
|
+
* Get the content as a utf-8 string
|
|
57
|
+
*/
|
|
58
|
+
asText(): Promisable<string>;
|
|
59
|
+
/**
|
|
60
|
+
* Get the content as a blob
|
|
61
|
+
*/
|
|
62
|
+
asBlob(): Promisable<Blob>;
|
|
63
|
+
};
|
|
64
|
+
/**
|
|
65
|
+
* TODO: [🐝] @@@ Annotate all
|
|
66
|
+
* TODO: [🔼] Export via types
|
|
67
|
+
*/
|
|
68
|
+
/**
|
|
69
|
+
* TODO: !!!!!! Test that this is catched
|
|
70
|
+
* Note: [⚫] Code in this file should never be published in any package
|
|
71
|
+
*/
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
import type { IDestroyable } from 'destroyable';
|
|
2
|
+
import type { string_absolute_filename } from '../../types/typeAliases';
|
|
3
|
+
/**
|
|
4
|
+
* @@@
|
|
5
|
+
*/
|
|
6
|
+
export type ScraperIntermediateSource = IDestroyable & {
|
|
7
|
+
/**
|
|
8
|
+
* @@@
|
|
9
|
+
*/
|
|
10
|
+
readonly filename: string_absolute_filename;
|
|
11
|
+
};
|
package/esm/typings/src/{knowledge/prepare-knowledge → scrapers}/_common/prepareKnowledgePieces.d.ts
RENAMED
|
@@ -1,13 +1,13 @@
|
|
|
1
|
-
import type {
|
|
2
|
-
import type { KnowledgePiecePreparedJson } from '
|
|
3
|
-
import type { KnowledgeSourceJson } from '
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
2
|
+
import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
|
|
3
|
+
import type { KnowledgeSourceJson } from '../../types/PipelineJson/KnowledgeSourceJson';
|
|
4
4
|
/**
|
|
5
5
|
* Prepares the knowle
|
|
6
6
|
*
|
|
7
7
|
* @see https://github.com/webgptorg/promptbook/discussions/41
|
|
8
8
|
* @public exported from `@promptbook/core`
|
|
9
9
|
*/
|
|
10
|
-
export declare function prepareKnowledgePieces(knowledgeSources: Array<KnowledgeSourceJson>, options:
|
|
10
|
+
export declare function prepareKnowledgePieces(knowledgeSources: Array<KnowledgeSourceJson>, options: PrepareAndScrapeOptions): Promise<Array<Omit<KnowledgePiecePreparedJson, 'preparationIds'>>>;
|
|
11
11
|
/**
|
|
12
12
|
* TODO: [🧊] In future one preparation can take data from previous preparation and save tokens and time
|
|
13
13
|
* Put `knowledgePieces` into `PrepareKnowledgeOptions`
|
|
@@ -0,0 +1,33 @@
|
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
|
|
2
|
+
import type { string_file_extension } from '../../../types/typeAliases';
|
|
3
|
+
import type { ScraperSourceHandler } from '../Scraper';
|
|
4
|
+
import type { ScraperIntermediateSource } from '../ScraperIntermediateSource';
|
|
5
|
+
/**
|
|
6
|
+
* @@@
|
|
7
|
+
*
|
|
8
|
+
* @private internal utility of `getScraperIntermediateSource`
|
|
9
|
+
*/
|
|
10
|
+
type GetScraperIntermediateSourceSource = Pick<ScraperSourceHandler, 'filename' | 'url'>;
|
|
11
|
+
/**
|
|
12
|
+
* @@@
|
|
13
|
+
*
|
|
14
|
+
* @private internal utility of `getScraperIntermediateSource`
|
|
15
|
+
*/
|
|
16
|
+
type GetScraperIntermediateSourceHandler = Required<Pick<PrepareAndScrapeOptions, 'rootDirname' | 'cacheDirname' | 'isCacheCleaned' | 'isVerbose'>> & {
|
|
17
|
+
readonly extension: string_file_extension;
|
|
18
|
+
};
|
|
19
|
+
/**
|
|
20
|
+
* Create a filename for intermediate cache for scrapers
|
|
21
|
+
*
|
|
22
|
+
* Note: It also checks if directory exists and creates it if not
|
|
23
|
+
*
|
|
24
|
+
* @private as internal utility for scrapers
|
|
25
|
+
*/
|
|
26
|
+
export declare function getScraperIntermediateSource(source: GetScraperIntermediateSourceSource, options: GetScraperIntermediateSourceHandler): Promise<ScraperIntermediateSource>;
|
|
27
|
+
export {};
|
|
28
|
+
/**
|
|
29
|
+
* Note: Not using `FileCacheStorage` for two reasons:
|
|
30
|
+
* 1) Need to store more than serialized JSONs
|
|
31
|
+
* 2) Need to switch between a `rootDirname` and `cacheDirname` <- TODO: !!!!
|
|
32
|
+
* TODO: [🐱🐉][🧠] Make some smart crop
|
|
33
|
+
*/
|
|
@@ -0,0 +1,10 @@
|
|
|
1
|
+
import type { SetOptional } from 'type-fest';
|
|
2
|
+
import type { PrepareAndScrapeOptions } from '../../../prepare/PrepareAndScrapeOptions';
|
|
3
|
+
import type { KnowledgeSourceJson } from '../../../types/PipelineJson/KnowledgeSourceJson';
|
|
4
|
+
import type { ScraperSourceHandler } from '../Scraper';
|
|
5
|
+
/**
|
|
6
|
+
* @@@
|
|
7
|
+
*
|
|
8
|
+
* @private for scraper utilities
|
|
9
|
+
*/
|
|
10
|
+
export declare function makeKnowledgeSourceHandler(knowledgeSource: SetOptional<KnowledgeSourceJson, 'name'>, options?: Pick<PrepareAndScrapeOptions, 'rootDirname' | 'isVerbose'>): Promise<ScraperSourceHandler>;
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
2
|
+
import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
|
|
3
|
+
import type { ScraperSourceHandler } from '../_common/Scraper';
|
|
4
|
+
import type { ScraperIntermediateSource } from '../_common/ScraperIntermediateSource';
|
|
5
|
+
/**
|
|
6
|
+
* Scraper of .docx and .odt files
|
|
7
|
+
*
|
|
8
|
+
* @see `documentationUrl` for more details
|
|
9
|
+
* @public exported from `@promptbook/core`
|
|
10
|
+
*/
|
|
11
|
+
export declare const documentScraper: {
|
|
12
|
+
/**
|
|
13
|
+
* Mime types that this scraper can handle
|
|
14
|
+
*/
|
|
15
|
+
mimeTypes: string[];
|
|
16
|
+
/**
|
|
17
|
+
* Link to documentation
|
|
18
|
+
*/
|
|
19
|
+
documentationUrl: "https://github.com/webgptorg/promptbook/discussions/@@";
|
|
20
|
+
/**
|
|
21
|
+
* Convert the `.docx` or `.odt` to `.md` file and returns intermediate source
|
|
22
|
+
*
|
|
23
|
+
* Note: `$` is used to indicate that this function is not a pure function - it leaves files on the disk and you are responsible for cleaning them by calling `destroy` method of returned object
|
|
24
|
+
*/
|
|
25
|
+
$convert(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<ScraperIntermediateSource>;
|
|
26
|
+
/**
|
|
27
|
+
* Scrapes the docx file and returns the knowledge pieces or `null` if it can't scrape it
|
|
28
|
+
*/
|
|
29
|
+
scrape(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<Array<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
|
|
30
|
+
};
|
|
31
|
+
/**
|
|
32
|
+
* TODO: [👣] Converted documents can act as cached items - there is no need to run conversion each time
|
|
33
|
+
* TODO: [🦖] Make some system for putting scrapers to separete packages
|
|
34
|
+
* TODO: [🪂] Do it in parallel 11:11
|
|
35
|
+
* TODO: [🦷] Ideally use `as const satisfies Converter & Scraper` BUT this combination throws errors
|
|
36
|
+
* Note: No need to aggregate usage here, it is done by intercepting the llmTools
|
|
37
|
+
*/
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
import type { PrepareAndScrapeOptions } from '../../prepare/PrepareAndScrapeOptions';
|
|
2
|
+
import type { KnowledgePiecePreparedJson } from '../../types/PipelineJson/KnowledgePieceJson';
|
|
3
|
+
import type { ScraperSourceHandler } from '../_common/Scraper';
|
|
4
|
+
import type { ScraperIntermediateSource } from '../_common/ScraperIntermediateSource';
|
|
5
|
+
/**
|
|
6
|
+
* Scraper for .docx files
|
|
7
|
+
*
|
|
8
|
+
* @see `documentationUrl` for more details
|
|
9
|
+
* @public exported from `@promptbook/core`
|
|
10
|
+
*/
|
|
11
|
+
export declare const legacyDocumentScraper: {
|
|
12
|
+
/**
|
|
13
|
+
* Mime types that this scraper can handle
|
|
14
|
+
*/
|
|
15
|
+
mimeTypes: string[];
|
|
16
|
+
/**
|
|
17
|
+
* Link to documentation
|
|
18
|
+
*/
|
|
19
|
+
documentationUrl: "https://github.com/webgptorg/promptbook/discussions/@@";
|
|
20
|
+
/**
|
|
21
|
+
* Convert the `.doc` or `.rtf` to `.doc` file and returns intermediate source
|
|
22
|
+
*
|
|
23
|
+
* Note: `$` is used to indicate that this function is not a pure function - it leaves files on the disk and you are responsible for cleaning them by calling `destroy` method of returned object
|
|
24
|
+
*/
|
|
25
|
+
$convert(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<ScraperIntermediateSource>;
|
|
26
|
+
/**
|
|
27
|
+
* Scrapes the `.doc` or `.rtf` file and returns the knowledge pieces or `null` if it can't scrape it
|
|
28
|
+
*/
|
|
29
|
+
scrape(source: ScraperSourceHandler, options: PrepareAndScrapeOptions): Promise<Array<Omit<KnowledgePiecePreparedJson, 'sources' | 'preparationIds'>> | null>;
|
|
30
|
+
};
|
|
31
|
+
/**
|
|
32
|
+
* TODO: [👣] Converted documents can act as cached items - there is no need to run conversion each time
|
|
33
|
+
* TODO: [🦖] Make some system for putting scrapers to separete packages
|
|
34
|
+
* TODO: [🪂] Do it in parallel 11:11
|
|
35
|
+
* TODO: [🦷] Ideally use `as const satisfies Converter & Scraper` BUT this combination throws errors
|
|
36
|
+
* Note: No need to aggregate usage here, it is done by intercepting the llmTools
|
|
37
|
+
*/
|