@promptbook/markdown-utils 0.84.0-11 → 0.84.0-13
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/esm/index.es.js +136 -90
- package/esm/index.es.js.map +1 -1
- package/esm/typings/src/_packages/core.index.d.ts +4 -2
- package/esm/typings/src/config.d.ts +9 -1
- package/esm/typings/src/execution/FilesystemTools.d.ts +1 -1
- package/esm/typings/src/wizzard/wizzard.d.ts +7 -1
- package/package.json +1 -1
- package/umd/index.umd.js +138 -92
- package/umd/index.umd.js.map +1 -1
|
@@ -19,7 +19,8 @@ import { DEFAULT_MAX_EXECUTION_ATTEMPTS } from '../config';
|
|
|
19
19
|
import { DEFAULT_MAX_KNOWLEDGE_SOURCES_SCRAPING_DEPTH } from '../config';
|
|
20
20
|
import { DEFAULT_MAX_KNOWLEDGE_SOURCES_SCRAPING_TOTAL } from '../config';
|
|
21
21
|
import { DEFAULT_BOOKS_DIRNAME } from '../config';
|
|
22
|
-
import {
|
|
22
|
+
import { DEFAULT_DOWNLOAD_CACHE_DIRNAME } from '../config';
|
|
23
|
+
import { DEFAULT_EXECUTION_CACHE_DIRNAME } from '../config';
|
|
23
24
|
import { DEFAULT_SCRAPE_CACHE_DIRNAME } from '../config';
|
|
24
25
|
import { DEFAULT_PIPELINE_COLLECTION_BASE_FILENAME } from '../config';
|
|
25
26
|
import { DEFAULT_REMOTE_URL } from '../config';
|
|
@@ -145,7 +146,8 @@ export { DEFAULT_MAX_EXECUTION_ATTEMPTS };
|
|
|
145
146
|
export { DEFAULT_MAX_KNOWLEDGE_SOURCES_SCRAPING_DEPTH };
|
|
146
147
|
export { DEFAULT_MAX_KNOWLEDGE_SOURCES_SCRAPING_TOTAL };
|
|
147
148
|
export { DEFAULT_BOOKS_DIRNAME };
|
|
148
|
-
export {
|
|
149
|
+
export { DEFAULT_DOWNLOAD_CACHE_DIRNAME };
|
|
150
|
+
export { DEFAULT_EXECUTION_CACHE_DIRNAME };
|
|
149
151
|
export { DEFAULT_SCRAPE_CACHE_DIRNAME };
|
|
150
152
|
export { DEFAULT_PIPELINE_COLLECTION_BASE_FILENAME };
|
|
151
153
|
export { DEFAULT_REMOTE_URL };
|
|
@@ -166,6 +166,14 @@ export declare const DEFAULT_MAX_KNOWLEDGE_SOURCES_SCRAPING_TOTAL = 200;
|
|
|
166
166
|
* @public exported from `@promptbook/core`
|
|
167
167
|
*/
|
|
168
168
|
export declare const DEFAULT_BOOKS_DIRNAME = "./books";
|
|
169
|
+
/**
|
|
170
|
+
* Where to store the temporary downloads
|
|
171
|
+
*
|
|
172
|
+
* Note: When the folder does not exist, it is created recursively
|
|
173
|
+
*
|
|
174
|
+
* @public exported from `@promptbook/core`
|
|
175
|
+
*/
|
|
176
|
+
export declare const DEFAULT_DOWNLOAD_CACHE_DIRNAME = "./.promptbook/download-cache";
|
|
169
177
|
/**
|
|
170
178
|
* Where to store the cache of executions for promptbook CLI
|
|
171
179
|
*
|
|
@@ -173,7 +181,7 @@ export declare const DEFAULT_BOOKS_DIRNAME = "./books";
|
|
|
173
181
|
*
|
|
174
182
|
* @public exported from `@promptbook/core`
|
|
175
183
|
*/
|
|
176
|
-
export declare const
|
|
184
|
+
export declare const DEFAULT_EXECUTION_CACHE_DIRNAME = "./.promptbook/execution-cache";
|
|
177
185
|
/**
|
|
178
186
|
* Where to store the scrape cache
|
|
179
187
|
*
|
|
@@ -3,7 +3,7 @@ import type fs from 'fs/promises';
|
|
|
3
3
|
/**
|
|
4
4
|
* Container for all the tools needed to manipulate with filesystem
|
|
5
5
|
*/
|
|
6
|
-
export type FilesystemTools = Pick<typeof fs, 'access' | 'constants' | 'readFile' | 'writeFile' | 'stat' | 'readdir'>;
|
|
6
|
+
export type FilesystemTools = Pick<typeof fs, 'access' | 'constants' | 'readFile' | 'writeFile' | 'stat' | 'readdir' | 'mkdir'>;
|
|
7
7
|
/**
|
|
8
8
|
* TODO: Implement destroyable pattern to free resources
|
|
9
9
|
*/
|
|
@@ -6,6 +6,7 @@ import type { PipelineString } from '../pipeline/PipelineString';
|
|
|
6
6
|
import type { TaskProgress } from '../types/TaskProgress';
|
|
7
7
|
import type { InputParameters } from '../types/typeAliases';
|
|
8
8
|
import type { string_filename } from '../types/typeAliases';
|
|
9
|
+
import type { string_parameter_value } from '../types/typeAliases';
|
|
9
10
|
import type { string_pipeline_url } from '../types/typeAliases';
|
|
10
11
|
/**
|
|
11
12
|
* Wizzard for simple usage of the Promptbook
|
|
@@ -27,7 +28,12 @@ declare class Wizzard {
|
|
|
27
28
|
*
|
|
28
29
|
* Note: This works simmilar to the `ptbk run` command
|
|
29
30
|
*/
|
|
30
|
-
execute(book: string_pipeline_url | string_filename | PipelineString, inputParameters: InputParameters, onProgress?: (taskProgress: TaskProgress) => Promisable<void>): Promise<
|
|
31
|
+
execute(book: string_pipeline_url | string_filename | PipelineString, inputParameters: InputParameters, onProgress?: (taskProgress: TaskProgress) => Promisable<void>): Promise<{
|
|
32
|
+
/**
|
|
33
|
+
* Simple result of the execution
|
|
34
|
+
*/
|
|
35
|
+
result: string_parameter_value;
|
|
36
|
+
} & PipelineExecutorResult>;
|
|
31
37
|
private executionTools;
|
|
32
38
|
/**
|
|
33
39
|
* Provides the tools automatically for the Node.js environment
|
package/package.json
CHANGED
package/umd/index.umd.js
CHANGED
|
@@ -1,14 +1,15 @@
|
|
|
1
1
|
(function (global, factory) {
|
|
2
|
-
typeof exports === 'object' && typeof module !== 'undefined' ? factory(exports, require('spacetrim'), require('prettier'), require('prettier/parser-html'), require('waitasecond'), require('
|
|
3
|
-
typeof define === 'function' && define.amd ? define(['exports', 'spacetrim', 'prettier', 'prettier/parser-html', 'waitasecond', '
|
|
4
|
-
(global = typeof globalThis !== 'undefined' ? globalThis : global || self, factory(global["promptbook-markdown-utils"] = {}, global.spaceTrim, global.prettier, global.parserHtml, global.waitasecond, global.
|
|
5
|
-
})(this, (function (exports, spaceTrim, prettier, parserHtml, waitasecond, path, cryptoJs,
|
|
2
|
+
typeof exports === 'object' && typeof module !== 'undefined' ? factory(exports, require('spacetrim'), require('prettier'), require('prettier/parser-html'), require('waitasecond'), require('crypto-js/enc-hex'), require('crypto-js/sha256'), require('path'), require('crypto-js'), require('mime-types'), require('papaparse')) :
|
|
3
|
+
typeof define === 'function' && define.amd ? define(['exports', 'spacetrim', 'prettier', 'prettier/parser-html', 'waitasecond', 'crypto-js/enc-hex', 'crypto-js/sha256', 'path', 'crypto-js', 'mime-types', 'papaparse'], factory) :
|
|
4
|
+
(global = typeof globalThis !== 'undefined' ? globalThis : global || self, factory(global["promptbook-markdown-utils"] = {}, global.spaceTrim, global.prettier, global.parserHtml, global.waitasecond, global.hexEncoder, global.sha256, global.path, global.cryptoJs, global.mimeTypes, global.papaparse));
|
|
5
|
+
})(this, (function (exports, spaceTrim, prettier, parserHtml, waitasecond, hexEncoder, sha256, path, cryptoJs, mimeTypes, papaparse) { 'use strict';
|
|
6
6
|
|
|
7
7
|
function _interopDefaultLegacy (e) { return e && typeof e === 'object' && 'default' in e ? e : { 'default': e }; }
|
|
8
8
|
|
|
9
9
|
var spaceTrim__default = /*#__PURE__*/_interopDefaultLegacy(spaceTrim);
|
|
10
10
|
var parserHtml__default = /*#__PURE__*/_interopDefaultLegacy(parserHtml);
|
|
11
11
|
var hexEncoder__default = /*#__PURE__*/_interopDefaultLegacy(hexEncoder);
|
|
12
|
+
var sha256__default = /*#__PURE__*/_interopDefaultLegacy(sha256);
|
|
12
13
|
|
|
13
14
|
// ⚠️ WARNING: This code has been generated so that any manual changes will be overwritten
|
|
14
15
|
/**
|
|
@@ -24,7 +25,7 @@
|
|
|
24
25
|
* @generated
|
|
25
26
|
* @see https://github.com/webgptorg/promptbook
|
|
26
27
|
*/
|
|
27
|
-
var PROMPTBOOK_ENGINE_VERSION = '0.84.0-
|
|
28
|
+
var PROMPTBOOK_ENGINE_VERSION = '0.84.0-12';
|
|
28
29
|
/**
|
|
29
30
|
* TODO: string_promptbook_version should be constrained to the all versions of Promptbook engine
|
|
30
31
|
* Note: [💞] Ignore a discrepancy between file name and entity name
|
|
@@ -810,6 +811,12 @@
|
|
|
810
811
|
* @private within the repository - too low-level in comparison with other `MAX_...`
|
|
811
812
|
*/
|
|
812
813
|
var IMMEDIATE_TIME = 10;
|
|
814
|
+
/**
|
|
815
|
+
* The maximum length of the (generated) filename
|
|
816
|
+
*
|
|
817
|
+
* @public exported from `@promptbook/core`
|
|
818
|
+
*/
|
|
819
|
+
var MAX_FILENAME_LENGTH = 30;
|
|
813
820
|
/**
|
|
814
821
|
* Strategy for caching the intermediate results for knowledge sources
|
|
815
822
|
*
|
|
@@ -829,6 +836,15 @@
|
|
|
829
836
|
* @public exported from `@promptbook/core`
|
|
830
837
|
*/
|
|
831
838
|
var DEFAULT_MAX_EXECUTION_ATTEMPTS = 3; // <- TODO: [🤹♂️]
|
|
839
|
+
// <- TODO: [🕝] Make also `BOOKS_DIRNAME_ALTERNATIVES`
|
|
840
|
+
/**
|
|
841
|
+
* Where to store the temporary downloads
|
|
842
|
+
*
|
|
843
|
+
* Note: When the folder does not exist, it is created recursively
|
|
844
|
+
*
|
|
845
|
+
* @public exported from `@promptbook/core`
|
|
846
|
+
*/
|
|
847
|
+
var DEFAULT_DOWNLOAD_CACHE_DIRNAME = './.promptbook/download-cache';
|
|
832
848
|
/**
|
|
833
849
|
* Where to store the scrape cache
|
|
834
850
|
*
|
|
@@ -3536,6 +3552,15 @@
|
|
|
3536
3552
|
* TODO: [🐱🐉][🧠] Make some smart crop NOT source-i-m-pavol-a-develop-... BUT source-i-m-pavol-a-developer-...
|
|
3537
3553
|
*/
|
|
3538
3554
|
|
|
3555
|
+
/**
|
|
3556
|
+
* @@@
|
|
3557
|
+
*
|
|
3558
|
+
* @private for `FileCacheStorage`
|
|
3559
|
+
*/
|
|
3560
|
+
function nameToSubfolderPath(name) {
|
|
3561
|
+
return [name.substr(0, 1).toLowerCase(), name.substr(1, 1).toLowerCase()];
|
|
3562
|
+
}
|
|
3563
|
+
|
|
3539
3564
|
/**
|
|
3540
3565
|
* Convert file extension to mime type
|
|
3541
3566
|
*
|
|
@@ -3591,6 +3616,46 @@
|
|
|
3591
3616
|
* TODO: [🖇] What about symlinks?
|
|
3592
3617
|
*/
|
|
3593
3618
|
|
|
3619
|
+
/**
|
|
3620
|
+
* Removes emojis from a string and fix whitespaces
|
|
3621
|
+
*
|
|
3622
|
+
* @param text with emojis
|
|
3623
|
+
* @returns text without emojis
|
|
3624
|
+
* @public exported from `@promptbook/utils`
|
|
3625
|
+
*/
|
|
3626
|
+
function removeEmojis(text) {
|
|
3627
|
+
// Replace emojis (and also ZWJ sequence) with hyphens
|
|
3628
|
+
text = text.replace(/(\p{Extended_Pictographic})\p{Modifier_Symbol}/gu, '$1');
|
|
3629
|
+
text = text.replace(/(\p{Extended_Pictographic})[\u{FE00}-\u{FE0F}]/gu, '$1');
|
|
3630
|
+
text = text.replace(/(\p{Extended_Pictographic})(\u{200D}\p{Extended_Pictographic})*/gu, '$1');
|
|
3631
|
+
text = text.replace(/\p{Extended_Pictographic}/gu, '');
|
|
3632
|
+
return text;
|
|
3633
|
+
}
|
|
3634
|
+
|
|
3635
|
+
/**
|
|
3636
|
+
* @@@
|
|
3637
|
+
*
|
|
3638
|
+
* @param value @@@
|
|
3639
|
+
* @returns @@@
|
|
3640
|
+
* @example @@@
|
|
3641
|
+
* @public exported from `@promptbook/utils`
|
|
3642
|
+
*/
|
|
3643
|
+
function titleToName(value) {
|
|
3644
|
+
if (isValidUrl(value)) {
|
|
3645
|
+
value = value.replace(/^https?:\/\//, '');
|
|
3646
|
+
value = value.replace(/\.html$/, '');
|
|
3647
|
+
}
|
|
3648
|
+
else if (isValidFilePath(value)) {
|
|
3649
|
+
value = path.basename(value);
|
|
3650
|
+
// Note: Keeping extension in the name
|
|
3651
|
+
}
|
|
3652
|
+
value = value.split('/').join('-');
|
|
3653
|
+
value = removeEmojis(value);
|
|
3654
|
+
value = normalizeToKebabCase(value);
|
|
3655
|
+
// TODO: [🧠] Maybe warn or add some padding to short name which are not good identifiers
|
|
3656
|
+
return value;
|
|
3657
|
+
}
|
|
3658
|
+
|
|
3594
3659
|
/**
|
|
3595
3660
|
* The built-in `fetch' function with a lightweight error handling wrapper as default fetch function used in Promptbook scrapers
|
|
3596
3661
|
*
|
|
@@ -3626,10 +3691,11 @@
|
|
|
3626
3691
|
function makeKnowledgeSourceHandler(knowledgeSource, tools, options) {
|
|
3627
3692
|
var _a;
|
|
3628
3693
|
return __awaiter(this, void 0, void 0, function () {
|
|
3629
|
-
var _b, fetch, knowledgeSourceContent, name, _c, _d, rootDirname, url, response_1, mimeType, filename_1, fileExtension, mimeType;
|
|
3630
|
-
return __generator(this, function (
|
|
3631
|
-
switch (
|
|
3694
|
+
var _b, fetch, knowledgeSourceContent, name, _c, _d, rootDirname, url, response_1, mimeType, basename, hash, rootDirname_1, filepath, _f, _g, _h, _j, _k, filename_1, fileExtension, mimeType;
|
|
3695
|
+
return __generator(this, function (_l) {
|
|
3696
|
+
switch (_l.label) {
|
|
3632
3697
|
case 0:
|
|
3698
|
+
console.log('!!! makeKnowledgeSourceHandler', knowledgeSource);
|
|
3633
3699
|
_b = tools.fetch, fetch = _b === void 0 ? scraperFetch : _b;
|
|
3634
3700
|
knowledgeSourceContent = knowledgeSource.knowledgeSourceContent;
|
|
3635
3701
|
name = knowledgeSource.name;
|
|
@@ -3637,54 +3703,74 @@
|
|
|
3637
3703
|
if (!name) {
|
|
3638
3704
|
name = knowledgeSourceContentToName(knowledgeSourceContent);
|
|
3639
3705
|
}
|
|
3640
|
-
if (!isValidUrl(knowledgeSourceContent)) return [3 /*break*/,
|
|
3706
|
+
if (!isValidUrl(knowledgeSourceContent)) return [3 /*break*/, 5];
|
|
3641
3707
|
url = knowledgeSourceContent;
|
|
3642
3708
|
return [4 /*yield*/, fetch(url)];
|
|
3643
3709
|
case 1:
|
|
3644
|
-
response_1 =
|
|
3710
|
+
response_1 = _l.sent();
|
|
3645
3711
|
mimeType = ((_a = response_1.headers.get('content-type')) === null || _a === void 0 ? void 0 : _a.split(';')[0]) || 'text/html';
|
|
3646
|
-
|
|
3647
|
-
|
|
3648
|
-
|
|
3649
|
-
|
|
3650
|
-
|
|
3651
|
-
|
|
3652
|
-
|
|
3653
|
-
|
|
3654
|
-
|
|
3655
|
-
|
|
3656
|
-
|
|
3657
|
-
|
|
3658
|
-
|
|
3659
|
-
|
|
3660
|
-
|
|
3661
|
-
|
|
3662
|
-
|
|
3663
|
-
|
|
3664
|
-
|
|
3665
|
-
|
|
3666
|
-
|
|
3667
|
-
|
|
3668
|
-
|
|
3712
|
+
if (tools.fs === undefined || !url.endsWith('.pdf')) {
|
|
3713
|
+
return [2 /*return*/, {
|
|
3714
|
+
source: name,
|
|
3715
|
+
filename: null,
|
|
3716
|
+
url: url,
|
|
3717
|
+
mimeType: mimeType,
|
|
3718
|
+
/*
|
|
3719
|
+
TODO: [🥽]
|
|
3720
|
+
> async asBlob() {
|
|
3721
|
+
> // TODO: [👨🏻🤝👨🏻] This can be called multiple times BUT when called second time, response in already consumed
|
|
3722
|
+
> const content = await response.blob();
|
|
3723
|
+
> return content;
|
|
3724
|
+
> },
|
|
3725
|
+
*/
|
|
3726
|
+
asJson: function () {
|
|
3727
|
+
return __awaiter(this, void 0, void 0, function () {
|
|
3728
|
+
var content;
|
|
3729
|
+
return __generator(this, function (_a) {
|
|
3730
|
+
switch (_a.label) {
|
|
3731
|
+
case 0: return [4 /*yield*/, response_1.json()];
|
|
3732
|
+
case 1:
|
|
3733
|
+
content = _a.sent();
|
|
3734
|
+
return [2 /*return*/, content];
|
|
3735
|
+
}
|
|
3736
|
+
});
|
|
3669
3737
|
});
|
|
3670
|
-
}
|
|
3671
|
-
|
|
3672
|
-
|
|
3673
|
-
|
|
3674
|
-
|
|
3675
|
-
|
|
3676
|
-
|
|
3677
|
-
|
|
3678
|
-
|
|
3679
|
-
|
|
3680
|
-
|
|
3681
|
-
}
|
|
3738
|
+
},
|
|
3739
|
+
asText: function () {
|
|
3740
|
+
return __awaiter(this, void 0, void 0, function () {
|
|
3741
|
+
var content;
|
|
3742
|
+
return __generator(this, function (_a) {
|
|
3743
|
+
switch (_a.label) {
|
|
3744
|
+
case 0: return [4 /*yield*/, response_1.text()];
|
|
3745
|
+
case 1:
|
|
3746
|
+
content = _a.sent();
|
|
3747
|
+
return [2 /*return*/, content];
|
|
3748
|
+
}
|
|
3749
|
+
});
|
|
3682
3750
|
});
|
|
3683
|
-
}
|
|
3684
|
-
}
|
|
3685
|
-
|
|
3751
|
+
},
|
|
3752
|
+
}];
|
|
3753
|
+
}
|
|
3754
|
+
basename = url.split('/').pop() || titleToName(url);
|
|
3755
|
+
hash = sha256__default["default"](hexEncoder__default["default"].parse(url)).toString( /* hex */);
|
|
3756
|
+
rootDirname_1 = path.join(process.cwd(), DEFAULT_DOWNLOAD_CACHE_DIRNAME);
|
|
3757
|
+
filepath = path.join.apply(void 0, __spreadArray(__spreadArray([], __read(nameToSubfolderPath(hash /* <- TODO: [🎎] Maybe add some SHA256 prefix */)), false), ["".concat(basename.substring(0, MAX_FILENAME_LENGTH), ".pdf")], false));
|
|
3758
|
+
return [4 /*yield*/, tools.fs.mkdir(path.dirname(path.join(rootDirname_1, filepath)), { recursive: true })];
|
|
3686
3759
|
case 2:
|
|
3687
|
-
|
|
3760
|
+
_l.sent();
|
|
3761
|
+
_g = (_f = tools.fs).writeFile;
|
|
3762
|
+
_h = [path.join(rootDirname_1, filepath)];
|
|
3763
|
+
_k = (_j = Buffer).from;
|
|
3764
|
+
return [4 /*yield*/, response_1.arrayBuffer()];
|
|
3765
|
+
case 3: return [4 /*yield*/, _g.apply(_f, _h.concat([_k.apply(_j, [_l.sent()])]))];
|
|
3766
|
+
case 4:
|
|
3767
|
+
_l.sent();
|
|
3768
|
+
// TODO: !!!!!!!! Check the file security
|
|
3769
|
+
// TODO: !!!!!!!! Check the file size (if it is not too big)
|
|
3770
|
+
// TODO: !!!!!!!! Delete the file
|
|
3771
|
+
return [2 /*return*/, makeKnowledgeSourceHandler({ name: name, knowledgeSourceContent: filepath }, tools, __assign(__assign({}, options), { rootDirname: rootDirname_1 }))];
|
|
3772
|
+
case 5:
|
|
3773
|
+
if (!isValidFilePath(knowledgeSourceContent)) return [3 /*break*/, 7];
|
|
3688
3774
|
if (tools.fs === undefined) {
|
|
3689
3775
|
throw new EnvironmentMismatchError('Can not import file knowledge without filesystem tools');
|
|
3690
3776
|
// <- TODO: [🧠] What is the best error type here`
|
|
@@ -3697,8 +3783,8 @@
|
|
|
3697
3783
|
fileExtension = getFileExtension(filename_1);
|
|
3698
3784
|
mimeType = extensionToMimeType(fileExtension || '');
|
|
3699
3785
|
return [4 /*yield*/, isFileExisting(filename_1, tools.fs)];
|
|
3700
|
-
case
|
|
3701
|
-
if (!(
|
|
3786
|
+
case 6:
|
|
3787
|
+
if (!(_l.sent())) {
|
|
3702
3788
|
throw new NotFoundError(spaceTrim__default["default"](function (block) { return "\n Can not make source handler for file which does not exist:\n\n File:\n ".concat(block(knowledgeSourceContent), "\n\n Full file path:\n ").concat(block(filename_1), "\n "); }));
|
|
3703
3789
|
}
|
|
3704
3790
|
// TODO: [🧠][😿] Test security file - file is scoped to the project (BUT maybe do this in `filesystemTools`)
|
|
@@ -3744,7 +3830,7 @@
|
|
|
3744
3830
|
});
|
|
3745
3831
|
},
|
|
3746
3832
|
}];
|
|
3747
|
-
case
|
|
3833
|
+
case 7: return [2 /*return*/, {
|
|
3748
3834
|
source: name,
|
|
3749
3835
|
filename: null,
|
|
3750
3836
|
url: null,
|
|
@@ -5974,46 +6060,6 @@
|
|
|
5974
6060
|
* TODO: [🐚] Change onProgress to object that represents the running execution, can be subscribed via RxJS to and also awaited
|
|
5975
6061
|
*/
|
|
5976
6062
|
|
|
5977
|
-
/**
|
|
5978
|
-
* Removes emojis from a string and fix whitespaces
|
|
5979
|
-
*
|
|
5980
|
-
* @param text with emojis
|
|
5981
|
-
* @returns text without emojis
|
|
5982
|
-
* @public exported from `@promptbook/utils`
|
|
5983
|
-
*/
|
|
5984
|
-
function removeEmojis(text) {
|
|
5985
|
-
// Replace emojis (and also ZWJ sequence) with hyphens
|
|
5986
|
-
text = text.replace(/(\p{Extended_Pictographic})\p{Modifier_Symbol}/gu, '$1');
|
|
5987
|
-
text = text.replace(/(\p{Extended_Pictographic})[\u{FE00}-\u{FE0F}]/gu, '$1');
|
|
5988
|
-
text = text.replace(/(\p{Extended_Pictographic})(\u{200D}\p{Extended_Pictographic})*/gu, '$1');
|
|
5989
|
-
text = text.replace(/\p{Extended_Pictographic}/gu, '');
|
|
5990
|
-
return text;
|
|
5991
|
-
}
|
|
5992
|
-
|
|
5993
|
-
/**
|
|
5994
|
-
* @@@
|
|
5995
|
-
*
|
|
5996
|
-
* @param value @@@
|
|
5997
|
-
* @returns @@@
|
|
5998
|
-
* @example @@@
|
|
5999
|
-
* @public exported from `@promptbook/utils`
|
|
6000
|
-
*/
|
|
6001
|
-
function titleToName(value) {
|
|
6002
|
-
if (isValidUrl(value)) {
|
|
6003
|
-
value = value.replace(/^https?:\/\//, '');
|
|
6004
|
-
value = value.replace(/\.html$/, '');
|
|
6005
|
-
}
|
|
6006
|
-
else if (isValidFilePath(value)) {
|
|
6007
|
-
value = path.basename(value);
|
|
6008
|
-
// Note: Keeping extension in the name
|
|
6009
|
-
}
|
|
6010
|
-
value = value.split('/').join('-');
|
|
6011
|
-
value = removeEmojis(value);
|
|
6012
|
-
value = normalizeToKebabCase(value);
|
|
6013
|
-
// TODO: [🧠] Maybe warn or add some padding to short name which are not good identifiers
|
|
6014
|
-
return value;
|
|
6015
|
-
}
|
|
6016
|
-
|
|
6017
6063
|
/**
|
|
6018
6064
|
* Metadata of the scraper
|
|
6019
6065
|
*
|