marlarky 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +489 -0
- package/dist/adapters/faker-js-adapter.d.ts +44 -0
- package/dist/adapters/faker-js-adapter.d.ts.map +1 -0
- package/dist/adapters/faker-js-adapter.js +46 -0
- package/dist/adapters/faker-js-adapter.js.map +1 -0
- package/dist/adapters/index.d.ts +3 -0
- package/dist/adapters/index.d.ts.map +1 -0
- package/dist/adapters/index.js +3 -0
- package/dist/adapters/index.js.map +1 -0
- package/dist/adapters/simple-faker-adapter.d.ts +22 -0
- package/dist/adapters/simple-faker-adapter.d.ts.map +1 -0
- package/dist/adapters/simple-faker-adapter.js +54 -0
- package/dist/adapters/simple-faker-adapter.js.map +1 -0
- package/dist/cli.d.ts +7 -0
- package/dist/cli.d.ts.map +1 -0
- package/dist/cli.js +588 -0
- package/dist/cli.js.map +1 -0
- package/dist/defaults/index.d.ts +2 -0
- package/dist/defaults/index.d.ts.map +1 -0
- package/dist/defaults/index.js +2 -0
- package/dist/defaults/index.js.map +1 -0
- package/dist/defaults/word-lists.d.ts +22 -0
- package/dist/defaults/word-lists.d.ts.map +1 -0
- package/dist/defaults/word-lists.js +124 -0
- package/dist/defaults/word-lists.js.map +1 -0
- package/dist/generator/index.d.ts +2 -0
- package/dist/generator/index.d.ts.map +1 -0
- package/dist/generator/index.js +2 -0
- package/dist/generator/index.js.map +1 -0
- package/dist/generator/text-generator.d.ts +93 -0
- package/dist/generator/text-generator.d.ts.map +1 -0
- package/dist/generator/text-generator.js +411 -0
- package/dist/generator/text-generator.js.map +1 -0
- package/dist/generator/text-generator.test.d.ts +2 -0
- package/dist/generator/text-generator.test.d.ts.map +1 -0
- package/dist/generator/text-generator.test.js +151 -0
- package/dist/generator/text-generator.test.js.map +1 -0
- package/dist/grammar/index.d.ts +5 -0
- package/dist/grammar/index.d.ts.map +1 -0
- package/dist/grammar/index.js +3 -0
- package/dist/grammar/index.js.map +1 -0
- package/dist/grammar/phrase-builders.d.ts +72 -0
- package/dist/grammar/phrase-builders.d.ts.map +1 -0
- package/dist/grammar/phrase-builders.js +241 -0
- package/dist/grammar/phrase-builders.js.map +1 -0
- package/dist/grammar/sentence-templates.d.ts +67 -0
- package/dist/grammar/sentence-templates.d.ts.map +1 -0
- package/dist/grammar/sentence-templates.js +272 -0
- package/dist/grammar/sentence-templates.js.map +1 -0
- package/dist/index.d.ts +17 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +40 -0
- package/dist/index.js.map +1 -0
- package/dist/interfaces/faker-adapter.d.ts +25 -0
- package/dist/interfaces/faker-adapter.d.ts.map +1 -0
- package/dist/interfaces/faker-adapter.js +2 -0
- package/dist/interfaces/faker-adapter.js.map +1 -0
- package/dist/interfaces/index.d.ts +4 -0
- package/dist/interfaces/index.d.ts.map +1 -0
- package/dist/interfaces/index.js +2 -0
- package/dist/interfaces/index.js.map +1 -0
- package/dist/interfaces/lexicon-store.d.ts +39 -0
- package/dist/interfaces/lexicon-store.d.ts.map +1 -0
- package/dist/interfaces/lexicon-store.js +2 -0
- package/dist/interfaces/lexicon-store.js.map +1 -0
- package/dist/interfaces/rng.d.ts +25 -0
- package/dist/interfaces/rng.d.ts.map +1 -0
- package/dist/interfaces/rng.js +2 -0
- package/dist/interfaces/rng.js.map +1 -0
- package/dist/lexicon/index.d.ts +4 -0
- package/dist/lexicon/index.d.ts.map +1 -0
- package/dist/lexicon/index.js +4 -0
- package/dist/lexicon/index.js.map +1 -0
- package/dist/lexicon/loader.d.ts +24 -0
- package/dist/lexicon/loader.d.ts.map +1 -0
- package/dist/lexicon/loader.js +47 -0
- package/dist/lexicon/loader.js.map +1 -0
- package/dist/lexicon/store.d.ts +39 -0
- package/dist/lexicon/store.d.ts.map +1 -0
- package/dist/lexicon/store.js +291 -0
- package/dist/lexicon/store.js.map +1 -0
- package/dist/lexicon/validator.d.ts +10 -0
- package/dist/lexicon/validator.d.ts.map +1 -0
- package/dist/lexicon/validator.js +273 -0
- package/dist/lexicon/validator.js.map +1 -0
- package/dist/morphology/articles.d.ts +17 -0
- package/dist/morphology/articles.d.ts.map +1 -0
- package/dist/morphology/articles.js +66 -0
- package/dist/morphology/articles.js.map +1 -0
- package/dist/morphology/articles.test.d.ts +2 -0
- package/dist/morphology/articles.test.d.ts.map +1 -0
- package/dist/morphology/articles.test.js +56 -0
- package/dist/morphology/articles.test.js.map +1 -0
- package/dist/morphology/conjugate.d.ts +46 -0
- package/dist/morphology/conjugate.d.ts.map +1 -0
- package/dist/morphology/conjugate.js +337 -0
- package/dist/morphology/conjugate.js.map +1 -0
- package/dist/morphology/conjugate.test.d.ts +2 -0
- package/dist/morphology/conjugate.test.d.ts.map +1 -0
- package/dist/morphology/conjugate.test.js +168 -0
- package/dist/morphology/conjugate.test.js.map +1 -0
- package/dist/morphology/index.d.ts +6 -0
- package/dist/morphology/index.d.ts.map +1 -0
- package/dist/morphology/index.js +9 -0
- package/dist/morphology/index.js.map +1 -0
- package/dist/morphology/normalize.d.ts +52 -0
- package/dist/morphology/normalize.d.ts.map +1 -0
- package/dist/morphology/normalize.js +127 -0
- package/dist/morphology/normalize.js.map +1 -0
- package/dist/morphology/pluralize.d.ts +17 -0
- package/dist/morphology/pluralize.d.ts.map +1 -0
- package/dist/morphology/pluralize.js +186 -0
- package/dist/morphology/pluralize.js.map +1 -0
- package/dist/morphology/pluralize.test.d.ts +2 -0
- package/dist/morphology/pluralize.test.d.ts.map +1 -0
- package/dist/morphology/pluralize.test.js +86 -0
- package/dist/morphology/pluralize.test.js.map +1 -0
- package/dist/providers/index.d.ts +2 -0
- package/dist/providers/index.d.ts.map +1 -0
- package/dist/providers/index.js +2 -0
- package/dist/providers/index.js.map +1 -0
- package/dist/providers/word-provider.d.ts +125 -0
- package/dist/providers/word-provider.d.ts.map +1 -0
- package/dist/providers/word-provider.js +266 -0
- package/dist/providers/word-provider.js.map +1 -0
- package/dist/rng/index.d.ts +2 -0
- package/dist/rng/index.d.ts.map +1 -0
- package/dist/rng/index.js +2 -0
- package/dist/rng/index.js.map +1 -0
- package/dist/rng/seedable-rng.d.ts +19 -0
- package/dist/rng/seedable-rng.d.ts.map +1 -0
- package/dist/rng/seedable-rng.js +77 -0
- package/dist/rng/seedable-rng.js.map +1 -0
- package/dist/rng/seedable-rng.test.d.ts +2 -0
- package/dist/rng/seedable-rng.test.d.ts.map +1 -0
- package/dist/rng/seedable-rng.test.js +165 -0
- package/dist/rng/seedable-rng.test.js.map +1 -0
- package/dist/rules/index.d.ts +3 -0
- package/dist/rules/index.d.ts.map +1 -0
- package/dist/rules/index.js +2 -0
- package/dist/rules/index.js.map +1 -0
- package/dist/rules/rule-engine.d.ts +78 -0
- package/dist/rules/rule-engine.d.ts.map +1 -0
- package/dist/rules/rule-engine.js +271 -0
- package/dist/rules/rule-engine.js.map +1 -0
- package/dist/transforms/config-merge.d.ts +19 -0
- package/dist/transforms/config-merge.d.ts.map +1 -0
- package/dist/transforms/config-merge.js +88 -0
- package/dist/transforms/config-merge.js.map +1 -0
- package/dist/transforms/config-merge.test.d.ts +2 -0
- package/dist/transforms/config-merge.test.d.ts.map +1 -0
- package/dist/transforms/config-merge.test.js +91 -0
- package/dist/transforms/config-merge.test.js.map +1 -0
- package/dist/transforms/default-registry.d.ts +10 -0
- package/dist/transforms/default-registry.d.ts.map +1 -0
- package/dist/transforms/default-registry.js +17 -0
- package/dist/transforms/default-registry.js.map +1 -0
- package/dist/transforms/index.d.ts +15 -0
- package/dist/transforms/index.d.ts.map +1 -0
- package/dist/transforms/index.js +20 -0
- package/dist/transforms/index.js.map +1 -0
- package/dist/transforms/pipeline.d.ts +28 -0
- package/dist/transforms/pipeline.d.ts.map +1 -0
- package/dist/transforms/pipeline.js +176 -0
- package/dist/transforms/pipeline.js.map +1 -0
- package/dist/transforms/pipeline.test.d.ts +2 -0
- package/dist/transforms/pipeline.test.d.ts.map +1 -0
- package/dist/transforms/pipeline.test.js +175 -0
- package/dist/transforms/pipeline.test.js.map +1 -0
- package/dist/transforms/protection.d.ts +16 -0
- package/dist/transforms/protection.d.ts.map +1 -0
- package/dist/transforms/protection.js +97 -0
- package/dist/transforms/protection.js.map +1 -0
- package/dist/transforms/protection.test.d.ts +2 -0
- package/dist/transforms/protection.test.d.ts.map +1 -0
- package/dist/transforms/protection.test.js +79 -0
- package/dist/transforms/protection.test.js.map +1 -0
- package/dist/transforms/registry.d.ts +25 -0
- package/dist/transforms/registry.d.ts.map +1 -0
- package/dist/transforms/registry.js +32 -0
- package/dist/transforms/registry.js.map +1 -0
- package/dist/transforms/registry.test.d.ts +2 -0
- package/dist/transforms/registry.test.d.ts.map +1 -0
- package/dist/transforms/registry.test.js +64 -0
- package/dist/transforms/registry.test.js.map +1 -0
- package/dist/transforms/tokenizer.d.ts +26 -0
- package/dist/transforms/tokenizer.d.ts.map +1 -0
- package/dist/transforms/tokenizer.js +137 -0
- package/dist/transforms/tokenizer.js.map +1 -0
- package/dist/transforms/tokenizer.test.d.ts +2 -0
- package/dist/transforms/tokenizer.test.d.ts.map +1 -0
- package/dist/transforms/tokenizer.test.js +85 -0
- package/dist/transforms/tokenizer.test.js.map +1 -0
- package/dist/transforms/transforms/biz-jargon.d.ts +7 -0
- package/dist/transforms/transforms/biz-jargon.d.ts.map +1 -0
- package/dist/transforms/transforms/biz-jargon.js +117 -0
- package/dist/transforms/transforms/biz-jargon.js.map +1 -0
- package/dist/transforms/transforms/emoji.d.ts +7 -0
- package/dist/transforms/transforms/emoji.d.ts.map +1 -0
- package/dist/transforms/transforms/emoji.js +127 -0
- package/dist/transforms/transforms/emoji.js.map +1 -0
- package/dist/transforms/transforms/index.d.ts +17 -0
- package/dist/transforms/transforms/index.d.ts.map +1 -0
- package/dist/transforms/transforms/index.js +37 -0
- package/dist/transforms/transforms/index.js.map +1 -0
- package/dist/transforms/transforms/leet.d.ts +7 -0
- package/dist/transforms/transforms/leet.d.ts.map +1 -0
- package/dist/transforms/transforms/leet.js +109 -0
- package/dist/transforms/transforms/leet.js.map +1 -0
- package/dist/transforms/transforms/mock-case.d.ts +7 -0
- package/dist/transforms/transforms/mock-case.d.ts.map +1 -0
- package/dist/transforms/transforms/mock-case.js +116 -0
- package/dist/transforms/transforms/mock-case.js.map +1 -0
- package/dist/transforms/transforms/pig-latin.d.ts +7 -0
- package/dist/transforms/transforms/pig-latin.d.ts.map +1 -0
- package/dist/transforms/transforms/pig-latin.js +132 -0
- package/dist/transforms/transforms/pig-latin.js.map +1 -0
- package/dist/transforms/transforms/pig-latin.test.d.ts +2 -0
- package/dist/transforms/transforms/pig-latin.test.d.ts.map +1 -0
- package/dist/transforms/transforms/pig-latin.test.js +77 -0
- package/dist/transforms/transforms/pig-latin.test.js.map +1 -0
- package/dist/transforms/transforms/pirate.d.ts +7 -0
- package/dist/transforms/transforms/pirate.d.ts.map +1 -0
- package/dist/transforms/transforms/pirate.js +150 -0
- package/dist/transforms/transforms/pirate.js.map +1 -0
- package/dist/transforms/transforms/redact.d.ts +7 -0
- package/dist/transforms/transforms/redact.d.ts.map +1 -0
- package/dist/transforms/transforms/redact.js +109 -0
- package/dist/transforms/transforms/redact.js.map +1 -0
- package/dist/transforms/transforms/reverse-words.d.ts +7 -0
- package/dist/transforms/transforms/reverse-words.d.ts.map +1 -0
- package/dist/transforms/transforms/reverse-words.js +88 -0
- package/dist/transforms/transforms/reverse-words.js.map +1 -0
- package/dist/transforms/transforms/transforms.test.d.ts +11 -0
- package/dist/transforms/transforms/transforms.test.d.ts.map +1 -0
- package/dist/transforms/transforms/transforms.test.js +489 -0
- package/dist/transforms/transforms/transforms.test.js.map +1 -0
- package/dist/transforms/transforms/ubbi-dubbi.d.ts +7 -0
- package/dist/transforms/transforms/ubbi-dubbi.d.ts.map +1 -0
- package/dist/transforms/transforms/ubbi-dubbi.js +120 -0
- package/dist/transforms/transforms/ubbi-dubbi.js.map +1 -0
- package/dist/transforms/transforms/uwu.d.ts +7 -0
- package/dist/transforms/transforms/uwu.d.ts.map +1 -0
- package/dist/transforms/transforms/uwu.js +106 -0
- package/dist/transforms/transforms/uwu.js.map +1 -0
- package/dist/transforms/types.d.ts +159 -0
- package/dist/transforms/types.d.ts.map +1 -0
- package/dist/transforms/types.js +22 -0
- package/dist/transforms/types.js.map +1 -0
- package/dist/types/api.d.ts +158 -0
- package/dist/types/api.d.ts.map +1 -0
- package/dist/types/api.js +6 -0
- package/dist/types/api.js.map +1 -0
- package/dist/types/config.d.ts +86 -0
- package/dist/types/config.d.ts.map +1 -0
- package/dist/types/config.js +66 -0
- package/dist/types/config.js.map +1 -0
- package/dist/types/context.d.ts +74 -0
- package/dist/types/context.d.ts.map +1 -0
- package/dist/types/context.js +83 -0
- package/dist/types/context.js.map +1 -0
- package/dist/types/index.d.ts +7 -0
- package/dist/types/index.d.ts.map +1 -0
- package/dist/types/index.js +3 -0
- package/dist/types/index.js.map +1 -0
- package/dist/types/lexicon.d.ts +247 -0
- package/dist/types/lexicon.d.ts.map +1 -0
- package/dist/types/lexicon.js +6 -0
- package/dist/types/lexicon.js.map +1 -0
- package/examples/basic-usage.ts +48 -0
- package/examples/corporate-lexicon.ts +71 -0
- package/examples/lexicons/corporate-min.json +200 -0
- package/examples/with-tracing.ts +85 -0
- package/package.json +70 -0
|
@@ -0,0 +1,137 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Output Transform Tokenizer & Renderer
|
|
3
|
+
* Single-pass O(n) tokenizer that preserves exact whitespace and punctuation.
|
|
4
|
+
* Re-rendering via render() is lossless.
|
|
5
|
+
*/
|
|
6
|
+
/** Punctuation characters recognized as their own tokens */
|
|
7
|
+
const PUNCTUATION_CHARS = new Set([
|
|
8
|
+
'.', ',', ';', ':', '!', '?', "'", '"',
|
|
9
|
+
'(', ')', '[', ']', '{', '}',
|
|
10
|
+
'\u2026', // …
|
|
11
|
+
'\u2014', // —
|
|
12
|
+
'-',
|
|
13
|
+
]);
|
|
14
|
+
/** Check if a character is a letter (ASCII A-Z, a-z) */
|
|
15
|
+
function isLetter(ch) {
|
|
16
|
+
const c = ch.charCodeAt(0);
|
|
17
|
+
return (c >= 65 && c <= 90) || (c >= 97 && c <= 122);
|
|
18
|
+
}
|
|
19
|
+
/** Check if a character is a digit */
|
|
20
|
+
function isDigit(ch) {
|
|
21
|
+
const c = ch.charCodeAt(0);
|
|
22
|
+
return c >= 48 && c <= 57;
|
|
23
|
+
}
|
|
24
|
+
/** Check if a character is whitespace */
|
|
25
|
+
function isWhitespace(ch) {
|
|
26
|
+
return ch === ' ' || ch === '\t' || ch === '\n' || ch === '\r';
|
|
27
|
+
}
|
|
28
|
+
/**
|
|
29
|
+
* Tokenize a string into Token[] in a single pass.
|
|
30
|
+
*
|
|
31
|
+
* Token types:
|
|
32
|
+
* - word: sequences of ASCII letters, may include internal apostrophes (e.g., "don't")
|
|
33
|
+
* - number: digits with optional decimals/percent (e.g., "12", "3.14", "60%")
|
|
34
|
+
* - punct: individual punctuation characters
|
|
35
|
+
* - whitespace: sequences of whitespace characters
|
|
36
|
+
* - symbol: anything else
|
|
37
|
+
*/
|
|
38
|
+
export function tokenize(input) {
|
|
39
|
+
const tokens = [];
|
|
40
|
+
const len = input.length;
|
|
41
|
+
let i = 0;
|
|
42
|
+
while (i < len) {
|
|
43
|
+
const ch = input[i];
|
|
44
|
+
// Whitespace token
|
|
45
|
+
if (isWhitespace(ch)) {
|
|
46
|
+
const start = i;
|
|
47
|
+
while (i < len && isWhitespace(input[i])) {
|
|
48
|
+
i++;
|
|
49
|
+
}
|
|
50
|
+
tokens.push({ type: 'whitespace', value: input.slice(start, i) });
|
|
51
|
+
continue;
|
|
52
|
+
}
|
|
53
|
+
// Word token: starts with letter
|
|
54
|
+
if (isLetter(ch)) {
|
|
55
|
+
const start = i;
|
|
56
|
+
i++;
|
|
57
|
+
while (i < len) {
|
|
58
|
+
const c = input[i];
|
|
59
|
+
if (isLetter(c)) {
|
|
60
|
+
i++;
|
|
61
|
+
}
|
|
62
|
+
else if (c === "'" && i + 1 < len && isLetter(input[i + 1])) {
|
|
63
|
+
// Internal apostrophe (e.g., "don't", "manager's")
|
|
64
|
+
i += 2; // skip apostrophe + next letter
|
|
65
|
+
}
|
|
66
|
+
else {
|
|
67
|
+
break;
|
|
68
|
+
}
|
|
69
|
+
}
|
|
70
|
+
tokens.push({ type: 'word', value: input.slice(start, i) });
|
|
71
|
+
continue;
|
|
72
|
+
}
|
|
73
|
+
// Number token: starts with digit
|
|
74
|
+
if (isDigit(ch)) {
|
|
75
|
+
const start = i;
|
|
76
|
+
i++;
|
|
77
|
+
while (i < len && isDigit(input[i])) {
|
|
78
|
+
i++;
|
|
79
|
+
}
|
|
80
|
+
// Optional decimal
|
|
81
|
+
if (i < len && input[i] === '.' && i + 1 < len && isDigit(input[i + 1])) {
|
|
82
|
+
i++; // skip '.'
|
|
83
|
+
while (i < len && isDigit(input[i])) {
|
|
84
|
+
i++;
|
|
85
|
+
}
|
|
86
|
+
}
|
|
87
|
+
// Optional percent
|
|
88
|
+
if (i < len && input[i] === '%') {
|
|
89
|
+
i++;
|
|
90
|
+
}
|
|
91
|
+
tokens.push({ type: 'number', value: input.slice(start, i) });
|
|
92
|
+
continue;
|
|
93
|
+
}
|
|
94
|
+
// Punctuation token
|
|
95
|
+
if (PUNCTUATION_CHARS.has(ch)) {
|
|
96
|
+
// Handle multi-char ellipsis "..."
|
|
97
|
+
if (ch === '.' && i + 2 < len && input[i + 1] === '.' && input[i + 2] === '.') {
|
|
98
|
+
tokens.push({ type: 'punct', value: '...' });
|
|
99
|
+
i += 3;
|
|
100
|
+
}
|
|
101
|
+
else {
|
|
102
|
+
tokens.push({ type: 'punct', value: ch });
|
|
103
|
+
i++;
|
|
104
|
+
}
|
|
105
|
+
continue;
|
|
106
|
+
}
|
|
107
|
+
// Symbol token: anything else, one character at a time
|
|
108
|
+
tokens.push({ type: 'symbol', value: ch });
|
|
109
|
+
i++;
|
|
110
|
+
}
|
|
111
|
+
return tokens;
|
|
112
|
+
}
|
|
113
|
+
/**
|
|
114
|
+
* Render tokens back to a string. Lossless: render(tokenize(s)) === s
|
|
115
|
+
*/
|
|
116
|
+
export function render(tokens) {
|
|
117
|
+
let result = '';
|
|
118
|
+
for (const token of tokens) {
|
|
119
|
+
result += token.value;
|
|
120
|
+
}
|
|
121
|
+
return result;
|
|
122
|
+
}
|
|
123
|
+
/**
|
|
124
|
+
* Get the type classification of a single character (utility).
|
|
125
|
+
*/
|
|
126
|
+
export function classifyChar(ch) {
|
|
127
|
+
if (isWhitespace(ch))
|
|
128
|
+
return 'whitespace';
|
|
129
|
+
if (isLetter(ch))
|
|
130
|
+
return 'word';
|
|
131
|
+
if (isDigit(ch))
|
|
132
|
+
return 'number';
|
|
133
|
+
if (PUNCTUATION_CHARS.has(ch))
|
|
134
|
+
return 'punct';
|
|
135
|
+
return 'symbol';
|
|
136
|
+
}
|
|
137
|
+
//# sourceMappingURL=tokenizer.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tokenizer.js","sourceRoot":"","sources":["../../src/transforms/tokenizer.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAIH,4DAA4D;AAC5D,MAAM,iBAAiB,GAAG,IAAI,GAAG,CAAC;IAChC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG;IACtC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG;IAC5B,QAAQ,EAAE,IAAI;IACd,QAAQ,EAAE,IAAI;IACd,GAAG;CACJ,CAAC,CAAC;AAEH,wDAAwD;AACxD,SAAS,QAAQ,CAAC,EAAU;IAC1B,MAAM,CAAC,GAAG,EAAE,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;IAC3B,OAAO,CAAC,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,CAAC,IAAI,CAAC,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,GAAG,CAAC,CAAC;AACvD,CAAC;AAED,sCAAsC;AACtC,SAAS,OAAO,CAAC,EAAU;IACzB,MAAM,CAAC,GAAG,EAAE,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;IAC3B,OAAO,CAAC,IAAI,EAAE,IAAI,CAAC,IAAI,EAAE,CAAC;AAC5B,CAAC;AAED,yCAAyC;AACzC,SAAS,YAAY,CAAC,EAAU;IAC9B,OAAO,EAAE,KAAK,GAAG,IAAI,EAAE,KAAK,IAAI,IAAI,EAAE,KAAK,IAAI,IAAI,EAAE,KAAK,IAAI,CAAC;AACjE,CAAC;AAED;;;;;;;;;GASG;AACH,MAAM,UAAU,QAAQ,CAAC,KAAa;IACpC,MAAM,MAAM,GAAY,EAAE,CAAC;IAC3B,MAAM,GAAG,GAAG,KAAK,CAAC,MAAM,CAAC;IACzB,IAAI,CAAC,GAAG,CAAC,CAAC;IAEV,OAAO,CAAC,GAAG,GAAG,EAAE,CAAC;QACf,MAAM,EAAE,GAAG,KAAK,CAAC,CAAC,CAAE,CAAC;QAErB,mBAAmB;QACnB,IAAI,YAAY,CAAC,EAAE,CAAC,EAAE,CAAC;YACrB,MAAM,KAAK,GAAG,CAAC,CAAC;YAChB,OAAO,CAAC,GAAG,GAAG,IAAI,YAAY,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,EAAE,CAAC;gBAC1C,CAAC,EAAE,CAAC;YACN,CAAC;YACD,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,KAAK,EAAE,KAAK,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC;YAClE,SAAS;QACX,CAAC;QAED,iCAAiC;QACjC,IAAI,QAAQ,CAAC,EAAE,CAAC,EAAE,CAAC;YACjB,MAAM,KAAK,GAAG,CAAC,CAAC;YAChB,CAAC,EAAE,CAAC;YACJ,OAAO,CAAC,GAAG,GAAG,EAAE,CAAC;gBACf,MAAM,CAAC,GAAG,KAAK,CAAC,CAAC,CAAE,CAAC;gBACpB,IAAI,QAAQ,CAAC,CAAC,CAAC,EAAE,CAAC;oBAChB,CAAC,EAAE,CAAC;gBACN,CAAC;qBAAM,IAAI,CAAC,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,GAAG,IAAI,QAAQ,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAE,CAAC,EAAE,CAAC;oBAC/D,mDAAmD;oBACnD,CAAC,IAAI,CAAC,CAAC,CAAC,gCAAgC;gBAC1C,CAAC;qBAAM,CAAC;oBACN,MAAM;gBACR,CAAC;YACH,CAAC;YACD,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,KAAK,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC;YAC5D,SAAS;QACX,CAAC;QAED,kCAAkC;QAClC,IAAI,OAAO,CAAC,EAAE,CAAC,EAAE,CAAC;YAChB,MAAM,KAAK,GAAG,CAAC,CAAC;YAChB,CAAC,EAAE,CAAC;YACJ,OAAO,CAAC,GAAG,GAAG,IAAI,OAAO,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,EAAE,CAAC;gBACrC,CAAC,EAAE,CAAC;YACN,CAAC;YACD,mBAAmB;YACnB,IAAI,CAAC,GAAG,GAAG,IAAI,KAAK,CAAC,CAAC,CAAC,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,GAAG,IAAI,OAAO,CAAC,KAAK,CAAC,CAAC,GAAG,CAAC,CAAE,CAAC,EAAE,CAAC;gBACzE,CAAC,EAAE,CAAC,CAAC,WAAW;gBAChB,OAAO,CAAC,GAAG,GAAG,IAAI,OAAO,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,EAAE,CAAC;oBACrC,CAAC,EAAE,CAAC;gBACN,CAAC;YACH,CAAC;YACD,mBAAmB;YACnB,IAAI,CAAC,GAAG,GAAG,IAAI,KAAK,CAAC,CAAC,CAAC,KAAK,GAAG,EAAE,CAAC;gBAChC,CAAC,EAAE,CAAC;YACN,CAAC;YACD,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,KAAK,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,CAAC,EAAE,CAAC,CAAC;YAC9D,SAAS;QACX,CAAC;QAED,oBAAoB;QACpB,IAAI,iBAAiB,CAAC,GAAG,CAAC,EAAE,CAAC,EAAE,CAAC;YAC9B,mCAAmC;YACnC,IAAI,EAAE,KAAK,GAAG,IAAI,CAAC,GAAG,CAAC,GAAG,GAAG,IAAI,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,GAAG,IAAI,KAAK,CAAC,CAAC,GAAG,CAAC,CAAC,KAAK,GAAG,EAAE,CAAC;gBAC9E,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC,CAAC;gBAC7C,CAAC,IAAI,CAAC,CAAC;YACT,CAAC;iBAAM,CAAC;gBACN,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,EAAE,EAAE,CAAC,CAAC;gBAC1C,CAAC,EAAE,CAAC;YACN,CAAC;YACD,SAAS;QACX,CAAC;QAED,uDAAuD;QACvD,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,EAAE,EAAE,CAAC,CAAC;QAC3C,CAAC,EAAE,CAAC;IACN,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;GAEG;AACH,MAAM,UAAU,MAAM,CAAC,MAAe;IACpC,IAAI,MAAM,GAAG,EAAE,CAAC;IAChB,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;QAC3B,MAAM,IAAI,KAAK,CAAC,KAAK,CAAC;IACxB,CAAC;IACD,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;GAEG;AACH,MAAM,UAAU,YAAY,CAAC,EAAU;IACrC,IAAI,YAAY,CAAC,EAAE,CAAC;QAAE,OAAO,YAAY,CAAC;IAC1C,IAAI,QAAQ,CAAC,EAAE,CAAC;QAAE,OAAO,MAAM,CAAC;IAChC,IAAI,OAAO,CAAC,EAAE,CAAC;QAAE,OAAO,QAAQ,CAAC;IACjC,IAAI,iBAAiB,CAAC,GAAG,CAAC,EAAE,CAAC;QAAE,OAAO,OAAO,CAAC;IAC9C,OAAO,QAAQ,CAAC;AAClB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tokenizer.test.d.ts","sourceRoot":"","sources":["../../src/transforms/tokenizer.test.ts"],"names":[],"mappings":""}
|
|
@@ -0,0 +1,85 @@
|
|
|
1
|
+
import { describe, it, expect } from 'vitest';
|
|
2
|
+
import { tokenize, render } from './tokenizer.js';
|
|
3
|
+
describe('Tokenizer', () => {
|
|
4
|
+
describe('tokenize', () => {
|
|
5
|
+
it('should tokenize a simple sentence', () => {
|
|
6
|
+
const tokens = tokenize('Hello world.');
|
|
7
|
+
expect(tokens).toHaveLength(4);
|
|
8
|
+
expect(tokens[0]).toEqual({ type: 'word', value: 'Hello' });
|
|
9
|
+
expect(tokens[1]).toEqual({ type: 'whitespace', value: ' ' });
|
|
10
|
+
expect(tokens[2]).toEqual({ type: 'word', value: 'world' });
|
|
11
|
+
expect(tokens[3]).toEqual({ type: 'punct', value: '.' });
|
|
12
|
+
});
|
|
13
|
+
it('should handle words with internal apostrophes', () => {
|
|
14
|
+
const tokens = tokenize("don't manager's");
|
|
15
|
+
expect(tokens).toHaveLength(3);
|
|
16
|
+
expect(tokens[0]).toEqual({ type: 'word', value: "don't" });
|
|
17
|
+
expect(tokens[1]).toEqual({ type: 'whitespace', value: ' ' });
|
|
18
|
+
expect(tokens[2]).toEqual({ type: 'word', value: "manager's" });
|
|
19
|
+
});
|
|
20
|
+
it('should tokenize numbers with decimals and percent', () => {
|
|
21
|
+
const tokens = tokenize('12 3.14 60%');
|
|
22
|
+
expect(tokens).toHaveLength(5);
|
|
23
|
+
expect(tokens[0]).toEqual({ type: 'number', value: '12' });
|
|
24
|
+
expect(tokens[2]).toEqual({ type: 'number', value: '3.14' });
|
|
25
|
+
expect(tokens[4]).toEqual({ type: 'number', value: '60%' });
|
|
26
|
+
});
|
|
27
|
+
it('should tokenize punctuation as separate tokens', () => {
|
|
28
|
+
const tokens = tokenize('Hello, world! "Yes."');
|
|
29
|
+
const punctTokens = tokens.filter(t => t.type === 'punct');
|
|
30
|
+
expect(punctTokens.map(t => t.value)).toEqual([',', '!', '"', '.', '"']);
|
|
31
|
+
});
|
|
32
|
+
it('should tokenize ellipsis as single token', () => {
|
|
33
|
+
const tokens = tokenize('Wait...');
|
|
34
|
+
expect(tokens[1]).toEqual({ type: 'punct', value: '...' });
|
|
35
|
+
});
|
|
36
|
+
it('should handle multiple whitespace types', () => {
|
|
37
|
+
const tokens = tokenize("Hello\t\nworld");
|
|
38
|
+
expect(tokens[1]).toEqual({ type: 'whitespace', value: '\t\n' });
|
|
39
|
+
});
|
|
40
|
+
it('should tokenize symbol characters', () => {
|
|
41
|
+
const tokens = tokenize('@#$');
|
|
42
|
+
expect(tokens.every(t => t.type === 'symbol')).toBe(true);
|
|
43
|
+
});
|
|
44
|
+
it('should handle empty string', () => {
|
|
45
|
+
const tokens = tokenize('');
|
|
46
|
+
expect(tokens).toHaveLength(0);
|
|
47
|
+
});
|
|
48
|
+
it('should handle multi-sentence text', () => {
|
|
49
|
+
const tokens = tokenize('Hello world. How are you?');
|
|
50
|
+
const words = tokens.filter(t => t.type === 'word');
|
|
51
|
+
expect(words).toHaveLength(5);
|
|
52
|
+
});
|
|
53
|
+
it('should handle em dash correctly', () => {
|
|
54
|
+
const tokens = tokenize('yes\u2014no');
|
|
55
|
+
expect(tokens[1]).toEqual({ type: 'punct', value: '\u2014' });
|
|
56
|
+
});
|
|
57
|
+
});
|
|
58
|
+
describe('render', () => {
|
|
59
|
+
it('should be lossless: render(tokenize(s)) === s', () => {
|
|
60
|
+
const inputs = [
|
|
61
|
+
'Hello world.',
|
|
62
|
+
"Don't stop! The manager's plan is 60% done.",
|
|
63
|
+
'Wait... really?',
|
|
64
|
+
'A, B, and C.',
|
|
65
|
+
' multiple spaces ',
|
|
66
|
+
'@user #hashtag $100',
|
|
67
|
+
'',
|
|
68
|
+
'Hello\tworld\nnewline.',
|
|
69
|
+
'Wow! "Yes," he said.',
|
|
70
|
+
];
|
|
71
|
+
for (const input of inputs) {
|
|
72
|
+
expect(render(tokenize(input))).toBe(input);
|
|
73
|
+
}
|
|
74
|
+
});
|
|
75
|
+
it('should handle complex punctuation losslessly', () => {
|
|
76
|
+
const input = 'She said, "Hello!" (and waved).';
|
|
77
|
+
expect(render(tokenize(input))).toBe(input);
|
|
78
|
+
});
|
|
79
|
+
it('should preserve exact whitespace', () => {
|
|
80
|
+
const input = 'Hello world ';
|
|
81
|
+
expect(render(tokenize(input))).toBe(input);
|
|
82
|
+
});
|
|
83
|
+
});
|
|
84
|
+
});
|
|
85
|
+
//# sourceMappingURL=tokenizer.test.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"tokenizer.test.js","sourceRoot":"","sources":["../../src/transforms/tokenizer.test.ts"],"names":[],"mappings":"AAAA,OAAO,EAAE,QAAQ,EAAE,EAAE,EAAE,MAAM,EAAE,MAAM,QAAQ,CAAC;AAC9C,OAAO,EAAE,QAAQ,EAAE,MAAM,EAAE,MAAM,gBAAgB,CAAC;AAElD,QAAQ,CAAC,WAAW,EAAE,GAAG,EAAE;IACzB,QAAQ,CAAC,UAAU,EAAE,GAAG,EAAE;QACxB,EAAE,CAAC,mCAAmC,EAAE,GAAG,EAAE;YAC3C,MAAM,MAAM,GAAG,QAAQ,CAAC,cAAc,CAAC,CAAC;YACxC,MAAM,CAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;YAC/B,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,OAAO,EAAE,CAAC,CAAC;YAC5D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,KAAK,EAAE,GAAG,EAAE,CAAC,CAAC;YAC9D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,OAAO,EAAE,CAAC,CAAC;YAC5D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,GAAG,EAAE,CAAC,CAAC;QAC3D,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,+CAA+C,EAAE,GAAG,EAAE;YACvD,MAAM,MAAM,GAAG,QAAQ,CAAC,iBAAiB,CAAC,CAAC;YAC3C,MAAM,CAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;YAC/B,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,OAAO,EAAE,CAAC,CAAC;YAC5D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,KAAK,EAAE,GAAG,EAAE,CAAC,CAAC;YAC9D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,WAAW,EAAE,CAAC,CAAC;QAClE,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,mDAAmD,EAAE,GAAG,EAAE;YAC3D,MAAM,MAAM,GAAG,QAAQ,CAAC,aAAa,CAAC,CAAC;YACvC,MAAM,CAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;YAC/B,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,IAAI,EAAE,CAAC,CAAC;YAC3D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,MAAM,EAAE,CAAC,CAAC;YAC7D,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,QAAQ,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC,CAAC;QAC9D,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,gDAAgD,EAAE,GAAG,EAAE;YACxD,MAAM,MAAM,GAAG,QAAQ,CAAC,sBAAsB,CAAC,CAAC;YAChD,MAAM,WAAW,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,OAAO,CAAC,CAAC;YAC3D,MAAM,CAAC,WAAW,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,KAAK,CAAC,CAAC,CAAC,OAAO,CAAC,CAAC,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,EAAE,GAAG,CAAC,CAAC,CAAC;QAC3E,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,0CAA0C,EAAE,GAAG,EAAE;YAClD,MAAM,MAAM,GAAG,QAAQ,CAAC,SAAS,CAAC,CAAC;YACnC,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC,CAAC;QAC7D,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,yCAAyC,EAAE,GAAG,EAAE;YACjD,MAAM,MAAM,GAAG,QAAQ,CAAC,gBAAgB,CAAC,CAAC;YAC1C,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,KAAK,EAAE,MAAM,EAAE,CAAC,CAAC;QACnE,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,mCAAmC,EAAE,GAAG,EAAE;YAC3C,MAAM,MAAM,GAAG,QAAQ,CAAC,KAAK,CAAC,CAAC;YAC/B,MAAM,CAAC,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,QAAQ,CAAC,CAAC,CAAC,IAAI,CAAC,IAAI,CAAC,CAAC;QAC5D,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,4BAA4B,EAAE,GAAG,EAAE;YACpC,MAAM,MAAM,GAAG,QAAQ,CAAC,EAAE,CAAC,CAAC;YAC5B,MAAM,CAAC,MAAM,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;QACjC,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,mCAAmC,EAAE,GAAG,EAAE;YAC3C,MAAM,MAAM,GAAG,QAAQ,CAAC,2BAA2B,CAAC,CAAC;YACrD,MAAM,KAAK,GAAG,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,MAAM,CAAC,CAAC;YACpD,MAAM,CAAC,KAAK,CAAC,CAAC,YAAY,CAAC,CAAC,CAAC,CAAC;QAChC,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,iCAAiC,EAAE,GAAG,EAAE;YACzC,MAAM,MAAM,GAAG,QAAQ,CAAC,aAAa,CAAC,CAAC;YACvC,MAAM,CAAC,MAAM,CAAC,CAAC,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,IAAI,EAAE,OAAO,EAAE,KAAK,EAAE,QAAQ,EAAE,CAAC,CAAC;QAChE,CAAC,CAAC,CAAC;IACL,CAAC,CAAC,CAAC;IAEH,QAAQ,CAAC,QAAQ,EAAE,GAAG,EAAE;QACtB,EAAE,CAAC,+CAA+C,EAAE,GAAG,EAAE;YACvD,MAAM,MAAM,GAAG;gBACb,cAAc;gBACd,6CAA6C;gBAC7C,iBAAiB;gBACjB,cAAc;gBACd,sBAAsB;gBACtB,qBAAqB;gBACrB,EAAE;gBACF,wBAAwB;gBACxB,sBAAsB;aACvB,CAAC;YAEF,KAAK,MAAM,KAAK,IAAI,MAAM,EAAE,CAAC;gBAC3B,MAAM,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;YAC9C,CAAC;QACH,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,8CAA8C,EAAE,GAAG,EAAE;YACtD,MAAM,KAAK,GAAG,iCAAiC,CAAC;YAChD,MAAM,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAC9C,CAAC,CAAC,CAAC;QAEH,EAAE,CAAC,kCAAkC,EAAE,GAAG,EAAE;YAC1C,MAAM,KAAK,GAAG,iBAAiB,CAAC;YAChC,MAAM,CAAC,MAAM,CAAC,QAAQ,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,CAAC;QAC9C,CAAC,CAAC,CAAC;IACL,CAAC,CAAC,CAAC;AACL,CAAC,CAAC,CAAC"}
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Corporate Jargon Transform (id="bizJargon")
|
|
3
|
+
* Replace common verbs/adjectives with corporate synonyms.
|
|
4
|
+
*/
|
|
5
|
+
import type { IOutputTransform } from '../types.js';
|
|
6
|
+
export declare const bizJargonTransform: IOutputTransform;
|
|
7
|
+
//# sourceMappingURL=biz-jargon.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"biz-jargon.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/biz-jargon.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,gBAAgB,EAMjB,MAAM,aAAa,CAAC;AAiErB,eAAO,MAAM,kBAAkB,EAAE,gBAgEhC,CAAC"}
|
|
@@ -0,0 +1,117 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Corporate Jargon Transform (id="bizJargon")
|
|
3
|
+
* Replace common verbs/adjectives with corporate synonyms.
|
|
4
|
+
*/
|
|
5
|
+
import { isProtected } from '../protection.js';
|
|
6
|
+
const DEFAULT_MAP = {
|
|
7
|
+
'use': ['leverage', 'utilize'],
|
|
8
|
+
'help': ['enable', 'empower', 'facilitate'],
|
|
9
|
+
'change': ['drive', 'pivot', 'transform'],
|
|
10
|
+
'start': ['kick off', 'greenlight', 'initiate'],
|
|
11
|
+
'plan': ['roadmap', 'strategize'],
|
|
12
|
+
'talk': ['align', 'sync', 'circle back'],
|
|
13
|
+
'meet': ['sync', 'connect', 'huddle'],
|
|
14
|
+
'ask': ['reach out', 'ping', 'loop in'],
|
|
15
|
+
'work': ['collaborate', 'execute', 'operationalize'],
|
|
16
|
+
'think': ['ideate', 'brainstorm', 'synergize'],
|
|
17
|
+
'try': ['iterate', 'explore', 'pilot'],
|
|
18
|
+
'make': ['build', 'architect', 'craft'],
|
|
19
|
+
'improve': ['optimize', 'uplevel', 'enhance'],
|
|
20
|
+
'show': ['showcase', 'demo', 'surface'],
|
|
21
|
+
'give': ['deliver', 'provide', 'offer'],
|
|
22
|
+
'get': ['secure', 'acquire', 'obtain'],
|
|
23
|
+
'tell': ['communicate', 'message', 'brief'],
|
|
24
|
+
'end': ['sunset', 'deprecate', 'wind down'],
|
|
25
|
+
'fix': ['remediate', 'resolve', 'address'],
|
|
26
|
+
'move': ['transition', 'migrate', 'shift'],
|
|
27
|
+
'big': ['scalable', 'enterprise-grade', 'robust'],
|
|
28
|
+
'good': ['best-in-class', 'world-class', 'premium'],
|
|
29
|
+
'new': ['innovative', 'cutting-edge', 'next-gen'],
|
|
30
|
+
'fast': ['agile', 'nimble', 'rapid'],
|
|
31
|
+
'important': ['mission-critical', 'high-priority', 'key'],
|
|
32
|
+
'hard': ['challenging', 'complex', 'non-trivial'],
|
|
33
|
+
'problem': ['challenge', 'opportunity', 'pain point'],
|
|
34
|
+
'idea': ['initiative', 'value proposition', 'thought leadership'],
|
|
35
|
+
'result': ['outcome', 'deliverable', 'KPI'],
|
|
36
|
+
'effect': ['impact', 'value-add', 'ROI'],
|
|
37
|
+
'team': ['squad', 'pod', 'task force'],
|
|
38
|
+
'goal': ['OKR', 'north star', 'target'],
|
|
39
|
+
'money': ['capital', 'budget', 'resources'],
|
|
40
|
+
'way': ['methodology', 'framework', 'approach'],
|
|
41
|
+
};
|
|
42
|
+
const DEFAULT_PARAMS = {
|
|
43
|
+
rate: 0.18,
|
|
44
|
+
map: DEFAULT_MAP,
|
|
45
|
+
caseInsensitive: true,
|
|
46
|
+
preserveCase: true,
|
|
47
|
+
};
|
|
48
|
+
function matchCase(source, target) {
|
|
49
|
+
if (source.length === 0 || target.length === 0)
|
|
50
|
+
return target;
|
|
51
|
+
if (source === source.toUpperCase() && source !== source.toLowerCase()) {
|
|
52
|
+
return target.toUpperCase();
|
|
53
|
+
}
|
|
54
|
+
if (source[0] >= 'A' && source[0] <= 'Z') {
|
|
55
|
+
return target[0].toUpperCase() + target.slice(1);
|
|
56
|
+
}
|
|
57
|
+
return target.toLowerCase();
|
|
58
|
+
}
|
|
59
|
+
export const bizJargonTransform = {
|
|
60
|
+
id: 'bizJargon',
|
|
61
|
+
version: '1.0.0',
|
|
62
|
+
capabilities: {
|
|
63
|
+
requiresTrace: false,
|
|
64
|
+
posAware: false,
|
|
65
|
+
deterministic: true,
|
|
66
|
+
safeToStack: true,
|
|
67
|
+
preferredOrder: 10,
|
|
68
|
+
},
|
|
69
|
+
validateParams(params) {
|
|
70
|
+
const errors = [];
|
|
71
|
+
if (params && typeof params === 'object') {
|
|
72
|
+
const p = params;
|
|
73
|
+
if (p.rate !== undefined) {
|
|
74
|
+
const rate = p.rate;
|
|
75
|
+
if (typeof rate !== 'number' || rate < 0 || rate > 1) {
|
|
76
|
+
errors.push('rate must be between 0 and 1');
|
|
77
|
+
}
|
|
78
|
+
}
|
|
79
|
+
if (p.map !== undefined && (typeof p.map !== 'object' || p.map === null)) {
|
|
80
|
+
errors.push('map must be an object');
|
|
81
|
+
}
|
|
82
|
+
}
|
|
83
|
+
return { valid: errors.length === 0, errors };
|
|
84
|
+
},
|
|
85
|
+
apply(input) {
|
|
86
|
+
const params = {
|
|
87
|
+
...DEFAULT_PARAMS,
|
|
88
|
+
...input.params,
|
|
89
|
+
map: {
|
|
90
|
+
...DEFAULT_MAP,
|
|
91
|
+
...(input.params.map ?? {}),
|
|
92
|
+
},
|
|
93
|
+
};
|
|
94
|
+
const tokens = [];
|
|
95
|
+
// Build lookup
|
|
96
|
+
const lowerMap = new Map();
|
|
97
|
+
for (const [k, v] of Object.entries(params.map)) {
|
|
98
|
+
lowerMap.set(params.caseInsensitive ? k.toLowerCase() : k, v);
|
|
99
|
+
}
|
|
100
|
+
for (const token of input.tokens) {
|
|
101
|
+
if (token.type === 'word' && !isProtected(token)) {
|
|
102
|
+
const lookupKey = params.caseInsensitive ? token.value.toLowerCase() : token.value;
|
|
103
|
+
const replacements = lowerMap.get(lookupKey);
|
|
104
|
+
if (replacements && replacements.length > 0 && input.rng.chance(params.rate)) {
|
|
105
|
+
// Deterministic selection: use first option
|
|
106
|
+
const replacement = replacements[0];
|
|
107
|
+
const cased = params.preserveCase ? matchCase(token.value, replacement) : replacement;
|
|
108
|
+
tokens.push({ ...token, value: cased });
|
|
109
|
+
continue;
|
|
110
|
+
}
|
|
111
|
+
}
|
|
112
|
+
tokens.push({ ...token });
|
|
113
|
+
}
|
|
114
|
+
return { tokens };
|
|
115
|
+
},
|
|
116
|
+
};
|
|
117
|
+
//# sourceMappingURL=biz-jargon.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"biz-jargon.js","sourceRoot":"","sources":["../../../src/transforms/transforms/biz-jargon.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAUH,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAS/C,MAAM,WAAW,GAA6B;IAC5C,KAAK,EAAE,CAAC,UAAU,EAAE,SAAS,CAAC;IAC9B,MAAM,EAAE,CAAC,QAAQ,EAAE,SAAS,EAAE,YAAY,CAAC;IAC3C,QAAQ,EAAE,CAAC,OAAO,EAAE,OAAO,EAAE,WAAW,CAAC;IACzC,OAAO,EAAE,CAAC,UAAU,EAAE,YAAY,EAAE,UAAU,CAAC;IAC/C,MAAM,EAAE,CAAC,SAAS,EAAE,YAAY,CAAC;IACjC,MAAM,EAAE,CAAC,OAAO,EAAE,MAAM,EAAE,aAAa,CAAC;IACxC,MAAM,EAAE,CAAC,MAAM,EAAE,SAAS,EAAE,QAAQ,CAAC;IACrC,KAAK,EAAE,CAAC,WAAW,EAAE,MAAM,EAAE,SAAS,CAAC;IACvC,MAAM,EAAE,CAAC,aAAa,EAAE,SAAS,EAAE,gBAAgB,CAAC;IACpD,OAAO,EAAE,CAAC,QAAQ,EAAE,YAAY,EAAE,WAAW,CAAC;IAC9C,KAAK,EAAE,CAAC,SAAS,EAAE,SAAS,EAAE,OAAO,CAAC;IACtC,MAAM,EAAE,CAAC,OAAO,EAAE,WAAW,EAAE,OAAO,CAAC;IACvC,SAAS,EAAE,CAAC,UAAU,EAAE,SAAS,EAAE,SAAS,CAAC;IAC7C,MAAM,EAAE,CAAC,UAAU,EAAE,MAAM,EAAE,SAAS,CAAC;IACvC,MAAM,EAAE,CAAC,SAAS,EAAE,SAAS,EAAE,OAAO,CAAC;IACvC,KAAK,EAAE,CAAC,QAAQ,EAAE,SAAS,EAAE,QAAQ,CAAC;IACtC,MAAM,EAAE,CAAC,aAAa,EAAE,SAAS,EAAE,OAAO,CAAC;IAC3C,KAAK,EAAE,CAAC,QAAQ,EAAE,WAAW,EAAE,WAAW,CAAC;IAC3C,KAAK,EAAE,CAAC,WAAW,EAAE,SAAS,EAAE,SAAS,CAAC;IAC1C,MAAM,EAAE,CAAC,YAAY,EAAE,SAAS,EAAE,OAAO,CAAC;IAC1C,KAAK,EAAE,CAAC,UAAU,EAAE,kBAAkB,EAAE,QAAQ,CAAC;IACjD,MAAM,EAAE,CAAC,eAAe,EAAE,aAAa,EAAE,SAAS,CAAC;IACnD,KAAK,EAAE,CAAC,YAAY,EAAE,cAAc,EAAE,UAAU,CAAC;IACjD,MAAM,EAAE,CAAC,OAAO,EAAE,QAAQ,EAAE,OAAO,CAAC;IACpC,WAAW,EAAE,CAAC,kBAAkB,EAAE,eAAe,EAAE,KAAK,CAAC;IACzD,MAAM,EAAE,CAAC,aAAa,EAAE,SAAS,EAAE,aAAa,CAAC;IACjD,SAAS,EAAE,CAAC,WAAW,EAAE,aAAa,EAAE,YAAY,CAAC;IACrD,MAAM,EAAE,CAAC,YAAY,EAAE,mBAAmB,EAAE,oBAAoB,CAAC;IACjE,QAAQ,EAAE,CAAC,SAAS,EAAE,aAAa,EAAE,KAAK,CAAC;IAC3C,QAAQ,EAAE,CAAC,QAAQ,EAAE,WAAW,EAAE,KAAK,CAAC;IACxC,MAAM,EAAE,CAAC,OAAO,EAAE,KAAK,EAAE,YAAY,CAAC;IACtC,MAAM,EAAE,CAAC,KAAK,EAAE,YAAY,EAAE,QAAQ,CAAC;IACvC,OAAO,EAAE,CAAC,SAAS,EAAE,QAAQ,EAAE,WAAW,CAAC;IAC3C,KAAK,EAAE,CAAC,aAAa,EAAE,WAAW,EAAE,UAAU,CAAC;CAChD,CAAC;AAEF,MAAM,cAAc,GAAoB;IACtC,IAAI,EAAE,IAAI;IACV,GAAG,EAAE,WAAW;IAChB,eAAe,EAAE,IAAI;IACrB,YAAY,EAAE,IAAI;CACnB,CAAC;AAEF,SAAS,SAAS,CAAC,MAAc,EAAE,MAAc;IAC/C,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,MAAM,CAAC;IAC9D,IAAI,MAAM,KAAK,MAAM,CAAC,WAAW,EAAE,IAAI,MAAM,KAAK,MAAM,CAAC,WAAW,EAAE,EAAE,CAAC;QACvE,OAAO,MAAM,CAAC,WAAW,EAAE,CAAC;IAC9B,CAAC;IACD,IAAI,MAAM,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,MAAM,CAAC,CAAC,CAAE,IAAI,GAAG,EAAE,CAAC;QAC3C,OAAO,MAAM,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;IACpD,CAAC;IACD,OAAO,MAAM,CAAC,WAAW,EAAE,CAAC;AAC9B,CAAC;AAED,MAAM,CAAC,MAAM,kBAAkB,GAAqB;IAClD,EAAE,EAAE,WAAW;IACf,OAAO,EAAE,OAAO;IAChB,YAAY,EAAE;QACZ,aAAa,EAAE,KAAK;QACpB,QAAQ,EAAE,KAAK;QACf,aAAa,EAAE,IAAI;QACnB,WAAW,EAAE,IAAI;QACjB,cAAc,EAAE,EAAE;KACa;IAEjC,cAAc,CAAC,MAAe;QAC5B,MAAM,MAAM,GAAa,EAAE,CAAC;QAC5B,IAAI,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,EAAE,CAAC;YACzC,MAAM,CAAC,GAAG,MAAiC,CAAC;YAC5C,IAAI,CAAC,CAAC,IAAI,KAAK,SAAS,EAAE,CAAC;gBACzB,MAAM,IAAI,GAAG,CAAC,CAAC,IAAc,CAAC;gBAC9B,IAAI,OAAO,IAAI,KAAK,QAAQ,IAAI,IAAI,GAAG,CAAC,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;oBACrD,MAAM,CAAC,IAAI,CAAC,8BAA8B,CAAC,CAAC;gBAC9C,CAAC;YACH,CAAC;YACD,IAAI,CAAC,CAAC,GAAG,KAAK,SAAS,IAAI,CAAC,OAAO,CAAC,CAAC,GAAG,KAAK,QAAQ,IAAI,CAAC,CAAC,GAAG,KAAK,IAAI,CAAC,EAAE,CAAC;gBACzE,MAAM,CAAC,IAAI,CAAC,uBAAuB,CAAC,CAAC;YACvC,CAAC;QACH,CAAC;QACD,OAAO,EAAE,KAAK,EAAE,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;IAChD,CAAC;IAED,KAAK,CAAC,KAAqB;QACzB,MAAM,MAAM,GAAoB;YAC9B,GAAG,cAAc;YACjB,GAAI,KAAK,CAAC,MAAmC;YAC7C,GAAG,EAAE;gBACH,GAAG,WAAW;gBACd,GAAG,CAAE,KAAK,CAAC,MAAmC,CAAC,GAAG,IAAI,EAAE,CAAC;aAC1D;SACF,CAAC;QACF,MAAM,MAAM,GAAY,EAAE,CAAC;QAE3B,eAAe;QACf,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAoB,CAAC;QAC7C,KAAK,MAAM,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC;YAChD,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAC,eAAe,CAAC,CAAC,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;QAChE,CAAC;QAED,KAAK,MAAM,KAAK,IAAI,KAAK,CAAC,MAAM,EAAE,CAAC;YACjC,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;gBACjD,MAAM,SAAS,GAAG,MAAM,CAAC,eAAe,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC;gBACnF,MAAM,YAAY,GAAG,QAAQ,CAAC,GAAG,CAAC,SAAS,CAAC,CAAC;gBAE7C,IAAI,YAAY,IAAI,YAAY,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC;oBAC7E,4CAA4C;oBAC5C,MAAM,WAAW,GAAG,YAAY,CAAC,CAAC,CAAE,CAAC;oBACrC,MAAM,KAAK,GAAG,MAAM,CAAC,YAAY,CAAC,CAAC,CAAC,SAAS,CAAC,KAAK,CAAC,KAAK,EAAE,WAAW,CAAC,CAAC,CAAC,CAAC,WAAW,CAAC;oBACtF,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC,CAAC;oBACxC,SAAS;gBACX,CAAC;YACH,CAAC;YAED,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;QAC5B,CAAC;QAED,OAAO,EAAE,MAAM,EAAE,CAAC;IACpB,CAAC;CACF,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"emoji.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/emoji.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,gBAAgB,EAMjB,MAAM,aAAa,CAAC;AAwErB,eAAO,MAAM,cAAc,EAAE,gBAoE5B,CAAC"}
|
|
@@ -0,0 +1,127 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Emoji-speak Transform (id="emoji")
|
|
3
|
+
* Replace certain words with emojis using mapping tables.
|
|
4
|
+
*/
|
|
5
|
+
import { isProtected } from '../protection.js';
|
|
6
|
+
const DEFAULT_MAP = {
|
|
7
|
+
'happy': ['\uD83D\uDE0A', '\uD83D\uDE04'],
|
|
8
|
+
'sad': ['\uD83D\uDE22', '\uD83D\uDE1E'],
|
|
9
|
+
'love': ['\u2764\uFE0F', '\uD83D\uDC95'],
|
|
10
|
+
'heart': ['\u2764\uFE0F', '\uD83D\uDC96'],
|
|
11
|
+
'fire': ['\uD83D\uDD25'],
|
|
12
|
+
'money': ['\uD83D\uDCB0', '\uD83D\uDCB5'],
|
|
13
|
+
'star': ['\u2B50', '\uD83C\uDF1F'],
|
|
14
|
+
'sun': ['\u2600\uFE0F', '\uD83C\uDF1E'],
|
|
15
|
+
'moon': ['\uD83C\uDF19'],
|
|
16
|
+
'rain': ['\uD83C\uDF27\uFE0F'],
|
|
17
|
+
'snow': ['\u2744\uFE0F'],
|
|
18
|
+
'tree': ['\uD83C\uDF33'],
|
|
19
|
+
'flower': ['\uD83C\uDF38', '\uD83C\uDF3A'],
|
|
20
|
+
'dog': ['\uD83D\uDC36'],
|
|
21
|
+
'cat': ['\uD83D\uDC31'],
|
|
22
|
+
'car': ['\uD83D\uDE97'],
|
|
23
|
+
'house': ['\uD83C\uDFE0'],
|
|
24
|
+
'book': ['\uD83D\uDCDA', '\uD83D\uDCD6'],
|
|
25
|
+
'music': ['\uD83C\uDFB5', '\uD83C\uDFB6'],
|
|
26
|
+
'food': ['\uD83C\uDF54', '\uD83C\uDF55'],
|
|
27
|
+
'water': ['\uD83D\uDCA7'],
|
|
28
|
+
'time': ['\u23F0', '\u231A'],
|
|
29
|
+
'world': ['\uD83C\uDF0D'],
|
|
30
|
+
'phone': ['\uD83D\uDCF1'],
|
|
31
|
+
'computer': ['\uD83D\uDCBB'],
|
|
32
|
+
'rocket': ['\uD83D\uDE80'],
|
|
33
|
+
'idea': ['\uD83D\uDCA1'],
|
|
34
|
+
'check': ['\u2705'],
|
|
35
|
+
'cross': ['\u274C'],
|
|
36
|
+
'warning': ['\u26A0\uFE0F'],
|
|
37
|
+
'laugh': ['\uD83D\uDE02'],
|
|
38
|
+
'think': ['\uD83E\uDD14'],
|
|
39
|
+
'cool': ['\uD83D\uDE0E'],
|
|
40
|
+
'strong': ['\uD83D\uDCAA'],
|
|
41
|
+
'fast': ['\u26A1'],
|
|
42
|
+
'slow': ['\uD83D\uDC22'],
|
|
43
|
+
'big': ['\uD83D\uDCAF'],
|
|
44
|
+
'small': ['\uD83E\uDD0F'],
|
|
45
|
+
'good': ['\uD83D\uDC4D'],
|
|
46
|
+
'bad': ['\uD83D\uDC4E'],
|
|
47
|
+
'yes': ['\u2705'],
|
|
48
|
+
'no': ['\u274C'],
|
|
49
|
+
'king': ['\uD83D\uDC51'],
|
|
50
|
+
'queen': ['\uD83D\uDC51'],
|
|
51
|
+
'sleep': ['\uD83D\uDE34'],
|
|
52
|
+
'wave': ['\uD83D\uDC4B'],
|
|
53
|
+
'party': ['\uD83C\uDF89'],
|
|
54
|
+
'brain': ['\uD83E\uDDE0'],
|
|
55
|
+
'eyes': ['\uD83D\uDC40'],
|
|
56
|
+
'hand': ['\u270B'],
|
|
57
|
+
};
|
|
58
|
+
const DEFAULT_PARAMS = {
|
|
59
|
+
rate: 0.12,
|
|
60
|
+
map: DEFAULT_MAP,
|
|
61
|
+
fallbackToNone: true,
|
|
62
|
+
preserveWordAlongsideEmoji: false,
|
|
63
|
+
caseInsensitive: true,
|
|
64
|
+
};
|
|
65
|
+
export const emojiTransform = {
|
|
66
|
+
id: 'emoji',
|
|
67
|
+
version: '1.0.0',
|
|
68
|
+
capabilities: {
|
|
69
|
+
requiresTrace: false,
|
|
70
|
+
posAware: false,
|
|
71
|
+
deterministic: true,
|
|
72
|
+
safeToStack: true,
|
|
73
|
+
preferredOrder: 10,
|
|
74
|
+
},
|
|
75
|
+
validateParams(params) {
|
|
76
|
+
const errors = [];
|
|
77
|
+
if (params && typeof params === 'object') {
|
|
78
|
+
const p = params;
|
|
79
|
+
if (p.rate !== undefined) {
|
|
80
|
+
const rate = p.rate;
|
|
81
|
+
if (typeof rate !== 'number' || rate < 0 || rate > 1) {
|
|
82
|
+
errors.push('rate must be between 0 and 1');
|
|
83
|
+
}
|
|
84
|
+
}
|
|
85
|
+
if (p.map !== undefined && (typeof p.map !== 'object' || p.map === null)) {
|
|
86
|
+
errors.push('map must be an object');
|
|
87
|
+
}
|
|
88
|
+
}
|
|
89
|
+
return { valid: errors.length === 0, errors };
|
|
90
|
+
},
|
|
91
|
+
apply(input) {
|
|
92
|
+
const params = {
|
|
93
|
+
...DEFAULT_PARAMS,
|
|
94
|
+
...input.params,
|
|
95
|
+
map: {
|
|
96
|
+
...DEFAULT_MAP,
|
|
97
|
+
...(input.params.map ?? {}),
|
|
98
|
+
},
|
|
99
|
+
};
|
|
100
|
+
const tokens = [];
|
|
101
|
+
// Build lookup map
|
|
102
|
+
const lowerMap = new Map();
|
|
103
|
+
for (const [k, v] of Object.entries(params.map)) {
|
|
104
|
+
lowerMap.set(params.caseInsensitive ? k.toLowerCase() : k, v);
|
|
105
|
+
}
|
|
106
|
+
for (const token of input.tokens) {
|
|
107
|
+
if (token.type === 'word' && !isProtected(token)) {
|
|
108
|
+
const lookupKey = params.caseInsensitive ? token.value.toLowerCase() : token.value;
|
|
109
|
+
const emojis = lowerMap.get(lookupKey);
|
|
110
|
+
if (emojis && emojis.length > 0 && input.rng.chance(params.rate)) {
|
|
111
|
+
// Deterministic emoji selection
|
|
112
|
+
const emoji = emojis[0];
|
|
113
|
+
if (params.preserveWordAlongsideEmoji) {
|
|
114
|
+
tokens.push({ ...token, value: token.value + ' ' + emoji });
|
|
115
|
+
}
|
|
116
|
+
else {
|
|
117
|
+
tokens.push({ ...token, value: emoji, type: 'symbol' });
|
|
118
|
+
}
|
|
119
|
+
continue;
|
|
120
|
+
}
|
|
121
|
+
}
|
|
122
|
+
tokens.push({ ...token });
|
|
123
|
+
}
|
|
124
|
+
return { tokens };
|
|
125
|
+
},
|
|
126
|
+
};
|
|
127
|
+
//# sourceMappingURL=emoji.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"emoji.js","sourceRoot":"","sources":["../../../src/transforms/transforms/emoji.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAUH,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAU/C,MAAM,WAAW,GAA6B;IAC5C,OAAO,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACzC,KAAK,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACvC,MAAM,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACxC,OAAO,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACzC,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,OAAO,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACzC,MAAM,EAAE,CAAC,QAAQ,EAAE,cAAc,CAAC;IAClC,KAAK,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACvC,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,MAAM,EAAE,CAAC,oBAAoB,CAAC;IAC9B,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,QAAQ,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IAC1C,KAAK,EAAE,CAAC,cAAc,CAAC;IACvB,KAAK,EAAE,CAAC,cAAc,CAAC;IACvB,KAAK,EAAE,CAAC,cAAc,CAAC;IACvB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACxC,OAAO,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACzC,MAAM,EAAE,CAAC,cAAc,EAAE,cAAc,CAAC;IACxC,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,QAAQ,EAAE,QAAQ,CAAC;IAC5B,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,UAAU,EAAE,CAAC,cAAc,CAAC;IAC5B,QAAQ,EAAE,CAAC,cAAc,CAAC;IAC1B,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,OAAO,EAAE,CAAC,QAAQ,CAAC;IACnB,OAAO,EAAE,CAAC,QAAQ,CAAC;IACnB,SAAS,EAAE,CAAC,cAAc,CAAC;IAC3B,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,QAAQ,EAAE,CAAC,cAAc,CAAC;IAC1B,MAAM,EAAE,CAAC,QAAQ,CAAC;IAClB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,KAAK,EAAE,CAAC,cAAc,CAAC;IACvB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,KAAK,EAAE,CAAC,cAAc,CAAC;IACvB,KAAK,EAAE,CAAC,QAAQ,CAAC;IACjB,IAAI,EAAE,CAAC,QAAQ,CAAC;IAChB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,OAAO,EAAE,CAAC,cAAc,CAAC;IACzB,MAAM,EAAE,CAAC,cAAc,CAAC;IACxB,MAAM,EAAE,CAAC,QAAQ,CAAC;CACnB,CAAC;AAEF,MAAM,cAAc,GAAgB;IAClC,IAAI,EAAE,IAAI;IACV,GAAG,EAAE,WAAW;IAChB,cAAc,EAAE,IAAI;IACpB,0BAA0B,EAAE,KAAK;IACjC,eAAe,EAAE,IAAI;CACtB,CAAC;AAEF,MAAM,CAAC,MAAM,cAAc,GAAqB;IAC9C,EAAE,EAAE,OAAO;IACX,OAAO,EAAE,OAAO;IAChB,YAAY,EAAE;QACZ,aAAa,EAAE,KAAK;QACpB,QAAQ,EAAE,KAAK;QACf,aAAa,EAAE,IAAI;QACnB,WAAW,EAAE,IAAI;QACjB,cAAc,EAAE,EAAE;KACa;IAEjC,cAAc,CAAC,MAAe;QAC5B,MAAM,MAAM,GAAa,EAAE,CAAC;QAC5B,IAAI,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,EAAE,CAAC;YACzC,MAAM,CAAC,GAAG,MAAiC,CAAC;YAC5C,IAAI,CAAC,CAAC,IAAI,KAAK,SAAS,EAAE,CAAC;gBACzB,MAAM,IAAI,GAAG,CAAC,CAAC,IAAc,CAAC;gBAC9B,IAAI,OAAO,IAAI,KAAK,QAAQ,IAAI,IAAI,GAAG,CAAC,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;oBACrD,MAAM,CAAC,IAAI,CAAC,8BAA8B,CAAC,CAAC;gBAC9C,CAAC;YACH,CAAC;YACD,IAAI,CAAC,CAAC,GAAG,KAAK,SAAS,IAAI,CAAC,OAAO,CAAC,CAAC,GAAG,KAAK,QAAQ,IAAI,CAAC,CAAC,GAAG,KAAK,IAAI,CAAC,EAAE,CAAC;gBACzE,MAAM,CAAC,IAAI,CAAC,uBAAuB,CAAC,CAAC;YACvC,CAAC;QACH,CAAC;QACD,OAAO,EAAE,KAAK,EAAE,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;IAChD,CAAC;IAED,KAAK,CAAC,KAAqB;QACzB,MAAM,MAAM,GAAgB;YAC1B,GAAG,cAAc;YACjB,GAAI,KAAK,CAAC,MAA+B;YACzC,GAAG,EAAE;gBACH,GAAG,WAAW;gBACd,GAAG,CAAE,KAAK,CAAC,MAA+B,CAAC,GAAG,IAAI,EAAE,CAAC;aACtD;SACF,CAAC;QACF,MAAM,MAAM,GAAY,EAAE,CAAC;QAE3B,mBAAmB;QACnB,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAoB,CAAC;QAC7C,KAAK,MAAM,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,GAAG,CAAC,EAAE,CAAC;YAChD,QAAQ,CAAC,GAAG,CAAC,MAAM,CAAC,eAAe,CAAC,CAAC,CAAC,CAAC,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC;QAChE,CAAC;QAED,KAAK,MAAM,KAAK,IAAI,KAAK,CAAC,MAAM,EAAE,CAAC;YACjC,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;gBACjD,MAAM,SAAS,GAAG,MAAM,CAAC,eAAe,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC,WAAW,EAAE,CAAC,CAAC,CAAC,KAAK,CAAC,KAAK,CAAC;gBACnF,MAAM,MAAM,GAAG,QAAQ,CAAC,GAAG,CAAC,SAAS,CAAC,CAAC;gBAEvC,IAAI,MAAM,IAAI,MAAM,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC;oBACjE,gCAAgC;oBAChC,MAAM,KAAK,GAAG,MAAM,CAAC,CAAC,CAAE,CAAC;oBAEzB,IAAI,MAAM,CAAC,0BAA0B,EAAE,CAAC;wBACtC,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,KAAK,CAAC,KAAK,GAAG,GAAG,GAAG,KAAK,EAAE,CAAC,CAAC;oBAC9D,CAAC;yBAAM,CAAC;wBACN,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,KAAK,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,CAAC;oBAC1D,CAAC;oBACD,SAAS;gBACX,CAAC;YACH,CAAC;YAED,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;QAC5B,CAAC;QAED,OAAO,EAAE,MAAM,EAAE,CAAC;IACpB,CAAC;CACF,CAAC"}
|
|
@@ -0,0 +1,17 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* V1 Transform Pack - All built-in transforms
|
|
3
|
+
*/
|
|
4
|
+
export { pigLatinTransform } from './pig-latin.js';
|
|
5
|
+
export { ubbiDubbiTransform } from './ubbi-dubbi.js';
|
|
6
|
+
export { leetTransform } from './leet.js';
|
|
7
|
+
export { uwuTransform } from './uwu.js';
|
|
8
|
+
export { pirateTransform } from './pirate.js';
|
|
9
|
+
export { redactTransform } from './redact.js';
|
|
10
|
+
export { emojiTransform } from './emoji.js';
|
|
11
|
+
export { mockCaseTransform } from './mock-case.js';
|
|
12
|
+
export { reverseWordsTransform } from './reverse-words.js';
|
|
13
|
+
export { bizJargonTransform } from './biz-jargon.js';
|
|
14
|
+
import type { IOutputTransform } from '../types.js';
|
|
15
|
+
/** All V1 built-in transforms */
|
|
16
|
+
export declare const V1_TRANSFORMS: IOutputTransform[];
|
|
17
|
+
//# sourceMappingURL=index.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/index.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AACrD,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,cAAc,EAAE,MAAM,YAAY,CAAC;AAC5C,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,qBAAqB,EAAE,MAAM,oBAAoB,CAAC;AAC3D,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AAYrD,OAAO,KAAK,EAAE,gBAAgB,EAAE,MAAM,aAAa,CAAC;AAEpD,iCAAiC;AACjC,eAAO,MAAM,aAAa,EAAE,gBAAgB,EAW3C,CAAC"}
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* V1 Transform Pack - All built-in transforms
|
|
3
|
+
*/
|
|
4
|
+
export { pigLatinTransform } from './pig-latin.js';
|
|
5
|
+
export { ubbiDubbiTransform } from './ubbi-dubbi.js';
|
|
6
|
+
export { leetTransform } from './leet.js';
|
|
7
|
+
export { uwuTransform } from './uwu.js';
|
|
8
|
+
export { pirateTransform } from './pirate.js';
|
|
9
|
+
export { redactTransform } from './redact.js';
|
|
10
|
+
export { emojiTransform } from './emoji.js';
|
|
11
|
+
export { mockCaseTransform } from './mock-case.js';
|
|
12
|
+
export { reverseWordsTransform } from './reverse-words.js';
|
|
13
|
+
export { bizJargonTransform } from './biz-jargon.js';
|
|
14
|
+
import { pigLatinTransform } from './pig-latin.js';
|
|
15
|
+
import { ubbiDubbiTransform } from './ubbi-dubbi.js';
|
|
16
|
+
import { leetTransform } from './leet.js';
|
|
17
|
+
import { uwuTransform } from './uwu.js';
|
|
18
|
+
import { pirateTransform } from './pirate.js';
|
|
19
|
+
import { redactTransform } from './redact.js';
|
|
20
|
+
import { emojiTransform } from './emoji.js';
|
|
21
|
+
import { mockCaseTransform } from './mock-case.js';
|
|
22
|
+
import { reverseWordsTransform } from './reverse-words.js';
|
|
23
|
+
import { bizJargonTransform } from './biz-jargon.js';
|
|
24
|
+
/** All V1 built-in transforms */
|
|
25
|
+
export const V1_TRANSFORMS = [
|
|
26
|
+
pigLatinTransform,
|
|
27
|
+
ubbiDubbiTransform,
|
|
28
|
+
leetTransform,
|
|
29
|
+
uwuTransform,
|
|
30
|
+
pirateTransform,
|
|
31
|
+
redactTransform,
|
|
32
|
+
emojiTransform,
|
|
33
|
+
mockCaseTransform,
|
|
34
|
+
reverseWordsTransform,
|
|
35
|
+
bizJargonTransform,
|
|
36
|
+
];
|
|
37
|
+
//# sourceMappingURL=index.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../../src/transforms/transforms/index.ts"],"names":[],"mappings":"AAAA;;GAEG;AAEH,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AACrD,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,cAAc,EAAE,MAAM,YAAY,CAAC;AAC5C,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,qBAAqB,EAAE,MAAM,oBAAoB,CAAC;AAC3D,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AAErD,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AACrD,OAAO,EAAE,aAAa,EAAE,MAAM,WAAW,CAAC;AAC1C,OAAO,EAAE,YAAY,EAAE,MAAM,UAAU,CAAC;AACxC,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,eAAe,EAAE,MAAM,aAAa,CAAC;AAC9C,OAAO,EAAE,cAAc,EAAE,MAAM,YAAY,CAAC;AAC5C,OAAO,EAAE,iBAAiB,EAAE,MAAM,gBAAgB,CAAC;AACnD,OAAO,EAAE,qBAAqB,EAAE,MAAM,oBAAoB,CAAC;AAC3D,OAAO,EAAE,kBAAkB,EAAE,MAAM,iBAAiB,CAAC;AAGrD,iCAAiC;AACjC,MAAM,CAAC,MAAM,aAAa,GAAuB;IAC/C,iBAAiB;IACjB,kBAAkB;IAClB,aAAa;IACb,YAAY;IACZ,eAAe;IACf,eAAe;IACf,cAAc;IACd,iBAAiB;IACjB,qBAAqB;IACrB,kBAAkB;CACnB,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"leet.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/leet.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,gBAAgB,EAMjB,MAAM,aAAa,CAAC;AAyErB,eAAO,MAAM,aAAa,EAAE,gBAiD3B,CAAC"}
|