marlarky 1.0.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +489 -0
- package/dist/adapters/faker-js-adapter.d.ts +44 -0
- package/dist/adapters/faker-js-adapter.d.ts.map +1 -0
- package/dist/adapters/faker-js-adapter.js +46 -0
- package/dist/adapters/faker-js-adapter.js.map +1 -0
- package/dist/adapters/index.d.ts +3 -0
- package/dist/adapters/index.d.ts.map +1 -0
- package/dist/adapters/index.js +3 -0
- package/dist/adapters/index.js.map +1 -0
- package/dist/adapters/simple-faker-adapter.d.ts +22 -0
- package/dist/adapters/simple-faker-adapter.d.ts.map +1 -0
- package/dist/adapters/simple-faker-adapter.js +54 -0
- package/dist/adapters/simple-faker-adapter.js.map +1 -0
- package/dist/cli.d.ts +7 -0
- package/dist/cli.d.ts.map +1 -0
- package/dist/cli.js +588 -0
- package/dist/cli.js.map +1 -0
- package/dist/defaults/index.d.ts +2 -0
- package/dist/defaults/index.d.ts.map +1 -0
- package/dist/defaults/index.js +2 -0
- package/dist/defaults/index.js.map +1 -0
- package/dist/defaults/word-lists.d.ts +22 -0
- package/dist/defaults/word-lists.d.ts.map +1 -0
- package/dist/defaults/word-lists.js +124 -0
- package/dist/defaults/word-lists.js.map +1 -0
- package/dist/generator/index.d.ts +2 -0
- package/dist/generator/index.d.ts.map +1 -0
- package/dist/generator/index.js +2 -0
- package/dist/generator/index.js.map +1 -0
- package/dist/generator/text-generator.d.ts +93 -0
- package/dist/generator/text-generator.d.ts.map +1 -0
- package/dist/generator/text-generator.js +411 -0
- package/dist/generator/text-generator.js.map +1 -0
- package/dist/generator/text-generator.test.d.ts +2 -0
- package/dist/generator/text-generator.test.d.ts.map +1 -0
- package/dist/generator/text-generator.test.js +151 -0
- package/dist/generator/text-generator.test.js.map +1 -0
- package/dist/grammar/index.d.ts +5 -0
- package/dist/grammar/index.d.ts.map +1 -0
- package/dist/grammar/index.js +3 -0
- package/dist/grammar/index.js.map +1 -0
- package/dist/grammar/phrase-builders.d.ts +72 -0
- package/dist/grammar/phrase-builders.d.ts.map +1 -0
- package/dist/grammar/phrase-builders.js +241 -0
- package/dist/grammar/phrase-builders.js.map +1 -0
- package/dist/grammar/sentence-templates.d.ts +67 -0
- package/dist/grammar/sentence-templates.d.ts.map +1 -0
- package/dist/grammar/sentence-templates.js +272 -0
- package/dist/grammar/sentence-templates.js.map +1 -0
- package/dist/index.d.ts +17 -0
- package/dist/index.d.ts.map +1 -0
- package/dist/index.js +40 -0
- package/dist/index.js.map +1 -0
- package/dist/interfaces/faker-adapter.d.ts +25 -0
- package/dist/interfaces/faker-adapter.d.ts.map +1 -0
- package/dist/interfaces/faker-adapter.js +2 -0
- package/dist/interfaces/faker-adapter.js.map +1 -0
- package/dist/interfaces/index.d.ts +4 -0
- package/dist/interfaces/index.d.ts.map +1 -0
- package/dist/interfaces/index.js +2 -0
- package/dist/interfaces/index.js.map +1 -0
- package/dist/interfaces/lexicon-store.d.ts +39 -0
- package/dist/interfaces/lexicon-store.d.ts.map +1 -0
- package/dist/interfaces/lexicon-store.js +2 -0
- package/dist/interfaces/lexicon-store.js.map +1 -0
- package/dist/interfaces/rng.d.ts +25 -0
- package/dist/interfaces/rng.d.ts.map +1 -0
- package/dist/interfaces/rng.js +2 -0
- package/dist/interfaces/rng.js.map +1 -0
- package/dist/lexicon/index.d.ts +4 -0
- package/dist/lexicon/index.d.ts.map +1 -0
- package/dist/lexicon/index.js +4 -0
- package/dist/lexicon/index.js.map +1 -0
- package/dist/lexicon/loader.d.ts +24 -0
- package/dist/lexicon/loader.d.ts.map +1 -0
- package/dist/lexicon/loader.js +47 -0
- package/dist/lexicon/loader.js.map +1 -0
- package/dist/lexicon/store.d.ts +39 -0
- package/dist/lexicon/store.d.ts.map +1 -0
- package/dist/lexicon/store.js +291 -0
- package/dist/lexicon/store.js.map +1 -0
- package/dist/lexicon/validator.d.ts +10 -0
- package/dist/lexicon/validator.d.ts.map +1 -0
- package/dist/lexicon/validator.js +273 -0
- package/dist/lexicon/validator.js.map +1 -0
- package/dist/morphology/articles.d.ts +17 -0
- package/dist/morphology/articles.d.ts.map +1 -0
- package/dist/morphology/articles.js +66 -0
- package/dist/morphology/articles.js.map +1 -0
- package/dist/morphology/articles.test.d.ts +2 -0
- package/dist/morphology/articles.test.d.ts.map +1 -0
- package/dist/morphology/articles.test.js +56 -0
- package/dist/morphology/articles.test.js.map +1 -0
- package/dist/morphology/conjugate.d.ts +46 -0
- package/dist/morphology/conjugate.d.ts.map +1 -0
- package/dist/morphology/conjugate.js +337 -0
- package/dist/morphology/conjugate.js.map +1 -0
- package/dist/morphology/conjugate.test.d.ts +2 -0
- package/dist/morphology/conjugate.test.d.ts.map +1 -0
- package/dist/morphology/conjugate.test.js +168 -0
- package/dist/morphology/conjugate.test.js.map +1 -0
- package/dist/morphology/index.d.ts +6 -0
- package/dist/morphology/index.d.ts.map +1 -0
- package/dist/morphology/index.js +9 -0
- package/dist/morphology/index.js.map +1 -0
- package/dist/morphology/normalize.d.ts +52 -0
- package/dist/morphology/normalize.d.ts.map +1 -0
- package/dist/morphology/normalize.js +127 -0
- package/dist/morphology/normalize.js.map +1 -0
- package/dist/morphology/pluralize.d.ts +17 -0
- package/dist/morphology/pluralize.d.ts.map +1 -0
- package/dist/morphology/pluralize.js +186 -0
- package/dist/morphology/pluralize.js.map +1 -0
- package/dist/morphology/pluralize.test.d.ts +2 -0
- package/dist/morphology/pluralize.test.d.ts.map +1 -0
- package/dist/morphology/pluralize.test.js +86 -0
- package/dist/morphology/pluralize.test.js.map +1 -0
- package/dist/providers/index.d.ts +2 -0
- package/dist/providers/index.d.ts.map +1 -0
- package/dist/providers/index.js +2 -0
- package/dist/providers/index.js.map +1 -0
- package/dist/providers/word-provider.d.ts +125 -0
- package/dist/providers/word-provider.d.ts.map +1 -0
- package/dist/providers/word-provider.js +266 -0
- package/dist/providers/word-provider.js.map +1 -0
- package/dist/rng/index.d.ts +2 -0
- package/dist/rng/index.d.ts.map +1 -0
- package/dist/rng/index.js +2 -0
- package/dist/rng/index.js.map +1 -0
- package/dist/rng/seedable-rng.d.ts +19 -0
- package/dist/rng/seedable-rng.d.ts.map +1 -0
- package/dist/rng/seedable-rng.js +77 -0
- package/dist/rng/seedable-rng.js.map +1 -0
- package/dist/rng/seedable-rng.test.d.ts +2 -0
- package/dist/rng/seedable-rng.test.d.ts.map +1 -0
- package/dist/rng/seedable-rng.test.js +165 -0
- package/dist/rng/seedable-rng.test.js.map +1 -0
- package/dist/rules/index.d.ts +3 -0
- package/dist/rules/index.d.ts.map +1 -0
- package/dist/rules/index.js +2 -0
- package/dist/rules/index.js.map +1 -0
- package/dist/rules/rule-engine.d.ts +78 -0
- package/dist/rules/rule-engine.d.ts.map +1 -0
- package/dist/rules/rule-engine.js +271 -0
- package/dist/rules/rule-engine.js.map +1 -0
- package/dist/transforms/config-merge.d.ts +19 -0
- package/dist/transforms/config-merge.d.ts.map +1 -0
- package/dist/transforms/config-merge.js +88 -0
- package/dist/transforms/config-merge.js.map +1 -0
- package/dist/transforms/config-merge.test.d.ts +2 -0
- package/dist/transforms/config-merge.test.d.ts.map +1 -0
- package/dist/transforms/config-merge.test.js +91 -0
- package/dist/transforms/config-merge.test.js.map +1 -0
- package/dist/transforms/default-registry.d.ts +10 -0
- package/dist/transforms/default-registry.d.ts.map +1 -0
- package/dist/transforms/default-registry.js +17 -0
- package/dist/transforms/default-registry.js.map +1 -0
- package/dist/transforms/index.d.ts +15 -0
- package/dist/transforms/index.d.ts.map +1 -0
- package/dist/transforms/index.js +20 -0
- package/dist/transforms/index.js.map +1 -0
- package/dist/transforms/pipeline.d.ts +28 -0
- package/dist/transforms/pipeline.d.ts.map +1 -0
- package/dist/transforms/pipeline.js +176 -0
- package/dist/transforms/pipeline.js.map +1 -0
- package/dist/transforms/pipeline.test.d.ts +2 -0
- package/dist/transforms/pipeline.test.d.ts.map +1 -0
- package/dist/transforms/pipeline.test.js +175 -0
- package/dist/transforms/pipeline.test.js.map +1 -0
- package/dist/transforms/protection.d.ts +16 -0
- package/dist/transforms/protection.d.ts.map +1 -0
- package/dist/transforms/protection.js +97 -0
- package/dist/transforms/protection.js.map +1 -0
- package/dist/transforms/protection.test.d.ts +2 -0
- package/dist/transforms/protection.test.d.ts.map +1 -0
- package/dist/transforms/protection.test.js +79 -0
- package/dist/transforms/protection.test.js.map +1 -0
- package/dist/transforms/registry.d.ts +25 -0
- package/dist/transforms/registry.d.ts.map +1 -0
- package/dist/transforms/registry.js +32 -0
- package/dist/transforms/registry.js.map +1 -0
- package/dist/transforms/registry.test.d.ts +2 -0
- package/dist/transforms/registry.test.d.ts.map +1 -0
- package/dist/transforms/registry.test.js +64 -0
- package/dist/transforms/registry.test.js.map +1 -0
- package/dist/transforms/tokenizer.d.ts +26 -0
- package/dist/transforms/tokenizer.d.ts.map +1 -0
- package/dist/transforms/tokenizer.js +137 -0
- package/dist/transforms/tokenizer.js.map +1 -0
- package/dist/transforms/tokenizer.test.d.ts +2 -0
- package/dist/transforms/tokenizer.test.d.ts.map +1 -0
- package/dist/transforms/tokenizer.test.js +85 -0
- package/dist/transforms/tokenizer.test.js.map +1 -0
- package/dist/transforms/transforms/biz-jargon.d.ts +7 -0
- package/dist/transforms/transforms/biz-jargon.d.ts.map +1 -0
- package/dist/transforms/transforms/biz-jargon.js +117 -0
- package/dist/transforms/transforms/biz-jargon.js.map +1 -0
- package/dist/transforms/transforms/emoji.d.ts +7 -0
- package/dist/transforms/transforms/emoji.d.ts.map +1 -0
- package/dist/transforms/transforms/emoji.js +127 -0
- package/dist/transforms/transforms/emoji.js.map +1 -0
- package/dist/transforms/transforms/index.d.ts +17 -0
- package/dist/transforms/transforms/index.d.ts.map +1 -0
- package/dist/transforms/transforms/index.js +37 -0
- package/dist/transforms/transforms/index.js.map +1 -0
- package/dist/transforms/transforms/leet.d.ts +7 -0
- package/dist/transforms/transforms/leet.d.ts.map +1 -0
- package/dist/transforms/transforms/leet.js +109 -0
- package/dist/transforms/transforms/leet.js.map +1 -0
- package/dist/transforms/transforms/mock-case.d.ts +7 -0
- package/dist/transforms/transforms/mock-case.d.ts.map +1 -0
- package/dist/transforms/transforms/mock-case.js +116 -0
- package/dist/transforms/transforms/mock-case.js.map +1 -0
- package/dist/transforms/transforms/pig-latin.d.ts +7 -0
- package/dist/transforms/transforms/pig-latin.d.ts.map +1 -0
- package/dist/transforms/transforms/pig-latin.js +132 -0
- package/dist/transforms/transforms/pig-latin.js.map +1 -0
- package/dist/transforms/transforms/pig-latin.test.d.ts +2 -0
- package/dist/transforms/transforms/pig-latin.test.d.ts.map +1 -0
- package/dist/transforms/transforms/pig-latin.test.js +77 -0
- package/dist/transforms/transforms/pig-latin.test.js.map +1 -0
- package/dist/transforms/transforms/pirate.d.ts +7 -0
- package/dist/transforms/transforms/pirate.d.ts.map +1 -0
- package/dist/transforms/transforms/pirate.js +150 -0
- package/dist/transforms/transforms/pirate.js.map +1 -0
- package/dist/transforms/transforms/redact.d.ts +7 -0
- package/dist/transforms/transforms/redact.d.ts.map +1 -0
- package/dist/transforms/transforms/redact.js +109 -0
- package/dist/transforms/transforms/redact.js.map +1 -0
- package/dist/transforms/transforms/reverse-words.d.ts +7 -0
- package/dist/transforms/transforms/reverse-words.d.ts.map +1 -0
- package/dist/transforms/transforms/reverse-words.js +88 -0
- package/dist/transforms/transforms/reverse-words.js.map +1 -0
- package/dist/transforms/transforms/transforms.test.d.ts +11 -0
- package/dist/transforms/transforms/transforms.test.d.ts.map +1 -0
- package/dist/transforms/transforms/transforms.test.js +489 -0
- package/dist/transforms/transforms/transforms.test.js.map +1 -0
- package/dist/transforms/transforms/ubbi-dubbi.d.ts +7 -0
- package/dist/transforms/transforms/ubbi-dubbi.d.ts.map +1 -0
- package/dist/transforms/transforms/ubbi-dubbi.js +120 -0
- package/dist/transforms/transforms/ubbi-dubbi.js.map +1 -0
- package/dist/transforms/transforms/uwu.d.ts +7 -0
- package/dist/transforms/transforms/uwu.d.ts.map +1 -0
- package/dist/transforms/transforms/uwu.js +106 -0
- package/dist/transforms/transforms/uwu.js.map +1 -0
- package/dist/transforms/types.d.ts +159 -0
- package/dist/transforms/types.d.ts.map +1 -0
- package/dist/transforms/types.js +22 -0
- package/dist/transforms/types.js.map +1 -0
- package/dist/types/api.d.ts +158 -0
- package/dist/types/api.d.ts.map +1 -0
- package/dist/types/api.js +6 -0
- package/dist/types/api.js.map +1 -0
- package/dist/types/config.d.ts +86 -0
- package/dist/types/config.d.ts.map +1 -0
- package/dist/types/config.js +66 -0
- package/dist/types/config.js.map +1 -0
- package/dist/types/context.d.ts +74 -0
- package/dist/types/context.d.ts.map +1 -0
- package/dist/types/context.js +83 -0
- package/dist/types/context.js.map +1 -0
- package/dist/types/index.d.ts +7 -0
- package/dist/types/index.d.ts.map +1 -0
- package/dist/types/index.js +3 -0
- package/dist/types/index.js.map +1 -0
- package/dist/types/lexicon.d.ts +247 -0
- package/dist/types/lexicon.d.ts.map +1 -0
- package/dist/types/lexicon.js +6 -0
- package/dist/types/lexicon.js.map +1 -0
- package/examples/basic-usage.ts +48 -0
- package/examples/corporate-lexicon.ts +71 -0
- package/examples/lexicons/corporate-min.json +200 -0
- package/examples/with-tracing.ts +85 -0
- package/package.json +70 -0
|
@@ -0,0 +1,150 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Pirate Transform (id="pirate")
|
|
3
|
+
* Phrase substitutions + interjections.
|
|
4
|
+
*/
|
|
5
|
+
import { isProtected } from '../protection.js';
|
|
6
|
+
const DEFAULT_PHRASE_MAP = {
|
|
7
|
+
'my': 'me',
|
|
8
|
+
'you': 'ye',
|
|
9
|
+
'your': 'yer',
|
|
10
|
+
'is': 'be',
|
|
11
|
+
'are': 'be',
|
|
12
|
+
'am': 'be',
|
|
13
|
+
'friend': 'matey',
|
|
14
|
+
'friends': 'mateys',
|
|
15
|
+
'hello': 'ahoy',
|
|
16
|
+
'hi': 'ahoy',
|
|
17
|
+
'the': 'th\'',
|
|
18
|
+
'money': 'booty',
|
|
19
|
+
'treasure': 'booty',
|
|
20
|
+
'man': 'landlubber',
|
|
21
|
+
'woman': 'lass',
|
|
22
|
+
'boy': 'lad',
|
|
23
|
+
'girl': 'lass',
|
|
24
|
+
'sir': 'cap\'n',
|
|
25
|
+
'madam': 'lass',
|
|
26
|
+
'fight': 'duel',
|
|
27
|
+
'food': 'grub',
|
|
28
|
+
'drink': 'grog',
|
|
29
|
+
'ocean': 'sea',
|
|
30
|
+
'jail': 'brig',
|
|
31
|
+
'stupid': 'scurvy',
|
|
32
|
+
'old': 'barnacled',
|
|
33
|
+
};
|
|
34
|
+
const DEFAULT_INTERJECTIONS = ['Arr!', 'Yo-ho-ho!', 'Ahoy!', 'Shiver me timbers!', 'Blimey!'];
|
|
35
|
+
const DEFAULT_PARAMS = {
|
|
36
|
+
phraseMap: DEFAULT_PHRASE_MAP,
|
|
37
|
+
interjections: DEFAULT_INTERJECTIONS,
|
|
38
|
+
interjectionRate: 0.05,
|
|
39
|
+
preserveCase: true,
|
|
40
|
+
};
|
|
41
|
+
function matchCase(source, target) {
|
|
42
|
+
if (source.length === 0 || target.length === 0)
|
|
43
|
+
return target;
|
|
44
|
+
// All uppercase
|
|
45
|
+
if (source === source.toUpperCase() && source !== source.toLowerCase()) {
|
|
46
|
+
return target.toUpperCase();
|
|
47
|
+
}
|
|
48
|
+
// Title case (first letter uppercase)
|
|
49
|
+
if (source[0] >= 'A' && source[0] <= 'Z') {
|
|
50
|
+
return target[0].toUpperCase() + target.slice(1);
|
|
51
|
+
}
|
|
52
|
+
return target.toLowerCase();
|
|
53
|
+
}
|
|
54
|
+
export const pirateTransform = {
|
|
55
|
+
id: 'pirate',
|
|
56
|
+
version: '1.0.0',
|
|
57
|
+
capabilities: {
|
|
58
|
+
requiresTrace: false,
|
|
59
|
+
posAware: false,
|
|
60
|
+
deterministic: true,
|
|
61
|
+
safeToStack: true,
|
|
62
|
+
preferredOrder: 10,
|
|
63
|
+
},
|
|
64
|
+
validateParams(params) {
|
|
65
|
+
const errors = [];
|
|
66
|
+
if (params && typeof params === 'object') {
|
|
67
|
+
const p = params;
|
|
68
|
+
if (p.interjectionRate !== undefined) {
|
|
69
|
+
const rate = p.interjectionRate;
|
|
70
|
+
if (typeof rate !== 'number' || rate < 0 || rate > 1) {
|
|
71
|
+
errors.push('interjectionRate must be between 0 and 1');
|
|
72
|
+
}
|
|
73
|
+
}
|
|
74
|
+
if (p.phraseMap !== undefined && (typeof p.phraseMap !== 'object' || p.phraseMap === null)) {
|
|
75
|
+
errors.push('phraseMap must be an object');
|
|
76
|
+
}
|
|
77
|
+
if (p.interjections !== undefined && !Array.isArray(p.interjections)) {
|
|
78
|
+
errors.push('interjections must be an array');
|
|
79
|
+
}
|
|
80
|
+
}
|
|
81
|
+
return { valid: errors.length === 0, errors };
|
|
82
|
+
},
|
|
83
|
+
apply(input) {
|
|
84
|
+
const params = {
|
|
85
|
+
...DEFAULT_PARAMS,
|
|
86
|
+
...input.params,
|
|
87
|
+
phraseMap: {
|
|
88
|
+
...DEFAULT_PHRASE_MAP,
|
|
89
|
+
...(input.params.phraseMap ?? {}),
|
|
90
|
+
},
|
|
91
|
+
};
|
|
92
|
+
const tokens = [];
|
|
93
|
+
// Build lowercase lookup
|
|
94
|
+
const lowerMap = new Map();
|
|
95
|
+
for (const [k, v] of Object.entries(params.phraseMap)) {
|
|
96
|
+
lowerMap.set(k.toLowerCase(), v);
|
|
97
|
+
}
|
|
98
|
+
// Maybe prepend interjection at start of sentence
|
|
99
|
+
let insertedInterjection = false;
|
|
100
|
+
if (params.interjections.length > 0 && input.rng.chance(params.interjectionRate)) {
|
|
101
|
+
// Find first word token
|
|
102
|
+
const firstWordIdx = input.tokens.findIndex(t => t.type === 'word');
|
|
103
|
+
if (firstWordIdx >= 0) {
|
|
104
|
+
insertedInterjection = true;
|
|
105
|
+
}
|
|
106
|
+
}
|
|
107
|
+
// Process tokens
|
|
108
|
+
let isFirst = true;
|
|
109
|
+
for (let i = 0; i < input.tokens.length; i++) {
|
|
110
|
+
const token = input.tokens[i];
|
|
111
|
+
// Insert interjection before first word
|
|
112
|
+
if (insertedInterjection && isFirst && token.type === 'word') {
|
|
113
|
+
const interjection = input.rng.pick(params.interjections);
|
|
114
|
+
tokens.push({ type: 'word', value: interjection });
|
|
115
|
+
tokens.push({ type: 'whitespace', value: ' ' });
|
|
116
|
+
// Lowercase the formerly-capitalized first word since interjection takes the capital
|
|
117
|
+
if (params.preserveCase && token.value[0] >= 'A' && token.value[0] <= 'Z') {
|
|
118
|
+
const lowerFirst = token.value[0].toLowerCase() + token.value.slice(1);
|
|
119
|
+
const replacement = lowerMap.get(lowerFirst.toLowerCase());
|
|
120
|
+
if (replacement && !isProtected(token)) {
|
|
121
|
+
tokens.push({ ...token, value: replacement });
|
|
122
|
+
}
|
|
123
|
+
else {
|
|
124
|
+
tokens.push({ ...token, value: lowerFirst });
|
|
125
|
+
}
|
|
126
|
+
isFirst = false;
|
|
127
|
+
continue;
|
|
128
|
+
}
|
|
129
|
+
}
|
|
130
|
+
if (token.type === 'word' && !isProtected(token)) {
|
|
131
|
+
const lower = token.value.toLowerCase();
|
|
132
|
+
const replacement = lowerMap.get(lower);
|
|
133
|
+
if (replacement) {
|
|
134
|
+
const cased = params.preserveCase ? matchCase(token.value, replacement) : replacement;
|
|
135
|
+
tokens.push({ ...token, value: cased });
|
|
136
|
+
}
|
|
137
|
+
else {
|
|
138
|
+
tokens.push({ ...token });
|
|
139
|
+
}
|
|
140
|
+
}
|
|
141
|
+
else {
|
|
142
|
+
tokens.push({ ...token });
|
|
143
|
+
}
|
|
144
|
+
if (token.type === 'word')
|
|
145
|
+
isFirst = false;
|
|
146
|
+
}
|
|
147
|
+
return { tokens };
|
|
148
|
+
},
|
|
149
|
+
};
|
|
150
|
+
//# sourceMappingURL=pirate.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"pirate.js","sourceRoot":"","sources":["../../../src/transforms/transforms/pirate.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAUH,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAS/C,MAAM,kBAAkB,GAA2B;IACjD,IAAI,EAAE,IAAI;IACV,KAAK,EAAE,IAAI;IACX,MAAM,EAAE,KAAK;IACb,IAAI,EAAE,IAAI;IACV,KAAK,EAAE,IAAI;IACX,IAAI,EAAE,IAAI;IACV,QAAQ,EAAE,OAAO;IACjB,SAAS,EAAE,QAAQ;IACnB,OAAO,EAAE,MAAM;IACf,IAAI,EAAE,MAAM;IACZ,KAAK,EAAE,MAAM;IACb,OAAO,EAAE,OAAO;IAChB,UAAU,EAAE,OAAO;IACnB,KAAK,EAAE,YAAY;IACnB,OAAO,EAAE,MAAM;IACf,KAAK,EAAE,KAAK;IACZ,MAAM,EAAE,MAAM;IACd,KAAK,EAAE,QAAQ;IACf,OAAO,EAAE,MAAM;IACf,OAAO,EAAE,MAAM;IACf,MAAM,EAAE,MAAM;IACd,OAAO,EAAE,MAAM;IACf,OAAO,EAAE,KAAK;IACd,MAAM,EAAE,MAAM;IACd,QAAQ,EAAE,QAAQ;IAClB,KAAK,EAAE,WAAW;CACnB,CAAC;AAEF,MAAM,qBAAqB,GAAG,CAAC,MAAM,EAAE,WAAW,EAAE,OAAO,EAAE,oBAAoB,EAAE,SAAS,CAAC,CAAC;AAE9F,MAAM,cAAc,GAAiB;IACnC,SAAS,EAAE,kBAAkB;IAC7B,aAAa,EAAE,qBAAqB;IACpC,gBAAgB,EAAE,IAAI;IACtB,YAAY,EAAE,IAAI;CACnB,CAAC;AAEF,SAAS,SAAS,CAAC,MAAc,EAAE,MAAc;IAC/C,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC,IAAI,MAAM,CAAC,MAAM,KAAK,CAAC;QAAE,OAAO,MAAM,CAAC;IAC9D,gBAAgB;IAChB,IAAI,MAAM,KAAK,MAAM,CAAC,WAAW,EAAE,IAAI,MAAM,KAAK,MAAM,CAAC,WAAW,EAAE,EAAE,CAAC;QACvE,OAAO,MAAM,CAAC,WAAW,EAAE,CAAC;IAC9B,CAAC;IACD,sCAAsC;IACtC,IAAI,MAAM,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,MAAM,CAAC,CAAC,CAAE,IAAI,GAAG,EAAE,CAAC;QAC3C,OAAO,MAAM,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,GAAG,MAAM,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;IACpD,CAAC;IACD,OAAO,MAAM,CAAC,WAAW,EAAE,CAAC;AAC9B,CAAC;AAED,MAAM,CAAC,MAAM,eAAe,GAAqB;IAC/C,EAAE,EAAE,QAAQ;IACZ,OAAO,EAAE,OAAO;IAChB,YAAY,EAAE;QACZ,aAAa,EAAE,KAAK;QACpB,QAAQ,EAAE,KAAK;QACf,aAAa,EAAE,IAAI;QACnB,WAAW,EAAE,IAAI;QACjB,cAAc,EAAE,EAAE;KACa;IAEjC,cAAc,CAAC,MAAe;QAC5B,MAAM,MAAM,GAAa,EAAE,CAAC;QAC5B,IAAI,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,EAAE,CAAC;YACzC,MAAM,CAAC,GAAG,MAAiC,CAAC;YAC5C,IAAI,CAAC,CAAC,gBAAgB,KAAK,SAAS,EAAE,CAAC;gBACrC,MAAM,IAAI,GAAG,CAAC,CAAC,gBAA0B,CAAC;gBAC1C,IAAI,OAAO,IAAI,KAAK,QAAQ,IAAI,IAAI,GAAG,CAAC,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;oBACrD,MAAM,CAAC,IAAI,CAAC,0CAA0C,CAAC,CAAC;gBAC1D,CAAC;YACH,CAAC;YACD,IAAI,CAAC,CAAC,SAAS,KAAK,SAAS,IAAI,CAAC,OAAO,CAAC,CAAC,SAAS,KAAK,QAAQ,IAAI,CAAC,CAAC,SAAS,KAAK,IAAI,CAAC,EAAE,CAAC;gBAC3F,MAAM,CAAC,IAAI,CAAC,6BAA6B,CAAC,CAAC;YAC7C,CAAC;YACD,IAAI,CAAC,CAAC,aAAa,KAAK,SAAS,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,aAAa,CAAC,EAAE,CAAC;gBACrE,MAAM,CAAC,IAAI,CAAC,gCAAgC,CAAC,CAAC;YAChD,CAAC;QACH,CAAC;QACD,OAAO,EAAE,KAAK,EAAE,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;IAChD,CAAC;IAED,KAAK,CAAC,KAAqB;QACzB,MAAM,MAAM,GAAiB;YAC3B,GAAG,cAAc;YACjB,GAAI,KAAK,CAAC,MAAgC;YAC1C,SAAS,EAAE;gBACT,GAAG,kBAAkB;gBACrB,GAAG,CAAE,KAAK,CAAC,MAAgC,CAAC,SAAS,IAAI,EAAE,CAAC;aAC7D;SACF,CAAC;QACF,MAAM,MAAM,GAAY,EAAE,CAAC;QAE3B,yBAAyB;QACzB,MAAM,QAAQ,GAAG,IAAI,GAAG,EAAkB,CAAC;QAC3C,KAAK,MAAM,CAAC,CAAC,EAAE,CAAC,CAAC,IAAI,MAAM,CAAC,OAAO,CAAC,MAAM,CAAC,SAAS,CAAC,EAAE,CAAC;YACtD,QAAQ,CAAC,GAAG,CAAC,CAAC,CAAC,WAAW,EAAE,EAAE,CAAC,CAAC,CAAC;QACnC,CAAC;QAED,kDAAkD;QAClD,IAAI,oBAAoB,GAAG,KAAK,CAAC;QACjC,IAAI,MAAM,CAAC,aAAa,CAAC,MAAM,GAAG,CAAC,IAAI,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,gBAAgB,CAAC,EAAE,CAAC;YACjF,wBAAwB;YACxB,MAAM,YAAY,GAAG,KAAK,CAAC,MAAM,CAAC,SAAS,CAAC,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,IAAI,KAAK,MAAM,CAAC,CAAC;YACpE,IAAI,YAAY,IAAI,CAAC,EAAE,CAAC;gBACtB,oBAAoB,GAAG,IAAI,CAAC;YAC9B,CAAC;QACH,CAAC;QAED,iBAAiB;QACjB,IAAI,OAAO,GAAG,IAAI,CAAC;QACnB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YAC7C,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAE,CAAC;YAE/B,wCAAwC;YACxC,IAAI,oBAAoB,IAAI,OAAO,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,EAAE,CAAC;gBAC7D,MAAM,YAAY,GAAG,KAAK,CAAC,GAAG,CAAC,IAAI,CAAC,MAAM,CAAC,aAAa,CAAC,CAAC;gBAC1D,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,MAAM,EAAE,KAAK,EAAE,YAAY,EAAE,CAAC,CAAC;gBACnD,MAAM,CAAC,IAAI,CAAC,EAAE,IAAI,EAAE,YAAY,EAAE,KAAK,EAAE,GAAG,EAAE,CAAC,CAAC;gBAChD,qFAAqF;gBACrF,IAAI,MAAM,CAAC,YAAY,IAAI,KAAK,CAAC,KAAK,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,KAAK,CAAC,KAAK,CAAC,CAAC,CAAE,IAAI,GAAG,EAAE,CAAC;oBAC5E,MAAM,UAAU,GAAG,KAAK,CAAC,KAAK,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,GAAG,KAAK,CAAC,KAAK,CAAC,KAAK,CAAC,CAAC,CAAC,CAAC;oBACxE,MAAM,WAAW,GAAG,QAAQ,CAAC,GAAG,CAAC,UAAU,CAAC,WAAW,EAAE,CAAC,CAAC;oBAC3D,IAAI,WAAW,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;wBACvC,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,WAAW,EAAE,CAAC,CAAC;oBAChD,CAAC;yBAAM,CAAC;wBACN,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,UAAU,EAAE,CAAC,CAAC;oBAC/C,CAAC;oBACD,OAAO,GAAG,KAAK,CAAC;oBAChB,SAAS;gBACX,CAAC;YACH,CAAC;YAED,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;gBACjD,MAAM,KAAK,GAAG,KAAK,CAAC,KAAK,CAAC,WAAW,EAAE,CAAC;gBACxC,MAAM,WAAW,GAAG,QAAQ,CAAC,GAAG,CAAC,KAAK,CAAC,CAAC;gBACxC,IAAI,WAAW,EAAE,CAAC;oBAChB,MAAM,KAAK,GAAG,MAAM,CAAC,YAAY,CAAC,CAAC,CAAC,SAAS,CAAC,KAAK,CAAC,KAAK,EAAE,WAAW,CAAC,CAAC,CAAC,CAAC,WAAW,CAAC;oBACtF,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,KAAK,EAAE,CAAC,CAAC;gBAC1C,CAAC;qBAAM,CAAC;oBACN,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;gBAC5B,CAAC;YACH,CAAC;iBAAM,CAAC;gBACN,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;YAC5B,CAAC;YAED,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM;gBAAE,OAAO,GAAG,KAAK,CAAC;QAC7C,CAAC;QAED,OAAO,EAAE,MAAM,EAAE,CAAC;IACpB,CAAC;CACF,CAAC"}
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"redact.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/redact.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,gBAAgB,EAMjB,MAAM,aAAa,CAAC;AA8BrB,eAAO,MAAM,eAAe,EAAE,gBA+F7B,CAAC"}
|
|
@@ -0,0 +1,109 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Redaction Transform (id="redact")
|
|
3
|
+
* Redact certain tokens while keeping grammar readable.
|
|
4
|
+
*/
|
|
5
|
+
import { isProtected } from '../protection.js';
|
|
6
|
+
const DEFAULT_PARAMS = {
|
|
7
|
+
rate: 0.10,
|
|
8
|
+
targets: ['noun', 'properNoun'],
|
|
9
|
+
style: '[REDACTED]',
|
|
10
|
+
minTokenLength: 4,
|
|
11
|
+
preserveCase: false,
|
|
12
|
+
};
|
|
13
|
+
const STYLE_MAP = {
|
|
14
|
+
'[REDACTED]': '[REDACTED]',
|
|
15
|
+
'\u2588\u2588\u2588\u2588': '\u2588\u2588\u2588\u2588',
|
|
16
|
+
'blackBar': '\u2588\u2588\u2588\u2588',
|
|
17
|
+
};
|
|
18
|
+
/** Heuristic: title-case word not at sentence start might be a proper noun */
|
|
19
|
+
function isTitleCase(word) {
|
|
20
|
+
return word.length > 1 && word[0] >= 'A' && word[0] <= 'Z' && word[1] >= 'a' && word[1] <= 'z';
|
|
21
|
+
}
|
|
22
|
+
export const redactTransform = {
|
|
23
|
+
id: 'redact',
|
|
24
|
+
version: '1.0.0',
|
|
25
|
+
capabilities: {
|
|
26
|
+
requiresTrace: false,
|
|
27
|
+
posAware: false,
|
|
28
|
+
deterministic: true,
|
|
29
|
+
safeToStack: true,
|
|
30
|
+
preferredOrder: 60,
|
|
31
|
+
},
|
|
32
|
+
validateParams(params) {
|
|
33
|
+
const errors = [];
|
|
34
|
+
if (params && typeof params === 'object') {
|
|
35
|
+
const p = params;
|
|
36
|
+
if (p.rate !== undefined) {
|
|
37
|
+
const rate = p.rate;
|
|
38
|
+
if (typeof rate !== 'number' || rate < 0 || rate > 1) {
|
|
39
|
+
errors.push('rate must be between 0 and 1');
|
|
40
|
+
}
|
|
41
|
+
}
|
|
42
|
+
if (p.targets !== undefined && !Array.isArray(p.targets)) {
|
|
43
|
+
errors.push('targets must be an array');
|
|
44
|
+
}
|
|
45
|
+
if (p.style !== undefined) {
|
|
46
|
+
const valid = ['[REDACTED]', '\u2588\u2588\u2588\u2588', 'blackBar'];
|
|
47
|
+
if (!valid.includes(p.style)) {
|
|
48
|
+
errors.push('style must be "[REDACTED]", "████", or "blackBar"');
|
|
49
|
+
}
|
|
50
|
+
}
|
|
51
|
+
if (p.minTokenLength !== undefined && (typeof p.minTokenLength !== 'number' || p.minTokenLength < 0)) {
|
|
52
|
+
errors.push('minTokenLength must be a non-negative number');
|
|
53
|
+
}
|
|
54
|
+
}
|
|
55
|
+
return { valid: errors.length === 0, errors };
|
|
56
|
+
},
|
|
57
|
+
apply(input) {
|
|
58
|
+
const params = { ...DEFAULT_PARAMS, ...input.params };
|
|
59
|
+
const tokens = [];
|
|
60
|
+
const redactStyle = STYLE_MAP[params.style] ?? '[REDACTED]';
|
|
61
|
+
// Determine which tokens are at sentence start (for properNoun heuristic)
|
|
62
|
+
const sentenceStarts = new Set();
|
|
63
|
+
let afterPunct = true;
|
|
64
|
+
for (let i = 0; i < input.tokens.length; i++) {
|
|
65
|
+
const t = input.tokens[i];
|
|
66
|
+
if (t.type === 'word') {
|
|
67
|
+
if (afterPunct)
|
|
68
|
+
sentenceStarts.add(i);
|
|
69
|
+
afterPunct = false;
|
|
70
|
+
}
|
|
71
|
+
if (t.type === 'punct' && (t.value === '.' || t.value === '!' || t.value === '?')) {
|
|
72
|
+
afterPunct = true;
|
|
73
|
+
}
|
|
74
|
+
}
|
|
75
|
+
const targetsSet = new Set(params.targets);
|
|
76
|
+
for (let i = 0; i < input.tokens.length; i++) {
|
|
77
|
+
const token = input.tokens[i];
|
|
78
|
+
if (token.type === 'number' && targetsSet.has('number') && !isProtected(token)) {
|
|
79
|
+
if (input.rng.chance(params.rate)) {
|
|
80
|
+
tokens.push({ ...token, value: redactStyle, type: 'symbol' });
|
|
81
|
+
continue;
|
|
82
|
+
}
|
|
83
|
+
}
|
|
84
|
+
if (token.type === 'word' && !isProtected(token) && token.value.length >= params.minTokenLength) {
|
|
85
|
+
let shouldRedact = false;
|
|
86
|
+
if (targetsSet.has('any')) {
|
|
87
|
+
shouldRedact = input.rng.chance(params.rate);
|
|
88
|
+
}
|
|
89
|
+
else {
|
|
90
|
+
// Proper noun heuristic
|
|
91
|
+
if (targetsSet.has('properNoun') && isTitleCase(token.value) && !sentenceStarts.has(i)) {
|
|
92
|
+
shouldRedact = input.rng.chance(params.rate);
|
|
93
|
+
}
|
|
94
|
+
// Noun heuristic: use rate as probability for every eligible word
|
|
95
|
+
if (!shouldRedact && targetsSet.has('noun')) {
|
|
96
|
+
shouldRedact = input.rng.chance(params.rate);
|
|
97
|
+
}
|
|
98
|
+
}
|
|
99
|
+
if (shouldRedact) {
|
|
100
|
+
tokens.push({ ...token, value: redactStyle, type: 'symbol' });
|
|
101
|
+
continue;
|
|
102
|
+
}
|
|
103
|
+
}
|
|
104
|
+
tokens.push({ ...token });
|
|
105
|
+
}
|
|
106
|
+
return { tokens };
|
|
107
|
+
},
|
|
108
|
+
};
|
|
109
|
+
//# sourceMappingURL=redact.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"redact.js","sourceRoot":"","sources":["../../../src/transforms/transforms/redact.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAUH,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAU/C,MAAM,cAAc,GAAiB;IACnC,IAAI,EAAE,IAAI;IACV,OAAO,EAAE,CAAC,MAAM,EAAE,YAAY,CAAC;IAC/B,KAAK,EAAE,YAAY;IACnB,cAAc,EAAE,CAAC;IACjB,YAAY,EAAE,KAAK;CACpB,CAAC;AAEF,MAAM,SAAS,GAA2B;IACxC,YAAY,EAAE,YAAY;IAC1B,0BAA0B,EAAE,0BAA0B;IACtD,UAAU,EAAE,0BAA0B;CACvC,CAAC;AAEF,8EAA8E;AAC9E,SAAS,WAAW,CAAC,IAAY;IAC/B,OAAO,IAAI,CAAC,MAAM,GAAG,CAAC,IAAI,IAAI,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,IAAI,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,IAAI,CAAC,CAAC,CAAE,IAAI,GAAG,IAAI,IAAI,CAAC,CAAC,CAAE,IAAI,GAAG,CAAC;AACrG,CAAC;AAED,MAAM,CAAC,MAAM,eAAe,GAAqB;IAC/C,EAAE,EAAE,QAAQ;IACZ,OAAO,EAAE,OAAO;IAChB,YAAY,EAAE;QACZ,aAAa,EAAE,KAAK;QACpB,QAAQ,EAAE,KAAK;QACf,aAAa,EAAE,IAAI;QACnB,WAAW,EAAE,IAAI;QACjB,cAAc,EAAE,EAAE;KACa;IAEjC,cAAc,CAAC,MAAe;QAC5B,MAAM,MAAM,GAAa,EAAE,CAAC;QAC5B,IAAI,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,EAAE,CAAC;YACzC,MAAM,CAAC,GAAG,MAAiC,CAAC;YAC5C,IAAI,CAAC,CAAC,IAAI,KAAK,SAAS,EAAE,CAAC;gBACzB,MAAM,IAAI,GAAG,CAAC,CAAC,IAAc,CAAC;gBAC9B,IAAI,OAAO,IAAI,KAAK,QAAQ,IAAI,IAAI,GAAG,CAAC,IAAI,IAAI,GAAG,CAAC,EAAE,CAAC;oBACrD,MAAM,CAAC,IAAI,CAAC,8BAA8B,CAAC,CAAC;gBAC9C,CAAC;YACH,CAAC;YACD,IAAI,CAAC,CAAC,OAAO,KAAK,SAAS,IAAI,CAAC,KAAK,CAAC,OAAO,CAAC,CAAC,CAAC,OAAO,CAAC,EAAE,CAAC;gBACzD,MAAM,CAAC,IAAI,CAAC,0BAA0B,CAAC,CAAC;YAC1C,CAAC;YACD,IAAI,CAAC,CAAC,KAAK,KAAK,SAAS,EAAE,CAAC;gBAC1B,MAAM,KAAK,GAAG,CAAC,YAAY,EAAE,0BAA0B,EAAE,UAAU,CAAC,CAAC;gBACrE,IAAI,CAAC,KAAK,CAAC,QAAQ,CAAC,CAAC,CAAC,KAAe,CAAC,EAAE,CAAC;oBACvC,MAAM,CAAC,IAAI,CAAC,mDAAmD,CAAC,CAAC;gBACnE,CAAC;YACH,CAAC;YACD,IAAI,CAAC,CAAC,cAAc,KAAK,SAAS,IAAI,CAAC,OAAO,CAAC,CAAC,cAAc,KAAK,QAAQ,IAAI,CAAC,CAAC,cAAc,GAAG,CAAC,CAAC,EAAE,CAAC;gBACrG,MAAM,CAAC,IAAI,CAAC,8CAA8C,CAAC,CAAC;YAC9D,CAAC;QACH,CAAC;QACD,OAAO,EAAE,KAAK,EAAE,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;IAChD,CAAC;IAED,KAAK,CAAC,KAAqB;QACzB,MAAM,MAAM,GAAiB,EAAE,GAAG,cAAc,EAAE,GAAI,KAAK,CAAC,MAAgC,EAAE,CAAC;QAC/F,MAAM,MAAM,GAAY,EAAE,CAAC;QAC3B,MAAM,WAAW,GAAG,SAAS,CAAC,MAAM,CAAC,KAAK,CAAC,IAAI,YAAY,CAAC;QAE5D,0EAA0E;QAC1E,MAAM,cAAc,GAAG,IAAI,GAAG,EAAU,CAAC;QACzC,IAAI,UAAU,GAAG,IAAI,CAAC;QACtB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YAC7C,MAAM,CAAC,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAE,CAAC;YAC3B,IAAI,CAAC,CAAC,IAAI,KAAK,MAAM,EAAE,CAAC;gBACtB,IAAI,UAAU;oBAAE,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC;gBACtC,UAAU,GAAG,KAAK,CAAC;YACrB,CAAC;YACD,IAAI,CAAC,CAAC,IAAI,KAAK,OAAO,IAAI,CAAC,CAAC,CAAC,KAAK,KAAK,GAAG,IAAI,CAAC,CAAC,KAAK,KAAK,GAAG,IAAI,CAAC,CAAC,KAAK,KAAK,GAAG,CAAC,EAAE,CAAC;gBAClF,UAAU,GAAG,IAAI,CAAC;YACpB,CAAC;QACH,CAAC;QAED,MAAM,UAAU,GAAG,IAAI,GAAG,CAAC,MAAM,CAAC,OAAO,CAAC,CAAC;QAE3C,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,KAAK,CAAC,MAAM,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YAC7C,MAAM,KAAK,GAAG,KAAK,CAAC,MAAM,CAAC,CAAC,CAAE,CAAC;YAE/B,IAAI,KAAK,CAAC,IAAI,KAAK,QAAQ,IAAI,UAAU,CAAC,GAAG,CAAC,QAAQ,CAAC,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;gBAC/E,IAAI,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,EAAE,CAAC;oBAClC,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,WAAW,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,CAAC;oBAC9D,SAAS;gBACX,CAAC;YACH,CAAC;YAED,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,IAAI,KAAK,CAAC,KAAK,CAAC,MAAM,IAAI,MAAM,CAAC,cAAc,EAAE,CAAC;gBAChG,IAAI,YAAY,GAAG,KAAK,CAAC;gBAEzB,IAAI,UAAU,CAAC,GAAG,CAAC,KAAK,CAAC,EAAE,CAAC;oBAC1B,YAAY,GAAG,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;gBAC/C,CAAC;qBAAM,CAAC;oBACN,wBAAwB;oBACxB,IAAI,UAAU,CAAC,GAAG,CAAC,YAAY,CAAC,IAAI,WAAW,CAAC,KAAK,CAAC,KAAK,CAAC,IAAI,CAAC,cAAc,CAAC,GAAG,CAAC,CAAC,CAAC,EAAE,CAAC;wBACvF,YAAY,GAAG,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;oBAC/C,CAAC;oBACD,kEAAkE;oBAClE,IAAI,CAAC,YAAY,IAAI,UAAU,CAAC,GAAG,CAAC,MAAM,CAAC,EAAE,CAAC;wBAC5C,YAAY,GAAG,KAAK,CAAC,GAAG,CAAC,MAAM,CAAC,MAAM,CAAC,IAAI,CAAC,CAAC;oBAC/C,CAAC;gBACH,CAAC;gBAED,IAAI,YAAY,EAAE,CAAC;oBACjB,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,WAAW,EAAE,IAAI,EAAE,QAAQ,EAAE,CAAC,CAAC;oBAC9D,SAAS;gBACX,CAAC;YACH,CAAC;YAED,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;QAC5B,CAAC;QAED,OAAO,EAAE,MAAM,EAAE,CAAC;IACpB,CAAC;CACF,CAAC"}
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Word Reverse Transform (id="reverseWords")
|
|
3
|
+
* Reverse letters per word, keep punctuation.
|
|
4
|
+
*/
|
|
5
|
+
import type { IOutputTransform } from '../types.js';
|
|
6
|
+
export declare const reverseWordsTransform: IOutputTransform;
|
|
7
|
+
//# sourceMappingURL=reverse-words.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"reverse-words.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/reverse-words.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAEH,OAAO,KAAK,EACV,gBAAgB,EAMjB,MAAM,aAAa,CAAC;AA4DrB,eAAO,MAAM,qBAAqB,EAAE,gBAoCnC,CAAC"}
|
|
@@ -0,0 +1,88 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Word Reverse Transform (id="reverseWords")
|
|
3
|
+
* Reverse letters per word, keep punctuation.
|
|
4
|
+
*/
|
|
5
|
+
import { isProtected } from '../protection.js';
|
|
6
|
+
const DEFAULT_PARAMS = {
|
|
7
|
+
mode: 'full',
|
|
8
|
+
preserveCase: true,
|
|
9
|
+
};
|
|
10
|
+
function isUpperCase(ch) {
|
|
11
|
+
return ch >= 'A' && ch <= 'Z';
|
|
12
|
+
}
|
|
13
|
+
function reverseWord(word, params) {
|
|
14
|
+
if (word.length <= 1)
|
|
15
|
+
return word;
|
|
16
|
+
if (params.mode === 'full') {
|
|
17
|
+
const reversed = word.split('').reverse().join('');
|
|
18
|
+
if (params.preserveCase) {
|
|
19
|
+
// Transfer original casing pattern to reversed string
|
|
20
|
+
let result = '';
|
|
21
|
+
for (let i = 0; i < reversed.length; i++) {
|
|
22
|
+
if (i < word.length && isUpperCase(word[i])) {
|
|
23
|
+
result += reversed[i].toUpperCase();
|
|
24
|
+
}
|
|
25
|
+
else {
|
|
26
|
+
result += reversed[i].toLowerCase();
|
|
27
|
+
}
|
|
28
|
+
}
|
|
29
|
+
return result;
|
|
30
|
+
}
|
|
31
|
+
return reversed;
|
|
32
|
+
}
|
|
33
|
+
// innerOnly: keep first and last letter fixed, reverse inner
|
|
34
|
+
if (word.length <= 2)
|
|
35
|
+
return word;
|
|
36
|
+
const first = word[0];
|
|
37
|
+
const last = word[word.length - 1];
|
|
38
|
+
const inner = word.slice(1, -1).split('').reverse().join('');
|
|
39
|
+
if (params.preserveCase) {
|
|
40
|
+
let result = '';
|
|
41
|
+
const combined = first + inner + last;
|
|
42
|
+
for (let i = 0; i < combined.length; i++) {
|
|
43
|
+
if (i < word.length && isUpperCase(word[i])) {
|
|
44
|
+
result += combined[i].toUpperCase();
|
|
45
|
+
}
|
|
46
|
+
else {
|
|
47
|
+
result += combined[i].toLowerCase();
|
|
48
|
+
}
|
|
49
|
+
}
|
|
50
|
+
return result;
|
|
51
|
+
}
|
|
52
|
+
return first + inner + last;
|
|
53
|
+
}
|
|
54
|
+
export const reverseWordsTransform = {
|
|
55
|
+
id: 'reverseWords',
|
|
56
|
+
version: '1.0.0',
|
|
57
|
+
capabilities: {
|
|
58
|
+
requiresTrace: false,
|
|
59
|
+
posAware: false,
|
|
60
|
+
deterministic: true,
|
|
61
|
+
safeToStack: true,
|
|
62
|
+
preferredOrder: 60,
|
|
63
|
+
},
|
|
64
|
+
validateParams(params) {
|
|
65
|
+
const errors = [];
|
|
66
|
+
if (params && typeof params === 'object') {
|
|
67
|
+
const p = params;
|
|
68
|
+
if (p.mode && p.mode !== 'full' && p.mode !== 'innerOnly') {
|
|
69
|
+
errors.push('mode must be "full" or "innerOnly"');
|
|
70
|
+
}
|
|
71
|
+
}
|
|
72
|
+
return { valid: errors.length === 0, errors };
|
|
73
|
+
},
|
|
74
|
+
apply(input) {
|
|
75
|
+
const params = { ...DEFAULT_PARAMS, ...input.params };
|
|
76
|
+
const tokens = [];
|
|
77
|
+
for (const token of input.tokens) {
|
|
78
|
+
if (token.type === 'word' && !isProtected(token)) {
|
|
79
|
+
tokens.push({ ...token, value: reverseWord(token.value, params) });
|
|
80
|
+
}
|
|
81
|
+
else {
|
|
82
|
+
tokens.push({ ...token });
|
|
83
|
+
}
|
|
84
|
+
}
|
|
85
|
+
return { tokens };
|
|
86
|
+
},
|
|
87
|
+
};
|
|
88
|
+
//# sourceMappingURL=reverse-words.js.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"reverse-words.js","sourceRoot":"","sources":["../../../src/transforms/transforms/reverse-words.ts"],"names":[],"mappings":"AAAA;;;GAGG;AAUH,OAAO,EAAE,WAAW,EAAE,MAAM,kBAAkB,CAAC;AAO/C,MAAM,cAAc,GAAuB;IACzC,IAAI,EAAE,MAAM;IACZ,YAAY,EAAE,IAAI;CACnB,CAAC;AAEF,SAAS,WAAW,CAAC,EAAU;IAC7B,OAAO,EAAE,IAAI,GAAG,IAAI,EAAE,IAAI,GAAG,CAAC;AAChC,CAAC;AAED,SAAS,WAAW,CAAC,IAAY,EAAE,MAA0B;IAC3D,IAAI,IAAI,CAAC,MAAM,IAAI,CAAC;QAAE,OAAO,IAAI,CAAC;IAElC,IAAI,MAAM,CAAC,IAAI,KAAK,MAAM,EAAE,CAAC;QAC3B,MAAM,QAAQ,GAAG,IAAI,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC,OAAO,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC;QACnD,IAAI,MAAM,CAAC,YAAY,EAAE,CAAC;YACxB,sDAAsD;YACtD,IAAI,MAAM,GAAG,EAAE,CAAC;YAChB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,QAAQ,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;gBACzC,IAAI,CAAC,GAAG,IAAI,CAAC,MAAM,IAAI,WAAW,CAAC,IAAI,CAAC,CAAC,CAAE,CAAC,EAAE,CAAC;oBAC7C,MAAM,IAAI,QAAQ,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,CAAC;gBACvC,CAAC;qBAAM,CAAC;oBACN,MAAM,IAAI,QAAQ,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,CAAC;gBACvC,CAAC;YACH,CAAC;YACD,OAAO,MAAM,CAAC;QAChB,CAAC;QACD,OAAO,QAAQ,CAAC;IAClB,CAAC;IAED,6DAA6D;IAC7D,IAAI,IAAI,CAAC,MAAM,IAAI,CAAC;QAAE,OAAO,IAAI,CAAC;IAElC,MAAM,KAAK,GAAG,IAAI,CAAC,CAAC,CAAE,CAAC;IACvB,MAAM,IAAI,GAAG,IAAI,CAAC,IAAI,CAAC,MAAM,GAAG,CAAC,CAAE,CAAC;IACpC,MAAM,KAAK,GAAG,IAAI,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,CAAC,CAAC,CAAC,KAAK,CAAC,EAAE,CAAC,CAAC,OAAO,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC,CAAC;IAE7D,IAAI,MAAM,CAAC,YAAY,EAAE,CAAC;QACxB,IAAI,MAAM,GAAG,EAAE,CAAC;QAChB,MAAM,QAAQ,GAAG,KAAK,GAAG,KAAK,GAAG,IAAI,CAAC;QACtC,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,QAAQ,CAAC,MAAM,EAAE,CAAC,EAAE,EAAE,CAAC;YACzC,IAAI,CAAC,GAAG,IAAI,CAAC,MAAM,IAAI,WAAW,CAAC,IAAI,CAAC,CAAC,CAAE,CAAC,EAAE,CAAC;gBAC7C,MAAM,IAAI,QAAQ,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,CAAC;YACvC,CAAC;iBAAM,CAAC;gBACN,MAAM,IAAI,QAAQ,CAAC,CAAC,CAAE,CAAC,WAAW,EAAE,CAAC;YACvC,CAAC;QACH,CAAC;QACD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,OAAO,KAAK,GAAG,KAAK,GAAG,IAAI,CAAC;AAC9B,CAAC;AAED,MAAM,CAAC,MAAM,qBAAqB,GAAqB;IACrD,EAAE,EAAE,cAAc;IAClB,OAAO,EAAE,OAAO;IAChB,YAAY,EAAE;QACZ,aAAa,EAAE,KAAK;QACpB,QAAQ,EAAE,KAAK;QACf,aAAa,EAAE,IAAI;QACnB,WAAW,EAAE,IAAI;QACjB,cAAc,EAAE,EAAE;KACa;IAEjC,cAAc,CAAC,MAAe;QAC5B,MAAM,MAAM,GAAa,EAAE,CAAC;QAC5B,IAAI,MAAM,IAAI,OAAO,MAAM,KAAK,QAAQ,EAAE,CAAC;YACzC,MAAM,CAAC,GAAG,MAAiC,CAAC;YAC5C,IAAI,CAAC,CAAC,IAAI,IAAI,CAAC,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,CAAC,IAAI,KAAK,WAAW,EAAE,CAAC;gBAC1D,MAAM,CAAC,IAAI,CAAC,oCAAoC,CAAC,CAAC;YACpD,CAAC;QACH,CAAC;QACD,OAAO,EAAE,KAAK,EAAE,MAAM,CAAC,MAAM,KAAK,CAAC,EAAE,MAAM,EAAE,CAAC;IAChD,CAAC;IAED,KAAK,CAAC,KAAqB;QACzB,MAAM,MAAM,GAAuB,EAAE,GAAG,cAAc,EAAE,GAAI,KAAK,CAAC,MAAsC,EAAE,CAAC;QAC3G,MAAM,MAAM,GAAY,EAAE,CAAC;QAE3B,KAAK,MAAM,KAAK,IAAI,KAAK,CAAC,MAAM,EAAE,CAAC;YACjC,IAAI,KAAK,CAAC,IAAI,KAAK,MAAM,IAAI,CAAC,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;gBACjD,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,KAAK,EAAE,WAAW,CAAC,KAAK,CAAC,KAAK,EAAE,MAAM,CAAC,EAAE,CAAC,CAAC;YACrE,CAAC;iBAAM,CAAC;gBACN,MAAM,CAAC,IAAI,CAAC,EAAE,GAAG,KAAK,EAAE,CAAC,CAAC;YAC5B,CAAC;QACH,CAAC;QAED,OAAO,EAAE,MAAM,EAAE,CAAC;IACpB,CAAC;CACF,CAAC"}
|
|
@@ -0,0 +1,11 @@
|
|
|
1
|
+
/**
|
|
2
|
+
* Comprehensive tests for all V1 transforms.
|
|
3
|
+
* At least 10 tests per transform covering:
|
|
4
|
+
* - basic behavior
|
|
5
|
+
* - casing
|
|
6
|
+
* - punctuation preservation
|
|
7
|
+
* - protected token behavior
|
|
8
|
+
* - determinism with seed
|
|
9
|
+
*/
|
|
10
|
+
export {};
|
|
11
|
+
//# sourceMappingURL=transforms.test.d.ts.map
|
|
@@ -0,0 +1 @@
|
|
|
1
|
+
{"version":3,"file":"transforms.test.d.ts","sourceRoot":"","sources":["../../../src/transforms/transforms/transforms.test.ts"],"names":[],"mappings":"AAAA;;;;;;;;GAQG"}
|