npm - cspell-dictionary - Versions diffs - 6.9.0 - Mend

cspell-dictionary 6.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (77) hide show

package/LICENSE +21 -0
package/README.md +3 -0
package/dist/SpellingDictionary/Dictionaries.d.ts +9 -0
package/dist/SpellingDictionary/Dictionaries.js +61 -0
package/dist/SpellingDictionary/SpellingDictionary.d.ts +93 -0
package/dist/SpellingDictionary/SpellingDictionary.js +6 -0
package/dist/SpellingDictionary/SpellingDictionaryCollection.d.ts +34 -0
package/dist/SpellingDictionary/SpellingDictionaryCollection.js +111 -0
package/dist/SpellingDictionary/SpellingDictionaryError.d.ts +10 -0
package/dist/SpellingDictionary/SpellingDictionaryError.js +18 -0
package/dist/SpellingDictionary/SpellingDictionaryFromTrie.d.ts +36 -0
package/dist/SpellingDictionary/SpellingDictionaryFromTrie.js +148 -0
package/dist/SpellingDictionary/SpellingDictionaryMethods.d.ts +29 -0
package/dist/SpellingDictionary/SpellingDictionaryMethods.js +114 -0
package/dist/SpellingDictionary/charset.d.ts +3 -0
package/dist/SpellingDictionary/charset.js +16 -0
package/dist/SpellingDictionary/createSpellingDictionary.d.ts +17 -0
package/dist/SpellingDictionary/createSpellingDictionary.js +91 -0
package/dist/SpellingDictionary/index.d.ts +4 -0
package/dist/SpellingDictionary/index.js +9 -0
package/dist/index.d.ts +3 -0
package/dist/index.js +8 -0
package/dist/util/Comparable.d.ts +20 -0
package/dist/util/Comparable.js +55 -0
package/dist/util/FreqCounter.d.ts +16 -0
package/dist/util/FreqCounter.js +52 -0
package/dist/util/IterableLike.d.ts +4 -0
package/dist/util/IterableLike.js +3 -0
package/dist/util/Memorizer.d.ts +65 -0
package/dist/util/Memorizer.js +138 -0
package/dist/util/MinHeapQueue.d.ts +23 -0
package/dist/util/MinHeapQueue.js +97 -0
package/dist/util/PairingHeap.d.ts +32 -0
package/dist/util/PairingHeap.js +90 -0
package/dist/util/TextMap.d.ts +15 -0
package/dist/util/TextMap.js +62 -0
package/dist/util/TextRange.d.ts +28 -0
package/dist/util/TextRange.js +144 -0
package/dist/util/clean.d.ts +7 -0
package/dist/util/clean.js +18 -0
package/dist/util/debugPerf.d.ts +9 -0
package/dist/util/debugPerf.js +22 -0
package/dist/util/errors.d.ts +17 -0
package/dist/util/errors.js +52 -0
package/dist/util/fileReader.d.ts +4 -0
package/dist/util/fileReader.js +21 -0
package/dist/util/iterableIteratorLib.d.ts +4 -0
package/dist/util/iterableIteratorLib.js +14 -0
package/dist/util/logger.d.ts +33 -0
package/dist/util/logger.js +46 -0
package/dist/util/memorizerWeak.d.ts +6 -0
package/dist/util/memorizerWeak.js +42 -0
package/dist/util/regexHelper.d.ts +7 -0
package/dist/util/regexHelper.js +13 -0
package/dist/util/repMap.d.ts +4 -0
package/dist/util/repMap.js +38 -0
package/dist/util/resolveFile.d.ts +13 -0
package/dist/util/resolveFile.js +127 -0
package/dist/util/search.d.ts +6 -0
package/dist/util/search.js +23 -0
package/dist/util/simpleCache.d.ts +46 -0
package/dist/util/simpleCache.js +143 -0
package/dist/util/text.d.ts +9 -0
package/dist/util/text.js +55 -0
package/dist/util/textRegex.d.ts +1 -0
package/dist/util/textRegex.js +2 -0
package/dist/util/timer.d.ts +26 -0
package/dist/util/timer.js +58 -0
package/dist/util/types.d.ts +7 -0
package/dist/util/types.js +3 -0
package/dist/util/util.d.ts +2 -0
package/dist/util/util.js +8 -0
package/dist/util/util.test copy.d.ts +2 -0
package/dist/util/util.test copy.js +17 -0
package/dist/util/wordSplitter.d.ts +46 -0
package/dist/util/wordSplitter.js +326 -0
package/package.json +47 -0

package/dist/util/types.d.ts ADDED Viewed

@@ -0,0 +1,7 @@
+/**
+ * Like Required, but keeps the Optional.
+ */
+export declare type RemoveUndefined<T> = {
+    [P in keyof T]: Exclude<T[P], undefined>;
+};
+//# sourceMappingURL=types.d.ts.map

package/dist/util/types.js ADDED Viewed

@@ -0,0 +1,3 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+//# sourceMappingURL=types.js.map

package/dist/util/util.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export declare function isDefined<T>(v: T \| undefined): v is T;
2	+ //# sourceMappingURL=util.d.ts.map

package/dist/util/util.js ADDED Viewed

@@ -0,0 +1,8 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.isDefined = void 0;
+function isDefined(v) {
+    return v !== undefined;
+}
+exports.isDefined = isDefined;
+//# sourceMappingURL=util.js.map

package/dist/util/util.test copy.d.ts ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ export {};
2	+ //# sourceMappingURL=util.test%20copy.d.ts.map

package/dist/util/util.test copy.js ADDED Viewed

@@ -0,0 +1,17 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+const clean_1 = require("./clean");
+describe('Validate util', () => {
+    test('tests clean up obj', () => {
+        const obj = {
+            a: undefined,
+            b: 1,
+            c: true,
+            d: undefined,
+            e: 'str',
+        };
+        const cleanObj = (0, clean_1.clean)(obj);
+        expect([...Object.keys(cleanObj)]).toEqual(['b', 'c', 'e']);
+    });
+});
+//# sourceMappingURL=util.test%20copy.js.map

package/dist/util/wordSplitter.d.ts ADDED Viewed

@@ -0,0 +1,46 @@
+import type { TextOffset } from '@cspell/cspell-types';
+export declare type IsValidWordFn = (word: TextOffset) => boolean;
+export interface SplitResult {
+    /** Original line passed to the split function */
+    line: TextOffset;
+    /** Starting point of processing - Original offset passed to the split function */
+    offset: number;
+    /** The span of text that was split */
+    text: TextOffset;
+    /** The collection of words that `text` was split into */
+    words: TextOffsetWithValid[];
+    /** the offset at which the split stopped */
+    endOffset: number;
+}
+export interface LineSegment {
+    line: TextOffset;
+    relStart: number;
+    relEnd: number;
+}
+export interface TextOffsetWithValid extends TextOffset {
+    isFound: boolean;
+}
+export interface SplitOptions extends WordBreakOptions {
+}
+export declare function split(line: TextOffset, offset: number, isValidWord: IsValidWordFn, options?: SplitOptions): SplitResult;
+declare type BreakPairs = readonly number[];
+interface PossibleWordBreak {
+    /** offset from the start of the string */
+    offset: number;
+    /**
+     * break pairs (start, end)
+     * (the characters between the start and end are removed)
+     * With a pure break, start === end.
+     */
+    breaks: BreakPairs[];
+}
+export declare type SortedBreaks = PossibleWordBreak[];
+interface WordBreakOptions {
+    optionalWordBreakCharacters?: string;
+}
+declare function generateWordBreaks(line: LineSegment, options: WordBreakOptions): SortedBreaks;
+export declare const __testing__: {
+    generateWordBreaks: typeof generateWordBreaks;
+};
+export {};
+//# sourceMappingURL=wordSplitter.d.ts.map

package/dist/util/wordSplitter.js ADDED Viewed

@@ -0,0 +1,326 @@
+"use strict";
+Object.defineProperty(exports, "__esModule", { value: true });
+exports.__testing__ = exports.split = void 0;
+const PairingHeap_1 = require("./PairingHeap");
+const regexHelper_1 = require("./regexHelper");
+const textRegex_1 = require("./textRegex");
+const ignoreBreak = Object.freeze([]);
+function split(line, offset, isValidWord, options = {}) {
+    const relWordToSplit = findNextWordText({ text: line.text, offset: offset - line.offset });
+    const lineOffset = line.offset;
+    const requested = new Map();
+    if (!relWordToSplit.text) {
+        const text = rebaseTextOffset(relWordToSplit);
+        return {
+            line,
+            offset,
+            text: text,
+            words: [],
+            endOffset: text.offset + text.text.length,
+        };
+    }
+    const lineSegment = {
+        line,
+        relStart: relWordToSplit.offset,
+        relEnd: relWordToSplit.offset + relWordToSplit.text.length,
+    };
+    const possibleBreaks = generateWordBreaks(lineSegment, options);
+    if (!possibleBreaks.length) {
+        const text = rebaseTextOffset(relWordToSplit);
+        return {
+            line,
+            offset,
+            text: text,
+            words: [{ ...text, isFound: isValidWord(text) }],
+            endOffset: text.offset + text.text.length,
+        };
+    }
+    function rebaseTextOffset(relText) {
+        return {
+            ...relText,
+            offset: relText.offset + lineOffset,
+        };
+    }
+    function has(word) {
+        const i = word.offset;
+        const j = word.text.length;
+        let v = i + (j << 20);
+        if (i < 1 << 20 && j < 1 << 11) {
+            const b = requested.get(v);
+            if (b !== undefined)
+                return b;
+        }
+        else {
+            v = -1;
+        }
+        const r = isValidWord(rebaseTextOffset(word));
+        if (v >= 0) {
+            requested.set(v, r);
+        }
+        return r;
+    }
+    // Add a dummy break at the end to avoid needing to check for last break.
+    possibleBreaks.push({
+        offset: lineSegment.relEnd,
+        breaks: [ignoreBreak],
+    });
+    const result = {
+        line,
+        offset,
+        text: rebaseTextOffset(relWordToSplit),
+        words: splitIntoWords(lineSegment, possibleBreaks, has).map(rebaseTextOffset),
+        endOffset: lineOffset + lineSegment.relEnd,
+    };
+    return result;
+}
+exports.split = split;
+function findNextWordText({ text, offset }) {
+    const reg = new RegExp(textRegex_1.regExWordsAndDigits);
+    reg.lastIndex = offset;
+    const m = reg.exec(text);
+    if (!m) {
+        return {
+            text: '',
+            offset: offset + text.length,
+        };
+    }
+    return {
+        text: m[0],
+        offset: m.index,
+    };
+}
+function generateWordBreaks(line, options) {
+    const camelBreaks = genWordBreakCamel(line);
+    const symbolBreaks = genSymbolBreaks(line);
+    const optionalBreaks = genOptionalWordBreaks(line, options.optionalWordBreakCharacters);
+    return mergeSortedBreaks(...camelBreaks, ...symbolBreaks, ...optionalBreaks);
+}
+function offsetRegEx(reg, offset) {
+    const r = new RegExp(reg);
+    r.lastIndex = offset;
+    return r;
+}
+function genWordBreakCamel(line) {
+    const breaksCamel1 = [];
+    const text = line.line.text.slice(0, line.relEnd);
+    // lower,Upper: camelCase -> camel|Case
+    for (const m of text.matchAll(offsetRegEx(textRegex_1.regExSplitWords, line.relStart))) {
+        if (m.index === undefined)
+            break;
+        const i = m.index + 1;
+        breaksCamel1.push({
+            offset: m.index,
+            breaks: [[i, i], ignoreBreak],
+        });
+    }
+    const breaksCamel2 = [];
+    // cspell:ignore ERRORC
+    // Upper,Upper,lower: ERRORCodes -> ERROR|Codes, ERRORC|odes
+    for (const m of text.matchAll(offsetRegEx(textRegex_1.regExSplitWords2, line.relStart))) {
+        if (m.index === undefined)
+            break;
+        const i = m.index + m[1].length;
+        const j = i + 1;
+        breaksCamel2.push({
+            offset: m.index,
+            breaks: [[i, i], [j, j], ignoreBreak],
+        });
+    }
+    return [breaksCamel1, breaksCamel2];
+}
+function calcBreaksForRegEx(line, reg, calcBreak) {
+    const sb = [];
+    const text = line.line.text.slice(0, line.relEnd);
+    for (const m of text.matchAll(offsetRegEx(reg, line.relStart))) {
+        const b = calcBreak(m);
+        if (b) {
+            sb.push(b);
+        }
+    }
+    return sb;
+}
+function genOptionalWordBreaks(line, optionalBreakCharacters) {
+    function calcBreaks(m) {
+        const i = m.index;
+        if (i === undefined)
+            return;
+        const j = i + m[0].length;
+        return {
+            offset: i,
+            breaks: [
+                [i, j],
+                ignoreBreak,
+            ],
+        };
+    }
+    const breaks = [
+        calcBreaksForRegEx(line, textRegex_1.regExDanglingQuote, calcBreaks),
+        calcBreaksForRegEx(line, textRegex_1.regExTrailingEndings, calcBreaks),
+    ];
+    if (optionalBreakCharacters) {
+        const regex = new RegExp(`[${(0, regexHelper_1.escapeRegEx)(optionalBreakCharacters)}]`, 'gu');
+        breaks.push(calcBreaksForRegEx(line, regex, calcBreaks));
+    }
+    return breaks;
+}
+function genSymbolBreaks(line) {
+    function calcBreaks(m) {
+        const i = m.index;
+        if (i === undefined)
+            return;
+        const j = i + m[0].length;
+        return {
+            offset: i,
+            breaks: [
+                [i, j],
+                [i, i],
+                [j, j],
+                ignoreBreak,
+            ],
+        };
+    }
+    return [
+        calcBreaksForRegEx(line, textRegex_1.regExPossibleWordBreaks, calcBreaks),
+        calcBreaksForRegEx(line, /\d+/g, calcBreaks),
+        calcBreaksForRegEx(line, textRegex_1.regExEscapeCharacters, calcBreaks),
+    ];
+}
+function splitIntoWords(lineSeg, breaks, has) {
+    const maxIndex = lineSeg.relEnd;
+    const maxAttempts = 1000;
+    const knownPathsByIndex = new Map();
+    /**
+     * Create a set of possible candidate to consider
+     * @param p - prev candidate that lead to this one
+     * @param i - offset within the string
+     * @param bi - current index into the set of breaks
+     * @param currentCost - current cost accrued
+     */
+    function makeCandidates(p, i, bi, currentCost) {
+        const len = maxIndex;
+        while (bi < breaks.length && breaks[bi].offset < i) {
+            bi += 1;
+        }
+        if (bi >= breaks.length) {
+            return [];
+        }
+        const br = breaks[bi];
+        function c(bp) {
+            const d = bp.length < 2 ? len - i : (bp[0] - i) * 0.5 + len - bp[1];
+            const ec = currentCost + d;
+            return {
+                p,
+                i,
+                bi,
+                bp,
+                c: currentCost,
+                ec,
+                text: undefined,
+            };
+        }
+        return br.breaks.map(c);
+    }
+    function toTextOffset(text, offset) {
+        const valid = has({ text, offset });
+        return {
+            text,
+            offset,
+            isFound: valid,
+        };
+    }
+    function compare(a, b) {
+        return a.ec - b.ec || b.i - a.i;
+    }
+    function pathToWords(node) {
+        const results = [];
+        for (let p = node; p; p = p.n) {
+            if (p.text) {
+                results.push(p.text);
+            }
+        }
+        return results;
+    }
+    function addToKnownPaths(candidate, path) {
+        for (let can = candidate; can !== undefined; can = can.p) {
+            const t = can.text;
+            const i = can.i;
+            const cost = (!t || t.isFound ? 0 : t.text.length) + (path?.c ?? 0);
+            const exitingPath = knownPathsByIndex.get(i);
+            // Keep going only if this is a better candidate than the existing path
+            if (exitingPath && exitingPath.c <= cost) {
+                return undefined;
+            }
+            const node = {
+                n: path,
+                i,
+                c: cost,
+                text: t,
+            };
+            knownPathsByIndex.set(i, node);
+            path = node;
+        }
+        return path;
+    }
+    let maxCost = lineSeg.relEnd - lineSeg.relStart;
+    const candidates = new PairingHeap_1.PairingHeap(compare);
+    const text = lineSeg.line.text;
+    candidates.concat(makeCandidates(undefined, lineSeg.relStart, 0, 0));
+    let attempts = 0;
+    let bestPath;
+    while (maxCost && candidates.length && attempts++ < maxAttempts) {
+        /** Best Candidate Index */
+        const best = candidates.dequeue();
+        if (!best || best.c >= maxCost) {
+            continue;
+        }
+        // Does it have a split?
+        if (best.bp.length) {
+            // yes
+            const i = best.bp[0];
+            const j = best.bp[1];
+            const t = i > best.i ? toTextOffset(text.slice(best.i, i), best.i) : undefined;
+            const cost = !t || t.isFound ? 0 : t.text.length;
+            const mc = maxIndex - j;
+            best.c += cost;
+            best.ec = best.c + mc;
+            best.text = t;
+            const possiblePath = knownPathsByIndex.get(j);
+            if (possiblePath) {
+                // We found a known apply to candidate
+                const f = addToKnownPaths(best, possiblePath);
+                bestPath = !bestPath || (f && f.c < bestPath.c) ? f : bestPath;
+            }
+            else if (best.c < maxCost) {
+                const c = makeCandidates(t ? best : best.p, j, best.bi + 1, best.c);
+                candidates.concat(c);
+            }
+        }
+        else {
+            // It is a pass through
+            const c = makeCandidates(best.p, best.i, best.bi + 1, best.c);
+            candidates.concat(c);
+            if (!c.length) {
+                const t = maxIndex > best.i ? toTextOffset(text.slice(best.i, maxIndex), best.i) : undefined;
+                const cost = !t || t.isFound ? 0 : t.text.length;
+                best.c += cost;
+                best.ec = best.c;
+                best.text = t;
+                const segText = t || best.p?.text || toTextOffset('', best.i);
+                const can = t ? { ...best, text: segText } : { ...best, ...best.p, text: segText };
+                const f = addToKnownPaths(can, undefined);
+                bestPath = !bestPath || (f && f.c < bestPath.c) ? f : bestPath;
+            }
+        }
+        if (bestPath && bestPath.c < maxCost) {
+            maxCost = bestPath.c;
+        }
+    }
+    return pathToWords(bestPath);
+}
+function mergeSortedBreaks(...maps) {
+    return [].concat(...maps).sort((a, b) => a.offset - b.offset);
+}
+exports.__testing__ = {
+    generateWordBreaks,
+};
+//# sourceMappingURL=wordSplitter.js.map

package/package.json ADDED Viewed

@@ -0,0 +1,47 @@
+{
+  "name": "cspell-dictionary",
+  "version": "6.9.0",
+  "description": "A spelling dictionary library useful for checking words and getting suggestions.",
+  "main": "dist/index.js",
+  "typings": "dist/index.d.ts",
+  "files": [
+    "dist",
+    "!**/__mocks__",
+    "!**/*.test.*",
+    "!**/*.spec.*",
+    "!**/*.map"
+  ],
+  "scripts": {
+    "build": "tsc -p .",
+    "build-dev": "tsc -p tsconfig.dev.json",
+    "watch": "tsc -p . -w",
+    "clean": "rimraf dist temp coverage .tsbuildinfo",
+    "clean-build": "pnpm run clean && pnpm run build",
+    "coverage": "jest --coverage",
+    "test-watch": "jest --watch",
+    "test": "jest"
+  },
+  "repository": {
+    "type": "git",
+    "url": "git+https://github.com/streetsidesoftware/cspell.git"
+  },
+  "keywords": [
+    "cspell"
+  ],
+  "author": "Jason Dent",
+  "license": "MIT",
+  "bugs": {
+    "url": "https://github.com/streetsidesoftware/cspell/labels/cspell-dictionary"
+  },
+  "homepage": "https://github.com/streetsidesoftware/cspell#readme",
+  "engines": {
+    "node": ">=14"
+  },
+  "dependencies": {
+    "@cspell/cspell-pipe": "workspace:^",
+    "@cspell/cspell-types": "workspace:^",
+    "cspell-trie-lib": "workspace:^",
+    "fast-equals": "^4.0.3",
+    "gensequence": "^4.0.2"
+  }
+}