npm - bekindprofanityfilter - Versions diffs - 0.0.5 → 0.0.7 - Mend

bekindprofanityfilter 0.0.5 → 0.0.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

package/dist/cjs/index.js +6 -6
package/dist/esm/index.d.ts +15 -0
package/dist/esm/languages/english-primary-all-languages.d.ts +0 -17
package/dist/esm.min.js +8 -0
package/package.json +5 -6
package/dist/esm/algos/aho-corasick.js +0 -238
package/dist/esm/algos/bloom-filter.js +0 -208
package/dist/esm/algos/context-patterns.js +0 -415
package/dist/esm/index.js +0 -2640
package/dist/esm/innocence-scoring.js +0 -118
package/dist/esm/language-detector.js +0 -952
package/dist/esm/language-dicts.js +0 -2718
package/dist/esm/languages/english-primary-all-languages.js +0 -36894
package/dist/esm/romanization-detector.js +0 -779

package/dist/esm/index.d.ts CHANGED Viewed

@@ -644,6 +644,21 @@ export declare class BeKind {
      * @param text - The input text.
      * @returns Normalized text.
      */
+    /**
+     * Regex matching numeric-punctuation clusters that should never be leet-decoded.
+     * Covers phone numbers "(206) 366-3311", prices "$8,575!", quantities "1,000",
+     * percentages "5%", times "7:30", and other numeric expressions.
+     * Matches any token that starts with or contains digits mixed with common
+     * numeric punctuation (,.!?:;$%#()/-) and has no adjacent letters.
+     */
+    /**
+     * Matches whitespace-delimited tokens that contain NO letters — only
+     * digits, punctuation, and symbols. These are pure numeric expressions
+     * (phone numbers, prices, years, quantities) and should never be
+     * leet-decoded. Tokens containing at least one letter (like "f0ck",
+     * "6006s", "b00bs") are left for leet-speak processing.
+     */
+    private static readonly PURE_NUMERIC_TOKEN_RE;
     private normalizeLeetSpeak;
     /**
      * Conservative leet normalization — only replaces non-letter characters

package/dist/esm/languages/english-primary-all-languages.d.ts CHANGED Viewed

@@ -1,20 +1,3 @@
-/**
- * Consolidated profanity words list across all supported languages.
- * Contains the full word lists from all individual language files.
- *
- * Cross-language false positives removed (normal English words that are profane elsewhere):
- *   bite (FR: dick), con (FR: cunt), gland (FR: idiot), laid (FR: ugly),
- *   pet (FR: fart), pine (FR: dick), sale (FR: dirty), beaver (EN: vulgar slang),
- *   Mist (DE: shit), mist (DE: crap), Sack (DE: scrotum), Pack (DE: scum),
- *   pica (BR: penis), pinto (BR: penis), peru (BR: penis + country name),
- *   bal (BN: pubic hair), paal (TA: contextually vulgar), memo (ES: dumb),
- *   laura (HI: penis variant), gay (BR: listed as profanity but isn't)
- *
- * Languages included: English, German, French, Spanish, Brazilian Portuguese,
- * Hindi/Hinglish, Tamil, Bengali, Telugu, Arabic, Chinese, Italian, Japanese, Korean, Russian
- *
- * ⚠️ Warning: This file contains explicit language in multiple languages
- */
 declare const allLanguagesBadWords: Record<string, {
     severity: number;
     certainty: number;