npm - allprofanity - Versions diffs - 1.0.4 → 2.0.0 - Mend

allprofanity 1.0.4 → 2.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/README.md +129 -85
package/dist/index.d.ts +100 -18
package/dist/index.js +546 -99
package/dist/index.js.map +1 -1
package/dist/languages/bengali-words.js +0 -1
package/dist/languages/bengali-words.js.map +1 -1
package/dist/languages/english-words.d.ts +2 -0
package/dist/languages/english-words.js +256 -0
package/dist/languages/english-words.js.map +1 -0
package/package.json +2 -5

package/dist/index.js CHANGED Viewed

@@ -1,22 +1,33 @@
-import leoProfanity from "leo-profanity";
-import hindiBadWords from "./languages/hindi-words";
-import frenchBadWords from "./languages/french-words";
-import germanBadWords from "./languages/german-words";
-import spanishBadWords from "./languages/spanish-words";
-import bengaliBadWords from "./languages/bengali-words";
-import tamilBadWords from "./languages/tamil-words";
-import teluguBadWords from "./languages/telugu-words";
+import englishBadWords from "./languages/english-words.js";
+import hindiBadWords from "./languages/hindi-words.js";
+import frenchBadWords from "./languages/french-words.js";
+import germanBadWords from "./languages/german-words.js";
+import spanishBadWords from "./languages/spanish-words.js";
+import bengaliBadWords from "./languages/bengali-words.js";
+import tamilBadWords from "./languages/tamil-words.js";
+import teluguBadWords from "./languages/telugu-words.js";
 // Export language dictionaries for direct access
-export { default as hindiBadWords } from "./languages/hindi-words";
-export { default as frenchBadWords } from "./languages/french-words";
-export { default as germanBadWords } from "./languages/german-words";
-export { default as spanishBadWords } from "./languages/spanish-words";
-export { default as bengaliBadWords } from "./languages/bengali-words";
-export { default as tamilBadWords } from "./languages/tamil-words";
-export { default as teluguBadWords } from "./languages/telugu-words";
+export { default as englishBadWords } from "./languages/english-words.js";
+export { default as hindiBadWords } from "./languages/hindi-words.js";
+export { default as frenchBadWords } from "./languages/french-words.js";
+export { default as germanBadWords } from "./languages/german-words.js";
+export { default as spanishBadWords } from "./languages/spanish-words.js";
+export { default as bengaliBadWords } from "./languages/bengali-words.js";
+export { default as tamilBadWords } from "./languages/tamil-words.js";
+export { default as teluguBadWords } from "./languages/telugu-words.js";
 /**
- * AllProfanity - Extended profanity filter with multi-language support
- * Based on leo-profanity with additional language capabilities
+ * Severity levels for profanity detection
+ */
+export var ProfanitySeverity;
+(function (ProfanitySeverity) {
+    ProfanitySeverity[ProfanitySeverity["MILD"] = 1] = "MILD";
+    ProfanitySeverity[ProfanitySeverity["MODERATE"] = 2] = "MODERATE";
+    ProfanitySeverity[ProfanitySeverity["SEVERE"] = 3] = "SEVERE";
+    ProfanitySeverity[ProfanitySeverity["EXTREME"] = 4] = "EXTREME";
+})(ProfanitySeverity = ProfanitySeverity || (ProfanitySeverity = {}));
+/**
+ * Advanced AllProfanity - Custom profanity filter with multi-language support and leet speak detection
+ * No external dependencies - built from scratch for maximum performance and control
  */
 export class AllProfanity {
     /**
@@ -24,25 +35,92 @@ export class AllProfanity {
      * @param options - Configuration options
      */
     constructor(options) {
+        var _a, _b, _c, _d;
+        this.profanitySet = new Set();
+        this.normalizedProfanityMap = new Map();
         this.defaultPlaceholder = "*";
         this.loadedLanguages = new Set();
+        this.whitelistSet = new Set();
+        this.enableLeetSpeak = true;
+        this.caseSensitive = false;
+        this.strictMode = false;
+        this.detectPartialWords = true;
+        // Comprehensive leet speak mapping
+        this.leetMap = {
+            a: ["4", "@", "^", "aye", "λ", "ª"],
+            b: ["8", "6", "|3", "ß", "β", "13"],
+            c: ["(", "<", "©", "¢", "see", "sea"],
+            d: ["|)", "|]", "0", "ð"],
+            e: ["3", "€", "£", "ë", "é", "è"],
+            f: ["|=", "ph", "|#", "ƒ"],
+            g: ["9", "6", "&", "gee"],
+            h: ["#", "|-|", "[-]", "}{", "ħ"],
+            i: ["1", "!", "|", "eye", "ï", "í", "ì"],
+            j: ["_|", "_/", "¿", "ĵ"],
+            k: ["|<", "1<", "l<", "|{", "ķ"],
+            l: ["1", "|", "7", "£", "ł", "ĺ"],
+            m: ["|/|", "//\\", "em", "ɱ"],
+            n: ["||", "//", "and", "ñ", "ń"],
+            o: ["0", "()", "oh", "ø", "ó", "ò", "ô"],
+            p: ["|*", "|o", "|^", "|>", "9", "þ"],
+            q: ["(_,)", "()_", "kw", "ĸ"],
+            r: ["|2", "12", ".-", "are", "ř", "ŕ"],
+            s: ["5", "$", "z", "ş", "ś", "š"],
+            t: ["7", "+", "-|-", "†", "ť", "ţ"],
+            u: ["(_)", "|_|", "v", "you", "ü", "ú", "ù"],
+            v: ["\\/", "|/", "|", "vee"],
+            w: ["\\/\\/", "vv", "dubya", "ŵ"],
+            x: ["><", "}{", "ecks", "χ"],
+            y: ["`/", "j", "why", "ÿ", "ý"],
+            z: ["2", "7_", "-/_", "zee", "ž", "ź", "ż"],
+        };
+        // Word boundary patterns
+        this.wordBoundaryChars = /[\s\.,;:!?\-_+=\[\]{}()"'\/\\]/;
+        // Common word variations and suffixes
+        this.commonSuffixes = [
+            "ing",
+            "ed",
+            "s",
+            "er",
+            "ers",
+            "est",
+            "ly",
+            "tion",
+            "ness",
+        ];
+        this.commonPrefixes = [
+            "un",
+            "re",
+            "pre",
+            "dis",
+            "over",
+            "under",
+            "out",
+        ];
         this.availableLanguages = {
-            hindi: hindiBadWords,
-            french: frenchBadWords,
-            german: germanBadWords,
-            spanish: spanishBadWords,
-            bengali: bengaliBadWords,
-            tamil: tamilBadWords,
-            telugu: teluguBadWords,
-            // Add more built-in languages here in the future
+            english: englishBadWords || [],
+            hindi: hindiBadWords || [],
+            french: frenchBadWords || [],
+            german: germanBadWords || [],
+            spanish: spanishBadWords || [],
+            bengali: bengaliBadWords || [],
+            tamil: tamilBadWords || [],
+            telugu: teluguBadWords || [],
         };
-        this.filter = leoProfanity;
-        // Set custom placeholder if provided
+        // Set configuration options
         if (options === null || options === void 0 ? void 0 : options.defaultPlaceholder) {
             this.setPlaceholder(options.defaultPlaceholder);
         }
-        // Load the default English dictionary from leo-profanity
-        this.loadedLanguages.add("english");
+        this.enableLeetSpeak = (_a = options === null || options === void 0 ? void 0 : options.enableLeetSpeak) !== null && _a !== void 0 ? _a : true;
+        this.caseSensitive = (_b = options === null || options === void 0 ? void 0 : options.caseSensitive) !== null && _b !== void 0 ? _b : false;
+        this.strictMode = (_c = options === null || options === void 0 ? void 0 : options.strictMode) !== null && _c !== void 0 ? _c : false;
+        this.detectPartialWords = (_d = options === null || options === void 0 ? void 0 : options.detectPartialWords) !== null && _d !== void 0 ? _d : true;
+        // Load whitelist if provided
+        if (options === null || options === void 0 ? void 0 : options.whitelistWords) {
+            this.addToWhitelist(options.whitelistWords);
+        }
+        // Load the default English dictionary
+        this.loadLanguage("english");
         // Load Hindi by default for backward compatibility
         this.loadLanguage("hindi");
         // Load any additional languages specified in options
@@ -56,25 +134,166 @@ export class AllProfanity {
             });
         }
     }
+    /**
+     * Normalize text by converting leet speak to regular characters
+     * @param text - Text to normalize
+     * @returns Normalized text
+     */
+    normalizeLeetSpeak(text) {
+        if (!this.enableLeetSpeak)
+            return text;
+        let normalized = text.toLowerCase();
+        // Define comprehensive leet mappings
+        const leetMappings = [
+            // Multi-character first
+            { pattern: /\|-\|/g, replacement: "h" },
+            { pattern: /\[-\]/g, replacement: "h" },
+            { pattern: /\}{\s*/g, replacement: "h" },
+            { pattern: /\|\/\|/g, replacement: "m" },
+            { pattern: /\/\/\\/g, replacement: "m" },
+            { pattern: /\|\|/g, replacement: "n" },
+            { pattern: /\/\//g, replacement: "n" },
+            { pattern: /\|2/g, replacement: "r" },
+            { pattern: /12/g, replacement: "r" },
+            { pattern: /\\\/\\\//g, replacement: "w" },
+            { pattern: /vv/g, replacement: "w" },
+            { pattern: /><\s*/g, replacement: "x" },
+            { pattern: /\(_\)/g, replacement: "u" },
+            { pattern: /\|_\|/g, replacement: "u" },
+            { pattern: /\\\//g, replacement: "v" },
+            { pattern: /\|\//g, replacement: "v" },
+            // Single character mappings
+            { pattern: /@/g, replacement: "a" },
+            { pattern: /4/g, replacement: "u" },
+            { pattern: /\^/g, replacement: "a" },
+            { pattern: /8/g, replacement: "b" },
+            { pattern: /6/g, replacement: "b" },
+            { pattern: /\(/g, replacement: "c" },
+            { pattern: /</g, replacement: "c" },
+            { pattern: /©/g, replacement: "c" },
+            { pattern: /¢/g, replacement: "c" },
+            { pattern: /0/g, replacement: "o" },
+            { pattern: /3/g, replacement: "e" },
+            { pattern: /€/g, replacement: "e" },
+            { pattern: /£/g, replacement: "e" },
+            { pattern: /9/g, replacement: "g" },
+            { pattern: /&/g, replacement: "g" },
+            { pattern: /#/g, replacement: "h" },
+            { pattern: /1/g, replacement: "i" },
+            { pattern: /!/g, replacement: "i" },
+            { pattern: /\|/g, replacement: "i" },
+            { pattern: /7/g, replacement: "t" },
+            { pattern: /5/g, replacement: "s" },
+            { pattern: /\$/g, replacement: "s" },
+            { pattern: /\+/g, replacement: "t" },
+            { pattern: /2/g, replacement: "z" },
+        ];
+        // Apply all mappings
+        for (const mapping of leetMappings) {
+            normalized = normalized.replace(mapping.pattern, mapping.replacement);
+        }
+        return normalized;
+    }
+    escapeRegex(str) {
+        if (!str || typeof str !== "string") {
+            return "";
+        }
+        return str.replace(/[\\^$.*+?()[\]{}|\-]/g, function (match) {
+            return "\\" + match;
+        });
+    }
+    /**
+     * Generate word variations with common prefixes and suffixes
+     */
+    generateWordVariations(word) {
+        const variations = new Set([word]);
+        // Add suffix variations
+        for (const suffix of this.commonSuffixes) {
+            variations.add(word + suffix);
+            // Handle words ending in 'e'
+            if (word.endsWith("e") && !suffix.startsWith("e")) {
+                variations.add(word.slice(0, -1) + suffix);
+            }
+            // Handle consonant doubling
+            if (word.length > 2 && /[bcdfghjklmnpqrstvwxyz]/.test(word.slice(-1))) {
+                variations.add(word + word.slice(-1) + suffix);
+            }
+        }
+        // Add prefix variations
+        for (const prefix of this.commonPrefixes) {
+            variations.add(prefix + word);
+        }
+        return Array.from(variations);
+    }
+    /**
+     * Check if text contains word boundaries around a match
+     */
+    hasWordBoundaries(text, start, end) {
+        if (!this.strictMode)
+            return true;
+        const beforeChar = start > 0 ? text[start - 1] : " ";
+        const afterChar = end < text.length ? text[end] : " ";
+        return (this.wordBoundaryChars.test(beforeChar) &&
+            this.wordBoundaryChars.test(afterChar));
+    }
+    /**
+     * Calculate severity based on detected words
+     */
+    calculateSeverity(detectedWords) {
+        if (detectedWords.length === 0)
+            return ProfanitySeverity.MILD;
+        // This is a simplified severity calculation
+        // You can enhance this based on your specific word categorization
+        const totalWords = detectedWords.length;
+        const uniqueWords = new Set(detectedWords).size;
+        if (totalWords >= 5 || uniqueWords >= 3)
+            return ProfanitySeverity.EXTREME;
+        if (totalWords >= 3 || uniqueWords >= 2)
+            return ProfanitySeverity.SEVERE;
+        if (totalWords >= 2)
+            return ProfanitySeverity.MODERATE;
+        return ProfanitySeverity.MILD;
+    }
     /**
      * Load a built-in language dictionary
      * @param language - The language to load
      * @returns boolean - True if loaded successfully, false otherwise
      */
     loadLanguage(language) {
-        // Skip if already loaded
         if (this.loadedLanguages.has(language.toLowerCase())) {
             return true;
         }
         const langKey = language.toLowerCase();
-        if (this.availableLanguages[langKey]) {
-            this.filter.add(this.availableLanguages[langKey]);
+        if (this.availableLanguages[langKey] &&
+            this.availableLanguages[langKey].length > 0) {
+            const words = this.availableLanguages[langKey];
+            // Add words and their variations to the profanity set
+            for (const word of words) {
+                if (!word || typeof word !== "string")
+                    continue;
+                const normalizedWord = this.caseSensitive ? word : word.toLowerCase();
+                this.profanitySet.add(normalizedWord);
+                // Store normalized leet version mapping
+                const leetNormalized = this.normalizeLeetSpeak(normalizedWord);
+                if (leetNormalized !== normalizedWord) {
+                    this.normalizedProfanityMap.set(leetNormalized, normalizedWord);
+                }
+                // Generate and add variations
+                const variations = this.generateWordVariations(normalizedWord);
+                for (const variation of variations) {
+                    this.profanitySet.add(variation);
+                    const leetVariation = this.normalizeLeetSpeak(variation);
+                    if (leetVariation !== variation) {
+                        this.normalizedProfanityMap.set(leetVariation, variation);
+                    }
+                }
+            }
             this.loadedLanguages.add(langKey);
-            console.log(`AllProfanity: Added ${this.availableLanguages[langKey].length} ${language} words to the profanity list.`);
+            console.log(`AllProfanity: Added ${words.length} ${language} words to the profanity list.`);
             return true;
         }
         else {
-            console.warn(`AllProfanity: Language '${language}' not found in available dictionaries.`);
+            console.warn(`AllProfanity: Language '${language}' not found or empty in available dictionaries.`);
             return false;
         }
     }
@@ -112,66 +331,224 @@ export class AllProfanity {
         }
         // Add to available languages for future reference
         this.availableLanguages[name.toLowerCase()] = words;
-        // Add to filter
-        this.filter.add(words);
+        // Process and add words
+        for (const word of words) {
+            if (!word || typeof word !== "string")
+                continue;
+            const normalizedWord = this.caseSensitive ? word : word.toLowerCase();
+            this.profanitySet.add(normalizedWord);
+            // Store normalized leet version mapping
+            const leetNormalized = this.normalizeLeetSpeak(normalizedWord);
+            if (leetNormalized !== normalizedWord) {
+                this.normalizedProfanityMap.set(leetNormalized, normalizedWord);
+            }
+            // Generate and add variations
+            const variations = this.generateWordVariations(normalizedWord);
+            for (const variation of variations) {
+                this.profanitySet.add(variation);
+                const leetVariation = this.normalizeLeetSpeak(variation);
+                if (leetVariation !== variation) {
+                    this.normalizedProfanityMap.set(leetVariation, variation);
+                }
+            }
+        }
         this.loadedLanguages.add(name.toLowerCase());
         console.log(`AllProfanity: Added ${words.length} words from custom '${name}' dictionary.`);
     }
     /**
-     * Get the list of currently loaded languages
-     * @returns string[] - Array of loaded language names
+     * Add words to whitelist (words that should never be flagged as profanity)
+     * @param words - Array of words to whitelist
      */
-    getLoadedLanguages() {
-        return Array.from(this.loadedLanguages);
+    addToWhitelist(words) {
+        for (const word of words) {
+            if (word && typeof word === "string") {
+                this.whitelistSet.add(this.caseSensitive ? word : word.toLowerCase());
+            }
+        }
     }
     /**
-     * Get the list of available language dictionaries
-     * @returns string[] - Array of available language names
+     * Remove words from whitelist
+     * @param words - Array of words to remove from whitelist
      */
-    getAvailableLanguages() {
-        return Object.keys(this.availableLanguages);
+    removeFromWhitelist(words) {
+        for (const word of words) {
+            if (word && typeof word === "string") {
+                this.whitelistSet.delete(this.caseSensitive ? word : word.toLowerCase());
+            }
+        }
     }
     /**
-     * Check if a string contains profanity
+     * Advanced profanity detection with detailed results
+     * @param text - The text to analyze
+     * @returns ProfanityDetectionResult - Detailed detection results
+     */
+    detect(text) {
+        if (!text || typeof text !== "string") {
+            return {
+                hasProfanity: false,
+                detectedWords: [],
+                cleanedText: text || "",
+                severity: ProfanitySeverity.MILD,
+                positions: [],
+            };
+        }
+        const normalizedText = this.caseSensitive ? text : text.toLowerCase();
+        const leetNormalizedText = this.normalizeLeetSpeak(normalizedText);
+        const detectedWords = [];
+        const positions = [];
+        // Check for whole word matches first
+        for (const profanity of this.profanitySet) {
+            if (this.whitelistSet.has(profanity))
+                continue;
+            try {
+                // Create regex for word boundary detection
+                const escapedWord = this.escapeRegex(profanity);
+                const wordRegex = new RegExp(`\\b${escapedWord}\\b`, this.caseSensitive ? "g" : "gi");
+                let match;
+                while ((match = wordRegex.exec(normalizedText)) !== null) {
+                    if (this.hasWordBoundaries(normalizedText, match.index, match.index + match[0].length)) {
+                        detectedWords.push(match[0]);
+                        positions.push({
+                            word: match[0],
+                            start: match.index,
+                            end: match.index + match[0].length,
+                        });
+                    }
+                }
+            }
+            catch (error) {
+                // Fallback to simple string search if regex fails
+                const index = normalizedText.indexOf(profanity);
+                if (index !== -1) {
+                    detectedWords.push(profanity);
+                    positions.push({
+                        word: profanity,
+                        start: index,
+                        end: index + profanity.length,
+                    });
+                }
+            }
+        }
+        // Check leet speak normalized text
+        if (this.enableLeetSpeak && leetNormalizedText !== normalizedText) {
+            for (const profanity of this.profanitySet) {
+                if (this.whitelistSet.has(profanity))
+                    continue;
+                try {
+                    const escapedWord = this.escapeRegex(profanity);
+                    const wordRegex = new RegExp(`\\b${escapedWord}\\b`, this.caseSensitive ? "g" : "gi");
+                    let match;
+                    while ((match = wordRegex.exec(leetNormalizedText)) !== null) {
+                        if (this.hasWordBoundaries(leetNormalizedText, match.index, match.index + match[0].length)) {
+                            // Find the original text that corresponds to this match
+                            const originalMatch = normalizedText.substring(match.index, match.index + match[0].length);
+                            if (!detectedWords.includes(originalMatch)) {
+                                detectedWords.push(originalMatch);
+                                positions.push({
+                                    word: originalMatch,
+                                    start: match.index,
+                                    end: match.index + match[0].length,
+                                });
+                            }
+                        }
+                    }
+                }
+                catch (error) {
+                    // Fallback to simple string search
+                    if (leetNormalizedText.includes(profanity)) {
+                        const index = leetNormalizedText.indexOf(profanity);
+                        const originalMatch = normalizedText.substring(index, index + profanity.length);
+                        if (!detectedWords.includes(originalMatch)) {
+                            detectedWords.push(originalMatch);
+                            positions.push({
+                                word: originalMatch,
+                                start: index,
+                                end: index + profanity.length,
+                            });
+                        }
+                    }
+                }
+            }
+        }
+        // Partial word detection (if enabled)
+        if (this.detectPartialWords) {
+            for (const profanity of this.profanitySet) {
+                if (this.whitelistSet.has(profanity) || profanity.length < 4)
+                    continue;
+                if (normalizedText.includes(profanity) ||
+                    leetNormalizedText.includes(profanity)) {
+                    const index = normalizedText.indexOf(profanity);
+                    if (index !== -1 &&
+                        !detectedWords.some((w) => normalizedText.indexOf(w) === index)) {
+                        detectedWords.push(profanity);
+                        positions.push({
+                            word: profanity,
+                            start: index,
+                            end: index + profanity.length,
+                        });
+                    }
+                }
+            }
+        }
+        // REMOVED: cleanedText = this.clean(text) - this was causing circular dependency
+        // We'll generate the cleaned text directly here instead
+        let cleanedText = text;
+        if (detectedWords.length > 0) {
+            // Sort positions by start index in descending order to avoid index shifting
+            const sortedPositions = positions.sort((a, b) => b.start - a.start);
+            for (const pos of sortedPositions) {
+                const originalWord = text.substring(pos.start, pos.end);
+                const replacement = this.defaultPlaceholder.repeat(originalWord.length);
+                cleanedText =
+                    cleanedText.substring(0, pos.start) +
+                        replacement +
+                        cleanedText.substring(pos.end);
+            }
+        }
+        const severity = this.calculateSeverity(detectedWords);
+        return {
+            hasProfanity: detectedWords.length > 0,
+            detectedWords: [...new Set(detectedWords)],
+            cleanedText,
+            severity,
+            positions,
+        };
+    }
+    /**
+     * Check if a string contains profanity (simple boolean check)
      * @param string - The string to check
      * @returns boolean - True if profanity found, false otherwise
      */
     check(string) {
-        return this.filter.check(string);
+        return this.detect(string).hasProfanity;
     }
     /**
      * Clean a string by replacing profanities with placeholders
      * @param string - The string to clean
-     * @param placeholder - Optional custom placeholder (defaults to '*')
+     * @param placeholder - Optional custom placeholder
      * @returns string - The cleaned string
      */
     clean(string, placeholder) {
-        // More general solution for handling variations like "fucking"
-        const badWords = this.list();
+        if (!string || typeof string !== "string")
+            return string || "";
+        const placeholderChar = placeholder || this.defaultPlaceholder;
+        const detection = this.detect(string);
+        // If detect() already provided cleanedText and no custom placeholder, use it
+        if (!placeholder && detection.cleanedText !== string) {
+            return detection.cleanedText;
+        }
+        // Otherwise, build cleaned text with custom placeholder
         let result = string;
-        for (const word of badWords) {
-            // Check for variations with "ing", "ed", etc.
-            const variations = [
-                `${word}ing`,
-                `${word}ed`,
-                `${word}s`,
-                `${word}er`,
-                `${word}ers`,
-            ];
-            for (const variation of variations) {
-                if (result.toLowerCase().includes(variation.toLowerCase())) {
-                    const prefix = word;
-                    const suffix = variation.slice(word.length);
-                    const replacement = (placeholder || this.defaultPlaceholder).repeat(prefix.length) +
-                        suffix;
-                    // Use regex to replace while preserving case (though this simplifies it)
-                    const regex = new RegExp(variation, "gi");
-                    result = result.replace(regex, replacement);
-                }
-            }
+        const sortedPositions = detection.positions.sort((a, b) => b.start - a.start);
+        for (const pos of sortedPositions) {
+            const originalWord = string.substring(pos.start, pos.end);
+            const replacement = placeholderChar.repeat(originalWord.length);
+            result =
+                result.substring(0, pos.start) +
+                    replacement +
+                    result.substring(pos.end);
         }
-        // Fall back to default leo-profanity implementation
-        return this.filter.clean(result, placeholder || this.defaultPlaceholder);
+        return result;
     }
     /**
      * Clean a string by replacing each profane word with a single placeholder
@@ -180,58 +557,77 @@ export class AllProfanity {
      * @returns string - The cleaned string
      */
     cleanWithWord(string, placeholder = "***") {
-        // Split by spaces but preserve punctuation
-        const regex = /([^\w\s])/g;
-        let tempString = string.replace(regex, " $1 ");
-        const words = tempString.split(" ").filter((w) => w !== "");
-        const result = words.map((word) => {
-            // Check if this word contains profanity, ignoring punctuation for the check
-            const wordWithoutPunctuation = word.replace(/[^\w\s]/g, "");
-            if (wordWithoutPunctuation && this.check(wordWithoutPunctuation)) {
-                return placeholder;
-            }
-            return word;
-        });
-        // Join and fix spaces before punctuation
-        let cleaned = result.join(" ");
-        cleaned = cleaned.replace(/ ([^\w\s]) /g, "$1 "); // Fix space before punctuation
-        cleaned = cleaned.replace(/ ([^\w\s])$/g, "$1"); // Fix trailing punctuation
-        return cleaned;
+        if (!string || typeof string !== "string")
+            return string || "";
+        // Build a regex that matches any profane word with word boundaries, unicode-aware
+        const words = Array.from(this.profanitySet)
+            .map((w) => w.replace(/[.*+?^${}()|[\]\\]/g, "\\$&")) // escape regex
+            .sort((a, b) => b.length - a.length); // longer words first to avoid partial matches
+        if (words.length === 0)
+            return string;
+        // Unicode safe word boundary: (?<=^|[^\p{L}\p{N}_])WORD(?=[^\p{L}\p{N}_]|$)
+        // This ensures we only match whole words, not inside other words.
+        const regex = new RegExp(`(?<=^|[\\s\\.,;:!\\?\\-_+=\\[\\]{}()"'\\/\\\\])(` +
+            words.join("|") +
+            `)(?=[\\s\\.,;:!\\?\\-_+=\\[\\]{}()"'\\/\\\\]|$)`, this.caseSensitive ? "gu" : "giu");
+        // Replace all matches with the placeholder.
+        return string.replace(regex, placeholder);
     }
     /**
      * Get the current list of profanity words
      * @returns string[] - Array of all profanity words
      */
     list() {
-        return this.filter.list();
+        return Array.from(this.profanitySet);
     }
     /**
      * Add word(s) to the profanity list
      * @param word - String or array of strings to add
      */
     add(word) {
-        this.filter.add(word);
+        const words = Array.isArray(word) ? word : [word];
+        for (const w of words) {
+            if (!w || typeof w !== "string")
+                continue;
+            const normalizedWord = this.caseSensitive ? w : w.toLowerCase();
+            this.profanitySet.add(normalizedWord);
+            // Add leet speak mapping
+            const leetNormalized = this.normalizeLeetSpeak(normalizedWord);
+            if (leetNormalized !== normalizedWord) {
+                this.normalizedProfanityMap.set(leetNormalized, normalizedWord);
+            }
+            // Add variations
+            const variations = this.generateWordVariations(normalizedWord);
+            for (const variation of variations) {
+                this.profanitySet.add(variation);
+            }
+        }
     }
     /**
      * Remove word(s) from the profanity list
      * @param word - String or array of strings to remove
      */
     remove(word) {
-        this.filter.remove(word);
+        const words = Array.isArray(word) ? word : [word];
+        for (const w of words) {
+            if (!w || typeof w !== "string")
+                continue;
+            const normalizedWord = this.caseSensitive ? w : w.toLowerCase();
+            this.profanitySet.delete(normalizedWord);
+            // Remove variations
+            const variations = this.generateWordVariations(normalizedWord);
+            for (const variation of variations) {
+                this.profanitySet.delete(variation);
+            }
+        }
     }
     /**
      * Clear the filter list and reset to default
      */
     clearList() {
-        // Get all current words
-        const currentWords = this.filter.list();
-        // Remove all words
-        if (currentWords.length > 0) {
-            this.filter.remove(currentWords);
-        }
-        // Reset loaded languages tracking
+        this.profanitySet.clear();
+        this.normalizedProfanityMap.clear();
         this.loadedLanguages.clear();
-        this.loadedLanguages.add("english"); // Default language remains
     }
     /**
      * Change the character used as placeholder
@@ -246,6 +642,57 @@ export class AllProfanity {
             this.defaultPlaceholder = placeholder;
         }
     }
+    /**
+     * Get the list of currently loaded languages
+     * @returns string[] - Array of loaded language names
+     */
+    getLoadedLanguages() {
+        return Array.from(this.loadedLanguages);
+    }
+    /**
+     * Get the list of available language dictionaries
+     * @returns string[] - Array of available language names
+     */
+    getAvailableLanguages() {
+        return Object.keys(this.availableLanguages);
+    }
+    /**
+     * Get current configuration
+     */
+    getConfig() {
+        return {
+            defaultPlaceholder: this.defaultPlaceholder,
+            enableLeetSpeak: this.enableLeetSpeak,
+            caseSensitive: this.caseSensitive,
+            strictMode: this.strictMode,
+            detectPartialWords: this.detectPartialWords,
+            languages: this.getLoadedLanguages(),
+            whitelistWords: Array.from(this.whitelistSet),
+        };
+    }
+    /**
+     * Update configuration
+     */
+    updateConfig(options) {
+        if (options.defaultPlaceholder !== undefined) {
+            this.setPlaceholder(options.defaultPlaceholder);
+        }
+        if (options.enableLeetSpeak !== undefined) {
+            this.enableLeetSpeak = options.enableLeetSpeak;
+        }
+        if (options.caseSensitive !== undefined) {
+            this.caseSensitive = options.caseSensitive;
+        }
+        if (options.strictMode !== undefined) {
+            this.strictMode = options.strictMode;
+        }
+        if (options.detectPartialWords !== undefined) {
+            this.detectPartialWords = options.detectPartialWords;
+        }
+        if (options.whitelistWords) {
+            this.addToWhitelist(options.whitelistWords);
+        }
+    }
 }
 // Create and export a singleton instance with default settings
 const allProfanity = new AllProfanity();