npm - glin-profanity - Versions diffs - 3.1.5 → 3.2.2 - Mend

glin-profanity 3.1.5 → 3.2.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (66) hide show

package/README.md +84 -566
package/dist/{types-CdDqSZY7.d.cts → Filter-BGcyIAvO.d.ts} +4 -162
package/dist/{types-CdDqSZY7.d.ts → Filter-D34Wsmrj.d.cts} +4 -162
package/dist/frameworks/index.cjs +5257 -0
package/dist/frameworks/index.d.cts +2 -0
package/dist/frameworks/index.d.ts +2 -0
package/dist/frameworks/index.js +5252 -0
package/dist/frameworks/nextjs.cjs +5257 -0
package/dist/frameworks/nextjs.d.cts +173 -0
package/dist/frameworks/nextjs.d.ts +173 -0
package/dist/frameworks/nextjs.js +5252 -0
package/dist/index.cjs +151 -85
package/dist/index.d.cts +5 -29
package/dist/index.d.ts +5 -29
package/dist/index.js +152 -85
package/dist/integrations/index.cjs +6110 -0
package/dist/integrations/index.d.cts +5 -0
package/dist/integrations/index.d.ts +5 -0
package/dist/integrations/index.js +6082 -0
package/dist/integrations/langchain.cjs +5252 -0
package/dist/integrations/langchain.d.cts +231 -0
package/dist/integrations/langchain.d.ts +231 -0
package/dist/integrations/langchain.js +5239 -0
package/dist/integrations/openai.cjs +5367 -0
package/dist/integrations/openai.d.cts +167 -0
package/dist/integrations/openai.d.ts +167 -0
package/dist/integrations/openai.js +5362 -0
package/dist/integrations/semantic.cjs +5314 -0
package/dist/integrations/semantic.d.cts +268 -0
package/dist/integrations/semantic.d.ts +268 -0
package/dist/integrations/semantic.js +5309 -0
package/dist/integrations/vercel-ai.cjs +5282 -0
package/dist/integrations/vercel-ai.d.cts +224 -0
package/dist/integrations/vercel-ai.d.ts +224 -0
package/dist/integrations/vercel-ai.js +5273 -0
package/dist/ml/index.cjs +358 -56
package/dist/ml/index.d.cts +5 -2
package/dist/ml/index.d.ts +5 -2
package/dist/ml/index.js +354 -57
package/dist/ml/transformers.cjs +5237 -0
package/dist/ml/transformers.d.cts +232 -0
package/dist/ml/transformers.d.ts +232 -0
package/dist/ml/transformers.js +5231 -0
package/dist/multimodal/audio.cjs +5269 -0
package/dist/multimodal/audio.d.cts +255 -0
package/dist/multimodal/audio.d.ts +255 -0
package/dist/multimodal/audio.js +5264 -0
package/dist/multimodal/index.cjs +5432 -0
package/dist/multimodal/index.d.cts +4 -0
package/dist/multimodal/index.d.ts +4 -0
package/dist/multimodal/index.js +5422 -0
package/dist/multimodal/ocr.cjs +5193 -0
package/dist/multimodal/ocr.d.cts +157 -0
package/dist/multimodal/ocr.d.ts +157 -0
package/dist/multimodal/ocr.js +5187 -0
package/dist/react.cjs +5133 -0
package/dist/react.d.cts +13 -0
package/dist/react.d.ts +13 -0
package/dist/react.js +5131 -0
package/dist/types-B9c_ik4k.d.cts +88 -0
package/dist/types-B9c_ik4k.d.ts +88 -0
package/dist/types-BuKh9tvV.d.ts +20 -0
package/dist/types-Ct_ueYqw.d.cts +76 -0
package/dist/types-Ct_ueYqw.d.ts +76 -0
package/dist/types-DI8nzwWc.d.cts +20 -0
package/package.json +170 -3

package/dist/{types-CdDqSZY7.d.cts → Filter-BGcyIAvO.d.ts} RENAMED Viewed

@@ -1,89 +1,4 @@
-/**
- * Type definitions for glin-profanity JavaScript/TypeScript package.
- * Unified API that mirrors the Python package structure.
- */
-/** Severity levels for profanity matches - unified with Python */
-declare enum SeverityLevel {
-    EXACT = 1,
-    FUZZY = 2
-}
-/** Supported languages - unified list with Python */
-type Language = 'arabic' | 'chinese' | 'czech' | 'danish' | 'dutch' | 'english' | 'esperanto' | 'finnish' | 'french' | 'german' | 'hindi' | 'hungarian' | 'italian' | 'japanese' | 'korean' | 'norwegian' | 'persian' | 'polish' | 'portuguese' | 'russian' | 'spanish' | 'swedish' | 'thai' | 'turkish';
-/** Represents a profanity match in text - unified with Python */
-interface Match {
-    word: string;
-    index: number;
-    severity: SeverityLevel;
-    contextScore?: number;
-    reason?: string;
-    isWhitelisted?: boolean;
-}
-/** Result of profanity check operation - unified field names */
-interface CheckProfanityResult {
-    containsProfanity: boolean;
-    profaneWords: string[];
-    processedText?: string;
-    severityMap?: Record<string, SeverityLevel>;
-    matches?: Match[];
-    contextScore?: number;
-    reason?: string;
-}
-/** Configuration for context-aware filtering - unified with Python */
-interface ContextAwareConfig {
-    enableContextAware?: boolean;
-    contextWindow?: number;
-    confidenceThreshold?: number;
-    domainWhitelists?: Record<string, string[]>;
-}
-/** Leetspeak detection intensity levels */
-type LeetspeakLevel = 'basic' | 'moderate' | 'aggressive';
-/** Main filter configuration options - unified with Python */
-interface FilterConfig extends ContextAwareConfig {
-    languages?: Language[];
-    allLanguages?: boolean;
-    caseSensitive?: boolean;
-    wordBoundaries?: boolean;
-    customWords?: string[];
-    replaceWith?: string;
-    severityLevels?: boolean;
-    ignoreWords?: string[];
-    logProfanity?: boolean;
-    allowObfuscatedMatch?: boolean;
-    fuzzyToleranceLevel?: number;
-    /**
-     * Enable leetspeak detection (e.g., "f4ck" → "fuck").
-     * @default false
-     */
-    detectLeetspeak?: boolean;
-    /**
-     * Leetspeak detection intensity level.
-     * - `basic`: Numbers only (0→o, 1→i, 3→e, 4→a, 5→s)
-     * - `moderate`: Basic + symbols (@→a, $→s, !→i)
-     * - `aggressive`: All known substitutions
-     * @default 'moderate'
-     */
-    leetspeakLevel?: LeetspeakLevel;
-    /**
-     * Enable Unicode normalization to detect homoglyphs and obfuscation.
-     * @default true
-     */
-    normalizeUnicode?: boolean;
-    /**
-     * Cache profanity check results for repeated strings.
-     * @default false
-     */
-    cacheResults?: boolean;
-    /**
-     * Maximum cache size when caching is enabled.
-     * @default 1000
-     */
-    maxCacheSize?: number;
-}
-/** Result with minimum severity filtering */
-interface FilteredProfanityResult {
-    result: CheckProfanityResult;
-    filteredWords: string[];
-}
+import { F as FilterConfig, C as CheckProfanityResult, S as SeverityLevel } from './types-B9c_ik4k.js';
 /**
  * Core profanity filter class.
@@ -123,6 +38,7 @@ declare class Filter {
     private cacheResults;
     private maxCacheSize;
     private cache;
+    private regexCache;
     /**
      * Creates a new Filter instance with the specified configuration.
      *
@@ -157,6 +73,7 @@ declare class Filter {
      * Applies Unicode normalization, leetspeak detection, and obfuscation handling.
      *
      * @param text - The input text to normalize
+     * @param aggressive - If true, collapses to single chars (for repeated char detection)
      * @returns The normalized text
      */
     private normalizeText;
@@ -272,79 +189,4 @@ declare class Filter {
     };
 }
-/**
- * Type definitions for ML-based profanity detection.
- */
-/**
- * Toxicity categories detected by the TensorFlow.js model.
- * These map to the civil comments dataset labels.
- */
-type ToxicityLabel = 'identity_attack' | 'insult' | 'obscene' | 'severe_toxicity' | 'sexual_explicit' | 'threat' | 'toxicity';
-/**
- * Result from a single toxicity prediction.
- */
-interface ToxicityPrediction {
-    /** The toxicity category */
-    label: ToxicityLabel;
-    /** Whether the text matches this category (null if below threshold) */
-    match: boolean | null;
-    /** Probability scores [non-toxic, toxic] */
-    probabilities: [number, number];
-}
-/**
- * Result from ML-based toxicity analysis.
- */
-interface MLAnalysisResult {
-    /** Whether any toxicity was detected */
-    isToxic: boolean;
-    /** Overall toxicity score (0-1) */
-    overallScore: number;
-    /** Predictions for each category */
-    predictions: ToxicityPrediction[];
-    /** Categories that matched */
-    matchedCategories: ToxicityLabel[];
-    /** Processing time in milliseconds */
-    processingTimeMs: number;
-}
-/**
- * Configuration for the ML toxicity detector.
- */
-interface MLDetectorConfig {
-    /**
-     * Minimum confidence threshold for predictions.
-     * Values below this threshold will return null for match.
-     * @default 0.85
-     */
-    threshold?: number;
-    /**
-     * Specific toxicity categories to check.
-     * If not specified, all categories are checked.
-     */
-    labels?: ToxicityLabel[];
-    /**
-     * Whether to load the model immediately on instantiation.
-     * If false, model will be loaded on first use.
-     * @default false
-     */
-    preloadModel?: boolean;
-}
-/**
- * Combined result from both rule-based and ML detection.
- */
-interface HybridAnalysisResult {
-    /** Rule-based detection result */
-    ruleBasedResult: {
-        containsProfanity: boolean;
-        profaneWords: string[];
-    };
-    /** ML-based detection result (null if ML not enabled) */
-    mlResult: MLAnalysisResult | null;
-    /** Combined decision */
-    isToxic: boolean;
-    /** Confidence score for the decision */
-    confidence: number;
-    /** Reason for the decision */
-    reason: string;
-}
-export { type CheckProfanityResult as C, type FilterConfig as F, type HybridAnalysisResult as H, type Language as L, type Match as M, SeverityLevel as S, type ToxicityLabel as T, Filter as a, type FilteredProfanityResult as b, type ContextAwareConfig as c, type ToxicityPrediction as d, type MLAnalysisResult as e, type MLDetectorConfig as f };
+export { Filter as F };

package/dist/{types-CdDqSZY7.d.ts → Filter-D34Wsmrj.d.cts} RENAMED Viewed

@@ -1,89 +1,4 @@
-/**
- * Type definitions for glin-profanity JavaScript/TypeScript package.
- * Unified API that mirrors the Python package structure.
- */
-/** Severity levels for profanity matches - unified with Python */
-declare enum SeverityLevel {
-    EXACT = 1,
-    FUZZY = 2
-}
-/** Supported languages - unified list with Python */
-type Language = 'arabic' | 'chinese' | 'czech' | 'danish' | 'dutch' | 'english' | 'esperanto' | 'finnish' | 'french' | 'german' | 'hindi' | 'hungarian' | 'italian' | 'japanese' | 'korean' | 'norwegian' | 'persian' | 'polish' | 'portuguese' | 'russian' | 'spanish' | 'swedish' | 'thai' | 'turkish';
-/** Represents a profanity match in text - unified with Python */
-interface Match {
-    word: string;
-    index: number;
-    severity: SeverityLevel;
-    contextScore?: number;
-    reason?: string;
-    isWhitelisted?: boolean;
-}
-/** Result of profanity check operation - unified field names */
-interface CheckProfanityResult {
-    containsProfanity: boolean;
-    profaneWords: string[];
-    processedText?: string;
-    severityMap?: Record<string, SeverityLevel>;
-    matches?: Match[];
-    contextScore?: number;
-    reason?: string;
-}
-/** Configuration for context-aware filtering - unified with Python */
-interface ContextAwareConfig {
-    enableContextAware?: boolean;
-    contextWindow?: number;
-    confidenceThreshold?: number;
-    domainWhitelists?: Record<string, string[]>;
-}
-/** Leetspeak detection intensity levels */
-type LeetspeakLevel = 'basic' | 'moderate' | 'aggressive';
-/** Main filter configuration options - unified with Python */
-interface FilterConfig extends ContextAwareConfig {
-    languages?: Language[];
-    allLanguages?: boolean;
-    caseSensitive?: boolean;
-    wordBoundaries?: boolean;
-    customWords?: string[];
-    replaceWith?: string;
-    severityLevels?: boolean;
-    ignoreWords?: string[];
-    logProfanity?: boolean;
-    allowObfuscatedMatch?: boolean;
-    fuzzyToleranceLevel?: number;
-    /**
-     * Enable leetspeak detection (e.g., "f4ck" → "fuck").
-     * @default false
-     */
-    detectLeetspeak?: boolean;
-    /**
-     * Leetspeak detection intensity level.
-     * - `basic`: Numbers only (0→o, 1→i, 3→e, 4→a, 5→s)
-     * - `moderate`: Basic + symbols (@→a, $→s, !→i)
-     * - `aggressive`: All known substitutions
-     * @default 'moderate'
-     */
-    leetspeakLevel?: LeetspeakLevel;
-    /**
-     * Enable Unicode normalization to detect homoglyphs and obfuscation.
-     * @default true
-     */
-    normalizeUnicode?: boolean;
-    /**
-     * Cache profanity check results for repeated strings.
-     * @default false
-     */
-    cacheResults?: boolean;
-    /**
-     * Maximum cache size when caching is enabled.
-     * @default 1000
-     */
-    maxCacheSize?: number;
-}
-/** Result with minimum severity filtering */
-interface FilteredProfanityResult {
-    result: CheckProfanityResult;
-    filteredWords: string[];
-}
+import { F as FilterConfig, C as CheckProfanityResult, S as SeverityLevel } from './types-B9c_ik4k.cjs';
 /**
  * Core profanity filter class.
@@ -123,6 +38,7 @@ declare class Filter {
     private cacheResults;
     private maxCacheSize;
     private cache;
+    private regexCache;
     /**
      * Creates a new Filter instance with the specified configuration.
      *
@@ -157,6 +73,7 @@ declare class Filter {
      * Applies Unicode normalization, leetspeak detection, and obfuscation handling.
      *
      * @param text - The input text to normalize
+     * @param aggressive - If true, collapses to single chars (for repeated char detection)
      * @returns The normalized text
      */
     private normalizeText;
@@ -272,79 +189,4 @@ declare class Filter {
     };
 }
-/**
- * Type definitions for ML-based profanity detection.
- */
-/**
- * Toxicity categories detected by the TensorFlow.js model.
- * These map to the civil comments dataset labels.
- */
-type ToxicityLabel = 'identity_attack' | 'insult' | 'obscene' | 'severe_toxicity' | 'sexual_explicit' | 'threat' | 'toxicity';
-/**
- * Result from a single toxicity prediction.
- */
-interface ToxicityPrediction {
-    /** The toxicity category */
-    label: ToxicityLabel;
-    /** Whether the text matches this category (null if below threshold) */
-    match: boolean | null;
-    /** Probability scores [non-toxic, toxic] */
-    probabilities: [number, number];
-}
-/**
- * Result from ML-based toxicity analysis.
- */
-interface MLAnalysisResult {
-    /** Whether any toxicity was detected */
-    isToxic: boolean;
-    /** Overall toxicity score (0-1) */
-    overallScore: number;
-    /** Predictions for each category */
-    predictions: ToxicityPrediction[];
-    /** Categories that matched */
-    matchedCategories: ToxicityLabel[];
-    /** Processing time in milliseconds */
-    processingTimeMs: number;
-}
-/**
- * Configuration for the ML toxicity detector.
- */
-interface MLDetectorConfig {
-    /**
-     * Minimum confidence threshold for predictions.
-     * Values below this threshold will return null for match.
-     * @default 0.85
-     */
-    threshold?: number;
-    /**
-     * Specific toxicity categories to check.
-     * If not specified, all categories are checked.
-     */
-    labels?: ToxicityLabel[];
-    /**
-     * Whether to load the model immediately on instantiation.
-     * If false, model will be loaded on first use.
-     * @default false
-     */
-    preloadModel?: boolean;
-}
-/**
- * Combined result from both rule-based and ML detection.
- */
-interface HybridAnalysisResult {
-    /** Rule-based detection result */
-    ruleBasedResult: {
-        containsProfanity: boolean;
-        profaneWords: string[];
-    };
-    /** ML-based detection result (null if ML not enabled) */
-    mlResult: MLAnalysisResult | null;
-    /** Combined decision */
-    isToxic: boolean;
-    /** Confidence score for the decision */
-    confidence: number;
-    /** Reason for the decision */
-    reason: string;
-}
-export { type CheckProfanityResult as C, type FilterConfig as F, type HybridAnalysisResult as H, type Language as L, type Match as M, SeverityLevel as S, type ToxicityLabel as T, Filter as a, type FilteredProfanityResult as b, type ContextAwareConfig as c, type ToxicityPrediction as d, type MLAnalysisResult as e, type MLDetectorConfig as f };
+export { Filter as F };