npm - @framers/agentos-ext-ml-classifiers - Versions diffs - 0.1.0 → 0.2.1 - Mend

@framers/agentos-ext-ml-classifiers 0.1.0 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

package/CHANGELOG.md +18 -0
package/dist/MLClassifierGuardrail.d.ts +88 -117
package/dist/MLClassifierGuardrail.d.ts.map +1 -1
package/dist/MLClassifierGuardrail.js +255 -264
package/dist/MLClassifierGuardrail.js.map +1 -1
package/dist/classifiers/InjectionClassifier.d.ts +1 -1
package/dist/classifiers/InjectionClassifier.d.ts.map +1 -1
package/dist/classifiers/JailbreakClassifier.d.ts +1 -1
package/dist/classifiers/JailbreakClassifier.d.ts.map +1 -1
package/dist/classifiers/ToxicityClassifier.d.ts +1 -1
package/dist/classifiers/ToxicityClassifier.d.ts.map +1 -1
package/dist/classifiers/WorkerClassifierProxy.d.ts +1 -1
package/dist/classifiers/WorkerClassifierProxy.d.ts.map +1 -1
package/dist/index.d.ts +16 -90
package/dist/index.d.ts.map +1 -1
package/dist/index.js +33 -306
package/dist/index.js.map +1 -1
package/dist/keyword-classifier.d.ts +26 -0
package/dist/keyword-classifier.d.ts.map +1 -0
package/dist/keyword-classifier.js +113 -0
package/dist/keyword-classifier.js.map +1 -0
package/dist/llm-classifier.d.ts +27 -0
package/dist/llm-classifier.d.ts.map +1 -0
package/dist/llm-classifier.js +129 -0
package/dist/llm-classifier.js.map +1 -0
package/dist/tools/ClassifyContentTool.d.ts +53 -80
package/dist/tools/ClassifyContentTool.d.ts.map +1 -1
package/dist/tools/ClassifyContentTool.js +52 -103
package/dist/tools/ClassifyContentTool.js.map +1 -1
package/dist/types.d.ts +77 -277
package/dist/types.d.ts.map +1 -1
package/dist/types.js +9 -55
package/dist/types.js.map +1 -1
package/package.json +10 -16
package/src/MLClassifierGuardrail.ts +279 -316
package/src/index.ts +35 -339
package/src/keyword-classifier.ts +130 -0
package/src/llm-classifier.ts +163 -0
package/src/tools/ClassifyContentTool.ts +75 -132
package/src/types.ts +78 -325
package/test/ClassifierOrchestrator.spec.ts +365 -0
package/test/ClassifyContentTool.spec.ts +226 -0
package/test/InjectionClassifier.spec.ts +263 -0
package/test/JailbreakClassifier.spec.ts +295 -0
package/test/MLClassifierGuardrail.spec.ts +486 -0
package/test/SlidingWindowBuffer.spec.ts +391 -0
package/test/ToxicityClassifier.spec.ts +268 -0
package/test/WorkerClassifierProxy.spec.ts +303 -0
package/test/index.spec.ts +431 -0
package/tsconfig.json +20 -0
package/vitest.config.ts +24 -0

package/dist/types.js CHANGED Viewed

@@ -1,62 +1,16 @@
 /**
- * @fileoverview Core type definitions for the ML Classifier Guardrail Extension Pack.
+ * @file types.ts
+ * @description Core type definitions for the ML Classifiers extension pack.
  *
- * This file defines all configuration shapes, runtime result types, and
- * service-identifier constants used by the ML classifier pipeline. All
- * classifiers in this pack evaluate text content against learned models
- * (toxicity, prompt-injection, jailbreak) and emit structured results that
- * feed into the AgentOS guardrail decision tree.
+ * Defines the shared interfaces used across the ML classification system:
+ * classifier categories, confidence results, option shapes, and the LLM
+ * invoker callback signature.
  *
- * Import hierarchy
- * ----------------
- * ```
- * IUtilityAI  ──── ClassificationResult, ClassificationScore
- * IGuardrailService ── GuardrailAction
- *                   │
- *                   ▼
- *              types.ts  (this file)
- *                   │
- *                   ▼
- *           IContentClassifier.ts  /  SlidingWindowBuffer.ts  /  …
- * ```
- *
- * @module agentos/extensions/packs/ml-classifiers/types
- */
-/**
- * Sensible defaults for {@link ClassifierThresholds}.
- *
- * These values reflect a conservative-but-pragmatic policy:
- * - block at 90 % confidence → very high bar, minimises false positives
- * - flag at 70 % → surfaced for human review, not blocked
- * - warn at 40 % → low-confidence signal, handled with a light touch
+ * @module ml-classifiers/types
  */
-export const DEFAULT_THRESHOLDS = {
-    blockThreshold: 0.9,
-    flagThreshold: 0.7,
-    warnThreshold: 0.4,
-};
-// ---------------------------------------------------------------------------
-// Service identifiers
-// ---------------------------------------------------------------------------
 /**
- * Well-known service identifier strings for the three built-in ML classifier
- * pipelines.
- *
- * These IDs follow the `agentos:<domain>:<name>` naming convention used
- * throughout the AgentOS extension ecosystem.  Use them to retrieve specific
- * classifier services from the shared service registry.
- *
- * @example
- * ```typescript
- * const toxicity = serviceRegistry.get(ML_CLASSIFIER_SERVICE_IDS.TOXICITY_PIPELINE);
- * ```
+ * All supported classifier categories as a constant array, used for
+ * iteration and default configuration.
  */
-export const ML_CLASSIFIER_SERVICE_IDS = {
-    /** Classifier that detects toxic, hateful, or abusive language. */
-    TOXICITY_PIPELINE: 'agentos:ml-classifiers:toxicity-pipeline',
-    /** Classifier that detects prompt-injection attempts. */
-    INJECTION_PIPELINE: 'agentos:ml-classifiers:injection-pipeline',
-    /** Classifier that detects jailbreak / system-override attempts. */
-    JAILBREAK_PIPELINE: 'agentos:ml-classifiers:jailbreak-pipeline',
-};
+export const ALL_CATEGORIES = ['toxic', 'injection', 'nsfw', 'threat'];
 //# sourceMappingURL=types.js.map

package/dist/types.js.map CHANGED Viewed

	@@ -1 +1 @@
1	- {"version":3,"file":"types.js","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":"AAAA~~;;;;;;;;;;;;;;;;;;;;;;;GAuBG~~;~~AA2CH;;;;;;;GAOG~~;AACH,MAAM,CAAC,MAAM,~~kBAAkB~~,GAAyB~~;IACtD~~,~~cAAc~~,~~EAAE~~,~~GAAG;IACnB,aAAa,~~EAAE,~~GAAG;IAClB~~,~~aAAa,~~EAAE,~~GAAG;CACV,CAAC;AA6NX,8EAA8E;AAC9E,sBAAsB;AACtB,8EAA8E;AAE9E;;;;;;;;;;;;GAYG;AACH,~~MAAM,~~CAAC,MAAM,yBAAyB,GAAG;IACvC,mEAAmE;IACnE,iBAAiB,~~EAAE,~~0CAA0C;IAE7D~~,~~yDAAyD;IACzD~~,~~kBAAkB,EAAE,2CAA2C;IAE/D,oEAAoE;IACpE,kBAAkB,EAAE,2CAA2C;CACvD,~~CAAC"}
1	+ {"version":3,"file":"types.js","sourceRoot":"","sources":["../src/types.ts"],"names":[],"mappings":"AAAA;;;;;;;;;GASG;AAgBH;;;GAGG;AACH,MAAM,CAAC,MAAM,cAAc,GAAyB,CAAC,OAAO,EAAE,WAAW,EAAE,MAAM,EAAE,QAAQ,CAAC,CAAC"}

package/package.json CHANGED Viewed

@@ -1,7 +1,7 @@
 {
   "name": "@framers/agentos-ext-ml-classifiers",
-  "version": "0.1.0",
-  "description": "ML-based content classification guardrail (toxicity, injection, jailbreak) for AgentOS",
+  "version": "0.2.1",
+  "description": "ML-based content classifiers for AgentOS — toxicity, prompt injection, and NSFW detection via ONNX models or LLM fallback",
   "type": "module",
   "main": "./dist/index.js",
   "types": "./dist/index.d.ts",
@@ -11,23 +11,12 @@
       "types": "./dist/index.d.ts"
     }
   },
-  "files": [
-    "dist",
-    "src",
-    "SKILL.md",
-    "manifest.json"
-  ],
   "peerDependencies": {
-    "@framers/agentos": "^0.1.0"
+    "@framers/agentos": ">=0.1.0"
   },
   "optionalDependencies": {
     "@huggingface/transformers": "^3.0.0"
   },
-  "devDependencies": {
-    "typescript": "^5.5.0",
-    "vitest": "^1.6.0",
-    "@framers/agentos": "0.1.47"
-  },
   "license": "MIT",
   "author": "Frame.dev",
   "repository": {
@@ -38,8 +27,13 @@
   "publishConfig": {
     "access": "public"
   },
+  "devDependencies": {
+    "semantic-release": "^24.0.0",
+    "@semantic-release/github": "^11.0.0"
+  },
   "scripts": {
-    "build": "tsc -p tsconfig.json",
-    "test": "vitest run"
+    "build": "tsc",
+    "clean": "rm -rf dist",
+    "typecheck": "tsc --noEmit"
   }
 }