npm - @framers/agentos-ext-ml-classifiers - Versions diffs - 0.1.0 → 0.2.1 - Mend

@framers/agentos-ext-ml-classifiers 0.1.0 → 0.2.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (51) hide show

package/CHANGELOG.md +18 -0
package/dist/MLClassifierGuardrail.d.ts +88 -117
package/dist/MLClassifierGuardrail.d.ts.map +1 -1
package/dist/MLClassifierGuardrail.js +255 -264
package/dist/MLClassifierGuardrail.js.map +1 -1
package/dist/classifiers/InjectionClassifier.d.ts +1 -1
package/dist/classifiers/InjectionClassifier.d.ts.map +1 -1
package/dist/classifiers/JailbreakClassifier.d.ts +1 -1
package/dist/classifiers/JailbreakClassifier.d.ts.map +1 -1
package/dist/classifiers/ToxicityClassifier.d.ts +1 -1
package/dist/classifiers/ToxicityClassifier.d.ts.map +1 -1
package/dist/classifiers/WorkerClassifierProxy.d.ts +1 -1
package/dist/classifiers/WorkerClassifierProxy.d.ts.map +1 -1
package/dist/index.d.ts +16 -90
package/dist/index.d.ts.map +1 -1
package/dist/index.js +33 -306
package/dist/index.js.map +1 -1
package/dist/keyword-classifier.d.ts +26 -0
package/dist/keyword-classifier.d.ts.map +1 -0
package/dist/keyword-classifier.js +113 -0
package/dist/keyword-classifier.js.map +1 -0
package/dist/llm-classifier.d.ts +27 -0
package/dist/llm-classifier.d.ts.map +1 -0
package/dist/llm-classifier.js +129 -0
package/dist/llm-classifier.js.map +1 -0
package/dist/tools/ClassifyContentTool.d.ts +53 -80
package/dist/tools/ClassifyContentTool.d.ts.map +1 -1
package/dist/tools/ClassifyContentTool.js +52 -103
package/dist/tools/ClassifyContentTool.js.map +1 -1
package/dist/types.d.ts +77 -277
package/dist/types.d.ts.map +1 -1
package/dist/types.js +9 -55
package/dist/types.js.map +1 -1
package/package.json +10 -16
package/src/MLClassifierGuardrail.ts +279 -316
package/src/index.ts +35 -339
package/src/keyword-classifier.ts +130 -0
package/src/llm-classifier.ts +163 -0
package/src/tools/ClassifyContentTool.ts +75 -132
package/src/types.ts +78 -325
package/test/ClassifierOrchestrator.spec.ts +365 -0
package/test/ClassifyContentTool.spec.ts +226 -0
package/test/InjectionClassifier.spec.ts +263 -0
package/test/JailbreakClassifier.spec.ts +295 -0
package/test/MLClassifierGuardrail.spec.ts +486 -0
package/test/SlidingWindowBuffer.spec.ts +391 -0
package/test/ToxicityClassifier.spec.ts +268 -0
package/test/WorkerClassifierProxy.spec.ts +303 -0
package/test/index.spec.ts +431 -0
package/tsconfig.json +20 -0
package/vitest.config.ts +24 -0

package/test/index.spec.ts ADDED Viewed

@@ -0,0 +1,431 @@
+/**
+ * @file index.spec.ts
+ * @description Unit tests for the ML Classifier pack factory.
+ *
+ * Tests verify:
+ *  - createMLClassifierGuardrail returns an ExtensionPack with name 'ml-classifiers'
+ *    and version '1.0.0'
+ *  - The pack provides exactly 2 descriptors: 1 guardrail + 1 tool
+ *  - Guardrail descriptor has id 'ml-classifier-guardrail' and kind 'guardrail'
+ *  - Tool descriptor has id 'classify_content' and kind 'tool'
+ *  - createExtensionPack bridges context.options to createMLClassifierGuardrail
+ *  - Disabled / selective classifiers work correctly
+ *  - onActivate rebuilds components with the shared registry
+ *  - onDeactivate disposes orchestrator and clears buffer
+ */
+import { describe, it, expect, vi, beforeEach } from 'vitest';
+import {
+  createMLClassifierGuardrail,
+  createExtensionPack,
+} from '../src/index';
+import { SharedServiceRegistry } from '@framers/agentos';
+import {
+  EXTENSION_KIND_GUARDRAIL,
+  EXTENSION_KIND_TOOL,
+} from '@framers/agentos';
+import type { ExtensionPackContext } from '@framers/agentos';
+// ---------------------------------------------------------------------------
+// Mocks — prevent real model downloads and ONNX/WASM loading
+// ---------------------------------------------------------------------------
+/**
+ * Mock ToxicityClassifier — lightweight stand-in that avoids the real
+ * `@huggingface/transformers` import during unit tests.
+ */
+vi.mock(
+  '../src/classifiers/ToxicityClassifier',
+  () => ({
+    ToxicityClassifier: vi.fn().mockImplementation(() => ({
+      id: 'agentos:ml-classifiers:toxicity-pipeline',
+      displayName: 'Toxicity Classifier (mock)',
+      description: 'Mock toxicity classifier.',
+      modelId: 'unitary/toxic-bert',
+      isLoaded: false,
+      classify: vi.fn().mockResolvedValue({ bestClass: 'benign', confidence: 0, allScores: [] }),
+      dispose: vi.fn().mockResolvedValue(undefined),
+    })),
+  }),
+);
+/**
+ * Mock InjectionClassifier.
+ */
+vi.mock(
+  '../src/classifiers/InjectionClassifier',
+  () => ({
+    InjectionClassifier: vi.fn().mockImplementation(() => ({
+      id: 'agentos:ml-classifiers:injection-pipeline',
+      displayName: 'Injection Classifier (mock)',
+      description: 'Mock injection classifier.',
+      modelId: 'protectai/deberta-v3-small-prompt-injection-v2',
+      isLoaded: false,
+      classify: vi.fn().mockResolvedValue({ bestClass: 'SAFE', confidence: 0.1, allScores: [] }),
+      dispose: vi.fn().mockResolvedValue(undefined),
+    })),
+  }),
+);
+/**
+ * Mock JailbreakClassifier.
+ */
+vi.mock(
+  '../src/classifiers/JailbreakClassifier',
+  () => ({
+    JailbreakClassifier: vi.fn().mockImplementation(() => ({
+      id: 'agentos:ml-classifiers:jailbreak-pipeline',
+      displayName: 'Jailbreak Classifier (mock)',
+      description: 'Mock jailbreak classifier.',
+      modelId: 'meta-llama/PromptGuard-86M',
+      isLoaded: false,
+      classify: vi.fn().mockResolvedValue({ bestClass: 'benign', confidence: 0, allScores: [] }),
+      dispose: vi.fn().mockResolvedValue(undefined),
+    })),
+  }),
+);
+// Import the mocked constructors so tests can assert on them.
+import { ToxicityClassifier } from '../src/classifiers/ToxicityClassifier';
+import { InjectionClassifier } from '../src/classifiers/InjectionClassifier';
+import { JailbreakClassifier } from '../src/classifiers/JailbreakClassifier';
+// ---------------------------------------------------------------------------
+// Tests
+// ---------------------------------------------------------------------------
+describe('createMLClassifierGuardrail', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+  // -------------------------------------------------------------------------
+  // 1. Pack identity
+  // -------------------------------------------------------------------------
+  describe('pack identity', () => {
+    it('returns an ExtensionPack with name "ml-classifiers"', () => {
+      const pack = createMLClassifierGuardrail();
+      expect(pack.name).toBe('ml-classifiers');
+    });
+    it('returns an ExtensionPack with version "1.0.0"', () => {
+      const pack = createMLClassifierGuardrail();
+      expect(pack.version).toBe('1.0.0');
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 2. Descriptors shape
+  // -------------------------------------------------------------------------
+  describe('descriptors', () => {
+    it('provides exactly 2 descriptors', () => {
+      const pack = createMLClassifierGuardrail();
+      expect(pack.descriptors).toHaveLength(2);
+    });
+    it('has a guardrail descriptor with id "ml-classifier-guardrail"', () => {
+      const pack = createMLClassifierGuardrail();
+      const guardrailDescriptor = pack.descriptors.find((d) => d.id === 'ml-classifier-guardrail');
+      expect(guardrailDescriptor).toBeDefined();
+    });
+    it('guardrail descriptor has kind "guardrail"', () => {
+      const pack = createMLClassifierGuardrail();
+      const guardrailDescriptor = pack.descriptors.find((d) => d.id === 'ml-classifier-guardrail');
+      expect(guardrailDescriptor?.kind).toBe(EXTENSION_KIND_GUARDRAIL);
+    });
+    it('guardrail descriptor has priority 5', () => {
+      const pack = createMLClassifierGuardrail();
+      const guardrailDescriptor = pack.descriptors.find((d) => d.id === 'ml-classifier-guardrail');
+      expect(guardrailDescriptor?.priority).toBe(5);
+    });
+    it('guardrail descriptor has a non-null payload', () => {
+      const pack = createMLClassifierGuardrail();
+      const guardrailDescriptor = pack.descriptors.find((d) => d.id === 'ml-classifier-guardrail');
+      expect(guardrailDescriptor?.payload).toBeDefined();
+      expect(guardrailDescriptor?.payload).not.toBeNull();
+    });
+    it('has a tool descriptor with id "classify_content"', () => {
+      const pack = createMLClassifierGuardrail();
+      const toolDescriptor = pack.descriptors.find((d) => d.id === 'classify_content');
+      expect(toolDescriptor).toBeDefined();
+    });
+    it('tool descriptor has kind "tool"', () => {
+      const pack = createMLClassifierGuardrail();
+      const toolDescriptor = pack.descriptors.find((d) => d.id === 'classify_content');
+      expect(toolDescriptor?.kind).toBe(EXTENSION_KIND_TOOL);
+    });
+    it('tool descriptor has priority 0', () => {
+      const pack = createMLClassifierGuardrail();
+      const toolDescriptor = pack.descriptors.find((d) => d.id === 'classify_content');
+      expect(toolDescriptor?.priority).toBe(0);
+    });
+    it('tool descriptor has a non-null payload', () => {
+      const pack = createMLClassifierGuardrail();
+      const toolDescriptor = pack.descriptors.find((d) => d.id === 'classify_content');
+      expect(toolDescriptor?.payload).toBeDefined();
+      expect(toolDescriptor?.payload).not.toBeNull();
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 3. Built-in classifier instantiation (zero-config)
+  // -------------------------------------------------------------------------
+  describe('zero-config classifier instantiation', () => {
+    it('instantiates all three built-in classifiers when no classifiers option is given', () => {
+      createMLClassifierGuardrail();
+      // Each built-in classifier should have been constructed once.
+      expect(ToxicityClassifier).toHaveBeenCalledOnce();
+      expect(InjectionClassifier).toHaveBeenCalledOnce();
+      expect(JailbreakClassifier).toHaveBeenCalledOnce();
+    });
+    it('instantiates all three built-in classifiers when classifiers is an empty array', () => {
+      createMLClassifierGuardrail({ classifiers: [] });
+      expect(ToxicityClassifier).toHaveBeenCalledOnce();
+      expect(InjectionClassifier).toHaveBeenCalledOnce();
+      expect(JailbreakClassifier).toHaveBeenCalledOnce();
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 4. Selective / disabled classifiers
+  // -------------------------------------------------------------------------
+  describe('selective classifiers', () => {
+    it('only instantiates ToxicityClassifier when classifiers: ["toxicity"]', () => {
+      createMLClassifierGuardrail({ classifiers: ['toxicity'] });
+      expect(ToxicityClassifier).toHaveBeenCalledOnce();
+      expect(InjectionClassifier).not.toHaveBeenCalled();
+      expect(JailbreakClassifier).not.toHaveBeenCalled();
+    });
+    it('only instantiates InjectionClassifier when classifiers: ["injection"]', () => {
+      createMLClassifierGuardrail({ classifiers: ['injection'] });
+      expect(ToxicityClassifier).not.toHaveBeenCalled();
+      expect(InjectionClassifier).toHaveBeenCalledOnce();
+      expect(JailbreakClassifier).not.toHaveBeenCalled();
+    });
+    it('only instantiates JailbreakClassifier when classifiers: ["jailbreak"]', () => {
+      createMLClassifierGuardrail({ classifiers: ['jailbreak'] });
+      expect(ToxicityClassifier).not.toHaveBeenCalled();
+      expect(InjectionClassifier).not.toHaveBeenCalled();
+      expect(JailbreakClassifier).toHaveBeenCalledOnce();
+    });
+    it('instantiates toxicity and jailbreak but not injection when specified', () => {
+      createMLClassifierGuardrail({ classifiers: ['toxicity', 'jailbreak'] });
+      expect(ToxicityClassifier).toHaveBeenCalledOnce();
+      expect(InjectionClassifier).not.toHaveBeenCalled();
+      expect(JailbreakClassifier).toHaveBeenCalledOnce();
+    });
+    it('still provides 2 descriptors when only 1 classifier is enabled', () => {
+      const pack = createMLClassifierGuardrail({ classifiers: ['toxicity'] });
+      // The guardrail and tool are always present regardless of classifier count.
+      expect(pack.descriptors).toHaveLength(2);
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 5. Custom classifiers
+  // -------------------------------------------------------------------------
+  describe('customClassifiers option', () => {
+    it('includes custom classifiers alongside built-in ones', () => {
+      const customClassifier = {
+        id: 'custom:sarcasm',
+        displayName: 'Sarcasm Detector',
+        description: 'Detects sarcasm.',
+        modelId: 'my-org/sarcasm-bert',
+        isLoaded: false,
+        classify: vi.fn().mockResolvedValue({ bestClass: 'benign', confidence: 0, allScores: [] }),
+      };
+      // Should not throw when a custom classifier is provided.
+      const pack = createMLClassifierGuardrail({
+        classifiers: ['toxicity'],
+        customClassifiers: [customClassifier],
+      });
+      // Pack structure must remain consistent.
+      expect(pack.descriptors).toHaveLength(2);
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 6. onActivate lifecycle hook
+  // -------------------------------------------------------------------------
+  describe('onActivate lifecycle hook', () => {
+    it('rebuilds components when onActivate is called with a shared registry', () => {
+      const pack = createMLClassifierGuardrail();
+      // Record the number of classifier constructions at pack-creation time.
+      const constructsBefore =
+        (ToxicityClassifier as ReturnType<typeof vi.fn>).mock.calls.length +
+        (InjectionClassifier as ReturnType<typeof vi.fn>).mock.calls.length +
+        (JailbreakClassifier as ReturnType<typeof vi.fn>).mock.calls.length;
+      // Activate with a shared registry.
+      const sharedRegistry = new SharedServiceRegistry();
+      pack.onActivate!({ services: sharedRegistry });
+      const constructsAfter =
+        (ToxicityClassifier as ReturnType<typeof vi.fn>).mock.calls.length +
+        (InjectionClassifier as ReturnType<typeof vi.fn>).mock.calls.length +
+        (JailbreakClassifier as ReturnType<typeof vi.fn>).mock.calls.length;
+      // Activation must have rebuilt the classifiers (3 more constructions).
+      expect(constructsAfter).toBe(constructsBefore + 3);
+    });
+    it('descriptors still reflect the rebuilt components after onActivate', () => {
+      const pack = createMLClassifierGuardrail();
+      const sharedRegistry = new SharedServiceRegistry();
+      pack.onActivate!({ services: sharedRegistry });
+      // Descriptors getter must return fresh references.
+      expect(pack.descriptors).toHaveLength(2);
+    });
+    it('does not throw when onActivate is called without services', () => {
+      const pack = createMLClassifierGuardrail();
+      // Context without a services field should be handled gracefully.
+      expect(() => pack.onActivate!({})).not.toThrow();
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 7. onDeactivate lifecycle hook
+  // -------------------------------------------------------------------------
+  describe('onDeactivate lifecycle hook', () => {
+    it('resolves without throwing', async () => {
+      const pack = createMLClassifierGuardrail();
+      await expect(pack.onDeactivate!()).resolves.toBeUndefined();
+    });
+  });
+  // -------------------------------------------------------------------------
+  // 8. Options passthrough
+  // -------------------------------------------------------------------------
+  describe('options passthrough', () => {
+    it('accepts and applies streaming mode options without throwing', () => {
+      expect(() =>
+        createMLClassifierGuardrail({
+          streamingMode: true,
+          chunkSize: 150,
+          contextSize: 30,
+          maxEvaluations: 50,
+          guardrailScope: 'output',
+        }),
+      ).not.toThrow();
+    });
+    it('accepts custom thresholds without throwing', () => {
+      expect(() =>
+        createMLClassifierGuardrail({
+          thresholds: {
+            blockThreshold: 0.95,
+            flagThreshold: 0.75,
+            warnThreshold: 0.5,
+          },
+        }),
+      ).not.toThrow();
+    });
+  });
+});
+// ---------------------------------------------------------------------------
+// createExtensionPack (manifest factory bridge)
+// ---------------------------------------------------------------------------
+describe('createExtensionPack', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+  it('returns a pack with name "ml-classifiers"', () => {
+    const context: ExtensionPackContext = {};
+    const pack = createExtensionPack(context);
+    expect(pack.name).toBe('ml-classifiers');
+  });
+  it('returns a pack with version "1.0.0"', () => {
+    const context: ExtensionPackContext = {};
+    const pack = createExtensionPack(context);
+    expect(pack.version).toBe('1.0.0');
+  });
+  it('provides 2 descriptors with empty context', () => {
+    const pack = createExtensionPack({});
+    expect(pack.descriptors).toHaveLength(2);
+  });
+  it('bridges context.options to createMLClassifierGuardrail — classifiers subset', () => {
+    const context: ExtensionPackContext = {
+      options: {
+        classifiers: ['toxicity'],
+      },
+    };
+    createExtensionPack(context);
+    // Only ToxicityClassifier should have been instantiated.
+    expect(ToxicityClassifier).toHaveBeenCalledOnce();
+    expect(InjectionClassifier).not.toHaveBeenCalled();
+    expect(JailbreakClassifier).not.toHaveBeenCalled();
+  });
+  it('bridges context.options to createMLClassifierGuardrail — thresholds', () => {
+    const context: ExtensionPackContext = {
+      options: {
+        thresholds: { blockThreshold: 0.99 },
+      },
+    };
+    const pack = createExtensionPack(context);
+    // Pack must still be well-formed.
+    expect(pack.descriptors).toHaveLength(2);
+  });
+  it('works when context.options is undefined', () => {
+    const context: ExtensionPackContext = { options: undefined };
+    const pack = createExtensionPack(context);
+    expect(pack.name).toBe('ml-classifiers');
+    expect(pack.descriptors).toHaveLength(2);
+  });
+});

package/tsconfig.json ADDED Viewed

@@ -0,0 +1,20 @@
+{
+  "compilerOptions": {
+    "target": "ES2022",
+    "module": "ESNext",
+    "moduleResolution": "bundler",
+    "declaration": true,
+    "declarationMap": true,
+    "sourceMap": true,
+    "outDir": "./dist",
+    "rootDir": "./src",
+    "strict": true,
+    "esModuleInterop": true,
+    "skipLibCheck": true,
+    "forceConsistentCasingInFileNames": true,
+    "resolveJsonModule": true,
+    "isolatedModules": true
+  },
+  "include": ["src/**/*.ts"],
+  "exclude": ["node_modules", "dist", "test"]
+}

package/vitest.config.ts ADDED Viewed

@@ -0,0 +1,24 @@
+import { defineConfig } from 'vitest/config';
+import path from 'path';
+import fs from 'fs';
+// CI layout: agentos cloned into packages/agentos/ inside this repo
+const ciPath = path.resolve(__dirname, '../../../../packages/agentos/src');
+// Monorepo layout: agentos is a sibling at packages/agentos/
+const monoPath = path.resolve(__dirname, '../../../../../agentos/src');
+const agentosPath = fs.existsSync(ciPath) ? ciPath : fs.existsSync(monoPath) ? monoPath : null;
+export default defineConfig({
+  test: {
+    globals: true,
+    environment: 'node',
+    include: ['test/**/*.spec.ts'],
+    testTimeout: 10000,
+  },
+  resolve: agentosPath ? {
+    alias: {
+      '@framers/agentos': agentosPath,
+    },
+  } : {},
+});