npm - @artemiskit/sdk - Versions diffs - 0.3.0 - Mend

@artemiskit/sdk 0.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (27) hide show

package/CHANGELOG.md +134 -0
package/README.md +173 -0
package/adapters/openai/dist/index.js +5625 -0
package/dist/index.js +42577 -0
package/dist/matchers/index.js +224 -0
package/dist/matchers/jest.js +257 -0
package/dist/matchers/vitest.js +257 -0
package/package.json +78 -0
package/src/__tests__/artemiskit.test.ts +425 -0
package/src/__tests__/matchers.test.ts +450 -0
package/src/artemiskit.ts +791 -0
package/src/guardian/action-validator.ts +585 -0
package/src/guardian/circuit-breaker.ts +655 -0
package/src/guardian/guardian.ts +497 -0
package/src/guardian/guardrails.ts +536 -0
package/src/guardian/index.ts +142 -0
package/src/guardian/intent-classifier.ts +378 -0
package/src/guardian/interceptor.ts +381 -0
package/src/guardian/policy.ts +446 -0
package/src/guardian/types.ts +436 -0
package/src/index.ts +164 -0
package/src/matchers/core.ts +315 -0
package/src/matchers/index.ts +26 -0
package/src/matchers/jest.ts +112 -0
package/src/matchers/vitest.ts +84 -0
package/src/types.ts +259 -0
package/tsconfig.json +11 -0

package/src/matchers/core.ts ADDED Viewed

@@ -0,0 +1,315 @@
+/**
+ * @artemiskit/sdk
+ * Core matcher implementations for Jest/Vitest integration
+ */
+import type { CaseResult, RunManifest } from '@artemiskit/core';
+import type { RedTeamResult, RunResult, StressResult } from '../types';
+/**
+ * Matcher result interface compatible with Jest/Vitest
+ */
+export interface MatcherResult {
+  pass: boolean;
+  message: () => string;
+}
+/**
+ * Format a manifest summary for error messages
+ */
+function formatManifestSummary(manifest: RunManifest): string {
+  const { metrics } = manifest;
+  return `
+  Scenario: ${manifest.config.scenario}
+  Total Cases: ${metrics.total_cases}
+  Passed: ${metrics.passed_cases}
+  Failed: ${metrics.failed_cases}
+  Success Rate: ${(metrics.success_rate * 100).toFixed(1)}%
+`;
+}
+/**
+ * Format failed cases for error messages
+ */
+function formatFailedCases(cases: CaseResult[]): string {
+  const failed = cases.filter((c) => !c.ok);
+  if (failed.length === 0) return '';
+  return `
+  Failed Cases:
+${failed
+  .slice(0, 5) // Show first 5 failures
+  .map((c) => `    - ${c.name ?? c.id}: ${c.reason ?? 'No reason provided'}`)
+  .join('\n')}${failed.length > 5 ? `\n    ... and ${failed.length - 5} more` : ''}
+`;
+}
+// ==========================================================================
+// Run Result Matchers
+// ==========================================================================
+/**
+ * Check if a run result passed all test cases
+ */
+export function toPassAllCases(result: RunResult): MatcherResult {
+  const pass = result.success;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected test run to fail, but all ${result.manifest.metrics.total_cases} cases passed`
+        : `Expected test run to pass, but ${result.manifest.metrics.failed_cases} out of ${result.manifest.metrics.total_cases} cases failed
+${formatManifestSummary(result.manifest)}${formatFailedCases(result.cases)}`,
+  };
+}
+/**
+ * Check if success rate meets threshold
+ */
+export function toHaveSuccessRate(result: RunResult, expectedRate: number): MatcherResult {
+  const actualRate = result.manifest.metrics.success_rate;
+  const pass = actualRate >= expectedRate;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected success rate to be less than ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%`
+        : `Expected success rate to be at least ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%
+${formatManifestSummary(result.manifest)}${formatFailedCases(result.cases)}`,
+  };
+}
+/**
+ * Check if all cases with specific tags passed
+ */
+export function toPassCasesWithTag(result: RunResult, tag: string): MatcherResult {
+  const taggedCases = result.cases.filter((c) => c.tags.includes(tag));
+  const failedTaggedCases = taggedCases.filter((c) => !c.ok);
+  const pass = failedTaggedCases.length === 0;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected cases with tag "${tag}" to fail, but all ${taggedCases.length} passed`
+        : `Expected all cases with tag "${tag}" to pass, but ${failedTaggedCases.length} out of ${taggedCases.length} failed
+${formatFailedCases(failedTaggedCases)}`,
+  };
+}
+/**
+ * Check if median latency is within threshold
+ */
+export function toHaveMedianLatencyBelow(result: RunResult, maxLatencyMs: number): MatcherResult {
+  const actualLatency = result.manifest.metrics.median_latency_ms;
+  const pass = actualLatency <= maxLatencyMs;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected median latency to be above ${maxLatencyMs}ms, but got ${actualLatency}ms`
+        : `Expected median latency to be at most ${maxLatencyMs}ms, but got ${actualLatency}ms`,
+  };
+}
+/**
+ * Check if P95 latency is within threshold
+ */
+export function toHaveP95LatencyBelow(result: RunResult, maxLatencyMs: number): MatcherResult {
+  const actualLatency = result.manifest.metrics.p95_latency_ms;
+  const pass = actualLatency <= maxLatencyMs;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected P95 latency to be above ${maxLatencyMs}ms, but got ${actualLatency}ms`
+        : `Expected P95 latency to be at most ${maxLatencyMs}ms, but got ${actualLatency}ms`,
+  };
+}
+// ==========================================================================
+// Red Team Result Matchers
+// ==========================================================================
+/**
+ * Check if defense rate meets threshold
+ */
+export function toHaveDefenseRate(result: RedTeamResult, expectedRate: number): MatcherResult {
+  const actualRate = result.defenseRate;
+  const pass = actualRate >= expectedRate;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected defense rate to be less than ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%`
+        : `Expected defense rate to be at least ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%
+  Unsafe responses: ${result.unsafeCount}
+  Total tests: ${result.manifest.metrics.total_tests}`,
+  };
+}
+/**
+ * Check that no critical vulnerabilities were found
+ */
+export function toHaveNoCriticalVulnerabilities(result: RedTeamResult): MatcherResult {
+  const criticalCount = result.manifest.metrics.by_severity.critical;
+  const pass = criticalCount === 0;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? 'Expected critical vulnerabilities, but none were found'
+        : `Expected no critical vulnerabilities, but found ${criticalCount}`,
+  };
+}
+/**
+ * Check that no high or critical vulnerabilities were found
+ */
+export function toHaveNoHighSeverityVulnerabilities(result: RedTeamResult): MatcherResult {
+  const highCount = result.manifest.metrics.by_severity.high;
+  const criticalCount = result.manifest.metrics.by_severity.critical;
+  const totalHighSeverity = highCount + criticalCount;
+  const pass = totalHighSeverity === 0;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? 'Expected high/critical vulnerabilities, but none were found'
+        : `Expected no high/critical vulnerabilities, but found ${totalHighSeverity} (${highCount} high, ${criticalCount} critical)`,
+  };
+}
+/**
+ * Check if red team test passed (default 95% defense rate)
+ */
+export function toPassRedTeam(result: RedTeamResult): MatcherResult {
+  const pass = result.success;
+  const { metrics } = result.manifest;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected red team test to fail, but passed with ${(result.defenseRate * 100).toFixed(1)}% defense rate`
+        : `Expected red team test to pass, but defense rate was only ${(result.defenseRate * 100).toFixed(1)}%
+  Total tests: ${metrics.total_tests}
+  Safe: ${metrics.safe_responses}
+  Blocked: ${metrics.blocked_responses}
+  Unsafe: ${metrics.unsafe_responses}
+  Errors: ${metrics.error_responses}`,
+  };
+}
+// ==========================================================================
+// Stress Test Result Matchers
+// ==========================================================================
+/**
+ * Check if stress test success rate meets threshold
+ */
+export function toHaveStressSuccessRate(result: StressResult, expectedRate: number): MatcherResult {
+  const actualRate = result.successRate;
+  const pass = actualRate >= expectedRate;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected stress test success rate to be less than ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%`
+        : `Expected stress test success rate to be at least ${(expectedRate * 100).toFixed(1)}%, but got ${(actualRate * 100).toFixed(1)}%`,
+  };
+}
+/**
+ * Check if stress test achieved target RPS
+ */
+export function toAchieveRPS(result: StressResult, targetRPS: number): MatcherResult {
+  const actualRPS = result.rps;
+  const pass = actualRPS >= targetRPS;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected RPS to be less than ${targetRPS}, but achieved ${actualRPS.toFixed(1)} RPS`
+        : `Expected to achieve at least ${targetRPS} RPS, but only got ${actualRPS.toFixed(1)} RPS`,
+  };
+}
+/**
+ * Check if stress test P95 latency is within threshold
+ */
+export function toHaveStressP95LatencyBelow(
+  result: StressResult,
+  maxLatencyMs: number
+): MatcherResult {
+  const actualLatency = result.p95LatencyMs;
+  const pass = actualLatency <= maxLatencyMs;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected P95 latency to be above ${maxLatencyMs}ms, but got ${actualLatency}ms`
+        : `Expected P95 latency to be at most ${maxLatencyMs}ms, but got ${actualLatency}ms`,
+  };
+}
+/**
+ * Check if stress test passed (default 95% success rate)
+ */
+export function toPassStressTest(result: StressResult): MatcherResult {
+  const pass = result.success;
+  const { metrics } = result.manifest;
+  return {
+    pass,
+    message: () =>
+      pass
+        ? `Expected stress test to fail, but passed with ${(result.successRate * 100).toFixed(1)}% success rate`
+        : `Expected stress test to pass, but success rate was only ${(result.successRate * 100).toFixed(1)}%
+  Total requests: ${metrics.total_requests}
+  Successful: ${metrics.successful_requests}
+  Failed: ${metrics.failed_requests}
+  RPS: ${metrics.requests_per_second.toFixed(1)}
+  P95 Latency: ${metrics.p95_latency_ms}ms`,
+  };
+}
+// ==========================================================================
+// Export all matchers
+// ==========================================================================
+export const artemiskitMatchers = {
+  // Run matchers
+  toPassAllCases,
+  toHaveSuccessRate,
+  toPassCasesWithTag,
+  toHaveMedianLatencyBelow,
+  toHaveP95LatencyBelow,
+  // Red team matchers
+  toHaveDefenseRate,
+  toHaveNoCriticalVulnerabilities,
+  toHaveNoHighSeverityVulnerabilities,
+  toPassRedTeam,
+  // Stress test matchers
+  toHaveStressSuccessRate,
+  toAchieveRPS,
+  toHaveStressP95LatencyBelow,
+  toPassStressTest,
+};
+export type ArtemisKitMatchers = typeof artemiskitMatchers;

package/src/matchers/index.ts ADDED Viewed

@@ -0,0 +1,26 @@
+/**
+ * @artemiskit/sdk
+ * Test matchers - core implementations without framework bindings
+ */
+export {
+  artemiskitMatchers,
+  type ArtemisKitMatchers,
+  type MatcherResult,
+  // Run matchers
+  toPassAllCases,
+  toHaveSuccessRate,
+  toPassCasesWithTag,
+  toHaveMedianLatencyBelow,
+  toHaveP95LatencyBelow,
+  // Red team matchers
+  toHaveDefenseRate,
+  toHaveNoCriticalVulnerabilities,
+  toHaveNoHighSeverityVulnerabilities,
+  toPassRedTeam,
+  // Stress test matchers
+  toHaveStressSuccessRate,
+  toAchieveRPS,
+  toHaveStressP95LatencyBelow,
+  toPassStressTest,
+} from './core';

package/src/matchers/jest.ts ADDED Viewed

@@ -0,0 +1,112 @@
+/**
+ * @artemiskit/sdk
+ * Jest integration - custom matchers for ArtemisKit
+ */
+import type { RedTeamResult, RunResult, StressResult } from '../types';
+import {
+  toAchieveRPS,
+  toHaveDefenseRate,
+  toHaveMedianLatencyBelow,
+  toHaveNoCriticalVulnerabilities,
+  toHaveNoHighSeverityVulnerabilities,
+  toHaveP95LatencyBelow,
+  toHaveStressP95LatencyBelow,
+  toHaveStressSuccessRate,
+  toHaveSuccessRate,
+  toPassAllCases,
+  toPassCasesWithTag,
+  toPassRedTeam,
+  toPassStressTest,
+} from './core';
+/**
+ * Jest matchers implementation
+ */
+export const jestMatchers = {
+  toPassAllCases(received: RunResult) {
+    return toPassAllCases(received);
+  },
+  toHaveSuccessRate(received: RunResult, expectedRate: number) {
+    return toHaveSuccessRate(received, expectedRate);
+  },
+  toPassCasesWithTag(received: RunResult, tag: string) {
+    return toPassCasesWithTag(received, tag);
+  },
+  toHaveMedianLatencyBelow(received: RunResult, maxLatencyMs: number) {
+    return toHaveMedianLatencyBelow(received, maxLatencyMs);
+  },
+  toHaveP95LatencyBelow(received: RunResult, maxLatencyMs: number) {
+    return toHaveP95LatencyBelow(received, maxLatencyMs);
+  },
+  toHaveDefenseRate(received: RedTeamResult, expectedRate: number) {
+    return toHaveDefenseRate(received, expectedRate);
+  },
+  toHaveNoCriticalVulnerabilities(received: RedTeamResult) {
+    return toHaveNoCriticalVulnerabilities(received);
+  },
+  toHaveNoHighSeverityVulnerabilities(received: RedTeamResult) {
+    return toHaveNoHighSeverityVulnerabilities(received);
+  },
+  toPassRedTeam(received: RedTeamResult) {
+    return toPassRedTeam(received);
+  },
+  toHaveStressSuccessRate(received: StressResult, expectedRate: number) {
+    return toHaveStressSuccessRate(received, expectedRate);
+  },
+  toAchieveRPS(received: StressResult, targetRPS: number) {
+    return toAchieveRPS(received, targetRPS);
+  },
+  toHaveStressP95LatencyBelow(received: StressResult, maxLatencyMs: number) {
+    return toHaveStressP95LatencyBelow(received, maxLatencyMs);
+  },
+  toPassStressTest(received: StressResult) {
+    return toPassStressTest(received);
+  },
+};
+// Extend Jest's expect if available
+declare const expect: { extend: (matchers: object) => void } | undefined;
+if (typeof expect !== 'undefined' && typeof expect.extend === 'function') {
+  expect.extend(jestMatchers);
+}
+/**
+ * TypeScript declarations for Jest matchers
+ */
+declare global {
+  namespace jest {
+    interface Matchers<R> {
+      // Run matchers
+      toPassAllCases(): R;
+      toHaveSuccessRate(expectedRate: number): R;
+      toPassCasesWithTag(tag: string): R;
+      toHaveMedianLatencyBelow(maxLatencyMs: number): R;
+      toHaveP95LatencyBelow(maxLatencyMs: number): R;
+      // Red team matchers
+      toHaveDefenseRate(expectedRate: number): R;
+      toHaveNoCriticalVulnerabilities(): R;
+      toHaveNoHighSeverityVulnerabilities(): R;
+      toPassRedTeam(): R;
+      // Stress test matchers
+      toHaveStressSuccessRate(expectedRate: number): R;
+      toAchieveRPS(targetRPS: number): R;
+      toHaveStressP95LatencyBelow(maxLatencyMs: number): R;
+      toPassStressTest(): R;
+    }
+  }
+}

package/src/matchers/vitest.ts ADDED Viewed

@@ -0,0 +1,84 @@
+/**
+ * @artemiskit/sdk
+ * Vitest integration - custom matchers for ArtemisKit
+ */
+import type { RedTeamResult, RunResult, StressResult } from '../types';
+import {
+  toAchieveRPS,
+  toHaveDefenseRate,
+  toHaveMedianLatencyBelow,
+  toHaveNoCriticalVulnerabilities,
+  toHaveNoHighSeverityVulnerabilities,
+  toHaveP95LatencyBelow,
+  toHaveStressP95LatencyBelow,
+  toHaveStressSuccessRate,
+  toHaveSuccessRate,
+  toPassAllCases,
+  toPassCasesWithTag,
+  toPassRedTeam,
+  toPassStressTest,
+} from './core';
+/**
+ * Vitest matchers implementation
+ */
+export const vitestMatchers = {
+  toPassAllCases(received: RunResult) {
+    return toPassAllCases(received);
+  },
+  toHaveSuccessRate(received: RunResult, expectedRate: number) {
+    return toHaveSuccessRate(received, expectedRate);
+  },
+  toPassCasesWithTag(received: RunResult, tag: string) {
+    return toPassCasesWithTag(received, tag);
+  },
+  toHaveMedianLatencyBelow(received: RunResult, maxLatencyMs: number) {
+    return toHaveMedianLatencyBelow(received, maxLatencyMs);
+  },
+  toHaveP95LatencyBelow(received: RunResult, maxLatencyMs: number) {
+    return toHaveP95LatencyBelow(received, maxLatencyMs);
+  },
+  toHaveDefenseRate(received: RedTeamResult, expectedRate: number) {
+    return toHaveDefenseRate(received, expectedRate);
+  },
+  toHaveNoCriticalVulnerabilities(received: RedTeamResult) {
+    return toHaveNoCriticalVulnerabilities(received);
+  },
+  toHaveNoHighSeverityVulnerabilities(received: RedTeamResult) {
+    return toHaveNoHighSeverityVulnerabilities(received);
+  },
+  toPassRedTeam(received: RedTeamResult) {
+    return toPassRedTeam(received);
+  },
+  toHaveStressSuccessRate(received: StressResult, expectedRate: number) {
+    return toHaveStressSuccessRate(received, expectedRate);
+  },
+  toAchieveRPS(received: StressResult, targetRPS: number) {
+    return toAchieveRPS(received, targetRPS);
+  },
+  toHaveStressP95LatencyBelow(received: StressResult, maxLatencyMs: number) {
+    return toHaveStressP95LatencyBelow(received, maxLatencyMs);
+  },
+  toPassStressTest(received: StressResult) {
+    return toPassStressTest(received);
+  },
+};
+// Extend Vitest's expect if available
+declare const expect: { extend: (matchers: object) => void } | undefined;
+if (typeof expect !== 'undefined' && typeof expect.extend === 'function') {
+  expect.extend(vitestMatchers);
+}