ai-shield-core 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (68) hide show
  1. package/dist/audit/logger.d.ts.map +1 -1
  2. package/dist/audit/logger.js +13 -14
  3. package/dist/audit/types.js +1 -2
  4. package/dist/cache/lru.js +1 -5
  5. package/dist/canary/memory.d.ts +75 -0
  6. package/dist/canary/memory.d.ts.map +1 -0
  7. package/dist/canary/memory.js +194 -0
  8. package/dist/context/wrap-context.d.ts +105 -0
  9. package/dist/context/wrap-context.d.ts.map +1 -0
  10. package/dist/context/wrap-context.js +188 -0
  11. package/dist/cost/anomaly.js +1 -4
  12. package/dist/cost/pricing.d.ts.map +1 -1
  13. package/dist/cost/pricing.js +18 -19
  14. package/dist/cost/tracker.d.ts +19 -1
  15. package/dist/cost/tracker.d.ts.map +1 -1
  16. package/dist/cost/tracker.js +27 -10
  17. package/dist/index.d.ts +31 -2
  18. package/dist/index.d.ts.map +1 -1
  19. package/dist/index.js +51 -37
  20. package/dist/policy/circuit-breaker.d.ts +70 -0
  21. package/dist/policy/circuit-breaker.d.ts.map +1 -0
  22. package/dist/policy/circuit-breaker.js +376 -0
  23. package/dist/policy/engine.js +1 -5
  24. package/dist/policy/tools.js +4 -8
  25. package/dist/scanner/canary.js +4 -8
  26. package/dist/scanner/chain.js +1 -5
  27. package/dist/scanner/heuristic.d.ts +13 -0
  28. package/dist/scanner/heuristic.d.ts.map +1 -1
  29. package/dist/scanner/heuristic.js +50 -7
  30. package/dist/scanner/ingestion.d.ts +116 -0
  31. package/dist/scanner/ingestion.d.ts.map +1 -0
  32. package/dist/scanner/ingestion.js +452 -0
  33. package/dist/scanner/pii.d.ts.map +1 -1
  34. package/dist/scanner/pii.js +24 -12
  35. package/dist/shield.d.ts.map +1 -1
  36. package/dist/shield.js +34 -26
  37. package/dist/types.d.ts +140 -2
  38. package/dist/types.d.ts.map +1 -1
  39. package/dist/types.js +1 -2
  40. package/package.json +4 -3
  41. package/src/audit/logger.ts +6 -1
  42. package/src/canary/memory.ts +259 -0
  43. package/src/context/wrap-context.ts +304 -0
  44. package/src/cost/pricing.ts +13 -9
  45. package/src/cost/tracker.ts +35 -1
  46. package/src/index.ts +82 -1
  47. package/src/policy/circuit-breaker.ts +449 -0
  48. package/src/scanner/heuristic.ts +49 -2
  49. package/src/scanner/ingestion.ts +550 -0
  50. package/src/scanner/pii.ts +21 -7
  51. package/src/shield.ts +15 -2
  52. package/src/types.ts +175 -2
  53. package/tsconfig.json +2 -1
  54. package/dist/audit/logger.js.map +0 -1
  55. package/dist/audit/types.js.map +0 -1
  56. package/dist/cache/lru.js.map +0 -1
  57. package/dist/cost/anomaly.js.map +0 -1
  58. package/dist/cost/pricing.js.map +0 -1
  59. package/dist/cost/tracker.js.map +0 -1
  60. package/dist/index.js.map +0 -1
  61. package/dist/policy/engine.js.map +0 -1
  62. package/dist/policy/tools.js.map +0 -1
  63. package/dist/scanner/canary.js.map +0 -1
  64. package/dist/scanner/chain.js.map +0 -1
  65. package/dist/scanner/heuristic.js.map +0 -1
  66. package/dist/scanner/pii.js.map +0 -1
  67. package/dist/shield.js.map +0 -1
  68. package/dist/types.js.map +0 -1
@@ -0,0 +1,304 @@
1
+ import type {
2
+ ContextSegment,
3
+ IngestionSource,
4
+ TrustTier,
5
+ WrappedContext,
6
+ ScanContext,
7
+ ScanDecision,
8
+ Violation,
9
+ } from "../types.js";
10
+ import { createHash } from "node:crypto";
11
+ import { IngestionScanner } from "../scanner/ingestion.js";
12
+
13
+ // ============================================================
14
+ // wrapContext — Trust-Tier Context Streams
15
+ //
16
+ // The deepest finding of the 2026 prompt-injection literature
17
+ // (Parallax, IPI surveys, OWASP LLM01:2025) is that the LLM cannot
18
+ // reliably distinguish *instruction* from *data* once both share the
19
+ // same attention substrate. The only architecturally robust mitigation
20
+ // is privilege separation: tag every segment with its provenance + trust
21
+ // tier, scan untrusted segments aggressively, and let downstream code
22
+ // decide whether instruction-shaped content from a `web`/`rag`/`tool-desc`
23
+ // segment is allowed to influence behaviour.
24
+ //
25
+ // `wrapContext()` is the ergonomic entry point.
26
+ // ============================================================
27
+
28
+ /**
29
+ * Input shape for `wrapContext()`. Each named field is conventional;
30
+ * pass only what applies.
31
+ */
32
+ export interface WrapContextInput {
33
+ /** Developer-controlled prompt. Always `trust: "system"`. */
34
+ system?: string;
35
+ /** Direct user message(s). `trust: "untrusted"`, `source: "user"`. */
36
+ user?: string | string[];
37
+ /** Retrieved documents. `trust: "untrusted"`, `source: "rag"`. */
38
+ retrieved?: Array<{ content: string; label?: string } | string>;
39
+ /** MCP / function tool descriptions about to be exposed to the model. */
40
+ tools?: Array<{ content: string; label?: string } | string>;
41
+ /** Stored memory facts. `trust: "untrusted"`, `source: "memory"`. */
42
+ memory?: Array<{ content: string; label?: string } | string>;
43
+ /** Scraped / fetched web content. */
44
+ web?: Array<{ content: string; label?: string } | string>;
45
+ /** Output from another agent (multi-agent pipelines). */
46
+ agentOutput?: Array<{ content: string; label?: string } | string>;
47
+ /**
48
+ * Promote specific named segments to `"trusted"` (e.g. an internal
49
+ * knowledge base whose contents you control end-to-end).
50
+ * Match is by `label` substring, case-insensitive.
51
+ */
52
+ trustedLabels?: string[];
53
+ }
54
+
55
+ /**
56
+ * Build a `WrappedContext` from typed inputs.
57
+ *
58
+ * Trust assignment:
59
+ * - `system` -> system
60
+ * - `retrieved`/`tools`/`memory`/`web`/`agent-output` -> untrusted
61
+ * - `user` -> untrusted (a user is not trusted in this threat model — they
62
+ * can also inject; the `untrusted` label means "scan aggressively")
63
+ * - any segment whose `label` matches one of `trustedLabels` -> trusted
64
+ *
65
+ * Trust does NOT mean "skip scanning". It only governs how
66
+ * `assemblePrompt()` and the per-segment policy decide whether to
67
+ * include the segment in the final assembled prompt.
68
+ */
69
+ export function wrapContext(input: WrapContextInput): WrappedContext {
70
+ const segments: ContextSegment[] = [];
71
+ const trustedLabels = (input.trustedLabels ?? []).map((s) => s.toLowerCase());
72
+
73
+ // Critic H1 — substring match would let an attacker-supplied label
74
+ // like "untrusted-doc-INTERNAL-kb-poisoned" claim trust because it
75
+ // CONTAINS the trusted prefix. Match exact or path-anchored only.
76
+ const isTrustedLabel = (label?: string): boolean => {
77
+ if (!label) return false;
78
+ const lc = label.toLowerCase();
79
+ return trustedLabels.some((tl) => lc === tl || lc.startsWith(tl + "/"));
80
+ };
81
+
82
+ const push = (
83
+ content: string,
84
+ source: IngestionSource,
85
+ trust: TrustTier,
86
+ label?: string,
87
+ ): void => {
88
+ if (typeof content !== "string" || content.length === 0) return;
89
+ segments.push({
90
+ source,
91
+ trust,
92
+ content,
93
+ label,
94
+ contentHash: hashContent(content),
95
+ });
96
+ };
97
+
98
+ // System: always trust=system. The `source` field is unused for
99
+ // system segments because `trust === "system"` is the authoritative
100
+ // signal — Analyst A2 round 1 review. We keep `source: "user"` here
101
+ // only because `ContextSegment.source` is non-optional; any code that
102
+ // branches on `seg.source` MUST first check `seg.trust !== "system"`.
103
+ if (input.system) {
104
+ push(input.system, "user", "system", "system-prompt");
105
+ }
106
+
107
+ // User messages.
108
+ if (input.user) {
109
+ const userInputs = Array.isArray(input.user) ? input.user : [input.user];
110
+ for (const u of userInputs) {
111
+ push(u, "user", "untrusted", "user");
112
+ }
113
+ }
114
+
115
+ // Helper for the array-of-{content,label} groups.
116
+ const pushGroup = (
117
+ items: Array<{ content: string; label?: string } | string> | undefined,
118
+ source: IngestionSource,
119
+ ): void => {
120
+ if (!items) return;
121
+ for (const item of items) {
122
+ const content = typeof item === "string" ? item : item.content;
123
+ const label = typeof item === "string" ? undefined : item.label;
124
+ const trust: TrustTier = isTrustedLabel(label) ? "trusted" : "untrusted";
125
+ push(content, source, trust, label);
126
+ }
127
+ };
128
+
129
+ pushGroup(input.retrieved, "rag");
130
+ pushGroup(input.tools, "tool-desc");
131
+ pushGroup(input.memory, "memory");
132
+ pushGroup(input.web, "web");
133
+ pushGroup(input.agentOutput, "agent-output");
134
+
135
+ return { segments };
136
+ }
137
+
138
+ /**
139
+ * Scan every segment with the source-specific ingestion profile.
140
+ * Mutates `ctx` in place by attaching `scanResults` + `decision`,
141
+ * AND returns the same object for chaining.
142
+ */
143
+ export async function scanWrappedContext(
144
+ ctx: WrappedContext,
145
+ options: { strictness?: "low" | "medium" | "high" } = {},
146
+ ): Promise<WrappedContext> {
147
+ const scanner = new IngestionScanner({
148
+ strictness: options.strictness ?? "high",
149
+ });
150
+ const results: NonNullable<WrappedContext["scanResults"]> = [];
151
+ let worst: ScanDecision = "allow";
152
+
153
+ for (let i = 0; i < ctx.segments.length; i += 1) {
154
+ const seg = ctx.segments[i]!;
155
+ // System segments skip the scanner — they're developer-authored and
156
+ // running the heuristic over a real system prompt would flood with
157
+ // false positives (system prompts ARE instructions, by definition).
158
+ if (seg.trust === "system") {
159
+ results.push({ segmentIndex: i, decision: "allow", violations: [] });
160
+ continue;
161
+ }
162
+
163
+ const scanContext: ScanContext = {
164
+ source: seg.source,
165
+ trustTier: seg.trust,
166
+ };
167
+ const r = await scanner.scan(seg.content, scanContext);
168
+ results.push({
169
+ segmentIndex: i,
170
+ decision: r.decision,
171
+ violations: r.violations,
172
+ });
173
+ if (priority(r.decision) > priority(worst)) {
174
+ worst = r.decision;
175
+ }
176
+ }
177
+
178
+ ctx.scanResults = results;
179
+ ctx.decision = worst;
180
+ return ctx;
181
+ }
182
+
183
+ /**
184
+ * Assemble a prompt string respecting tier boundaries.
185
+ *
186
+ * Order: `system` → `trusted` retrieved/memory/tool-desc → `user`
187
+ * → all remaining `untrusted` segments wrapped in fenced markers.
188
+ *
189
+ * Why `trusted` before `user`? Putting developer-marked trusted
190
+ * context above the user message reduces the chance an untrusted user
191
+ * prompt re-frames the trusted reference material below it.
192
+ *
193
+ * Untrusted segments are wrapped in an explicit fence so a downstream
194
+ * model has a chance to attend to provenance. This is not a guarantee
195
+ * (no in-band marker is) but it is the single highest-leverage
196
+ * mitigation we can apply at the toolkit layer per Anthropic +
197
+ * OpenAI Model Spec guidance.
198
+ *
199
+ * Pass `strictMode: true` to OMIT blocked segments entirely. Default
200
+ * keeps them but fences them with a `<BLOCKED>` marker so an auditor
201
+ * can see what was tried.
202
+ */
203
+ export interface AssembleOptions {
204
+ strictMode?: boolean;
205
+ /** Custom fence labels. Defaults are sensible. */
206
+ fences?: {
207
+ untrusted?: { open: string; close: string };
208
+ blocked?: { open: string; close: string };
209
+ };
210
+ }
211
+
212
+ export function assemblePrompt(
213
+ ctx: WrappedContext,
214
+ options: AssembleOptions = {},
215
+ ): string {
216
+ const fences = {
217
+ untrusted: options.fences?.untrusted ?? {
218
+ open: "<UNTRUSTED_CONTENT source=",
219
+ close: "</UNTRUSTED_CONTENT>",
220
+ },
221
+ blocked: options.fences?.blocked ?? {
222
+ open: "<BLOCKED_CONTENT source=",
223
+ close: "</BLOCKED_CONTENT>",
224
+ },
225
+ };
226
+
227
+ // Pre-build a segment→index map ONCE. Avoids O(n²) `indexOf` inside the
228
+ // assembly loop AND removes a TOCTOU on mutable `ctx.segments` (Critic
229
+ // H2 + Analyst A4 round 1 review).
230
+ const segmentIndexMap = new Map<ContextSegment, number>();
231
+ ctx.segments.forEach((s, i) => segmentIndexMap.set(s, i));
232
+ const segmentResultMap = new Map<number, NonNullable<WrappedContext["scanResults"]>[number]>();
233
+ for (const r of ctx.scanResults ?? []) {
234
+ segmentResultMap.set(r.segmentIndex, r);
235
+ }
236
+
237
+ const ordered: ContextSegment[] = [];
238
+ // 1. system
239
+ ordered.push(...ctx.segments.filter((s) => s.trust === "system"));
240
+ // 2. trusted (retrieved/memory/tool-desc the dev marked as trusted)
241
+ ordered.push(...ctx.segments.filter((s) => s.trust === "trusted"));
242
+ // 3. user (untrusted, source="user")
243
+ ordered.push(
244
+ ...ctx.segments.filter(
245
+ (s) => s.source === "user" && s.trust === "untrusted",
246
+ ),
247
+ );
248
+ // 4. all remaining untrusted, preserve original order within group.
249
+ for (const s of ctx.segments) {
250
+ if (s.trust === "untrusted" && s.source !== "user") {
251
+ ordered.push(s);
252
+ }
253
+ }
254
+
255
+ const parts: string[] = [];
256
+ for (const seg of ordered) {
257
+ const segIdx = segmentIndexMap.get(seg) ?? -1;
258
+ const segResult = segIdx >= 0 ? segmentResultMap.get(segIdx) : undefined;
259
+ const blocked = segResult?.decision === "block";
260
+
261
+ if (blocked) {
262
+ if (options.strictMode) {
263
+ // Drop entirely.
264
+ continue;
265
+ }
266
+ parts.push(
267
+ `${fences.blocked.open}"${seg.source}" label="${seg.label ?? ""}">\n${seg.content}\n${fences.blocked.close}`,
268
+ );
269
+ continue;
270
+ }
271
+
272
+ if (seg.trust === "system") {
273
+ parts.push(seg.content);
274
+ } else if (seg.trust === "trusted") {
275
+ parts.push(seg.content);
276
+ } else if (seg.source === "user" && seg.trust === "untrusted") {
277
+ // User input keeps its natural shape — fencing every user message
278
+ // creates more noise than signal.
279
+ parts.push(seg.content);
280
+ } else {
281
+ parts.push(
282
+ `${fences.untrusted.open}"${seg.source}" label="${seg.label ?? ""}">\n${seg.content}\n${fences.untrusted.close}`,
283
+ );
284
+ }
285
+ }
286
+
287
+ return parts.join("\n\n");
288
+ }
289
+
290
+ function hashContent(content: string): string {
291
+ return createHash("sha256").update(content).digest("hex");
292
+ }
293
+
294
+ function priority(d: ScanDecision): number {
295
+ return d === "block" ? 2 : d === "warn" ? 1 : 0;
296
+ }
297
+
298
+ /**
299
+ * Convenience aggregator: violations across all scanned segments.
300
+ */
301
+ export function flattenViolations(ctx: WrappedContext): Violation[] {
302
+ if (!ctx.scanResults) return [];
303
+ return ctx.scanResults.flatMap((r) => r.violations);
304
+ }
@@ -1,8 +1,10 @@
1
1
  import type { ModelPricing } from "../types.js";
2
2
 
3
3
  // ============================================================
4
- // Model Pricing Table — Updated Feb 2026
5
- // Prices in USD per 1M tokens
4
+ // Model Pricing Table — Updated April 2026
5
+ // Prices in USD per 1M tokens.
6
+ // Includes `cachedInputPer1M` for providers that support prompt caching
7
+ // (Anthropic cache reads land at ~10% of standard input rate).
6
8
  // ============================================================
7
9
 
8
10
  export const MODEL_PRICING: Record<string, ModelPricing> = {
@@ -17,16 +19,18 @@ export const MODEL_PRICING: Record<string, ModelPricing> = {
17
19
  "o3-mini": { inputPer1M: 1.10, outputPer1M: 4.40 },
18
20
  "o4-mini": { inputPer1M: 1.10, outputPer1M: 4.40 },
19
21
 
20
- // Anthropic
21
- "claude-opus-4-6": { inputPer1M: 15.0, outputPer1M: 75.0 },
22
- "claude-sonnet-4-6": { inputPer1M: 3.0, outputPer1M: 15.0 },
23
- "claude-haiku-4-5": { inputPer1M: 0.80, outputPer1M: 4.0 },
22
+ // Anthropic — April 2026 line-up (Opus 4.7, Sonnet 4.6, Haiku 4.5)
23
+ "claude-opus-4-7": { inputPer1M: 15.0, outputPer1M: 75.0, cachedInputPer1M: 1.50 },
24
+ "claude-opus-4-6": { inputPer1M: 15.0, outputPer1M: 75.0, cachedInputPer1M: 1.50 },
25
+ "claude-sonnet-4-6": { inputPer1M: 3.0, outputPer1M: 15.0, cachedInputPer1M: 0.30 },
26
+ "claude-sonnet-4-5": { inputPer1M: 3.0, outputPer1M: 15.0, cachedInputPer1M: 0.30 },
27
+ "claude-haiku-4-5": { inputPer1M: 0.80, outputPer1M: 4.0, cachedInputPer1M: 0.08 },
24
28
 
25
29
  // Aliases
26
30
  "gpt-5.2-turbo": { inputPer1M: 2.50, outputPer1M: 10.0 },
27
- opus: { inputPer1M: 15.0, outputPer1M: 75.0 },
28
- sonnet: { inputPer1M: 3.0, outputPer1M: 15.0 },
29
- haiku: { inputPer1M: 0.80, outputPer1M: 4.0 },
31
+ opus: { inputPer1M: 15.0, outputPer1M: 75.0, cachedInputPer1M: 1.50 },
32
+ sonnet: { inputPer1M: 3.0, outputPer1M: 15.0, cachedInputPer1M: 0.30 },
33
+ haiku: { inputPer1M: 0.80, outputPer1M: 4.0, cachedInputPer1M: 0.08 },
30
34
  };
31
35
 
32
36
  /** Get pricing for a model, fallback to gpt-4o-mini rates */
@@ -49,17 +49,32 @@ class MemoryStore implements RedisLike {
49
49
  }
50
50
  }
51
51
 
52
+ export interface CostTrackerOptions {
53
+ /**
54
+ * Cap on in-memory CostRecord retention (ring-buffer).
55
+ * Default: 10_000. Set to 0 to disable record retention entirely
56
+ * (use this in long-running processes that only care about budget
57
+ * counters, not per-request records).
58
+ * Override via env: AI_SHIELD_MAX_RECORDS.
59
+ */
60
+ maxRecords?: number;
61
+ }
62
+
52
63
  export class CostTracker {
53
64
  private store: RedisLike;
54
65
  private budgets: Map<string, BudgetConfig>;
55
66
  private records: CostRecord[] = [];
67
+ private maxRecords: number;
56
68
 
57
69
  constructor(
58
70
  budgets: Record<string, BudgetConfig> = {},
59
71
  redis?: RedisLike,
72
+ options: CostTrackerOptions = {},
60
73
  ) {
61
74
  this.store = redis ?? new MemoryStore();
62
75
  this.budgets = new Map(Object.entries(budgets));
76
+ const envCap = Number(process.env.AI_SHIELD_MAX_RECORDS);
77
+ this.maxRecords = options.maxRecords ?? (Number.isFinite(envCap) && envCap >= 0 ? envCap : 10_000);
63
78
  }
64
79
 
65
80
  /** Check if a request is within budget BEFORE sending to LLM */
@@ -133,10 +148,29 @@ export class CostTracker {
133
148
  await this.store.expire(globalKey, this.periodSeconds(globalBudget.period) * 2);
134
149
  }
135
150
 
136
- this.records.push(record);
151
+ this.appendRecord(record);
137
152
  return record;
138
153
  }
139
154
 
155
+ /**
156
+ * Append a record with ring-buffer semantics to prevent unbounded memory growth.
157
+ * When maxRecords is 0, records are not retained.
158
+ */
159
+ private appendRecord(record: CostRecord): void {
160
+ if (this.maxRecords === 0) return;
161
+ this.records.push(record);
162
+ if (this.records.length > this.maxRecords) {
163
+ // Drop oldest entries — O(1) amortized using splice(0, overflow)
164
+ const overflow = this.records.length - this.maxRecords;
165
+ this.records.splice(0, overflow);
166
+ }
167
+ }
168
+
169
+ /** Clear all in-memory records (e.g., after export) */
170
+ clearRecords(): void {
171
+ this.records.length = 0;
172
+ }
173
+
140
174
  /** Get current spend for an entity */
141
175
  async getCurrentSpend(entityId: string): Promise<number> {
142
176
  const budget = this.budgets.get(entityId);
package/src/index.ts CHANGED
@@ -10,10 +10,42 @@ export { HeuristicScanner, type HeuristicConfig } from "./scanner/heuristic.js";
10
10
  export { PIIScanner } from "./scanner/pii.js";
11
11
  export { ScannerChain, type ChainConfig } from "./scanner/chain.js";
12
12
  export { injectCanary, checkCanaryLeak } from "./scanner/canary.js";
13
+ export {
14
+ IngestionScanner,
15
+ scanIngested,
16
+ trustTierForSource,
17
+ type IngestionScannerConfig,
18
+ type IngestionScanResult,
19
+ } from "./scanner/ingestion.js";
20
+
21
+ // Context / Trust-Tier
22
+ export {
23
+ wrapContext,
24
+ scanWrappedContext,
25
+ assemblePrompt,
26
+ flattenViolations,
27
+ type WrapContextInput,
28
+ type AssembleOptions,
29
+ } from "./context/wrap-context.js";
30
+
31
+ // Memory Canary / Persistence-Poisoning
32
+ export {
33
+ mintMemoryCanary,
34
+ verifyMemoryCanary,
35
+ rotateMemoryCanary,
36
+ buildSentinelEntry,
37
+ bulkVerify,
38
+ type MintMemoryCanaryOptions,
39
+ } from "./canary/memory.js";
13
40
 
14
41
  // Policy
15
42
  export { PolicyEngine, type PolicyPreset } from "./policy/engine.js";
16
43
  export { ToolPolicyScanner } from "./policy/tools.js";
44
+ export {
45
+ CircuitBreakerRegistry,
46
+ makeBreakerScope,
47
+ type CircuitBreakerOptions,
48
+ } from "./policy/circuit-breaker.js";
17
49
 
18
50
  // Cost
19
51
  export { CostTracker, type RedisLike } from "./cost/tracker.js";
@@ -37,6 +69,19 @@ export type {
37
69
  ScanContext,
38
70
  Violation,
39
71
  ViolationType,
72
+ // Ingestion / Trust-Tier (v0.2)
73
+ IngestionSource,
74
+ TrustTier,
75
+ ContextSegment,
76
+ WrappedContext,
77
+ // Memory Canary (v0.2)
78
+ MemoryCanaryEntry,
79
+ MemoryCanaryVerification,
80
+ // Circuit Breaker (v0.2)
81
+ CircuitState,
82
+ CircuitBreakerConfig,
83
+ CircuitBreakerDecision,
84
+ CounterStoreLike,
40
85
  // PII
41
86
  PIIType,
42
87
  PIIAction,
@@ -71,7 +116,15 @@ export type {
71
116
  import { AIShield } from "./shield.js";
72
117
  import type { ShieldConfig, ScanResult, ScanContext } from "./types.js";
73
118
 
74
- /** Quick scan — one line, maximum protection */
119
+ /**
120
+ * Quick scan — one line, maximum protection.
121
+ *
122
+ * **Performance warning:** This creates a new AIShield instance on every call.
123
+ * For production use with multiple calls, create a single `new AIShield(config)`
124
+ * instance and reuse it — this avoids repeated scanner chain setup and teardown.
125
+ *
126
+ * Use `createShieldSingleton()` for a cached version that reuses a single instance.
127
+ */
75
128
  export async function shield(
76
129
  input: string,
77
130
  configOrContext?: ShieldConfig | ScanContext,
@@ -89,3 +142,31 @@ export async function shield(
89
142
  await instance.close();
90
143
  }
91
144
  }
145
+
146
+ /**
147
+ * Create a cached shield function that reuses a single AIShield instance.
148
+ * Much better performance than `shield()` for repeated calls.
149
+ *
150
+ * @example
151
+ * ```ts
152
+ * const scan = createShieldSingleton({ injection: { strictness: "high" } });
153
+ * const r1 = await scan("input 1");
154
+ * const r2 = await scan("input 2");
155
+ * // Call scan.close() when done (e.g., on process exit)
156
+ * await scan.close();
157
+ * ```
158
+ */
159
+ export function createShieldSingleton(config: ShieldConfig = {}): {
160
+ (input: string, context?: ScanContext): Promise<ScanResult>;
161
+ close(): Promise<void>;
162
+ } {
163
+ const instance = new AIShield(config);
164
+
165
+ const scan = (input: string, context?: ScanContext): Promise<ScanResult> => {
166
+ return instance.scan(input, context);
167
+ };
168
+
169
+ scan.close = (): Promise<void> => instance.close();
170
+
171
+ return scan;
172
+ }