npm - @vantinelai/node-sdk - Versions diffs - 0.4.5 - Mend

@vantinelai/node-sdk 0.4.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

package/README.md +189 -0
package/dist/client.d.ts +105 -0
package/dist/client.js +431 -0
package/dist/index.d.ts +5 -0
package/dist/index.js +28 -0
package/dist/integrations/anthropic.d.ts +64 -0
package/dist/integrations/anthropic.js +138 -0
package/dist/integrations/index.d.ts +5 -0
package/dist/integrations/index.js +11 -0
package/dist/integrations/openai-agents.d.ts +70 -0
package/dist/integrations/openai-agents.js +108 -0
package/dist/monitor.d.ts +41 -0
package/dist/monitor.js +308 -0
package/dist/security.d.ts +17 -0
package/dist/security.js +82 -0
package/package.json +49 -0

package/README.md ADDED Viewed

@@ -0,0 +1,189 @@
+# @vantinel/node-sdk
+Node.js / Server-side SDK for [Vantinel](https://vantinel.ai) — real-time AI agent observability & guardrails.
+## Installation
+```bash
+npm install @vantinel/node-sdk
+# or
+yarn add @vantinel/node-sdk
+# or
+pnpm add @vantinel/node-sdk
+```
+## Quick Start
+```ts
+import { VantinelMonitor } from '@vantinel/node-sdk';
+const monitor = new VantinelMonitor({
+  apiKey: process.env.VANTINEL_API_KEY,
+  clientId: 'my-company',
+  agentId: 'customer-support-bot',
+});
+// Wrap any tool function — one line
+const search = monitor.monitor('search_database', async (query: string) => {
+  return db.query(query);
+});
+// Use as normal — monitoring is transparent
+const results = await search('SELECT * FROM users');
+```
+## Configuration
+| Option | Type | Default | Description |
+|---|---|---|---|
+| `apiKey` | `string` | `$VANTINEL_API_KEY` | Your Vantinel API key |
+| `clientId` | `string` | `$VANTINEL_CLIENT_ID` | Your organization ID |
+| `agentId` | `string` | `'default-agent'` | Identifier for this agent |
+| `collectorUrl` | `string` | `http://localhost:8000` | Vantinel Collector endpoint |
+| `dryRun` | `boolean` | `false` | Log events without sending (useful in CI) |
+| `shadowMode` | `boolean` | `false` | Detect threats but never block; log what *would* have happened |
+| `batchSize` | `number` | `1` | Buffer N events before sending (reduces HTTP overhead) |
+| `flushInterval` | `number` | `0` | Auto-flush interval in milliseconds (0 = disabled) |
+| `retry.maxRetries` | `number` | `0` | Retry on 5xx/network errors |
+| `retry.backoffMs` | `number` | `100` | Base backoff between retries |
+| `slackWebhookUrl` | `string` | — | Shadow Mode Slack alerts webhook |
+All options also read from environment variables (`VANTINEL_API_KEY`, `VANTINEL_CLIENT_ID`, `VANTINEL_DRY_RUN`, `VANTINEL_SHADOW_MODE`, etc.).
+## API
+### `monitor.monitor(toolName, fn, options?)`
+Wraps a function for monitoring. Returns the same function, transparently instrumented.
+```ts
+const wrappedFn = monitor.monitor('send_email', sendEmail, {
+  traceId: monitor.startTrace(),   // correlate with browser events
+  skip: false,                      // set true to skip monitoring for this call
+  costCalculator: (result) => ({    // extract cost from AI API response
+    estimated_cost: result.usage.total_tokens * 0.00001,
+    metadata: { model: 'gpt-4', tokens: result.usage.total_tokens },
+  }),
+});
+```
+**Decisions:** If the Collector returns `block`, an error is thrown. All other decisions allow execution.
+### `monitor.wrapOpenAI(openaiClient)`
+Zero-config monitoring for all OpenAI chat completions:
+```ts
+import OpenAI from 'openai';
+const openai = monitor.wrapOpenAI(new OpenAI());
+// All openai.chat.completions.create() calls are now monitored
+const response = await openai.chat.completions.create({ model: 'gpt-4', messages: [...] });
+```
+### `monitor.wrapLangChain(chain)`
+Zero-config monitoring for LangChain chains (invoke, call, run, stream):
+```ts
+const chain = prompt.pipe(llm).pipe(parser);
+const monitored = monitor.wrapLangChain(chain);
+const result = await monitored.invoke({ question: 'What is 2+2?' });
+```
+### `monitor.captureError(toolName, error, metadata?)`
+Report a tool failure to the Collector:
+```ts
+try {
+  await myTool();
+} catch (err) {
+  await monitor.captureError('my_tool', err, { retry: 1, context: 'user-flow' });
+  throw err;
+}
+```
+### `monitor.setGlobalMetadata(metadata)`
+Attach key-value metadata to every subsequent event (merge, not replace):
+```ts
+monitor.setGlobalMetadata({ userId: 'user_123', tenantId: 'acme-corp' });
+monitor.setGlobalMetadata({ environment: 'production' }); // merged
+```
+### `monitor.startTrace()`
+Generate a UUID trace ID to correlate frontend and backend events:
+```ts
+const traceId = monitor.startTrace();
+// Pass traceId to browser SDK via X-Vantinel-Trace header
+const fn = monitor.monitor('backend_call', myFn, { traceId });
+```
+### `monitor.ping()`
+Check connectivity to the Collector:
+```ts
+const { ok, latencyMs } = await monitor.ping();
+if (!ok) console.warn('Collector unreachable');
+```
+### `monitor.flush()`
+Drain the event batch queue immediately (useful on graceful shutdown):
+```ts
+process.on('SIGTERM', async () => {
+  await monitor.flush();
+  process.exit(0);
+});
+```
+### `VantinelMonitor.getSingleton(config?)`
+Return a shared instance — safe for Next.js hot-reload and multi-import scenarios:
+```ts
+// lib/vantinel.ts
+export const monitor = VantinelMonitor.getSingleton({
+  apiKey: process.env.VANTINEL_API_KEY,
+});
+```
+## Shadow Mode
+Shadow Mode observes without enforcing — ideal for proving value before enabling hard blocks:
+```ts
+const monitor = new VantinelMonitor({
+  shadowMode: true,
+  slackWebhookUrl: process.env.SLACK_WEBHOOK, // optional
+});
+// Blocked calls are allowed but logged: "[Vantinel Shadow] Would have blocked `delete_users`"
+```
+## Enforcement Decisions
+| Decision | Behavior |
+|---|---|
+| `allow` | Tool executes normally |
+| `block` | SDK throws `Error: [Vantinel] Tool blocked: ...` |
+| `require_approval` | Warning logged, execution continues (approval UI in dashboard) |
+| `warn` | Tool executes, warning logged |
+If the Collector is unreachable, the SDK **fails open** — the tool executes normally. Collector downtime never breaks your agent.
+## Security
+- All requests signed with **HMAC-SHA256** (`timestamp.body` format)
+- Per-request nonces prevent replay attacks
+- Tool arguments are **never sent** — only a SHA-256 hash
+- **Fail-open by default**: any network/5xx error returns `{ decision: 'allow' }`
+## License
+MIT © Vantinel AI

package/dist/client.d.ts ADDED Viewed

@@ -0,0 +1,105 @@
+export interface VantinelConfig {
+    apiKey?: string;
+    clientId?: string;
+    collectorUrl?: string;
+    agentId?: string;
+    dryRun?: boolean;
+    shadowMode?: boolean;
+    failMode?: 'open' | 'closed';
+    batchSize?: number;
+    flushInterval?: number;
+    retry?: {
+        maxRetries?: number;
+        backoffMs?: number;
+    };
+    slackWebhookUrl?: string;
+}
+export interface VantinelEvent {
+    client_id?: string;
+    session_id: string;
+    agent_id?: string;
+    tool_name: string;
+    tool_args_hash: string;
+    timestamp: number;
+    latency_ms?: number;
+    estimated_cost?: number;
+    event_type?: string;
+    trace_id?: string;
+    metadata?: Record<string, unknown>;
+}
+export interface VantinelDecision {
+    decision: 'allow' | 'block' | 'require_approval' | 'warn';
+    message?: string;
+    session_spend?: number;
+    violations?: string[];
+}
+/**
+ * Rough token estimation: ~4 characters per token.
+ */
+declare function estimateTokens(text: string): number;
+/**
+ * Model pricing per 1k tokens (input, output, cache_read) in USD.
+ */
+declare const MODEL_PRICING: Record<string, {
+    input: number;
+    output: number;
+    cache_read?: number;
+}>;
+declare function estimateCostFromText(text: string): number;
+declare function estimateCostFromTokens(model: string, inputTokens: number, outputTokens: number, cachedTokens?: number): number;
+export declare class VantinelClient {
+    private client;
+    private config;
+    private batchQueue;
+    private flushTimer;
+    private globalMetadata;
+    constructor(config: VantinelConfig);
+    setGlobalMetadata(metadata: Record<string, unknown>): void;
+    private mergeGlobalMetadata;
+    private sendWithRetry;
+    /**
+     * Send an event to the collector.
+     * Cost is only included if explicitly set on the event.
+     */
+    sendEvent(event: VantinelEvent): Promise<VantinelDecision>;
+    /**
+     * Wrap a tool function — automatically measures latency and tracks it.
+     * This is the recommended way to use Vantinel.
+     *
+     * Cost is only reported if you explicitly provide it (e.g., from your LLM provider's usage data).
+     * Latency is always automatically measured.
+     *
+     * @example
+     * const result = await client.wrap('search_db', '{"query":"test"}', async () => {
+     *   return await searchDatabase('test');
+     * });
+     */
+    wrap<T>(toolName: string, toolArgs: string, fn: () => T | Promise<T>, options?: {
+        sessionId?: string;
+        estimatedCost?: number;
+        traceId?: string;
+    }): Promise<T>;
+    /**
+     * Auto-instrument an OpenAI client.
+     * This monkey-patches `chat.completions.create` to automatically intercept calls,
+     * measure latency, extract exact token usage from the response, and calculate true cost.
+     *
+     * @param openaiClient - The instantiated OpenAI client (e.g., `new OpenAI()`)
+     * @param options - Optional configuration for the intercepted calls
+     * @returns The patched OpenAI client
+     */
+    wrapOpenAI(openaiClient: any, options?: {
+        sessionId?: string;
+        traceId?: string;
+    }): any;
+    /**
+     * Gracefully shut down the client: flush pending events and clear timers.
+     */
+    destroy(): Promise<void>;
+    flush(): Promise<void>;
+    ping(): Promise<{
+        ok: boolean;
+        latencyMs: number;
+    }>;
+}
+export { estimateCostFromTokens, estimateCostFromText, estimateTokens, MODEL_PRICING };