npm - @artemiskit/adapter-deepagents - Versions diffs - 0.2.0 - Mend

@artemiskit/adapter-deepagents 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

package/src/client.ts ADDED Viewed

@@ -0,0 +1,392 @@
+/**
+ * DeepAgents Adapter
+ * Wraps DeepAgents multi-agent systems for ArtemisKit testing
+ */
+import type {
+  AdapterConfig,
+  GenerateOptions,
+  GenerateResult,
+  ModelCapabilities,
+  ModelClient,
+} from '@artemiskit/core';
+import { nanoid } from 'nanoid';
+import type {
+  DeepAgentsAdapterConfig,
+  DeepAgentsCallbacks,
+  DeepAgentsExecutionMetadata,
+  DeepAgentsMessage,
+  DeepAgentsOutput,
+  DeepAgentsSystem,
+  DeepAgentsTrace,
+} from './types';
+/**
+ * Adapter for testing DeepAgents multi-agent systems with ArtemisKit
+ *
+ * @example
+ * ```typescript
+ * import { DeepAgentsAdapter } from '@artemiskit/adapter-deepagents';
+ * import { createTeam } from 'deepagents';
+ *
+ * // Create a DeepAgents team
+ * const team = createTeam({
+ *   agents: [researcher, writer, editor],
+ *   workflow: 'sequential',
+ * });
+ *
+ * // Wrap with ArtemisKit adapter
+ * const adapter = new DeepAgentsAdapter(
+ *   { provider: 'deepagents', name: 'content-team' },
+ *   team
+ * );
+ *
+ * // Use in ArtemisKit tests
+ * const result = await adapter.generate({
+ *   prompt: 'Write an article about AI testing',
+ * });
+ * ```
+ */
+export class DeepAgentsAdapter implements ModelClient {
+  private system: DeepAgentsSystem;
+  private config: DeepAgentsAdapterConfig;
+  readonly provider = 'deepagents';
+  // Execution tracking
+  private traces: DeepAgentsTrace[] = [];
+  private messages: DeepAgentsMessage[] = [];
+  constructor(config: AdapterConfig, system: DeepAgentsSystem) {
+    this.config = config as DeepAgentsAdapterConfig;
+    this.system = system;
+    this.validateSystem(system);
+  }
+  /**
+   * Validate that the system has a usable execution method
+   */
+  private validateSystem(system: DeepAgentsSystem): void {
+    const hasMethod =
+      typeof system.invoke === 'function' ||
+      typeof system.run === 'function' ||
+      typeof system.execute === 'function';
+    if (!hasMethod) {
+      throw new Error('DeepAgents system must have an invoke(), run(), or execute() method');
+    }
+  }
+  async generate(options: GenerateOptions): Promise<GenerateResult> {
+    const startTime = Date.now();
+    // Reset tracking for this execution
+    this.traces = [];
+    this.messages = [];
+    // Prepare input
+    const input = this.prepareInput(options);
+    // Create callbacks for tracking if enabled
+    const callbacks = this.createCallbacks();
+    // Execute the system
+    const execConfig = {
+      timeout: this.config.executionTimeout ?? 300000,
+      callbacks,
+    };
+    const response = await this.executeSystem(input, execConfig);
+    const latencyMs = Date.now() - startTime;
+    // Extract output
+    const text = this.extractOutput(response);
+    // Build metadata
+    const metadata = this.extractMetadata(response);
+    // Extract token usage if available
+    const tokens = {
+      prompt: response.tokenUsage?.prompt ?? 0,
+      completion: response.tokenUsage?.completion ?? 0,
+      total: response.tokenUsage?.total ?? 0,
+    };
+    return {
+      id: nanoid(),
+      model: this.config.name || 'deepagents:system',
+      text,
+      tokens,
+      latencyMs,
+      finishReason: 'stop',
+      raw: {
+        response,
+        metadata,
+      },
+    };
+  }
+  /**
+   * Execute the DeepAgents system using available method
+   */
+  private async executeSystem(
+    input: Record<string, unknown>,
+    config: Record<string, unknown>
+  ): Promise<DeepAgentsOutput> {
+    // Try methods in order of preference
+    if (typeof this.system.invoke === 'function') {
+      return this.system.invoke(input, config);
+    }
+    if (typeof this.system.run === 'function') {
+      return this.system.run(input, config);
+    }
+    if (typeof this.system.execute === 'function') {
+      return this.system.execute(input, config);
+    }
+    throw new Error('No execution method available on DeepAgents system');
+  }
+  async *stream(options: GenerateOptions, onChunk: (chunk: string) => void): AsyncIterable<string> {
+    if (!this.system.stream) {
+      // Fallback to non-streaming
+      const result = await this.generate(options);
+      onChunk(result.text);
+      yield result.text;
+      return;
+    }
+    // Reset tracking
+    this.traces = [];
+    this.messages = [];
+    const input = this.prepareInput(options);
+    const stream = this.system.stream(input, {
+      timeout: this.config.executionTimeout ?? 300000,
+    });
+    for await (const event of stream) {
+      // Track events
+      if (event.type === 'agent_start' || event.type === 'agent_end') {
+        this.traces.push({
+          agent: event.agent || 'unknown',
+          action: event.type,
+          output: event.data,
+          timestamp: event.timestamp || Date.now(),
+        });
+      }
+      if (event.type === 'message' && event.data) {
+        const msgData = event.data as DeepAgentsMessage;
+        this.messages.push(msgData);
+      }
+      // Emit text content
+      if (event.type === 'token' && event.content) {
+        onChunk(event.content);
+        yield event.content;
+      }
+    }
+  }
+  async capabilities(): Promise<ModelCapabilities> {
+    return {
+      streaming: typeof this.system.stream === 'function',
+      functionCalling: true, // Multi-agent systems typically use tools
+      toolUse: true,
+      maxContext: 128000, // Varies by underlying models
+      vision: false, // Depends on underlying agents
+      jsonMode: false,
+    };
+  }
+  async close(): Promise<void> {
+    // No cleanup needed for most DeepAgents systems
+  }
+  /**
+   * Prepare input for the DeepAgents system
+   */
+  private prepareInput(options: GenerateOptions): Record<string, unknown> {
+    // Handle string prompts
+    if (typeof options.prompt === 'string') {
+      return {
+        task: options.prompt,
+        query: options.prompt,
+        input: options.prompt,
+      };
+    }
+    // Handle chat message array
+    const messages = options.prompt;
+    const lastUserMessage = messages.findLast((m) => m.role === 'user');
+    const systemMessage = messages.find((m) => m.role === 'system');
+    const input: Record<string, unknown> = {
+      task: lastUserMessage?.content || '',
+      query: lastUserMessage?.content || '',
+      input: lastUserMessage?.content || '',
+    };
+    if (systemMessage) {
+      input.context = { systemPrompt: systemMessage.content };
+    }
+    // Include full message history for context
+    input.messages = messages.map((m) => ({
+      role: m.role,
+      content: m.content,
+    }));
+    return input;
+  }
+  /**
+   * Extract text output from DeepAgents response
+   */
+  private extractOutput(response: DeepAgentsOutput): string {
+    // Check common output keys
+    const possibleKeys = ['result', 'output', 'response', 'answer', 'content'];
+    for (const key of possibleKeys) {
+      const value = response[key];
+      if (typeof value === 'string') {
+        return value;
+      }
+    }
+    // If we have traces, use the last agent's output
+    if (response.traces?.length) {
+      const lastTrace = response.traces[response.traces.length - 1];
+      if (lastTrace.output) {
+        return typeof lastTrace.output === 'string'
+          ? lastTrace.output
+          : JSON.stringify(lastTrace.output);
+      }
+    }
+    // Fallback to JSON
+    return JSON.stringify(response);
+  }
+  /**
+   * Create callbacks for execution tracking
+   */
+  private createCallbacks(): DeepAgentsCallbacks {
+    const callbacks: DeepAgentsCallbacks = {};
+    if (this.config.captureTraces !== false) {
+      callbacks.onAgentStart = (agent, input) => {
+        this.traces.push({
+          agent,
+          action: 'start',
+          input,
+          timestamp: Date.now(),
+        });
+      };
+      callbacks.onAgentEnd = (agent, output) => {
+        this.traces.push({
+          agent,
+          action: 'end',
+          output,
+          timestamp: Date.now(),
+        });
+      };
+      callbacks.onToolUse = (agent, tool, input) => {
+        this.traces.push({
+          agent,
+          action: 'tool_use',
+          input: { tool, toolInput: input },
+          toolsUsed: [tool],
+          timestamp: Date.now(),
+        });
+      };
+    }
+    if (this.config.captureMessages !== false) {
+      callbacks.onMessage = (from, to, message) => {
+        this.messages.push({
+          from,
+          to,
+          content: typeof message === 'string' ? message : JSON.stringify(message),
+          timestamp: Date.now(),
+        });
+      };
+    }
+    return callbacks;
+  }
+  /**
+   * Extract execution metadata
+   */
+  private extractMetadata(response: DeepAgentsOutput): DeepAgentsExecutionMetadata {
+    // Combine response traces with our tracked traces
+    const allTraces = [...(response.traces || []), ...this.traces];
+    const allMessages = [...(response.messages || []), ...this.messages];
+    // Extract unique agents
+    const agentsSet = new Set<string>();
+    for (const trace of allTraces) {
+      agentsSet.add(trace.agent);
+    }
+    for (const msg of allMessages) {
+      agentsSet.add(msg.from);
+      agentsSet.add(msg.to);
+    }
+    if (response.agents) {
+      for (const agent of response.agents) {
+        agentsSet.add(agent);
+      }
+    }
+    // Extract tools used
+    const toolsSet = new Set<string>();
+    let toolCallCount = 0;
+    for (const trace of allTraces) {
+      if (trace.toolsUsed) {
+        for (const tool of trace.toolsUsed) {
+          toolsSet.add(tool);
+        }
+        toolCallCount += trace.toolsUsed.length;
+      }
+    }
+    return {
+      name: this.config.name,
+      agentsInvolved: Array.from(agentsSet),
+      totalAgentCalls: allTraces.filter((t) => t.action === 'start' || t.action === 'end').length,
+      totalMessages: allMessages.length,
+      totalToolCalls: toolCallCount,
+      toolsUsed: Array.from(toolsSet),
+      traces: this.config.captureTraces !== false ? allTraces : undefined,
+      messages: this.config.captureMessages !== false ? allMessages : undefined,
+      executionTimeMs: response.executionTimeMs,
+    };
+  }
+}
+/**
+ * Factory function to create a DeepAgents adapter
+ *
+ * @example
+ * ```typescript
+ * const adapter = createDeepAgentsAdapter(myTeam, {
+ *   name: 'research-team',
+ *   captureTraces: true,
+ * });
+ * ```
+ */
+export function createDeepAgentsAdapter(
+  system: DeepAgentsSystem,
+  options?: Partial<DeepAgentsAdapterConfig>
+): DeepAgentsAdapter {
+  const config: DeepAgentsAdapterConfig = {
+    provider: 'deepagents',
+    ...options,
+  };
+  return new DeepAgentsAdapter(config, system);
+}

package/src/index.ts ADDED Viewed

@@ -0,0 +1,32 @@
+/**
+ * @artemiskit/adapter-deepagents
+ *
+ * DeepAgents.js adapter for ArtemisKit LLM evaluation toolkit.
+ * Enables testing of DeepAgents multi-agent systems.
+ *
+ * @example
+ * ```typescript
+ * import { createDeepAgentsAdapter } from '@artemiskit/adapter-deepagents';
+ * import { createTeam } from 'deepagents';
+ *
+ * const team = createTeam({ agents: [researcher, writer] });
+ * const adapter = createDeepAgentsAdapter(team, { name: 'content-team' });
+ *
+ * // Use with ArtemisKit
+ * const result = await adapter.generate({ prompt: 'Create content' });
+ * ```
+ */
+export { DeepAgentsAdapter, createDeepAgentsAdapter } from './client';
+export type {
+  DeepAgentsAdapterConfig,
+  DeepAgentsSystem,
+  DeepAgentsInput,
+  DeepAgentsOutput,
+  DeepAgentsConfig,
+  DeepAgentsTrace,
+  DeepAgentsMessage,
+  DeepAgentsStreamEvent,
+  DeepAgentsCallbacks,
+  DeepAgentsExecutionMetadata,
+} from './types';

package/src/types.ts ADDED Viewed

@@ -0,0 +1,195 @@
+/**
+ * Types for DeepAgents adapter
+ */
+import type { BaseAdapterConfig } from '@artemiskit/core';
+/**
+ * Configuration for DeepAgents adapter
+ */
+export interface DeepAgentsAdapterConfig extends BaseAdapterConfig {
+  provider: 'deepagents';
+  /**
+   * Name identifier for the agent system (for logging/tracking)
+   */
+  name?: string;
+  /**
+   * Whether to capture agent traces and execution history
+   * @default true
+   */
+  captureTraces?: boolean;
+  /**
+   * Whether to capture inter-agent messages
+   * @default true
+   */
+  captureMessages?: boolean;
+  /**
+   * Maximum execution time in milliseconds
+   * @default 300000 (5 minutes)
+   */
+  executionTimeout?: number;
+  /**
+   * Custom input transformer function name
+   */
+  inputTransformer?: string;
+  /**
+   * Custom output transformer function name
+   */
+  outputTransformer?: string;
+}
+/**
+ * Generic interface for DeepAgents systems
+ * Supports multi-agent orchestration with invoke() or run() methods
+ */
+export interface DeepAgentsSystem {
+  invoke?(input: DeepAgentsInput, config?: DeepAgentsConfig): Promise<DeepAgentsOutput>;
+  run?(input: DeepAgentsInput, config?: DeepAgentsConfig): Promise<DeepAgentsOutput>;
+  execute?(input: DeepAgentsInput, config?: DeepAgentsConfig): Promise<DeepAgentsOutput>;
+  stream?(input: DeepAgentsInput, config?: DeepAgentsConfig): AsyncIterable<DeepAgentsStreamEvent>;
+}
+/**
+ * Input format for DeepAgents systems
+ */
+export interface DeepAgentsInput {
+  /** The main task/query to process */
+  task?: string;
+  query?: string;
+  input?: string;
+  message?: string;
+  /** Optional context/memory from previous interactions */
+  context?: Record<string, unknown>;
+  /** Optional metadata */
+  metadata?: Record<string, unknown>;
+  [key: string]: unknown;
+}
+/**
+ * Configuration for DeepAgents execution
+ */
+export interface DeepAgentsConfig {
+  /** Maximum iterations for agent loops */
+  maxIterations?: number;
+  /** Timeout in milliseconds */
+  timeout?: number;
+  /** Enable verbose logging */
+  verbose?: boolean;
+  /** Callback handlers */
+  callbacks?: DeepAgentsCallbacks;
+  [key: string]: unknown;
+}
+/**
+ * Callback handlers for DeepAgents execution
+ */
+export interface DeepAgentsCallbacks {
+  onAgentStart?: (agent: string, input: unknown) => void;
+  onAgentEnd?: (agent: string, output: unknown) => void;
+  onMessage?: (from: string, to: string, message: unknown) => void;
+  onToolUse?: (agent: string, tool: string, input: unknown) => void;
+  onError?: (agent: string, error: Error) => void;
+}
+/**
+ * Output from DeepAgents system execution
+ */
+export interface DeepAgentsOutput {
+  /** Main result/output */
+  result?: string;
+  output?: string;
+  response?: string;
+  answer?: string;
+  /** Execution traces from agents */
+  traces?: DeepAgentsTrace[];
+  /** Messages exchanged between agents */
+  messages?: DeepAgentsMessage[];
+  /** Agents that participated in the execution */
+  agents?: string[];
+  /** Total execution time */
+  executionTimeMs?: number;
+  /** Token usage if available */
+  tokenUsage?: {
+    prompt?: number;
+    completion?: number;
+    total?: number;
+  };
+  /** Raw response data */
+  [key: string]: unknown;
+}
+/**
+ * Trace of a single agent's execution
+ */
+export interface DeepAgentsTrace {
+  /** Agent identifier */
+  agent: string;
+  /** Action taken by the agent */
+  action: string;
+  /** Input to the action */
+  input?: unknown;
+  /** Output/result of the action */
+  output?: unknown;
+  /** Timestamp */
+  timestamp?: number;
+  /** Duration in milliseconds */
+  durationMs?: number;
+  /** Tools used during this action */
+  toolsUsed?: string[];
+}
+/**
+ * Message exchanged between agents
+ */
+export interface DeepAgentsMessage {
+  /** Sender agent */
+  from: string;
+  /** Recipient agent */
+  to: string;
+  /** Message content */
+  content: string;
+  /** Message type */
+  type?: 'request' | 'response' | 'broadcast' | 'delegation';
+  /** Timestamp */
+  timestamp?: number;
+}
+/**
+ * Streaming event from DeepAgents
+ */
+export interface DeepAgentsStreamEvent {
+  /** Event type */
+  type: 'agent_start' | 'agent_end' | 'message' | 'tool_use' | 'token' | 'error' | 'done';
+  /** Agent involved */
+  agent?: string;
+  /** Event data */
+  data?: unknown;
+  /** Text content (for token events) */
+  content?: string;
+  /** Timestamp */
+  timestamp?: number;
+}
+/**
+ * Metadata extracted from DeepAgents execution
+ */
+export interface DeepAgentsExecutionMetadata {
+  /** System/workflow name */
+  name?: string;
+  /** Agents that participated */
+  agentsInvolved: string[];
+  /** Total agent invocations */
+  totalAgentCalls: number;
+  /** Total messages exchanged */
+  totalMessages: number;
+  /** Total tool calls across all agents */
+  totalToolCalls: number;
+  /** Unique tools used */
+  toolsUsed: string[];
+  /** Execution traces */
+  traces?: DeepAgentsTrace[];
+  /** Messages log */
+  messages?: DeepAgentsMessage[];
+  /** Total execution time */
+  executionTimeMs?: number;
+}

package/tsconfig.json ADDED Viewed

@@ -0,0 +1,13 @@
+{
+  "extends": "../../../tsconfig.json",
+  "compilerOptions": {
+    "outDir": "./dist",
+    "rootDir": "./src",
+    "declaration": true,
+    "declarationMap": true,
+    "noEmit": false,
+    "emitDeclarationOnly": true
+  },
+  "include": ["src/**/*"],
+  "exclude": ["node_modules", "dist", "**/*.test.ts"]
+}