npm - @strav/brain - Versions diffs - 0.4.31 → 1.0.0-alpha.9 - Mend

@strav/brain 0.4.31 → 1.0.0-alpha.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (39) hide show

package/package.json +17 -20
package/src/agent.ts +42 -76
package/src/agent_result.ts +32 -0
package/src/agent_runner.ts +61 -0
package/src/brain_config.ts +72 -0
package/src/brain_error.ts +29 -0
package/src/brain_manager.ts +170 -123
package/src/brain_provider.ts +90 -6
package/src/define_tool.ts +42 -0
package/src/index.ts +40 -42
package/src/provider.ts +74 -0
package/src/providers/anthropic_provider.ts +347 -231
package/src/thread.ts +99 -0
package/src/tool.ts +28 -44
package/src/tool_execution_error.ts +26 -0
package/src/types.ts +129 -241
package/CHANGELOG.md +0 -44
package/README.md +0 -121
package/src/helpers.ts +0 -1082
package/src/mcp_toolbox.ts +0 -62
package/src/memory/context_budget.ts +0 -120
package/src/memory/index.ts +0 -17
package/src/memory/memory_manager.ts +0 -168
package/src/memory/semantic_memory.ts +0 -89
package/src/memory/strategies/sliding_window.ts +0 -20
package/src/memory/strategies/summarize.ts +0 -157
package/src/memory/thread_store.ts +0 -56
package/src/memory/token_counter.ts +0 -101
package/src/memory/types.ts +0 -68
package/src/providers/google_provider.ts +0 -496
package/src/providers/openai_provider.ts +0 -569
package/src/providers/openai_responses_provider.ts +0 -321
package/src/utils/error_scrub.ts +0 -5
package/src/utils/prompt.ts +0 -65
package/src/utils/retry.ts +0 -104
package/src/utils/schema.ts +0 -27
package/src/utils/sse_parser.ts +0 -62
package/src/workflow.ts +0 -199
package/tsconfig.json +0 -5

package/src/providers/anthropic_provider.ts CHANGED Viewed

@@ -1,281 +1,397 @@
-import { parseSSE } from '../utils/sse_parser.ts'
-import { retryableFetch, type RetryOptions } from '../utils/retry.ts'
-import { ExternalServiceError } from '@strav/kernel'
-import type {
-  AIProvider,
-  CompletionRequest,
-  CompletionResponse,
-  StreamChunk,
-  ProviderConfig,
-  Message,
-  ToolCall,
-  Usage,
-} from '../types.ts'
 /**
- * Anthropic Messages API provider.
+ * `AnthropicProvider` — implementation of `Provider` backed by the
+ * official `@anthropic-ai/sdk`.
+ *
+ * Responsibilities:
+ *   1. Hold a singleton `Anthropic` client instance for the
+ *      configured API key + base URL.
+ *   2. Translate the framework's `ChatOptions` / `Message` shapes
+ *      into Anthropic's `MessageCreateParams` (system as `TextBlock[]`
+ *      with `cache_control` when requested; messages with per-block
+ *      cache flags translated likewise; `thinking` mapped to
+ *      `ThinkingConfigParam`; `effort` placed under `output_config`).
+ *   3. Translate the response back to `ChatResult` — flatten the
+ *      content blocks into a single `text` string, surface usage with
+ *      cache-hit counters, and pass the raw `Message` through on `.raw`.
+ *   4. Stream via `client.messages.stream()` and yield the framework
+ *      `StreamEvent` union — `text` deltas plus a terminal `stop`
+ *      event with usage + stop reason.
  *
- * Translates the framework's normalized CompletionRequest/Response
- * to/from the Anthropic wire format. Uses raw `fetch()`.
+ * Errors from the SDK propagate; apps that want provider-specific
+ * recovery can `instanceof Anthropic.RateLimitError` etc. The brain
+ * facade wraps the call site in `BrainError` only for invariants the
+ * facade owns (e.g. "no provider configured").
  */
-export class AnthropicProvider implements AIProvider {
-  readonly name: string
-  private apiKey: string
-  private baseUrl: string
-  private defaultModel: string
-  private defaultMaxTokens: number
-  private retryOptions: RetryOptions
-  constructor(config: ProviderConfig) {
-    this.name = 'anthropic'
-    this.apiKey = config.apiKey
-    this.baseUrl = (config.baseUrl ?? 'https://api.anthropic.com').replace(/\/$/, '')
-    this.defaultModel = config.model
-    this.defaultMaxTokens = config.maxTokens ?? 4096
-    this.retryOptions = {
-      maxRetries: config.maxRetries ?? 3,
-      baseDelay: config.retryBaseDelay ?? 1000,
-    }
-  }
+import Anthropic from '@anthropic-ai/sdk'
+import type { AgentResult } from '../agent_result.ts'
+import type { AnthropicProviderConfig } from '../brain_config.ts'
+import { DEFAULT_MODEL } from '../brain_config.ts'
+import type { Provider, RunWithToolsOptions } from '../provider.ts'
+import type { Tool } from '../tool.ts'
+import { ToolExecutionError } from '../tool_execution_error.ts'
+import type {
+  ChatOptions,
+  ChatResult,
+  ChatUsage,
+  ContentBlock,
+  Message,
+  StreamEvent,
+  SystemPrompt,
+  TextBlock,
+  ToolResultBlock,
+  ToolUseBlock,
+} from '../types.ts'
-  async complete(request: CompletionRequest): Promise<CompletionResponse> {
-    const body = this.buildRequestBody(request, false)
+const EPHEMERAL_CACHE = { type: 'ephemeral' } as const
-    const response = await retryableFetch(
-      'Anthropic',
-      `${this.baseUrl}/v1/messages`,
-      { method: 'POST', headers: this.buildHeaders(), body: JSON.stringify(body) },
-      this.retryOptions
-    )
+export class AnthropicProvider implements Provider {
+  readonly name: string
+  private readonly client: Anthropic
+  private readonly defaultModel: string
+  private readonly defaultMaxTokens: number
+  private readonly betas: readonly string[]
+  constructor(
+    name: string,
+    config: AnthropicProviderConfig,
+    options: { client?: Anthropic } = {},
+  ) {
+    this.name = name
+    this.defaultModel = config.defaultModel ?? DEFAULT_MODEL
+    this.defaultMaxTokens = config.defaultMaxTokens ?? 4096
+    this.betas = config.betas ?? []
+    // `client` injection point — tests pass a stub; apps that want a
+    // pre-configured SDK instance (custom retry, fetch transport, etc.)
+    // build their own and hand it over here.
+    this.client =
+      options.client ??
+      new Anthropic({
+        apiKey: config.apiKey,
+        ...(config.baseUrl !== undefined ? { baseURL: config.baseUrl } : {}),
+      })
+  }
-    const data: any = await response.json()
-    return this.parseResponse(data)
+  async chat(messages: readonly Message[], options: ChatOptions = {}): Promise<ChatResult> {
+    const params = this.buildParams(messages, options)
+    const response = await this.client.messages.create(params)
+    return this.toChatResult(response)
   }
-  async *stream(request: CompletionRequest): AsyncIterable<StreamChunk> {
-    const body = this.buildRequestBody(request, true)
+  async *stream(
+    messages: readonly Message[],
+    options: ChatOptions = {},
+  ): AsyncIterable<StreamEvent> {
+    const params = this.buildParams(messages, options)
+    const stream = this.client.messages.stream(params)
+    for await (const event of stream) {
+      if (
+        event.type === 'content_block_delta' &&
+        event.delta.type === 'text_delta'
+      ) {
+        yield { type: 'text', delta: event.delta.text }
+      }
+    }
+    const final = await stream.finalMessage()
+    yield {
+      type: 'stop',
+      stopReason: final.stop_reason,
+      usage: toUsage(final.usage),
+    }
+  }
-    const response = await retryableFetch(
-      'Anthropic',
-      `${this.baseUrl}/v1/messages`,
-      { method: 'POST', headers: this.buildHeaders(), body: JSON.stringify(body) },
-      this.retryOptions
-    )
+  async countTokens(
+    messages: readonly Message[],
+    options: ChatOptions = {},
+  ): Promise<number> {
+    const base = this.buildParams(messages, options)
+    // count_tokens only accepts a subset of MessageCreateParams; build
+    // a focused payload that matches what apps actually need to budget.
+    const result = await this.client.messages.countTokens({
+      model: base.model,
+      messages: base.messages,
+      ...(base.system !== undefined ? { system: base.system } : {}),
+      ...(base.thinking !== undefined ? { thinking: base.thinking } : {}),
+    })
+    return result.input_tokens
+  }
-    if (!response.body) {
-      throw new ExternalServiceError('Anthropic', undefined, 'No stream body returned')
+  /**
+   * Agentic loop. Send → detect tool_use blocks → execute → append
+   * tool_result → re-send, until the model returns `end_turn` or
+   * the iteration ceiling is hit.
+   *
+   * Tools are passed once on every call — Anthropic doesn't carry
+   * tool state across requests; the model rediscovers them from the
+   * `tools` array each turn. Apps that care about cache hits keep
+   * the tool list stable across runs.
+   */
+  async runWithTools(
+    messages: readonly Message[],
+    tools: readonly Tool[],
+    options: RunWithToolsOptions = {},
+  ): Promise<AgentResult> {
+    const maxIterations = options.maxIterations ?? 10
+    const toolMap = new Map<string, Tool>(tools.map((t) => [t.name, t]))
+    const workingMessages: Message[] = [...messages]
+    const aggregated: ChatUsage = {
+      inputTokens: 0,
+      outputTokens: 0,
+      cacheReadTokens: 0,
+      cacheCreationTokens: 0,
     }
+    let iterations = 0
+    let lastStopReason: string | null = null
-    let currentBlockIndex = -1
-    for await (const sse of parseSSE(response.body)) {
-      if (sse.data === '[DONE]') break
+    while (true) {
+      const params = this.buildParams(workingMessages, options)
+      params.tools = tools.map((t) => ({
+        name: t.name,
+        description: t.description,
+        input_schema: t.inputSchema as Anthropic.Tool.InputSchema,
+      }))
-      let parsed: any
-      try {
-        parsed = JSON.parse(sse.data)
-      } catch {
-        continue
+      const response = await this.client.messages.create(params)
+      addUsage(aggregated, response.usage)
+      lastStopReason = response.stop_reason ?? null
+      // Append the assistant turn verbatim from the SDK shape so
+      // tool_use blocks survive to the next request unchanged.
+      workingMessages.push({
+        role: 'assistant',
+        content: fromAnthropicContent(response.content),
+      })
+      if (response.stop_reason !== 'tool_use') {
+        return {
+          text: collectText(response.content),
+          messages: workingMessages,
+          iterations,
+          stopReason: lastStopReason ?? 'end_turn',
+          usage: aggregated,
+        }
       }
-      const type = parsed.type ?? sse.event
-      if (type === 'content_block_start') {
-        currentBlockIndex = parsed.index ?? currentBlockIndex + 1
-        const block = parsed.content_block
-        if (block?.type === 'tool_use') {
-          yield {
-            type: 'tool_start',
-            toolCall: { id: block.id, name: block.name },
-            toolIndex: currentBlockIndex,
-          }
+      // Execute every tool_use block in the response and append the
+      // results in a single user-role turn. The SDK's API expects all
+      // tool_result blocks for a given assistant turn to land in the
+      // same user message.
+      const toolUseBlocks = response.content.filter(
+        (b): b is Anthropic.ToolUseBlock => b.type === 'tool_use',
+      )
+      const resultBlocks: ContentBlock[] = []
+      for (const block of toolUseBlocks) {
+        const tool = toolMap.get(block.name)
+        if (!tool) {
+          throw new ToolExecutionError(
+            block.name,
+            block.id,
+            new Error(`Tool "${block.name}" is not registered.`),
+          )
         }
-      } else if (type === 'content_block_delta') {
-        const delta = parsed.delta
-        if (delta?.type === 'text_delta') {
-          yield { type: 'text', text: delta.text }
-        } else if (delta?.type === 'input_json_delta') {
-          yield {
-            type: 'tool_delta',
-            text: delta.partial_json,
-            toolIndex: parsed.index ?? currentBlockIndex,
-          }
+        let output: unknown
+        try {
+          output = await tool.execute(block.input, {
+            callId: block.id,
+            context: options.context ?? {},
+          })
+        } catch (cause) {
+          throw new ToolExecutionError(block.name, block.id, cause)
         }
-      } else if (type === 'content_block_stop') {
-        // If we were accumulating a tool call, signal end
-        if (currentBlockIndex >= 0) {
-          yield { type: 'tool_end', toolIndex: parsed.index ?? currentBlockIndex }
+        const resultBlock: ToolResultBlock = {
+          type: 'tool_result',
+          toolUseId: block.id,
+          content: typeof output === 'string' ? output : JSON.stringify(output),
         }
-      } else if (type === 'message_delta') {
-        const usage = parsed.usage
-        if (usage) {
-          yield {
-            type: 'usage',
-            usage: {
-              inputTokens: usage.input_tokens ?? 0,
-              outputTokens: usage.output_tokens ?? 0,
-              totalTokens: (usage.input_tokens ?? 0) + (usage.output_tokens ?? 0),
-            },
-          }
+        resultBlocks.push(resultBlock)
+      }
+      workingMessages.push({ role: 'user', content: resultBlocks })
+      iterations++
+      if (iterations >= maxIterations) {
+        return {
+          text: collectText(response.content),
+          messages: workingMessages,
+          iterations,
+          stopReason: 'max_iterations',
+          usage: aggregated,
         }
-      } else if (type === 'message_stop') {
-        yield { type: 'done' }
       }
     }
   }
-  // ── Private helpers ──────────────────────────────────────────────────────
-  private buildHeaders(): Record<string, string> {
-    return {
-      'content-type': 'application/json',
-      'x-api-key': this.apiKey,
-      'anthropic-version': '2023-06-01',
+  // ─── Param translation ──────────────────────────────────────────────────
+  private buildParams(
+    messages: readonly Message[],
+    options: ChatOptions,
+  ): Anthropic.MessageCreateParamsNonStreaming {
+    const model = options.model ?? this.defaultModel
+    const params: Anthropic.MessageCreateParamsNonStreaming = {
+      model,
+      max_tokens: options.maxTokens ?? this.defaultMaxTokens,
+      messages: messages.map(toMessageParam),
     }
-  }
-  private buildRequestBody(request: CompletionRequest, stream: boolean): Record<string, unknown> {
-    const body: Record<string, unknown> = {
-      model: request.model ?? this.defaultModel,
-      max_tokens: request.maxTokens ?? this.defaultMaxTokens,
-      messages: this.mapMessages(request.messages),
-    }
+    const system = toSystemParam(options.system)
+    if (system !== undefined) params.system = system
-    if (stream) body.stream = true
-    if (request.system) body.system = request.system
-    if (request.temperature !== undefined) body.temperature = request.temperature
-    if (request.stopSequences?.length) body.stop_sequences = request.stopSequences
+    if (options.thinking === 'adaptive') {
+      params.thinking = { type: 'adaptive' }
+    } else if (options.thinking === 'disabled') {
+      params.thinking = { type: 'disabled' }
+    }
-    // Tools
-    if (request.tools?.length) {
-      body.tools = request.tools.map(t => ({
-        name: t.name,
-        description: t.description,
-        input_schema: t.parameters,
-      }))
+    if (options.effort !== undefined) {
+      params.output_config = { effort: options.effort }
     }
-    // Tool choice
-    if (request.toolChoice) {
-      if (request.toolChoice === 'auto') {
-        body.tool_choice = { type: 'auto' }
-      } else if (request.toolChoice === 'required') {
-        body.tool_choice = { type: 'any' }
-      } else {
-        body.tool_choice = { type: 'tool', name: request.toolChoice.name }
-      }
+    if (options.cache === true) {
+      // Top-level auto-cache the last cacheable block. Maps to the
+      // SDK's `cache_control` shorthand on the request body.
+      ;(params as { cache_control?: { type: 'ephemeral' } }).cache_control = EPHEMERAL_CACHE
     }
-    // Structured output (using GA API with output_config)
-    if (request.schema) {
-      body.output_config = {
-        format: {
-          type: 'json_schema',
-          schema: request.schema
-        }
-      }
+    const betas = mergeBetas(this.betas, options.betas)
+    if (betas.length > 0) {
+      ;(params as { betas?: readonly string[] }).betas = betas
     }
-    return body
+    return params
   }
-  private mapMessages(messages: Message[]): any[] {
-    const result: any[] = []
+  private toChatResult(message: Anthropic.Message): ChatResult<Anthropic.Message> {
+    const text = message.content
+      .filter((b): b is Anthropic.TextBlock => b.type === 'text')
+      .map((b) => b.text)
+      .join('')
+    return {
+      text,
+      model: message.model,
+      stopReason: message.stop_reason,
+      usage: toUsage(message.usage),
+      raw: message,
+    }
+  }
+}
-    for (const msg of messages) {
-      if (msg.role === 'tool') {
-        // Tool results go as user messages with tool_result content blocks
-        result.push({
-          role: 'user',
-          content: [
-            {
-              type: 'tool_result',
-              tool_use_id: msg.toolCallId,
-              content: typeof msg.content === 'string' ? msg.content : JSON.stringify(msg.content),
-            },
-          ],
-        })
-      } else if (msg.role === 'assistant') {
-        const content: any[] = []
+// ─── Shape converters ─────────────────────────────────────────────────────
-        // Add text content if present
-        const text = typeof msg.content === 'string' ? msg.content : ''
-        if (text) {
-          content.push({ type: 'text', text })
-        }
+function toUsage(u: Anthropic.Usage): ChatUsage {
+  return {
+    inputTokens: u.input_tokens,
+    outputTokens: u.output_tokens,
+    cacheReadTokens: u.cache_read_input_tokens ?? 0,
+    cacheCreationTokens: u.cache_creation_input_tokens ?? 0,
+  }
+}
-        // Add tool use blocks
-        if (msg.toolCalls?.length) {
-          for (const tc of msg.toolCalls) {
-            content.push({
-              type: 'tool_use',
-              id: tc.id,
-              name: tc.name,
-              input: tc.arguments,
-            })
-          }
+function toMessageParam(message: Message): Anthropic.MessageParam {
+  if (typeof message.content === 'string') {
+    return { role: message.role, content: message.content }
+  }
+  return {
+    role: message.role,
+    content: message.content.map((block): Anthropic.ContentBlockParam => {
+      if (block.type === 'tool_use') {
+        return {
+          type: 'tool_use',
+          id: block.id,
+          name: block.name,
+          input: block.input as Record<string, unknown>,
         }
-        result.push({
-          role: 'assistant',
-          content: content.length === 1 && content[0].type === 'text' ? content[0].text : content,
-        })
-      } else {
-        // User messages
-        result.push({
-          role: 'user',
-          content: typeof msg.content === 'string' ? msg.content : msg.content,
-        })
       }
-    }
-    return result
+      if (block.type === 'tool_result') {
+        const param: Anthropic.ToolResultBlockParam = {
+          type: 'tool_result',
+          tool_use_id: block.toolUseId,
+          content:
+            typeof block.content === 'string'
+              ? block.content
+              : block.content.map((b) => ({ type: 'text', text: b.text }) as Anthropic.TextBlockParam),
+        }
+        if (block.isError) param.is_error = true
+        return param
+      }
+      const text: Anthropic.TextBlockParam = { type: 'text', text: block.text }
+      if (block.cache) text.cache_control = EPHEMERAL_CACHE
+      return text
+    }),
   }
+}
-  private parseResponse(data: any): CompletionResponse {
-    let content = ''
-    const toolCalls: ToolCall[] = []
+function toSystemParam(
+  system: SystemPrompt | undefined,
+): string | Anthropic.TextBlockParam[] | undefined {
+  if (system === undefined) return undefined
+  if (typeof system === 'string') return system
+  if (Array.isArray(system)) {
+    return system.map((block) => {
+      const param: Anthropic.TextBlockParam = { type: 'text', text: block.text }
+      if (block.cache) param.cache_control = EPHEMERAL_CACHE
+      return param
+    })
+  }
+  const param: Anthropic.TextBlockParam = { type: 'text', text: system.text }
+  if (system.cache) param.cache_control = EPHEMERAL_CACHE
+  return [param]
+}
-    if (Array.isArray(data.content)) {
-      for (const block of data.content) {
-        if (block.type === 'text') {
-          content += block.text
-        } else if (block.type === 'tool_use') {
-          toolCalls.push({
-            id: block.id,
-            name: block.name,
-            arguments: block.input ?? {},
-          })
-        }
-      }
-    }
+function mergeBetas(
+  providerBetas: readonly string[],
+  callBetas: readonly string[] | undefined,
+): readonly string[] {
+  if (!callBetas || callBetas.length === 0) return providerBetas
+  const seen = new Set<string>()
+  const out: string[] = []
+  for (const b of providerBetas) {
+    if (seen.has(b)) continue
+    seen.add(b)
+    out.push(b)
+  }
+  for (const b of callBetas) {
+    if (seen.has(b)) continue
+    seen.add(b)
+    out.push(b)
+  }
+  return out
+}
-    const usage: Usage = {
-      inputTokens: data.usage?.input_tokens ?? 0,
-      outputTokens: data.usage?.output_tokens ?? 0,
-      totalTokens: (data.usage?.input_tokens ?? 0) + (data.usage?.output_tokens ?? 0),
-    }
+function addUsage(acc: ChatUsage, u: Anthropic.Usage): void {
+  acc.inputTokens += u.input_tokens
+  acc.outputTokens += u.output_tokens
+  acc.cacheReadTokens += u.cache_read_input_tokens ?? 0
+  acc.cacheCreationTokens += u.cache_creation_input_tokens ?? 0
+}
-    let stopReason: CompletionResponse['stopReason'] = 'end'
-    switch (data.stop_reason) {
-      case 'tool_use':
-        stopReason = 'tool_use'
-        break
-      case 'max_tokens':
-        stopReason = 'max_tokens'
-        break
-      case 'stop_sequence':
-        stopReason = 'stop_sequence'
-        break
-    }
+function collectText(content: Anthropic.ContentBlock[]): string {
+  return content
+    .filter((b): b is Anthropic.TextBlock => b.type === 'text')
+    .map((b) => b.text)
+    .join('')
+}
-    return {
-      id: data.id ?? '',
-      content,
-      toolCalls,
-      stopReason,
-      usage,
-      raw: data,
+/**
+ * Translate the SDK's response content blocks back into framework
+ * `ContentBlock`s for storage in `workingMessages`. We preserve
+ * `text` and `tool_use` blocks verbatim; other server-side block
+ * types (thinking, server tool blocks) are dropped — V1 doesn't
+ * surface them, and re-sending them as part of the assistant turn
+ * could confuse the model.
+ */
+function fromAnthropicContent(content: Anthropic.ContentBlock[]): ContentBlock[] {
+  const out: ContentBlock[] = []
+  for (const block of content) {
+    if (block.type === 'text') {
+      out.push({ type: 'text', text: block.text } satisfies TextBlock)
+    } else if (block.type === 'tool_use') {
+      out.push({
+        type: 'tool_use',
+        id: block.id,
+        name: block.name,
+        input: block.input,
+      } satisfies ToolUseBlock)
     }
   }
+  return out
 }