npm - @hevmind/ask - Versions diffs - 0.1.0 → 0.2.0 - Mend

@hevmind/ask 0.1.0 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/README.md +33 -13
package/bin/ask-launcher.mjs +19 -2
package/openapi.yaml +53 -7
package/package.json +6 -6
package/skills/build-digest/SKILL.md +7 -7
package/src/digest/build.ts +54 -16
package/src/digest/cli.ts +19 -7
package/src/digest/frontmatter.ts +7 -0
package/src/digest/schema.ts +3 -0
package/src/digest/tree.ts +259 -0
package/src/digest/verify.ts +2 -11
package/src/endpoint.ts +121 -5
package/src/index.ts +1 -1
package/src/integration.ts +16 -14
package/src/llm-openai.ts +330 -0
package/src/observability.ts +3 -1
package/src/providers.ts +81 -0
package/src/types.ts +34 -6

package/src/llm-openai.ts ADDED Viewed

@@ -0,0 +1,330 @@
+// OpenAI-compatible Chat Completions client over fetch. One translation layer
+// covers OpenAI, OpenRouter, and any Chat Completions-compatible endpoint: the
+// rest of the package keeps speaking the internal (Anthropic-shaped) block
+// types, and this module converts both ways. Like `llm.ts`, it stays free of
+// runtime dependencies and edge-runtime friendly.
+import type {
+  AnthropicResponse,
+  AnthropicTextBlock,
+  AnthropicUsage,
+  CallClaudeOptions,
+  StreamEvent,
+} from './llm.ts';
+export interface OpenAiEndpoint {
+  /** API base, e.g. `https://api.openai.com/v1` or `https://openrouter.ai/api/v1`. */
+  baseUrl: string;
+  /**
+   * OpenAI's reasoning models reject `max_tokens` and want
+   * `max_completion_tokens`; OpenRouter normalizes `max_tokens` for every
+   * underlying provider.
+   */
+  tokenParam: 'max_tokens' | 'max_completion_tokens';
+  /** Human label used in error messages, e.g. `OpenAI` or `OpenRouter`. */
+  label: string;
+}
+interface OpenAiToolCall {
+  id: string;
+  type: 'function';
+  function: { name: string; arguments: string };
+}
+interface OpenAiMessage {
+  role: 'system' | 'user' | 'assistant' | 'tool';
+  content: string | null;
+  tool_calls?: OpenAiToolCall[];
+  tool_call_id?: string;
+}
+function systemText(system: string | AnthropicTextBlock[]): string {
+  // cache_control is Anthropic-specific; OpenAI-compatible APIs cache on their own.
+  return typeof system === 'string' ? system : system.map((block) => block.text).join('\n\n');
+}
+/** Converts the internal (Anthropic-shaped) conversation into Chat Completions messages. */
+export function toOpenAiMessages(opts: Pick<CallClaudeOptions, 'system' | 'messages'>): OpenAiMessage[] {
+  const out: OpenAiMessage[] = [{ role: 'system', content: systemText(opts.system) }];
+  for (const message of opts.messages) {
+    if (typeof message.content === 'string') {
+      out.push({ role: message.role, content: message.content });
+      continue;
+    }
+    if (!Array.isArray(message.content)) continue;
+    const blocks = message.content as Array<Record<string, unknown>>;
+    if (message.role === 'assistant') {
+      const text = blocks
+        .filter((block) => block.type === 'text')
+        .map((block) => String(block.text ?? ''))
+        .join('');
+      const toolCalls: OpenAiToolCall[] = blocks
+        .filter((block) => block.type === 'tool_use')
+        .map((block) => ({
+          id: String(block.id ?? ''),
+          type: 'function',
+          function: { name: String(block.name ?? ''), arguments: JSON.stringify(block.input ?? {}) },
+        }));
+      out.push({
+        role: 'assistant',
+        content: text || null,
+        ...(toolCalls.length ? { tool_calls: toolCalls } : {}),
+      });
+      continue;
+    }
+    // User turns: tool_result blocks must become role:"tool" messages directly
+    // after the assistant turn that issued the calls; any text follows as a
+    // plain user message.
+    for (const block of blocks) {
+      if (block.type !== 'tool_result') continue;
+      out.push({
+        role: 'tool',
+        tool_call_id: String(block.tool_use_id ?? ''),
+        content: typeof block.content === 'string' ? block.content : JSON.stringify(block.content ?? ''),
+      });
+    }
+    const text = blocks
+      .filter((block) => block.type === 'text')
+      .map((block) => String(block.text ?? ''))
+      .join('');
+    if (text) out.push({ role: 'user', content: text });
+  }
+  return out;
+}
+/** Builds the full Chat Completions request body from internal call options. */
+export function toOpenAiRequest(
+  opts: CallClaudeOptions,
+  endpoint: OpenAiEndpoint,
+  stream: boolean,
+): Record<string, unknown> {
+  return {
+    model: opts.model,
+    [endpoint.tokenParam]: opts.maxTokens ?? 2048,
+    messages: toOpenAiMessages(opts),
+    ...(opts.tools?.length
+      ? {
+          tools: opts.tools.map((tool) => ({
+            type: 'function',
+            function: { name: tool.name, description: tool.description, parameters: tool.input_schema },
+          })),
+        }
+      : {}),
+    ...(opts.toolChoice
+      ? {
+          tool_choice:
+            opts.toolChoice.type === 'tool'
+              ? { type: 'function', function: { name: opts.toolChoice.name } }
+              : 'auto',
+        }
+      : {}),
+    ...(stream ? { stream: true, stream_options: { include_usage: true } } : {}),
+  };
+}
+function mapStopReason(finishReason: string | null | undefined): string | null {
+  if (finishReason === 'tool_calls') return 'tool_use';
+  if (finishReason === 'stop') return 'end_turn';
+  if (finishReason === 'length') return 'max_tokens';
+  return finishReason ?? null;
+}
+function parseToolInput(args: string): unknown {
+  try {
+    return JSON.parse(args || '{}');
+  } catch {
+    return {};
+  }
+}
+function mapUsage(usage: unknown): AnthropicUsage | undefined {
+  const u = usage as { prompt_tokens?: number; completion_tokens?: number } | null | undefined;
+  if (typeof u?.prompt_tokens !== 'number' && typeof u?.completion_tokens !== 'number') return undefined;
+  return { input_tokens: u?.prompt_tokens ?? 0, output_tokens: u?.completion_tokens ?? 0 };
+}
+function requestInit(opts: CallClaudeOptions, endpoint: OpenAiEndpoint, stream: boolean): RequestInit {
+  return {
+    method: 'POST',
+    headers: {
+      'content-type': 'application/json',
+      authorization: `Bearer ${opts.apiKey}`,
+    },
+    body: JSON.stringify(toOpenAiRequest(opts, endpoint, stream)),
+    signal: opts.signal,
+  };
+}
+function completionsUrl(endpoint: OpenAiEndpoint): string {
+  return `${endpoint.baseUrl.replace(/\/+$/, '')}/chat/completions`;
+}
+export async function callOpenAi(opts: CallClaudeOptions, endpoint: OpenAiEndpoint): Promise<AnthropicResponse> {
+  const res = await fetch(completionsUrl(endpoint), requestInit(opts, endpoint, false));
+  if (!res.ok) {
+    const detail = await res.text().catch(() => '');
+    throw new Error(`${endpoint.label} API ${res.status}: ${detail.slice(0, 500)}`);
+  }
+  const payload = (await res.json()) as {
+    choices?: Array<{ message?: { content?: string | null; tool_calls?: OpenAiToolCall[] }; finish_reason?: string | null }>;
+    usage?: unknown;
+  };
+  const choice = payload.choices?.[0];
+  const content: AnthropicResponse['content'] = [];
+  if (choice?.message?.content) content.push({ type: 'text', text: choice.message.content });
+  for (const call of choice?.message?.tool_calls ?? []) {
+    content.push({ type: 'tool_use', id: call.id, name: call.function.name, input: parseToolInput(call.function.arguments) });
+  }
+  return {
+    content,
+    stop_reason: mapStopReason(choice?.finish_reason),
+    ...(mapUsage(payload.usage) ? { usage: mapUsage(payload.usage) } : {}),
+  };
+}
+/**
+ * Streams a Chat Completions response, yielding text deltas as they arrive and
+ * fully-reconstructed tool_use blocks (plus one `stop` event) at the end.
+ */
+export async function* streamOpenAi(opts: CallClaudeOptions, endpoint: OpenAiEndpoint): AsyncGenerator<StreamEvent> {
+  const res = await fetch(completionsUrl(endpoint), requestInit(opts, endpoint, true));
+  if (!res.ok || !res.body) {
+    const detail = res.ok ? 'no response body' : await res.text().catch(() => '');
+    throw new Error(`${endpoint.label} API ${res.status}: ${detail.slice(0, 500)}`);
+  }
+  const reader = res.body.getReader();
+  const decoder = new TextDecoder('utf-8');
+  let state = newOpenAiSseState();
+  while (true) {
+    const { done, value } = await reader.read();
+    if (done) break;
+    const out = parseOpenAiSseChunk(decoder.decode(value, { stream: true }), state);
+    state = out.state;
+    for (const event of out.events) yield event;
+  }
+  // Streams normally end with `data: [DONE]`; flush here in case one doesn't.
+  for (const event of flushOpenAiSse(state)) yield event;
+}
+interface SseToolCall {
+  id: string;
+  name: string;
+  args: string;
+}
+export interface OpenAiSseState {
+  /** Bytes not yet terminated by a blank line. */
+  buffer: string;
+  /** Tool calls accumulated by their stream index. */
+  toolCalls: Record<number, SseToolCall>;
+  usage: AnthropicUsage;
+  finishReason: string | null;
+  /** Tool-use and stop events were already emitted (on `[DONE]`). */
+  flushed: boolean;
+}
+export function newOpenAiSseState(): OpenAiSseState {
+  return {
+    buffer: '',
+    toolCalls: {},
+    usage: { input_tokens: 0, output_tokens: 0 },
+    finishReason: null,
+    flushed: false,
+  };
+}
+/**
+ * Pure, network-free Chat Completions SSE parser. Text deltas surface
+ * immediately; tool calls and usage accumulate until `[DONE]` flushes them.
+ */
+export function parseOpenAiSseChunk(
+  chunk: string,
+  prev: OpenAiSseState,
+): { events: StreamEvent[]; state: OpenAiSseState } {
+  const events: StreamEvent[] = [];
+  const state = { ...prev, toolCalls: prev.toolCalls, usage: prev.usage };
+  state.buffer = prev.buffer + chunk;
+  let sep: number;
+  while ((sep = state.buffer.indexOf('\n\n')) !== -1) {
+    const frame = state.buffer.slice(0, sep);
+    state.buffer = state.buffer.slice(sep + 2);
+    // Non-`data:` lines (OpenRouter emits `: PROCESSING` comments) are dropped.
+    const data = frame
+      .split('\n')
+      .filter((line) => line.startsWith('data:'))
+      .map((line) => line.slice(5).trim())
+      .join('');
+    if (!data) continue;
+    if (data === '[DONE]') {
+      events.push(...flushOpenAiSse(state));
+      continue;
+    }
+    let payload: Record<string, unknown>;
+    try {
+      payload = JSON.parse(data) as Record<string, unknown>;
+    } catch {
+      continue;
+    }
+    const mappedUsage = mapUsage(payload.usage);
+    if (mappedUsage) state.usage = mappedUsage;
+    const choice = (payload.choices as Array<Record<string, unknown>> | undefined)?.[0];
+    if (!choice) continue;
+    if (typeof choice.finish_reason === 'string') state.finishReason = choice.finish_reason;
+    const delta = choice.delta as
+      | { content?: string | null; tool_calls?: Array<{ index?: number; id?: string; function?: { name?: string; arguments?: string } }> }
+      | undefined;
+    if (typeof delta?.content === 'string' && delta.content) {
+      events.push({ type: 'text', text: delta.content });
+    }
+    for (const call of delta?.tool_calls ?? []) {
+      const index = call.index ?? 0;
+      const existing = state.toolCalls[index] ?? { id: '', name: '', args: '' };
+      state.toolCalls[index] = {
+        id: call.id ?? existing.id,
+        name: existing.name + (call.function?.name ?? ''),
+        args: existing.args + (call.function?.arguments ?? ''),
+      };
+    }
+  }
+  return { events, state };
+}
+/** Emits accumulated tool_use blocks and the final stop event, exactly once. */
+export function flushOpenAiSse(state: OpenAiSseState): StreamEvent[] {
+  if (state.flushed) return [];
+  state.flushed = true;
+  const events: StreamEvent[] = [];
+  const indexes = Object.keys(state.toolCalls)
+    .map(Number)
+    .sort((a, b) => a - b);
+  for (const index of indexes) {
+    const call = state.toolCalls[index];
+    events.push({ type: 'tool_use', id: call.id, name: call.name, input: parseToolInput(call.args) });
+  }
+  const hasUsage = state.usage.input_tokens > 0 || state.usage.output_tokens > 0;
+  events.push({
+    type: 'stop',
+    stopReason: mapStopReason(state.finishReason),
+    ...(hasUsage ? { usage: { ...state.usage } } : {}),
+  });
+  return events;
+}

package/src/observability.ts CHANGED Viewed

@@ -66,6 +66,8 @@ export interface TelemetryOptions {
   distinctId?: string;
   /** Optional label attached to every event as `agent_scope`. */
   scope?: string;
+  /** Inference provider reported as `$ai_provider`; defaults to `anthropic`. */
+  provider?: string;
   /** Reuse an existing trace id; one is generated otherwise. */
   traceId?: string;
   /** Cloudflare-style keep-alive so in-flight captures survive response end. */
@@ -113,7 +115,7 @@ export function makeTelemetry(options: TelemetryOptions = {}): Telemetry {
       distinct_id: distinctId,
       properties: {
         $ai_trace_id: traceId,
-        $ai_provider: 'anthropic',
+        $ai_provider: options.provider ?? 'anthropic',
         $process_person_profile: false, // anonymous — no person profile
         ...(scope ? { agent_scope: scope } : {}),
         ...properties,

package/src/providers.ts ADDED Viewed

@@ -0,0 +1,81 @@
+// Inference provider registry. Anthropic keeps its native Messages client;
+// OpenAI and OpenRouter share the Chat Completions client in `llm-openai.ts`,
+// differing only in base URL, key env var, token param, and default models.
+import { callClaude, streamClaude } from './llm.ts';
+import { callOpenAi, streamOpenAi, type OpenAiEndpoint } from './llm-openai.ts';
+import type { ProviderName } from './types.ts';
+export type { ProviderName };
+export interface ProviderInfo {
+  name: ProviderName;
+  /** Human label for log and error messages. */
+  label: string;
+  /** Environment variable the API key is read from. */
+  envKey: string;
+  /** Default API base URL (OpenAI-compatible providers only). */
+  baseUrl?: string;
+  /** Default model for the agentic search loop. */
+  defaultModel: string;
+  /** Default model for the offline digest builder. */
+  defaultDigestModel: string;
+}
+export const PROVIDERS: Record<ProviderName, ProviderInfo> = {
+  anthropic: {
+    name: 'anthropic',
+    label: 'Anthropic',
+    envKey: 'ANTHROPIC_API_KEY',
+    defaultModel: 'claude-haiku-4-5',
+    defaultDigestModel: 'claude-opus-4-8',
+  },
+  openai: {
+    name: 'openai',
+    label: 'OpenAI',
+    envKey: 'OPENAI_API_KEY',
+    baseUrl: 'https://api.openai.com/v1',
+    defaultModel: 'gpt-4.1-mini',
+    defaultDigestModel: 'gpt-5.1',
+  },
+  openrouter: {
+    name: 'openrouter',
+    label: 'OpenRouter',
+    envKey: 'OPENROUTER_API_KEY',
+    baseUrl: 'https://openrouter.ai/api/v1',
+    defaultModel: 'anthropic/claude-haiku-4.5',
+    defaultDigestModel: 'anthropic/claude-opus-4.8',
+  },
+};
+/** Validates a configured provider name, defaulting to `anthropic`. */
+export function resolveProviderName(value?: string): ProviderName {
+  if (!value) return 'anthropic';
+  if (value in PROVIDERS) return value as ProviderName;
+  throw new Error(`Unknown provider "${value}". Expected one of: ${Object.keys(PROVIDERS).join(', ')}.`);
+}
+export interface LlmClient {
+  call: typeof callClaude;
+  stream: typeof streamClaude;
+}
+/**
+ * Returns the call/stream pair for a provider. `baseUrl` overrides the
+ * provider's API base, so any Chat Completions-compatible endpoint works.
+ */
+export function clientFor(provider: ProviderName, baseUrl?: string): LlmClient {
+  if (provider === 'anthropic') return { call: callClaude, stream: streamClaude };
+  const info = PROVIDERS[provider];
+  const endpoint: OpenAiEndpoint = {
+    baseUrl: baseUrl ?? info.baseUrl!,
+    // OpenAI's reasoning models reject `max_tokens`; OpenRouter normalizes it.
+    tokenParam: provider === 'openai' ? 'max_completion_tokens' : 'max_tokens',
+    label: info.label,
+  };
+  return {
+    call: (opts) => callOpenAi(opts, endpoint),
+    stream: (opts) => streamOpenAi(opts, endpoint),
+  };
+}

package/src/types.ts CHANGED Viewed

@@ -1,3 +1,6 @@
+/** Inference providers the search loop and digest builder can run against. */
+export type ProviderName = 'anthropic' | 'openai' | 'openrouter';
 export interface HevAskOptions {
   /**
    * Content collection name(s) to index and search over.
@@ -6,8 +9,24 @@ export interface HevAskOptions {
   collections?: string[];
   /**
-   * Claude model used by the bounded search loop.
-   * @default 'claude-haiku-4-5'
+   * Inference provider for the agentic loop and the digest builder. Each
+   * provider reads its own key from the environment: `ANTHROPIC_API_KEY`,
+   * `OPENAI_API_KEY`, or `OPENROUTER_API_KEY`.
+   * @default 'anthropic'
+   */
+  provider?: ProviderName;
+  /**
+   * Override the provider's API base URL. Applies to the OpenAI-compatible
+   * providers only, so any Chat Completions-compatible endpoint works
+   * (e.g. a proxy or a self-hosted gateway).
+   */
+  providerBaseUrl?: string;
+  /**
+   * Model used by the bounded search loop. Defaults per provider:
+   * `claude-haiku-4-5` (anthropic), `gpt-4.1-mini` (openai),
+   * `anthropic/claude-haiku-4.5` (openrouter).
    */
   model?: string;
@@ -38,8 +57,9 @@ export interface HevAskOptions {
   answerMaxTokens?: number;
   /**
-   * Model used by the offline digest builder.
-   * @default 'claude-opus-4-8'
+   * Model used by the offline digest builder. Defaults per provider:
+   * `claude-opus-4-8` (anthropic), `gpt-5.1` (openai),
+   * `anthropic/claude-opus-4.8` (openrouter).
    */
   digestModel?: string;
@@ -69,8 +89,14 @@ export interface HevAskOptions {
   perDocCap?: number;
   /**
-   * Path to the committed ask digest artifact, relative to the site root.
-   * @default '.hev-ask/digest.json'
+   * Path to the committed ask digest tree, relative to the site root.
+   * @default '.hev-ask'
+   */
+  digestDir?: string;
+  /**
+   * Deprecated alias for `digestDir`.
+   * @default '.hev-ask'
    */
   digestPath?: string;
@@ -84,6 +110,8 @@ export interface HevAskOptions {
 /** The shape the integration serializes into `virtual:hev-ask/config`. */
 export interface ResolvedConfig {
   collections: string[] | null;
+  provider: ProviderName;
+  providerBaseUrl?: string;
   model: string;
   digestModel: string;
   endpoint: string;