npm - typeclaw - Versions diffs - 0.36.7 → 0.37.0 - Mend

typeclaw 0.36.7 → 0.37.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (112) hide show

package/README.md +2 -2
package/package.json +3 -2
package/src/agent/index.ts +31 -11
package/src/agent/live-sessions.ts +12 -0
package/src/agent/model-fallback.ts +17 -15
package/src/agent/model-overrides.ts +2 -2
package/src/agent/session-meta.ts +10 -0
package/src/agent/subagents.ts +11 -2
package/src/agent/system-prompt.ts +9 -3
package/src/agent/todo/continuation-policy.ts +6 -3
package/src/agent/todo/continuation-wiring.ts +4 -2
package/src/agent/todo/continuation.ts +3 -3
package/src/agent/tools/todo/index.ts +27 -4
package/src/bundled-plugins/agent-browser/index.ts +33 -108
package/src/bundled-plugins/agent-browser/shim.ts +3 -94
package/src/bundled-plugins/agent-browser/skills/agent-browser/SKILL.md +8 -33
package/src/bundled-plugins/doc-render/skills/typeclaw-render-pdf/SKILL.md +2 -2
package/src/bundled-plugins/guard/policies/memory-retrieval-cache-write.ts +7 -1
package/src/bundled-plugins/memory/README.md +80 -23
package/src/bundled-plugins/memory/append-tool.ts +74 -53
package/src/bundled-plugins/memory/citation-superset.ts +4 -0
package/src/bundled-plugins/memory/citations.ts +54 -0
package/src/bundled-plugins/memory/dreaming-metrics.ts +30 -0
package/src/bundled-plugins/memory/dreaming.ts +444 -21
package/src/bundled-plugins/memory/index.ts +544 -400
package/src/bundled-plugins/memory/load-memory.ts +87 -10
package/src/bundled-plugins/memory/load-shards.ts +48 -22
package/src/bundled-plugins/memory/memory-logger.ts +95 -106
package/src/bundled-plugins/memory/memory-retrieval.ts +3 -3
package/src/bundled-plugins/memory/parent-link.ts +33 -0
package/src/bundled-plugins/memory/paths.ts +12 -0
package/src/bundled-plugins/memory/references/frontmatter.ts +197 -0
package/src/bundled-plugins/memory/references/load-references.ts +212 -0
package/src/bundled-plugins/memory/references/store-reference-tool.ts +59 -0
package/src/bundled-plugins/memory/search-tool.ts +282 -45
package/src/bundled-plugins/memory/stream-events.ts +1 -0
package/src/bundled-plugins/memory/stream-io.ts +28 -3
package/src/bundled-plugins/memory/turn-dedup.ts +40 -0
package/src/bundled-plugins/memory/vector/cache-write.ts +19 -0
package/src/bundled-plugins/memory/vector/config.ts +28 -0
package/src/bundled-plugins/memory/vector/doctor.ts +124 -0
package/src/bundled-plugins/memory/vector/embedder.ts +246 -0
package/src/bundled-plugins/memory/vector/hybrid.ts +439 -0
package/src/bundled-plugins/memory/vector/index-on-write.ts +34 -0
package/src/bundled-plugins/memory/vector/inspect.ts +111 -0
package/src/bundled-plugins/memory/vector/passages.ts +125 -0
package/src/bundled-plugins/memory/vector/reference-index-on-write.ts +50 -0
package/src/bundled-plugins/memory/vector/relevance-gate.ts +93 -0
package/src/bundled-plugins/memory/vector/startup.ts +71 -0
package/src/bundled-plugins/memory/vector/store.ts +203 -0
package/src/bundled-plugins/memory/vector/truncation.ts +124 -0
package/src/bundled-plugins/security/policies/outbound-secret-scan.ts +2 -0
package/src/channels/router.ts +239 -40
package/src/cli/incomplete-init.ts +57 -0
package/src/cli/init.ts +143 -12
package/src/cli/inspect.ts +11 -5
package/src/cli/model.ts +112 -34
package/src/cli/restart.ts +24 -0
package/src/cli/start.ts +24 -0
package/src/cli/tunnel.ts +53 -8
package/src/config/config.ts +110 -19
package/src/config/index.ts +5 -1
package/src/config/models-mutation.ts +29 -11
package/src/config/providers-mutation.ts +2 -2
package/src/config/providers.ts +146 -12
package/src/container/shared.ts +9 -0
package/src/container/start.ts +87 -4
package/src/cron/consumer.ts +13 -7
package/src/hostd/models.ts +64 -0
package/src/hostd/paths.ts +6 -0
package/src/hostd/portbroker-manager.ts +2 -2
package/src/init/checkpoint.ts +201 -0
package/src/init/dockerfile.ts +164 -51
package/src/init/gitignore.ts +7 -7
package/src/init/index.ts +41 -9
package/src/init/line-auth.ts +50 -21
package/src/init/models-dev.ts +96 -21
package/src/init/oauth-login.ts +3 -3
package/src/init/progress.ts +29 -0
package/src/init/validate-api-key.ts +4 -0
package/src/inspect/index.ts +13 -6
package/src/inspect/item-list.ts +11 -2
package/src/inspect/live-list.ts +65 -0
package/src/inspect/open-item.ts +22 -1
package/src/inspect/session-list.ts +29 -0
package/src/models/embedding-model.ts +114 -0
package/src/models/transformers-version.ts +55 -0
package/src/plugin/types.ts +3 -0
package/src/portbroker/container-server.ts +23 -0
package/src/portbroker/forward-request-bus.ts +35 -0
package/src/portbroker/forward-result-bus.ts +2 -3
package/src/portbroker/hostd-client.ts +182 -36
package/src/portbroker/index.ts +6 -1
package/src/portbroker/protocol.ts +9 -2
package/src/run/channel-session-factory.ts +11 -1
package/src/run/index.ts +41 -7
package/src/server/command-runner.ts +24 -1
package/src/server/index.ts +42 -8
package/src/shared/index.ts +2 -0
package/src/shared/protocol.ts +31 -0
package/src/skills/typeclaw-channels/SKILL.md +4 -4
package/src/skills/typeclaw-config/SKILL.md +2 -2
package/src/skills/typeclaw-memory/SKILL.md +3 -1
package/src/skills/typeclaw-permissions/SKILL.md +3 -3
package/src/skills/typeclaw-skills/SKILL.md +1 -1
package/src/skills/typeclaw-tunnels/SKILL.md +22 -1
package/src/tunnels/providers/cloudflare-quick.ts +65 -7
package/src/tunnels/upstream-probe.ts +25 -0
package/typeclaw.schema.json +156 -67
package/src/bundled-plugins/agent-browser/dashboard-discovery.ts +0 -170
package/src/bundled-plugins/agent-browser/dashboard-proxy.ts +0 -421
package/src/portbroker/bind-with-forward.ts +0 -102

package/src/bundled-plugins/memory/vector/hybrid.ts ADDED Viewed

@@ -0,0 +1,439 @@
+import { createHash } from 'node:crypto'
+import { loadAllShards, type TopicShard } from '../load-shards'
+import { buildParentLinks } from '../parent-link'
+import { loadAllReferences, type Reference } from '../references/load-references'
+import {
+  buildMatcher,
+  distinctTokens,
+  hasNonAscii,
+  searchAll,
+  searchAllRanked,
+  type MemorySearchMatch,
+  type StreamMatch,
+} from '../search-tool'
+import type { StreamEvent } from '../stream-events'
+import { readAllUndreamedStreamDays, type UndreamedStreamDay } from '../stream-io'
+import { embed, EMBEDDING_MODEL_ID, type EmbedType } from './embedder'
+import type { Passage } from './passages'
+import { clearsBaseline, gateRelevance, streamAdmissionBaseline } from './relevance-gate'
+import { VectorStore, type VectorRow } from './store'
+export { collectPassages, findMissingPassages, type Passage } from './passages'
+const RRF_K = 60
+export type HybridSearchResult = {
+  source: 'topic' | 'stream' | 'reference'
+  key: string
+  heading: string
+  excerpt: string
+  rrfScore: number
+}
+export type EmbedFn = (texts: string[], type: EmbedType) => Promise<Float32Array[]>
+export async function hybridSearch(
+  query: string,
+  store: VectorStore,
+  agentDir: string,
+  topK: number,
+  embedFn: EmbedFn = embed,
+): Promise<HybridSearchResult[]> {
+  if (topK <= 0) return []
+  const [shards, streamDays, references, queryEmbeddings] = await Promise.all([
+    loadAllShards(agentDir),
+    readAllUndreamedStreamDays(agentDir),
+    loadAllReferences(agentDir),
+    embedFn([query], 'query'),
+  ])
+  const { parentSlugsByFragmentId, supersededFragmentIds } = buildParentLinks(shards)
+  const index = buildContentIndex(shards, streamDays, references, supersededFragmentIds)
+  const vectorRows = queryEmbeddings[0] === undefined ? [] : gatedVectorLane(queryEmbeddings[0], store, topK)
+  const keywordMatches = keywordLane(query, shards, streamDays, references, topK * 2)
+  return fuseLanes(vectorRows, keywordMatches, index, parentSlugsByFragmentId).slice(0, topK)
+}
+// The vector lane, gated by per-query relevance. Both row kinds are judged
+// against ONE query-local no-match band, derived from the TOPIC score
+// distribution alone (topics are the only stable-enough corpus to estimate the
+// ambient band; sparse streams consume the band but never define it, so a
+// nearest-neighbour cluster of fragments can't move the bar).
+//
+//   - Topic rows: the gate keeps the knee above the band, or empties the topic
+//     partition entirely when no topic clears it.
+//   - Stream rows: admitted one-by-one only when they clear the SAME band by
+//     the shared margin. A genuine fresh fragment (well above the band) survives
+//     the freshness window; an irrelevant in-band neighbour is dropped, so a
+//     no-match query can't leak closest-neighbours-regardless through streams.
+//
+// Topic suppression uses the floor-gated verdict (gateRelevance): below the
+// floor topics pass ungated, since a tiny index can't form a reliable band and
+// a false negative is cheaper than suppressing the only memory. Stream
+// admission uses streamAdmissionBaseline, which tolerates a below-floor topic
+// set — even a few topics give the contrast a vector-only fragment match needs,
+// and it returns null (dropping uncorroborated streams) only when NO topics
+// exist at all. A lexically-corroborated fragment still reaches RRF via the
+// separate keyword lane. An empty merged lane composes with RRF exactly like a
+// lane that found nothing, so a genuine keyword hit survives a full no-match.
+function gatedVectorLane(queryEmbedding: Float32Array, store: VectorStore, topK: number): VectorRow[] {
+  const scored = store.queryScored(queryEmbedding, EMBEDDING_MODEL_ID)
+  const bandDefiningRows = scored.filter(({ row }) => row.source === 'topic' || row.source === 'reference')
+  const streamRows = scored.filter(({ row }) => row.source === 'stream')
+  const bandScores = bandDefiningRows.map(({ score }) => score)
+  const keptBandDefiningRows = bandDefiningRows.slice(0, gateRelevance(bandScores, topK * 2))
+  const streamBaseline = streamAdmissionBaseline(bandScores)
+  const keptStreams = streamRows.filter(({ score }) => clearsBaseline(score, streamBaseline)).slice(0, topK * 2)
+  return [...keptBandDefiningRows, ...keptStreams].sort((a, b) => b.score - a.score).map(({ row }) => row)
+}
+// Phrase-first, then token-OR fallback (mirrors `memory_search`). `hybridSearch`'s
+// query is always the whole user prompt, which never appears verbatim in a shard,
+// so a phrase-only lane returns nothing every real turn and RRF degenerates to the
+// vector lane alone. The `searchAllRanked` fallback also gives RRF a
+// matched-token-count rank (truncated after ranking) instead of alphabetical order.
+function keywordLane(
+  query: string,
+  shards: TopicShard[],
+  streamDays: UndreamedStreamDay[],
+  references: Reference[],
+  maxResults: number,
+): MemorySearchMatch[] {
+  const matcher = buildMatcher(query, false)
+  if (typeof matcher === 'string') return []
+  const phrase = searchAll(shards, streamDays, matcher, { full: false, maxResults, references })
+  const phraseMatches = 'matches' in phrase ? phrase.matches : []
+  if (phraseMatches.length > 0) return phraseMatches
+  const tokens = distinctHybridContentTokens(query)
+  if (tokens.length === 0) return []
+  if (tokens.length === 1 && tokens[0] === query.trim().toLowerCase()) return []
+  const ranked = searchAllRanked(shards, streamDays, tokens, {
+    full: false,
+    maxResults,
+    references,
+    tokenMatchMode: 'ascii-boundary',
+  })
+  return 'matches' in ranked ? ranked.matches : []
+}
+// Stopwords are judged ONLY against a token's ASCII-alpha core (below), so this
+// set is intentionally English-only — non-ASCII tokens never reach it.
+const HYBRID_PROMPT_STOPWORDS = new Set([
+  'a',
+  'an',
+  'the',
+  'and',
+  'or',
+  'but',
+  'i',
+  'me',
+  'my',
+  'mine',
+  'you',
+  'your',
+  'yours',
+  'he',
+  'him',
+  'his',
+  'she',
+  'her',
+  'hers',
+  'it',
+  'its',
+  'we',
+  'us',
+  'our',
+  'ours',
+  'they',
+  'them',
+  'their',
+  'theirs',
+  'this',
+  'that',
+  'these',
+  'those',
+  'here',
+  'there',
+  'what',
+  'when',
+  'where',
+  'who',
+  'whom',
+  'whose',
+  'why',
+  'how',
+  'which',
+  'is',
+  'am',
+  'are',
+  'was',
+  'were',
+  'be',
+  'been',
+  'being',
+  'do',
+  'does',
+  'did',
+  'doing',
+  'have',
+  'has',
+  'had',
+  'having',
+  'can',
+  'could',
+  'should',
+  'would',
+  'will',
+  'may',
+  'might',
+  'must',
+  'about',
+  'as',
+  'at',
+  'by',
+  'for',
+  'from',
+  'in',
+  'into',
+  'of',
+  'on',
+  'onto',
+  'to',
+  'with',
+  'without',
+  'over',
+  'under',
+  'after',
+  'before',
+  'between',
+  'up',
+  'down',
+  'out',
+  'off',
+  'say',
+  'said',
+  'thing',
+  'things',
+  'stuff',
+])
+// The hybrid lane's query is a whole user prompt, so its tokens include
+// function words ('what', 'we', 'the', 'about'). Token-OR matching on those
+// alone would make the keyword lane non-empty for a low-information prompt and,
+// when the vector lane is gated out, inject arbitrary memory instead of no
+// result. The tool path's `distinctTokens` stays untouched — there the query is
+// a deliberate agent search, not a sentence. Stopwords are judged ONLY on a
+// token's ASCII-alpha core, so non-ASCII tokens ('홍길동'), numerics ('#651'),
+// and short content words ('pr', 'ci', 'go') all survive; no length filter,
+// which would wrongly drop CJK and short content.
+function distinctHybridContentTokens(query: string): string[] {
+  return distinctTokens(query).filter((token) => {
+    const core = token.replace(/^[^a-z0-9]+|[^a-z0-9]+$/g, '')
+    if (core.length === 0) return hasNonAscii(token)
+    if (!/^[a-z]+$/.test(core)) return true
+    return !HYBRID_PROMPT_STOPWORDS.has(core)
+  })
+}
+// Reciprocal Rank Fusion across two rankers (vector + keyword). Each lane is
+// collapsed to per-parent scores INDEPENDENTLY (MAX over a parent's children
+// within that lane), then the two lanes' per-parent scores are SUMMED. The two
+// reductions are different on purpose:
+//
+//   - WITHIN a lane, a topic's children (the fragments citing it) collapse by
+//     MAX — summing would over-rank often-revised topics purely for having more
+//     historical citations to match (PARADE: max beats sum for concentrated
+//     relevance).
+//   - ACROSS lanes, the per-parent contributions SUM — cross-ranker agreement
+//     is the entire signal RRF exists to capture. A topic found by BOTH the
+//     vector and the keyword lane must outrank one found by a single lane, so
+//     its score is 1/(k+rankVector) + 1/(k+rankKeyword). Collapsing both lanes
+//     into one map and taking MAX (the previous behavior) discarded that
+//     agreement, leaving every result carrying a single lane's reciprocal rank.
+function fuseLanes(
+  vectorRows: VectorRow[],
+  keywordMatches: MemorySearchMatch[],
+  index: Map<string, Omit<HybridSearchResult, 'rrfScore'>>,
+  parentSlugsByFragmentId: Map<string, Set<string>>,
+): HybridSearchResult[] {
+  const vectorLane = collapseLane(
+    vectorRows.map((row, i) => ({ source: row.source, key: row.key, score: 1 / (RRF_K + i + 1) })),
+    index,
+    parentSlugsByFragmentId,
+  )
+  const keywordLane = collapseLane(
+    keywordMatches.map((match, i) => ({ source: match.source, key: matchKey(match), score: 1 / (RRF_K + i + 1) })),
+    index,
+    parentSlugsByFragmentId,
+  )
+  const fused = new Map<string, HybridSearchResult>()
+  for (const lane of [vectorLane, keywordLane]) {
+    for (const [fusedKey, { content, score }] of lane) {
+      const existing = fused.get(fusedKey)
+      if (existing !== undefined) existing.rrfScore += score
+      else fused.set(fusedKey, { ...content, rrfScore: score })
+    }
+  }
+  return [...fused.values()].sort((a, b) => b.rrfScore - a.rrfScore || a.key.localeCompare(b.key))
+}
+type LaneHit = { source: 'topic' | 'stream' | 'reference'; key: string; score: number }
+type LaneEntry = { content: Omit<HybridSearchResult, 'rrfScore'>; score: number }
+// Returns one lane's per-parent scores so the caller can SUM across lanes;
+// folding straight into a shared map would force a cross-lane MAX instead.
+function collapseLane(
+  hits: LaneHit[],
+  index: Map<string, Omit<HybridSearchResult, 'rrfScore'>>,
+  parentSlugsByFragmentId: Map<string, Set<string>>,
+): Map<string, LaneEntry> {
+  const lane = new Map<string, LaneEntry>()
+  for (const hit of hits) {
+    for (const { fusedKey, content } of resolveToParents(hit.source, hit.key, index, parentSlugsByFragmentId)) {
+      const existing = lane.get(fusedKey)
+      if (existing !== undefined) existing.score = Math.max(existing.score, hit.score)
+      else lane.set(fusedKey, { content, score: hit.score })
+    }
+  }
+  return lane
+}
+// A matched fragment collapses to EVERY topic that cites it (a fragment can back
+// more than one belief), so it contributes its score to each parent. An
+// undreamed fragment with no citing topic resolves to itself.
+function resolveToParents(
+  source: 'topic' | 'stream' | 'reference',
+  nodeKey: string,
+  index: Map<string, Omit<HybridSearchResult, 'rrfScore'>>,
+  parentSlugsByFragmentId: Map<string, Set<string>>,
+): Array<{ fusedKey: string; content: Omit<HybridSearchResult, 'rrfScore'> }> {
+  if (source === 'reference') {
+    const slug = referenceSlugFromKey(nodeKey)
+    const content = index.get(laneKey('reference', slug))
+    return content === undefined ? [] : [{ fusedKey: laneKey('reference', slug), content }]
+  }
+  if (source === 'stream') {
+    const fragmentId = fragmentIdFromKey(nodeKey)
+    const parentSlugs = fragmentId === null ? undefined : parentSlugsByFragmentId.get(fragmentId)
+    if (parentSlugs !== undefined && parentSlugs.size > 0) {
+      const parents: Array<{ fusedKey: string; content: Omit<HybridSearchResult, 'rrfScore'> }> = []
+      for (const parentSlug of parentSlugs) {
+        const topic = index.get(laneKey('topic', parentSlug))
+        if (topic !== undefined) parents.push({ fusedKey: laneKey('topic', parentSlug), content: topic })
+      }
+      if (parents.length > 0) return parents
+    }
+  }
+  const content = index.get(laneKey(source, nodeKey))
+  return content === undefined ? [] : [{ fusedKey: laneKey(source, nodeKey), content }]
+}
+function referenceSlugFromKey(referenceKey: string): string {
+  const hashIndex = referenceKey.indexOf('#')
+  return hashIndex === -1 ? referenceKey : referenceKey.slice(0, hashIndex)
+}
+function fragmentIdFromKey(streamKey: string): string | null {
+  const hashIndex = streamKey.indexOf('#')
+  if (hashIndex === -1) return null
+  const id = streamKey.slice(hashIndex + 1)
+  return id.startsWith('legacy-') ? null : id
+}
+// Superseded fragments are kept out of the content index entirely, so both
+// lanes drop them: the keyword lane can match a superseded body, but resolving
+// it finds no active parent link and then no `stream` fallback here, so the
+// stale fragment never surfaces as a standalone result (mirrors the passage-set
+// exclusion that keeps superseded fragments out of the vector lane).
+function buildContentIndex(
+  shards: TopicShard[],
+  streamDays: UndreamedStreamDay[],
+  references: Reference[],
+  supersededFragmentIds: Set<string>,
+): Map<string, Omit<HybridSearchResult, 'rrfScore'>> {
+  const index = new Map<string, Omit<HybridSearchResult, 'rrfScore'>>()
+  for (const shard of shards) {
+    index.set(laneKey('topic', shard.slug), {
+      source: 'topic',
+      key: shard.slug,
+      heading: shard.frontmatter.heading,
+      excerpt: excerpt(shard.body, shard.frontmatter.heading),
+    })
+  }
+  for (const day of streamDays) {
+    for (const event of day.events) {
+      const item = streamIndexItem(day, event, supersededFragmentIds)
+      if (item !== null) index.set(laneKey('stream', item.key), item)
+    }
+  }
+  for (const reference of references) {
+    if (reference.frontmatter.demoted) continue
+    index.set(laneKey('reference', reference.slug), {
+      source: 'reference',
+      key: reference.slug,
+      heading: reference.frontmatter.title,
+      excerpt: excerpt(reference.body, reference.frontmatter.title),
+    })
+  }
+  return index
+}
+function streamIndexItem(
+  day: UndreamedStreamDay,
+  event: StreamEvent,
+  supersededFragmentIds: Set<string>,
+): Omit<HybridSearchResult, 'rrfScore'> | null {
+  if (event.type === 'watermark') return null
+  if (event.type === 'fragment') {
+    if (supersededFragmentIds.has(event.id)) return null
+    return {
+      source: 'stream',
+      key: `${day.date}#${event.id}`,
+      heading: event.topic,
+      excerpt: excerpt(event.body, event.topic),
+    }
+  }
+  return {
+    source: 'stream',
+    key: `${day.date}#legacy-${hashContent(event.text).slice(0, 12)}`,
+    heading: '[legacy prose from pre-shard migration]',
+    excerpt: excerpt(event.text, '[legacy prose from pre-shard migration]'),
+  }
+}
+function matchKey(match: MemorySearchMatch): string {
+  if (match.source === 'topic') return match.slug
+  if (match.source === 'reference') return match.slug
+  return streamMatchKey(match)
+}
+function streamMatchKey(match: StreamMatch): string {
+  if (match.eventId !== undefined) return match.eventId.replace(/^streams\//, '')
+  return `${match.date}#legacy-${hashContent(match.excerpt).slice(0, 12)}`
+}
+function laneKey(source: 'topic' | 'stream' | 'reference', key: string): string {
+  return `${source}:${key}`
+}
+function excerpt(body: string, fallback: string): string {
+  const trimmed = body.trim()
+  if (trimmed.length === 0) return fallback
+  return trimmed.split('\n').slice(0, 7).join('\n')
+}
+function hashContent(content: string): string {
+  return createHash('sha256').update(content).digest('hex')
+}

package/src/bundled-plugins/memory/vector/index-on-write.ts ADDED Viewed

@@ -0,0 +1,34 @@
+import { fragmentContentHash } from '../fragment-parser'
+import type { FragmentEvent } from '../stream-events'
+import type { FragmentsAppendedContext } from '../stream-io'
+import { embed, EMBEDDING_MODEL_ID } from './embedder'
+import type { EmbedFn } from './hybrid'
+import type { VectorStore } from './store'
+export function makeAppendHook(
+  store: VectorStore,
+  embedFn: EmbedFn = embed,
+): (fragments: FragmentEvent[], context: FragmentsAppendedContext) => Promise<void> {
+  return async (fragments, context) => {
+    for (const fragment of fragments) {
+      const key = `${context.date ?? fragment.ts.slice(0, 10)}#${fragment.id}`
+      const id = `stream:${key}`
+      const contentHash = fragmentContentHash(fragment)
+      const existing = store.getByIds([id])[0]
+      if (existing?.contentHash === contentHash && existing.model === EMBEDDING_MODEL_ID) continue
+      const text = `${fragment.topic}\n${fragment.body}`
+      const [embedding] = await embedFn([text], 'passage')
+      if (embedding === undefined) continue
+      store.upsert({
+        id,
+        source: 'stream',
+        key,
+        model: EMBEDDING_MODEL_ID,
+        dims: embedding.length,
+        embedding,
+        contentHash,
+      })
+    }
+  }
+}

package/src/bundled-plugins/memory/vector/inspect.ts ADDED Viewed

@@ -0,0 +1,111 @@
+import { Database } from 'bun:sqlite'
+import { DIMS, EMBEDDING_MODEL_ID } from './embedder'
+// Read-only health probe for the vector index DB. Deliberately does NOT go
+// through `VectorStore.open`: that path runs `CREATE TABLE IF NOT EXISTS`,
+// which would silently "heal" a DB whose `vectors` table is missing — turning
+// a corruption signal into a no-op. The doctor must observe state, not mutate
+// it, so we open raw, validate the schema ourselves, and never write.
+const EXPECTED_COLUMNS = ['id', 'source', 'key', 'model', 'dims', 'embedding', 'content_hash', 'updated_at'] as const
+export type VectorIndexProblem =
+  | { kind: 'unreadable'; detail: string }
+  | { kind: 'corrupt'; detail: string[] }
+  | { kind: 'schema-missing'; detail: string }
+export type VectorIndexFinding =
+  | VectorIndexProblem
+  | { kind: 'ok'; rowCount: number; rowIds: string[]; modelMismatch: string[]; malformed: string[] }
+type IntegrityRow = { result: string }
+type SchemaRow = { name: string }
+type RowMeta = { id: string; model: string; dims: number; embeddingBytes: number }
+export function inspectVectorIndex(dbPath: string): VectorIndexFinding {
+  let db: Database
+  try {
+    db = new Database(dbPath, { readonly: true })
+  } catch (err) {
+    return { kind: 'unreadable', detail: messageOf(err) }
+  }
+  try {
+    const corruption = runQuickCheck(db)
+    if (corruption !== null) return { kind: 'corrupt', detail: corruption }
+    if (!hasVectorsTable(db)) {
+      return { kind: 'schema-missing', detail: 'vectors table is absent' }
+    }
+    const missingColumns = missingVectorColumns(db)
+    if (missingColumns.length > 0) {
+      return { kind: 'schema-missing', detail: `vectors table missing columns: ${missingColumns.join(', ')}` }
+    }
+    return classifyRows(db)
+  } catch (err) {
+    // A read that throws after the DB opened (e.g. a malformed page surfaced
+    // mid-scan that quick_check's sampling missed) is corruption, not an
+    // unreadable file — the file opened fine.
+    return { kind: 'corrupt', detail: [messageOf(err)] }
+  } finally {
+    db.close()
+  }
+}
+function runQuickCheck(db: Database): string[] | null {
+  // quick_check over integrity_check: integrity_check is O(db size) and can
+  // blow the 5s doctor budget on a large index; quick_check skips the
+  // expensive UNIQUE/foreign-key scans while still catching page-level
+  // corruption. A healthy DB returns exactly one row: "ok". SQLite names the
+  // result column after the pragma, hence `quick_check`, aliased to `result`.
+  const rows = db.query<IntegrityRow, []>('SELECT quick_check AS result FROM pragma_quick_check').all()
+  if (rows.length === 1 && rows[0]?.result === 'ok') return null
+  return rows.map((row) => row.result)
+}
+function hasVectorsTable(db: Database): boolean {
+  const row = db
+    .query<SchemaRow, [string]>("SELECT name FROM sqlite_master WHERE type = 'table' AND name = ?")
+    .get('vectors')
+  return row !== null
+}
+function missingVectorColumns(db: Database): string[] {
+  const present = new Set(
+    db
+      .query<SchemaRow, []>('PRAGMA table_info(vectors)')
+      .all()
+      .map((row) => row.name),
+  )
+  return EXPECTED_COLUMNS.filter((column) => !present.has(column))
+}
+function classifyRows(db: Database): VectorIndexFinding {
+  const rows = db
+    .query<RowMeta, []>('SELECT id, model, dims, length(embedding) AS embeddingBytes FROM vectors ORDER BY id')
+    .all()
+  const rowIds: string[] = []
+  const modelMismatch: string[] = []
+  const malformed: string[] = []
+  for (const row of rows) {
+    rowIds.push(row.id)
+    if (row.model !== EMBEDDING_MODEL_ID || row.dims !== DIMS) {
+      modelMismatch.push(row.id)
+      continue
+    }
+    // Float32 → 4 bytes per dim. A stored BLOB that disagrees can't decode to
+    // a valid embedding, so cosine against it would be garbage.
+    if (row.embeddingBytes !== row.dims * 4) malformed.push(row.id)
+  }
+  return { kind: 'ok', rowCount: rows.length, rowIds, modelMismatch, malformed }
+}
+function messageOf(err: unknown): string {
+  return err instanceof Error ? err.message : String(err)
+}