npm - @kitlangton/motel - Versions diffs - 0.1.2 → 0.2.0 - Mend

@kitlangton/motel 0.1.2 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (22) hide show

package/AGENTS.md +6 -1
package/package.json +1 -1
package/src/App.tsx +6 -0
package/src/domain.ts +46 -4
package/src/httpApi.ts +4 -1
package/src/localServer.ts +1 -0
package/src/services/TelemetryStore.ts +209 -10
package/src/services/TraceQueryService.ts +1 -1
package/src/telemetry.test.ts +33 -0
package/src/ui/TraceDetailsPane.tsx +33 -2
package/src/ui/Waterfall.tsx +56 -29
package/src/ui/app/TraceWorkspace.tsx +9 -5
package/src/ui/app/useTraceScreenData.ts +31 -9
package/src/ui/filterParser.test.ts +56 -0
package/src/ui/filterParser.ts +45 -0
package/src/ui/primitives.tsx +20 -8
package/src/ui/state.ts +32 -2
package/src/ui/useKeyboardNav.ts +191 -10
package/src/ui/waterfallFilter.test.ts +84 -0
package/src/ui/waterfallFilter.ts +59 -0
package/web/dist/assets/{index-DKinj-OE.js → index-DnyVo03x.js} +1 -1
package/web/dist/index.html +1 -1

package/AGENTS.md CHANGED Viewed

@@ -146,7 +146,12 @@
 - `[` / `]`: switch services
 - `s`: cycle sort mode (recent → slowest → errors)
 - `t`: cycle theme (motel-default → tokyo-night → catppuccin)
-- `/`: enter filter mode (type to match on root operation name; `:error` restricts to failing traces)
+- `/`: enter filter mode.
+  - **In the trace list (L0)** the input matches against the root operation name. Composable modifiers:
+    - `:error` — restrict to traces with at least one failed span (client-side)
+    - `:ai <query>` — FTS5-backed search against LLM prompt/response/tool content (`AI_FTS_KEYS`) across every span in the trace. Tokens are prefix-matched and implicitly AND'd. Debounced 250ms.
+    - Modifiers compose: `/ :ai rate limit :error`
+  - **In the waterfall (L1/L2)** the input runs a client-side substring match against each span's operation name and tag values. Non-matching spans are dimmed; the filter bar shows the live match count. `enter` commits (dim persists while you navigate); `esc` clears.
 - `f`: open attribute filter picker (browse span-attribute keys → values for the current service; `backspace` walks back to keys; `esc` in the trace list clears the active filter)
 - `a`: pause or resume auto-refresh
 - `r`: refresh now

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@kitlangton/motel",
-  "version": "0.1.2",
+  "version": "0.2.0",
   "description": "A local OpenTelemetry ingest + TUI viewer for development, backed by SQLite.",
   "type": "module",
   "license": "MIT",

package/src/App.tsx CHANGED Viewed

@@ -15,6 +15,8 @@ import {
 	noticeAtom,
 	persistSelectedTheme,
 	selectedThemeAtom,
+	waterfallFilterModeAtom,
+	waterfallFilterTextAtom,
 } from "./ui/state.ts"
 import { applyTheme, colors, SEPARATOR, themeLabel } from "./ui/theme.ts"
 import { getVisibleSpans } from "./ui/Waterfall.tsx"
@@ -57,6 +59,8 @@ export const App = () => {
 	const [pickerInput] = useAtom(attrPickerInputAtom)
 	const [pickerIndex] = useAtom(attrPickerIndexAtom)
 	const [attrFacets] = useAtom(attrFacetStateAtom)
+	const [waterfallFilterMode] = useAtom(waterfallFilterModeAtom)
+	const [waterfallFilterText] = useAtom(waterfallFilterTextAtom)
 	useAttrFilterPicker(activeAttrKey)
 	const layout = useAppLayout({ width, height, notice, detailView, selectedSpanIndex })
@@ -179,6 +183,8 @@ export const App = () => {
 				detailView={detailView}
 				filterMode={filterMode}
 				filterText={filterText}
+				waterfallFilterMode={waterfallFilterMode}
+				waterfallFilterText={waterfallFilterText}
 				traceListProps={traceListProps}
 				selectedTraceService={selectedTraceService}
 				serviceLogState={serviceLogState}

package/src/domain.ts CHANGED Viewed

@@ -145,14 +145,56 @@ export const AI_ATTR_MAP = {
 	responseTimestamp: "ai.response.timestamp",
 } as const
-/** Attribute keys to search across when using the `text` filter */
-export const AI_TEXT_SEARCH_KEYS = [
-	"ai.prompt.messages",
+/**
+ * Attribute keys that carry LLM prompt/response content and should be
+ * indexed in the span-attribute FTS table. These are the keys emitted by
+ * well-known LLM instrumentation conventions:
+ *
+ * - **Vercel AI SDK** (`ai.*`): rich, SDK-specific attributes captured by
+ *   `experimental_telemetry` on `generateText` / `streamText` / `generateObject`.
+ * - **OpenTelemetry GenAI semantic conventions** (`gen_ai.*`): the
+ *   cross-vendor standard. The singular `prompt`/`completion` attrs are
+ *   deprecated in favor of event-based capture but are still emitted by
+ *   most instrumentations, so we keep them.
+ * - **OpenInference** (`input.value` / `output.value`): Arize Phoenix /
+ *   LangChain-style normalized input/output.
+ *
+ * Keys here trigger FTS indexing on insert via a trigger in TelemetryStore.
+ * Adding a key requires a one-time backfill; removing one leaves orphan
+ * FTS entries that get cleaned up on next retention pass.
+ */
+export const AI_FTS_KEYS = [
+	// Vercel AI SDK
 	"ai.prompt",
-	"ai.response.text",
+	"ai.prompt.messages",
 	"ai.prompt.tools",
+	"ai.prompt.toolChoice",
+	"ai.response.text",
+	"ai.response.toolCalls",
+	"ai.response.reasoning",
+	"ai.response.object",
+	"ai.toolCall.args",
+	"ai.toolCall.result",
+	// OpenTelemetry GenAI semantic conventions
+	"gen_ai.prompt",
+	"gen_ai.completion",
+	"gen_ai.input.messages",
+	"gen_ai.output.messages",
+	"gen_ai.system_instructions",
+	"gen_ai.tool.definitions",
+	"gen_ai.tool.message.content",
+	// OpenInference (Phoenix, LangChain, etc.)
+	"input.value",
+	"output.value",
 ] as const
+/**
+ * Back-compat alias. The `text` filter on `/api/ai/calls` historically
+ * LIKE-searched these four keys; now FTS indexes the broader AI_FTS_KEYS
+ * set so the filter transparently covers more content.
+ */
+export const AI_TEXT_SEARCH_KEYS = AI_FTS_KEYS
 const PREVIEW_LENGTH = 200
 export const truncatePreview = (value: string | null | undefined): string | null => {

package/src/httpApi.ts CHANGED Viewed

@@ -121,6 +121,9 @@ export const MotelHttpApi = HttpApi.make("MotelTelemetry")
 						minDurationMs: Schema.optionalKey(Schema.Number).pipe(
 							Schema.annotateKey({ description: "Only return traces slower than this threshold (milliseconds)" }),
 						),
+						aiText: Schema.optionalKey(Schema.String).pipe(
+							Schema.annotateKey({ description: "FTS match against AI prompt/response/tool content across all spans in the trace. Tokens are prefix-matched and implicitly AND'd." }),
+						),
 						lookback: LookbackParam,
 						limit: LimitParam,
 						cursor: CursorParam,
@@ -128,7 +131,7 @@ export const MotelHttpApi = HttpApi.make("MotelTelemetry")
 					success: TraceSummaryList,
 				})
 					.annotate(OpenApi.Summary, "Search traces with filters")
-					.annotate(OpenApi.Description, "Search compact trace summaries with filters. Use /api/traces/{traceId} for full details. Supports cursor pagination and attr.<key> filters in the query string."),
+					.annotate(OpenApi.Description, "Search compact trace summaries with filters. Use /api/traces/{traceId} for full details. Supports cursor pagination, attr.<key> filters in the query string, and aiText for full-text search across LLM prompt/response content."),
 				HttpApiEndpoint.get("traceStats", "/api/traces/stats", {
 					query: {

package/src/localServer.ts CHANGED Viewed

@@ -335,6 +335,7 @@ const TelemetryGroupLive = HttpApiBuilder.group(
 							status: (url.searchParams.get("status") as "ok" | "error" | null) ?? null,
 							minDurationMs: url.searchParams.get("minDurationMs") ? Number.parseFloat(url.searchParams.get("minDurationMs") ?? "") : null,
 							attributeFilters,
+							aiText: url.searchParams.get("aiText"),
 							limit: limit + 1,
 							lookbackMinutes,
 							cursorStartedAtMs: cursor?.kind === "trace" ? cursor.startedAt : undefined,

package/src/services/TelemetryStore.ts CHANGED Viewed

@@ -4,7 +4,7 @@ import { dirname } from "node:path"
 import { Clock, Effect, Layer, Schedule, Context } from "effect"
 import { config } from "../config.js"
 import type { AiCallDetail, AiCallSummary, FacetItem, LogItem, SpanItem, StatsItem, TraceItem, TraceSummaryItem, TraceSpanEvent, TraceSpanItem } from "../domain.js"
-import { AI_ATTR_MAP, AI_TEXT_SEARCH_KEYS, truncatePreview } from "../domain.js"
+import { AI_ATTR_MAP, AI_FTS_KEYS, AI_TEXT_SEARCH_KEYS, truncatePreview } from "../domain.js"
 import { attributeMap, nanosToMilliseconds, parseAnyValue, spanKindLabel, spanStatusLabel, stringifyValue, type OtlpLogExportRequest, type OtlpTraceExportRequest } from "../otlp.js"
 interface SpanRow {
@@ -57,6 +57,13 @@ interface TraceSearch {
 	readonly status?: "ok" | "error" | null
 	readonly minDurationMs?: number | null
 	readonly attributeFilters?: Readonly<Record<string, string>>
+	/**
+	 * Full-text match against the AI prompt/response/tool attribute values
+	 * on any span in the trace (see AI_FTS_KEYS). When set, traces are
+	 * filtered to those containing at least one span whose indexed LLM
+	 * content matches. Powered by span_attr_fts (FTS5).
+	 */
+	readonly aiText?: string | null
 	readonly lookbackMinutes?: number
 	readonly limit?: number
 	readonly cursorStartedAtMs?: number
@@ -163,6 +170,15 @@ const parseSummaryRow = (row: TraceSummaryRow): TraceSummaryItem => ({
 	warnings: [],
 })
+// Skip attribute facet rows whose value blob is longer than this. Prevents
+// multi-MB text attrs (ai.prompt, ai.prompt.messages, etc.) from dominating
+// picker-open time — SQLite skips reading those pages from disk when the
+// length predicate is evaluated against the page header, taking queries over
+// a 2GB database from ~1.2s down to ~370ms. Keys whose values are ALL fat
+// simply don't appear in the picker, which is the desired behaviour: you'd
+// never want to filter traces by exact-match on a 1MB prompt blob anyway.
+const FACET_VALUE_MAX_LEN = 512
 const TRACE_SUMMARY_SELECT_SQL = `
 	SELECT
 		trace_id,
@@ -437,13 +453,30 @@ export const TelemetryStoreLive = Layer.effect(
 		mkdirSync(dirname(config.otel.databasePath), { recursive: true })
 		const db = yield* Effect.acquireRelease(
 			Effect.sync(() => new Database(config.otel.databasePath, { create: true })),
-			(db) => Effect.sync(() => db.close()),
+			(db) => Effect.sync(() => {
+				// `PRAGMA optimize` at close persists any stats SQLite gathered
+				// during the session, so the next process start gets an accurate
+				// query planner on the first query instead of a 3-second cold
+				// run. Cheap: it skips work unless stats have drifted.
+				try { db.exec(`PRAGMA optimize;`) } catch { /* nothing */ }
+				db.close()
+			}),
 		)
 		db.exec(`
 			PRAGMA journal_mode = WAL;
 			PRAGMA synchronous = NORMAL;
 			PRAGMA temp_store = MEMORY;
 			PRAGMA busy_timeout = 5000;
+			-- Bump cache above the 2MB default. 64MB fits most hot index pages
+			-- (trace_summaries, spans, span_attributes indexes) in RAM even on
+			-- multi-GB databases, cutting cold-read latency meaningfully on
+			-- picker / search queries that sweep the index.
+			PRAGMA cache_size = -65536;
+			-- Let SQLite memory-map the first 256MB of the file. This is a
+			-- cheap way to avoid read() syscalls on hot pages and lets the OS
+			-- page cache serve index lookups directly. Safe on macOS and Linux;
+			-- SQLite silently caps at actual file size for smaller DBs.
+			PRAGMA mmap_size = 268435456;
 			CREATE TABLE IF NOT EXISTS spans (
 				trace_id TEXT NOT NULL,
@@ -545,12 +578,90 @@ export const TelemetryStoreLive = Layer.effect(
 			// FTS is optional; queries will fall back to LIKE if unavailable.
 		}
+		// External-content FTS5 over the subset of span_attributes.value rows
+		// whose key is in AI_FTS_KEYS (LLM prompts, responses, tool calls,
+		// etc.). External content means the inverted index is the only
+		// FTS storage — the value text itself continues to live once in
+		// span_attributes, not duplicated into the FTS table. On a 2 GB DB
+		// with 270 MB of prompt JSON this typically adds ~50-120 MB of
+		// index, turning a 500-800ms LIKE scan into a <50ms MATCH.
+		//
+		// Keys are inlined into the trigger DDL rather than looked up in a
+		// side table so the `WHEN` guard stays constant-cost (a subquery
+		// would run on every span_attributes insert — ~60/span).
+		let hasAttrFts = hasFts
+		if (hasFts) {
+			try {
+				const keyList = AI_FTS_KEYS.map((k) => `'${k.replace(/'/g, "''")}'`).join(", ")
+				db.exec(`
+					CREATE VIRTUAL TABLE IF NOT EXISTS span_attr_fts USING fts5(
+						value,
+						content='span_attributes',
+						content_rowid='rowid',
+						tokenize='unicode61 remove_diacritics 2'
+					);
+					-- Mirror inserts into FTS when the key carries LLM content.
+					-- NOTE: triggers MUST use fully-qualified name (new.rowid,
+					-- new.value) and emit rowid so external-content FTS can
+					-- fetch the value back via span_attributes.rowid.
+					CREATE TRIGGER IF NOT EXISTS span_attr_fts_ai AFTER INSERT ON span_attributes
+					WHEN new.key IN (${keyList})
+					BEGIN
+						INSERT INTO span_attr_fts(rowid, value) VALUES (new.rowid, new.value);
+					END;
+					-- Delete with the same guard so retention & re-ingest stay
+					-- in sync. External-content 'delete' command needs the
+					-- original value to remove from the inverted index.
+					CREATE TRIGGER IF NOT EXISTS span_attr_fts_ad AFTER DELETE ON span_attributes
+					WHEN old.key IN (${keyList})
+					BEGIN
+						INSERT INTO span_attr_fts(span_attr_fts, rowid, value)
+						VALUES ('delete', old.rowid, old.value);
+					END;
+					-- Handle in-place updates (rare; re-ingest usually goes
+					-- DELETE then INSERT but belt-and-braces).
+					CREATE TRIGGER IF NOT EXISTS span_attr_fts_au AFTER UPDATE ON span_attributes
+					WHEN old.key IN (${keyList}) OR new.key IN (${keyList})
+					BEGIN
+						INSERT INTO span_attr_fts(span_attr_fts, rowid, value)
+						VALUES ('delete', old.rowid, old.value);
+						INSERT INTO span_attr_fts(rowid, value)
+						SELECT new.rowid, new.value
+						WHERE new.key IN (${keyList});
+					END;
+				`)
+			} catch {
+				hasAttrFts = false
+			}
+		}
 		try {
 			db.exec(`ALTER TABLE trace_summaries ADD COLUMN active_span_count INTEGER NOT NULL DEFAULT 0`)
 		} catch {
 			// Existing databases may already have the column.
 		}
+		// Prime the query planner. `PRAGMA optimize` is SQLite's modern,
+		// lightweight stats refresh: it only re-ANALYZEs indexes whose row
+		// counts have drifted significantly since the last run, capped at
+		// `analysis_limit` iterations per index so it finishes in a
+		// bounded time even on large databases. Without this, queries like
+		// the attribute picker facet run with guessed row estimates and
+		// pay 3-4s on cold open instead of 400ms.
+		try {
+			db.exec(`PRAGMA analysis_limit = 1000; PRAGMA optimize;`)
+			// First-time databases won't have sqlite_stat1 until we run a
+			// real ANALYZE. Force it once if stats haven't been collected.
+			const hasStats = db.query(`SELECT 1 FROM sqlite_master WHERE name = 'sqlite_stat1' LIMIT 1`).get() !== null
+			if (!hasStats) db.exec(`ANALYZE;`)
+		} catch {
+			// ANALYZE / optimize failures are never fatal — queries still work,
+			// they just run with default row estimates.
+		}
 		const insertSpan = db.query(`
 			INSERT INTO spans (
 				trace_id, span_id, parent_span_id, service_name, scope_name, operation_name, kind,
@@ -687,6 +798,47 @@ export const TelemetryStoreLive = Layer.effect(
 		// Run cleanup every 60 seconds in the background, tied to the layer's scope
 		yield* Effect.forkScoped(Effect.repeat(cleanupExpired(), Schedule.spaced("60 seconds")))
+		// Periodically refresh query planner stats. `PRAGMA optimize` is a
+		// no-op when nothing has changed, so this is essentially free on idle
+		// servers and keeps facet/search planner estimates accurate as data
+		// grows. 15 minutes is slower than ingestion rates we care about but
+		// frequent enough that the attribute picker stays snappy.
+		const refreshPlannerStats = Effect.sync(() => {
+			try { db.exec(`PRAGMA optimize;`) } catch { /* ignore */ }
+		})
+		yield* Effect.forkScoped(Effect.repeat(refreshPlannerStats, Schedule.spaced("15 minutes")))
+		// One-time backfill for existing DBs: if span_attr_fts is empty but
+		// span_attributes has rows with AI_FTS_KEYS, populate the index.
+		// Runs forked so server startup isn't blocked; queries hitting the
+		// FTS will just return empty until the fill lands. On a 2 GB DB with
+		// ~400 matching rows this takes ~3-8 seconds.
+		if (hasAttrFts) {
+			const backfillAttrFts = Effect.sync(() => {
+				try {
+					const ftsCount = (db.query(`SELECT COUNT(*) AS c FROM span_attr_fts`).get() as { c: number }).c
+					if (ftsCount > 0) return
+					const keyList = AI_FTS_KEYS.map((k) => `'${k.replace(/'/g, "''")}'`).join(", ")
+					const attrCount = (db.query(
+						`SELECT COUNT(*) AS c FROM span_attributes WHERE key IN (${keyList})`,
+					).get() as { c: number }).c
+					if (attrCount === 0) return
+					// Single INSERT..SELECT is atomic and fast; FTS5 batches
+					// its internal segment writes. No transaction wrapper
+					// needed — it runs as one statement.
+					db.exec(`
+						INSERT INTO span_attr_fts(rowid, value)
+						SELECT rowid, value FROM span_attributes WHERE key IN (${keyList})
+					`)
+				} catch {
+					// Backfill failure is never fatal — new ingests still
+					// populate FTS via the trigger, and queries fall back to
+					// LIKE when FTS lookups return empty.
+				}
+			})
+			yield* Effect.forkScoped(backfillAttrFts)
+		}
 		const ingestTraces = Effect.fn("motel/TelemetryStore.ingestTraces")(function* (payload: OtlpTraceExportRequest) {
 			return yield* Effect.sync(() => {
 				let insertedSpans = 0
@@ -911,6 +1063,25 @@ export const TelemetryStoreLive = Layer.effect(
 					params.push(...exactAttrMatch.params)
 				}
+				// `:ai <query>` — FTS match against LLM content keys. Joins
+				// span_attr_fts back to span_attributes to collect trace_ids
+				// whose spans carry matching prompt/response content. Falls
+				// through to no-op when the query tokenizes empty (e.g. only
+				// stopwords or operator-chars) so users don't get a silently
+				// empty list.
+				if (input.aiText) {
+					const aiFtsQuery = toFtsMatchQuery(input.aiText)
+					if (hasAttrFts && aiFtsQuery) {
+						clauses.push(`trace_id IN (
+							SELECT DISTINCT sa.trace_id
+							FROM span_attr_fts fts
+							JOIN span_attributes sa ON sa.rowid = fts.rowid
+							WHERE fts.value MATCH ?
+						)`)
+						params.push(aiFtsQuery)
+					}
+				}
 				const rows = db.query(`
 					SELECT trace_id, service_name, root_operation_name, started_at_ms, ended_at_ms, active_span_count, duration_ms, span_count, error_count
 					FROM trace_summaries
@@ -1463,7 +1634,14 @@ export const TelemetryStoreLive = Layer.effect(
 						// user id, model) rank higher than keys that are constant across every
 						// trace (service.name, telemetry.sdk.*) — the latter can't discriminate
 						// between traces so they're useless as filters.
-						const params: Array<string | number> = [cutoff]
+						//
+						// Performance note: we skip rows whose value blob is larger than
+						// FACET_VALUE_MAX_LEN. For opencode this hides `ai.prompt`,
+						// `ai.prompt.messages`, and `ai.prompt.tools` — which are 1-6MB text
+						// blobs that you'd never want to filter by exact match anyway. The
+						// WHERE clause lets SQLite skip reading those pages from disk, taking
+						// the picker open time from ~1.2s to ~370ms on a 2GB database.
+						const params: Array<string | number> = [FACET_VALUE_MAX_LEN, cutoff]
 						if (input.serviceName) params.push(input.serviceName)
 						params.push(limit)
 						const rows = db.query(`
@@ -1472,7 +1650,8 @@ export const TelemetryStoreLive = Layer.effect(
 							       COUNT(DISTINCT sa.value) AS distinct_values
 							FROM span_attributes sa
 							JOIN spans s ON s.trace_id = sa.trace_id AND s.span_id = sa.span_id
-							WHERE s.start_time_ms >= ?
+							WHERE LENGTH(sa.value) < ?
+							  AND s.start_time_ms >= ?
 							${input.serviceName ? "AND s.service_name = ?" : ""}
 							GROUP BY sa.key
 							ORDER BY (CASE WHEN distinct_values = 1 THEN 1 ELSE 0 END) ASC,
@@ -1485,14 +1664,18 @@ export const TelemetryStoreLive = Layer.effect(
 					}
 					if (input.field === "attribute_values") {
 						if (!input.key) return [] as FacetItem[]
-						const params: Array<string | number> = [input.key, cutoff]
+						// Skip multi-KB values here too — they blow up GROUP BY on big text.
+						// Matches the attribute_keys pre-filter so the picker stays responsive
+						// if someone hand-crafts a URL that targets a fat key.
+						const params: Array<string | number> = [input.key, FACET_VALUE_MAX_LEN, cutoff]
 						if (input.serviceName) params.push(input.serviceName)
 						params.push(limit)
 						const rows = db.query(`
 							SELECT sa.value AS value, COUNT(DISTINCT sa.trace_id) AS count
 							FROM span_attributes sa
 							JOIN spans s ON s.trace_id = sa.trace_id AND s.span_id = sa.span_id
-							WHERE sa.key = ? AND s.start_time_ms >= ?
+							WHERE sa.key = ? AND LENGTH(sa.value) < ?
+							  AND s.start_time_ms >= ?
 							${input.serviceName ? "AND s.service_name = ?" : ""}
 							GROUP BY sa.value
 							ORDER BY count DESC, value ASC
@@ -1558,11 +1741,27 @@ export const TelemetryStoreLive = Layer.effect(
 				params.push(key, value)
 			}
-			// Text search across prompt/response/tool attribute values
+			// Text search across prompt/response/tool attribute values via
+			// FTS5. Prefers the external-content span_attr_fts index when
+			// available, falls back to case-insensitive LIKE so old DBs
+			// without FTS still work. FTS turns ~500ms full scans of 3 MB
+			// prompt JSON into <50ms MATCH lookups.
 			if ("text" in input && input.text) {
-				const textKeys = AI_TEXT_SEARCH_KEYS.map(() => "?").join(", ")
-				clauses.push(`EXISTS (SELECT 1 FROM span_attributes WHERE span_attributes.trace_id = s.trace_id AND span_attributes.span_id = s.span_id AND key IN (${textKeys}) AND value LIKE ? COLLATE NOCASE)`)
-				params.push(...AI_TEXT_SEARCH_KEYS, `%${input.text}%`)
+				const ftsQuery = toFtsMatchQuery(input.text)
+				if (hasAttrFts && ftsQuery) {
+					clauses.push(`EXISTS (
+						SELECT 1 FROM span_attr_fts fts
+						JOIN span_attributes sa ON sa.rowid = fts.rowid
+						WHERE sa.trace_id = s.trace_id
+						AND sa.span_id = s.span_id
+						AND fts.value MATCH ?
+					)`)
+					params.push(ftsQuery)
+				} else {
+					const textKeys = AI_TEXT_SEARCH_KEYS.map(() => "?").join(", ")
+					clauses.push(`EXISTS (SELECT 1 FROM span_attributes WHERE span_attributes.trace_id = s.trace_id AND span_attributes.span_id = s.span_id AND key IN (${textKeys}) AND value LIKE ? COLLATE NOCASE)`)
+					params.push(...AI_TEXT_SEARCH_KEYS, `%${input.text}%`)
+				}
 			}
 			return { clauses, params }

package/src/services/TraceQueryService.ts CHANGED Viewed

@@ -8,7 +8,7 @@ export class TraceQueryService extends Context.Service<
 		readonly listServices: Effect.Effect<readonly string[], Error>
 		readonly listRecentTraces: (serviceName: string, options?: { readonly lookbackMinutes?: number; readonly limit?: number }) => Effect.Effect<readonly TraceItem[], Error>
 		readonly listTraceSummaries: (serviceName: string, options?: { readonly lookbackMinutes?: number; readonly limit?: number }) => Effect.Effect<readonly TraceSummaryItem[], Error>
-		readonly searchTraceSummaries: (input: { readonly serviceName?: string | null; readonly operation?: string | null; readonly status?: "ok" | "error" | null; readonly minDurationMs?: number | null; readonly lookbackMinutes?: number; readonly limit?: number; readonly attributeFilters?: Readonly<Record<string, string>> }) => Effect.Effect<readonly TraceSummaryItem[], Error>
+		readonly searchTraceSummaries: (input: { readonly serviceName?: string | null; readonly operation?: string | null; readonly status?: "ok" | "error" | null; readonly minDurationMs?: number | null; readonly lookbackMinutes?: number; readonly limit?: number; readonly attributeFilters?: Readonly<Record<string, string>>; readonly aiText?: string | null }) => Effect.Effect<readonly TraceSummaryItem[], Error>
 		readonly listFacets: (input: { readonly type: "traces" | "logs"; readonly field: string; readonly serviceName?: string | null; readonly key?: string | null; readonly lookbackMinutes?: number; readonly limit?: number }) => Effect.Effect<readonly { readonly value: string; readonly count: number }[], Error>
 		readonly searchTraces: (input: { readonly serviceName?: string | null; readonly operation?: string | null; readonly status?: "ok" | "error" | null; readonly minDurationMs?: number | null; readonly lookbackMinutes?: number; readonly limit?: number; readonly attributeFilters?: Readonly<Record<string, string>> }) => Effect.Effect<readonly TraceItem[], Error>
 		readonly traceStats: (input: { readonly groupBy: string; readonly agg: "count" | "avg_duration" | "p95_duration" | "error_rate"; readonly serviceName?: string | null; readonly operation?: string | null; readonly status?: "ok" | "error" | null; readonly minDurationMs?: number | null; readonly lookbackMinutes?: number; readonly limit?: number; readonly attributeFilters?: Readonly<Record<string, string>> }) => Effect.Effect<readonly { readonly group: string; readonly value: number; readonly count: number }[], Error>

package/src/telemetry.test.ts CHANGED Viewed

@@ -651,6 +651,39 @@ describe("motel telemetry store", () => {
 		expect(result[0]?.spanId).toBe("ai-stream-1")
 	})
+	it("matches AI calls via words in the response text", async () => {
+		// Verifies FTS indexes ai.response.text, not just ai.prompt*. The
+		// seeded ai-stream-2 has response "Error: rate limited".
+		const result = await storeRuntime.runPromise(
+			Effect.flatMap(TelemetryStore.asEffect(), (store) =>
+				store.searchAiCalls({ text: "rate limited" }),
+			).pipe(Effect.provideService(References.MinimumLogLevel, "None")),
+		)
+		expect(result.map((r) => r.spanId)).toContain("ai-stream-2")
+	})
+	it("matches AI calls case-insensitively and with partial words", async () => {
+		// unicode61 tokenizer is case-insensitive by default; prefix `*`
+		// handles partial terms like `"PROG"` matching `"programming"`.
+		const result = await storeRuntime.runPromise(
+			Effect.flatMap(TelemetryStore.asEffect(), (store) =>
+				store.searchAiCalls({ text: "PROG" }),
+			).pipe(Effect.provideService(References.MinimumLogLevel, "None")),
+		)
+		expect(result.map((r) => r.spanId)).toContain("ai-stream-1")
+	})
+	it("ignores FTS special characters without syntax errors", async () => {
+		// FTS5 treats `"`, `*`, `-`, `:` as operators; toFtsQuery must
+		// strip them so raw user input never crashes the query.
+		const result = await storeRuntime.runPromise(
+			Effect.flatMap(TelemetryStore.asEffect(), (store) =>
+				store.searchAiCalls({ text: `"joke" - about:programming*` }),
+			).pipe(Effect.provideService(References.MinimumLogLevel, "None")),
+		)
+		expect(result.map((r) => r.spanId)).toContain("ai-stream-1")
+	})
 	it("filters AI calls by operation type", async () => {
 		const result = await storeRuntime.runPromise(
 			Effect.flatMap(TelemetryStore.asEffect(), (store) =>

package/src/ui/TraceDetailsPane.tsx CHANGED Viewed

@@ -1,8 +1,9 @@
 import { useMemo } from "react"
 import type { TraceItem, TraceSummaryItem } from "../domain.ts"
 import { formatDuration, formatShortDate, formatTimestamp } from "./format.ts"
-import { AlignedHeaderLine, Divider, PlainLine, TextLine } from "./primitives.tsx"
+import { AlignedHeaderLine, Divider, FilterBar, PlainLine, TextLine } from "./primitives.tsx"
 import { getVisibleSpans, WaterfallTimeline } from "./Waterfall.tsx"
+import { computeMatchingSpanIds } from "./waterfallFilter.ts"
 import type { LoadStatus, LogState } from "./state.ts"
 import { colors, SEPARATOR } from "./theme.ts"
@@ -30,6 +31,8 @@ export const TraceDetailsPane = ({
 	collapsedSpanIds,
 	focused = false,
 	onSelectSpan,
+	waterfallFilterMode,
+	waterfallFilterText,
 }: {
 	trace: TraceItem | null
 	traceSummary: TraceSummaryItem | null
@@ -43,6 +46,8 @@ export const TraceDetailsPane = ({
 	collapsedSpanIds: ReadonlySet<string>
 	focused?: boolean
 	onSelectSpan: (index: number) => void
+	waterfallFilterMode: boolean
+	waterfallFilterText: string
 }) => {
 	const filteredSpans = useMemo(
 		() => trace ? getVisibleSpans(trace.spans, collapsedSpanIds) : [],
@@ -62,6 +67,15 @@ export const TraceDetailsPane = ({
 		() => selectedSpan ? traceLogsState.data.filter((log) => log.spanId === selectedSpan.spanId) : [],
 		[selectedSpan, traceLogsState.data],
 	)
+	const matchingSpanIds = useMemo(
+		() => trace ? computeMatchingSpanIds(trace.spans, waterfallFilterText) : null,
+		[trace, waterfallFilterText],
+	)
+	const matchCount = matchingSpanIds?.size ?? 0
+	// Reserve 1 row for the filter bar when it's being shown so the
+	// waterfall doesn't spill into the footer.
+	const showFilterBar = waterfallFilterMode || waterfallFilterText.length > 0
+	const waterfallBodyLines = showFilterBar ? Math.max(1, bodyLines - 1) : bodyLines
 	const traceMeta = trace ?? traceSummary
 	const hasTraceSelection = traceSummary !== null
@@ -112,6 +126,22 @@ export const TraceDetailsPane = ({
 						</TextLine>
 					</box>
 					<Divider width={paneWidth} />
+					{showFilterBar ? (
+						<box paddingLeft={1} paddingRight={1}>
+							{waterfallFilterMode ? (
+								<FilterBar text={waterfallFilterText} width={contentWidth} />
+							) : (
+								<TextLine>
+									<span fg={colors.muted}>{"/"}</span>
+									<span fg={colors.text}>{waterfallFilterText}</span>
+									<span fg={colors.separator}>{SEPARATOR}</span>
+									<span fg={colors.count}>{matchCount} match{matchCount === 1 ? "" : "es"}</span>
+									<span fg={colors.separator}>{SEPARATOR}</span>
+									<span fg={colors.muted}>esc clear</span>
+								</TextLine>
+							)}
+						</box>
+					) : null}
 					<box flexDirection="column" paddingLeft={1} paddingRight={1}>
 						<WaterfallTimeline
 							trace={trace}
@@ -119,9 +149,10 @@ export const TraceDetailsPane = ({
 							spanLogCounts={spanLogCounts}
 							selectedSpanLogs={selectedSpanLogs}
 							contentWidth={contentWidth}
-							bodyLines={bodyLines}
+							bodyLines={waterfallBodyLines}
 							selectedSpanIndex={selectedSpanIndex}
 							collapsedSpanIds={collapsedSpanIds}
+							matchingSpanIds={matchingSpanIds}
 							onSelectSpan={onSelectSpan}
 						/>
 					</box>