npm - @cephalization/phoenix-insight - Versions diffs - 0.3.0 → 1.0.0 - Mend

@cephalization/phoenix-insight 0.3.0 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (57) hide show

package/README.md +195 -1
package/dist/agent/index.js +9 -4
package/dist/cli.js +172 -0
package/dist/commands/index.js +1 -0
package/dist/commands/report-tool.js +239 -0
package/dist/config/schema.js +2 -2
package/dist/modes/local.js +7 -0
package/dist/modes/sandbox.js +8 -0
package/dist/prompts/index.js +1 -1
package/dist/prompts/system.js +10 -3
package/dist/server/session.js +357 -0
package/dist/server/ui.js +232 -0
package/dist/server/websocket.js +212 -0
package/dist/snapshot/spans.js +28 -4
package/dist/tsconfig.esm.tsbuildinfo +1 -1
package/dist/ui/assets/code-block-F6WJLWQG-BTdTzfvl.js +154 -0
package/dist/ui/assets/code-block-F6WJLWQG-BTdTzfvl.js.map +1 -0
package/dist/ui/assets/index-CX8aDatf.css +1 -0
package/dist/ui/assets/index-DjZuAW6Y.js +63 -0
package/dist/ui/assets/index-DjZuAW6Y.js.map +1 -0
package/dist/ui/assets/vendor-data-r1ZEkUds.js +40 -0
package/dist/ui/assets/vendor-data-r1ZEkUds.js.map +1 -0
package/dist/ui/assets/vendor-react-Cgg2GOmP.js +2 -0
package/dist/ui/assets/vendor-react-Cgg2GOmP.js.map +1 -0
package/dist/ui/assets/vendor-render-DoMl5bum.js +381 -0
package/dist/ui/assets/vendor-render-DoMl5bum.js.map +1 -0
package/dist/ui/assets/vendor-ui-Cg-YC4hK.js +46 -0
package/dist/ui/assets/vendor-ui-Cg-YC4hK.js.map +1 -0
package/dist/ui/index.html +18 -0
package/dist/ui/vite.svg +1 -0
package/package.json +13 -14
package/src/agent/index.ts +0 -323
package/src/cli.ts +0 -854
package/src/commands/index.ts +0 -8
package/src/commands/px-fetch-more-spans.ts +0 -174
package/src/commands/px-fetch-more-trace.ts +0 -183
package/src/config/index.ts +0 -225
package/src/config/loader.ts +0 -173
package/src/config/schema.ts +0 -66
package/src/index.ts +0 -1
package/src/modes/index.ts +0 -21
package/src/modes/local.ts +0 -163
package/src/modes/sandbox.ts +0 -144
package/src/modes/types.ts +0 -31
package/src/observability/index.ts +0 -90
package/src/progress.ts +0 -239
package/src/prompts/index.ts +0 -1
package/src/prompts/system.ts +0 -31
package/src/snapshot/client.ts +0 -129
package/src/snapshot/context.ts +0 -587
package/src/snapshot/datasets.ts +0 -132
package/src/snapshot/experiments.ts +0 -246
package/src/snapshot/index.ts +0 -403
package/src/snapshot/projects.ts +0 -58
package/src/snapshot/prompts.ts +0 -267
package/src/snapshot/spans.ts +0 -142
package/src/snapshot/utils.ts +0 -140

package/src/snapshot/context.ts DELETED Viewed

@@ -1,587 +0,0 @@
-import type { ExecutionMode } from "../modes/types.js";
-interface ContextMetadata {
-  phoenixUrl: string;
-  snapshotTime: Date;
-  spansPerProject?: number;
-}
-interface ProjectStats {
-  name: string;
-  spanCount: number;
-  hasErrors?: boolean;
-  recentSpans?: number;
-}
-interface DatasetInfo {
-  name: string;
-  exampleCount: number;
-  updatedAt?: string;
-}
-interface ExperimentInfo {
-  id: string;
-  datasetName: string;
-  projectName?: string;
-  status: "completed" | "in_progress" | "failed";
-  runCounts: {
-    successful: number;
-    failed: number;
-    missing: number;
-  };
-  updatedAt?: string;
-}
-interface PromptInfo {
-  name: string;
-  versionCount: number;
-  latestVersion?: string;
-  updatedAt?: string;
-}
-// =============================================================================
-// Static Section Templates
-// =============================================================================
-/**
- * Quick Start section for external agents - appears at the top for discoverability
- */
-const QUICK_START_SECTION = `## Quick Start for External Agents
-This is a **read-only snapshot** of Phoenix observability data. You cannot modify this data.
-### Key Files to Start With
-| File | Description |
-|------|-------------|
-| \`/phoenix/projects/index.jsonl\` | List of all projects with traces |
-| \`/phoenix/datasets/index.jsonl\` | List of all datasets |
-| \`/phoenix/experiments/index.jsonl\` | List of all experiments |
-| \`/phoenix/prompts/index.jsonl\` | List of all prompts |
-### How to Parse Each File Format
-**JSONL files** (\`.jsonl\`): One JSON object per line
-\`\`\`bash
-# Read all lines as a JSON array
-cat /phoenix/projects/index.jsonl | jq -s '.'
-# Process each line individually
-while read -r line; do echo "$line" | jq '.name'; done < /phoenix/projects/index.jsonl
-# Get first N items
-head -n 5 /phoenix/projects/index.jsonl | jq -s '.'
-\`\`\`
-**JSON files** (\`.json\`): Standard JSON format
-\`\`\`bash
-# Read and pretty-print
-cat /phoenix/projects/my-project/metadata.json | jq '.'
-# Extract specific field
-cat /phoenix/projects/my-project/metadata.json | jq '.name'
-\`\`\`
-**Markdown files** (\`.md\`): Plain text prompt templates
-\`\`\`bash
-# Read prompt template
-cat /phoenix/prompts/my-prompt/versions/v1.md
-\`\`\`
-### Common Operations
-\`\`\`bash
-# List all project names
-cat /phoenix/projects/index.jsonl | jq -r '.name'
-# Count spans in a project
-wc -l < /phoenix/projects/my-project/spans/index.jsonl
-# Find spans with errors
-cat /phoenix/projects/my-project/spans/index.jsonl | jq 'select(.status_code == "ERROR")'
-# Get dataset examples
-cat /phoenix/datasets/my-dataset/examples.jsonl | jq -s '.' | head -n 100
-# Search across all files
-grep -r "error" /phoenix/
-\`\`\``;
-/**
- * Directory Structure section showing the snapshot layout
- */
-const DIRECTORY_STRUCTURE_SECTION = `## Directory Structure
-\`\`\`
-/phoenix/
-  _context.md                    # This file - start here!
-  /projects/
-    index.jsonl                  # List of all projects
-    /{project_name}/
-      metadata.json              # Project details
-      /spans/
-        index.jsonl              # Span data (may be sampled)
-        metadata.json            # Span snapshot metadata
-  /datasets/
-    index.jsonl                  # List of all datasets
-    /{dataset_name}/
-      metadata.json              # Dataset details
-      examples.jsonl             # Dataset examples
-  /experiments/
-    index.jsonl                  # List of all experiments
-    /{experiment_id}/
-      metadata.json              # Experiment details
-      runs.jsonl                 # Experiment runs
-  /prompts/
-    index.jsonl                  # List of all prompts
-    /{prompt_name}/
-      metadata.json              # Prompt details
-      /versions/
-        index.jsonl              # Version list
-        /{version_id}.md         # Version template
-  /_meta/
-    snapshot.json                # Snapshot metadata
-\`\`\``;
-/**
- * What You Can Do section describing available operations
- */
-const WHAT_YOU_CAN_DO_SECTION = `## What You Can Do
-- **Explore**: ls, cat, grep, find, jq, awk, sed
-- **Fetch more data**: \`px-fetch-more spans --project <name> --limit 500\`
-- **Fetch specific trace**: \`px-fetch-more trace --trace-id <id>\``;
-/**
- * Data Freshness section with refresh instructions
- */
-const DATA_FRESHNESS_SECTION = `## Data Freshness
-This is a **read-only snapshot**. Data may have changed since capture.
-Run with \`--refresh\` to get latest data.`;
-// =============================================================================
-// Main Context Generation
-// =============================================================================
-/**
- * Generates a _context.md summary file for the Phoenix snapshot
- * This provides human and agent-readable context about what data is available
- */
-export async function generateContext(
-  mode: ExecutionMode,
-  metadata: ContextMetadata
-): Promise<void> {
-  // Collect stats from the snapshot
-  const stats = await collectSnapshotStats(mode);
-  // Build the dynamic "What's Here" section
-  const whatsHereSection = buildWhatsHereSection(stats, metadata);
-  // Build the dynamic "Recent Activity" section (may be empty)
-  const recentActivitySection = buildRecentActivitySection(stats);
-  // Compose the full context document
-  const content = [
-    "# Phoenix Snapshot Context",
-    "",
-    QUICK_START_SECTION,
-    "",
-    whatsHereSection,
-    recentActivitySection,
-    DIRECTORY_STRUCTURE_SECTION,
-    "",
-    WHAT_YOU_CAN_DO_SECTION,
-    "",
-    DATA_FRESHNESS_SECTION,
-  ].join("\n");
-  // Write the context file
-  await mode.writeFile("/phoenix/_context.md", content);
-}
-// =============================================================================
-// Dynamic Section Builders
-// =============================================================================
-/**
- * Builds the "What's Here" section with project/dataset/experiment/prompt summaries
- */
-function buildWhatsHereSection(
-  stats: {
-    projects: ProjectStats[];
-    datasets: DatasetInfo[];
-    experiments: ExperimentInfo[];
-    prompts: PromptInfo[];
-  },
-  metadata: ContextMetadata
-): string {
-  const lines: string[] = [];
-  lines.push("## What's Here");
-  lines.push("");
-  // Projects summary
-  if (stats.projects.length > 0) {
-    const projectSummary = stats.projects
-      .map((p) => `${p.name} (${p.spanCount} spans)`)
-      .join(", ");
-    lines.push(`- **${stats.projects.length} projects**: ${projectSummary}`);
-  } else {
-    lines.push("- **No projects found**");
-  }
-  // Datasets summary
-  if (stats.datasets.length > 0) {
-    const datasetNames = stats.datasets.map((d) => d.name).join(", ");
-    lines.push(`- **${stats.datasets.length} datasets**: ${datasetNames}`);
-  } else {
-    lines.push("- **No datasets found**");
-  }
-  // Experiments summary
-  if (stats.experiments.length > 0) {
-    const completedCount = stats.experiments.filter(
-      (e) => e.status === "completed"
-    ).length;
-    const inProgressCount = stats.experiments.filter(
-      (e) => e.status === "in_progress"
-    ).length;
-    const failedCount = stats.experiments.filter(
-      (e) => e.status === "failed"
-    ).length;
-    const parts: string[] = [];
-    if (completedCount > 0) parts.push(`${completedCount} completed`);
-    if (inProgressCount > 0) parts.push(`${inProgressCount} in progress`);
-    if (failedCount > 0) parts.push(`${failedCount} failed`);
-    lines.push(
-      `- **${stats.experiments.length} experiments**: ${parts.join(", ")}`
-    );
-  } else {
-    lines.push("- **No experiments found**");
-  }
-  // Prompts summary
-  if (stats.prompts.length > 0) {
-    const promptNames = stats.prompts.map((p) => p.name).join(", ");
-    lines.push(`- **${stats.prompts.length} prompts**: ${promptNames}`);
-  } else {
-    lines.push("- **No prompts found**");
-  }
-  // Snapshot metadata
-  lines.push(
-    `- **Snapshot**: Created ${formatRelativeTime(metadata.snapshotTime)} from ${metadata.phoenixUrl}`
-  );
-  lines.push("");
-  return lines.join("\n");
-}
-/**
- * Builds the "Recent Activity" section if there are recent updates
- * Returns an empty string if no recent activity
- */
-function buildRecentActivitySection(stats: {
-  projects: ProjectStats[];
-  datasets: DatasetInfo[];
-  experiments: ExperimentInfo[];
-  prompts: PromptInfo[];
-}): string {
-  const activities = getRecentActivity(stats);
-  if (activities.length === 0) {
-    return "";
-  }
-  const lines: string[] = [];
-  lines.push("## Recent Activity");
-  lines.push("");
-  for (const activity of activities) {
-    lines.push(`- ${activity}`);
-  }
-  lines.push("");
-  return lines.join("\n");
-}
-// =============================================================================
-// Data Collection
-// =============================================================================
-/**
- * Collects statistics from the snapshot filesystem
- */
-async function collectSnapshotStats(mode: ExecutionMode): Promise<{
-  projects: ProjectStats[];
-  datasets: DatasetInfo[];
-  experiments: ExperimentInfo[];
-  prompts: PromptInfo[];
-}> {
-  const result = {
-    projects: [] as ProjectStats[],
-    datasets: [] as DatasetInfo[],
-    experiments: [] as ExperimentInfo[],
-    prompts: [] as PromptInfo[],
-  };
-  // Collect project stats
-  try {
-    const projectsExec = await mode.exec(
-      "cat /phoenix/projects/index.jsonl 2>/dev/null || true"
-    );
-    if (projectsExec.stdout) {
-      const projectLines = projectsExec.stdout
-        .trim()
-        .split("\n")
-        .filter((line) => line.length > 0);
-      for (const line of projectLines) {
-        try {
-          const project = JSON.parse(line);
-          const stats: ProjectStats = {
-            name: project.name,
-            spanCount: 0,
-          };
-          // Get span count for this project
-          const spansMetaExec = await mode.exec(
-            `cat /phoenix/projects/${project.name}/spans/metadata.json 2>/dev/null || echo "{}"`
-          );
-          if (spansMetaExec.stdout) {
-            try {
-              const spansMeta = JSON.parse(spansMetaExec.stdout);
-              stats.spanCount = spansMeta.spanCount || 0;
-            } catch (e) {
-              // Ignore parse errors
-            }
-          }
-          result.projects.push(stats);
-        } catch (e) {
-          // Skip invalid project lines
-        }
-      }
-    }
-  } catch (e) {
-    // No projects file
-  }
-  // Collect dataset stats
-  try {
-    const datasetsExec = await mode.exec(
-      "cat /phoenix/datasets/index.jsonl 2>/dev/null || true"
-    );
-    if (datasetsExec.stdout) {
-      const datasetLines = datasetsExec.stdout
-        .trim()
-        .split("\n")
-        .filter((line) => line.length > 0);
-      for (const line of datasetLines) {
-        try {
-          const dataset = JSON.parse(line);
-          // Get example count
-          const examplesExec = await mode.exec(
-            `wc -l < /phoenix/datasets/${dataset.name}/examples.jsonl 2>/dev/null || echo "0"`
-          );
-          const exampleCount = parseInt(examplesExec.stdout.trim()) || 0;
-          result.datasets.push({
-            name: dataset.name,
-            exampleCount,
-            updatedAt: dataset.updated_at,
-          });
-        } catch (e) {
-          // Skip invalid dataset lines
-        }
-      }
-    }
-  } catch (e) {
-    // No datasets file
-  }
-  // Collect experiment stats
-  try {
-    const experimentsExec = await mode.exec(
-      "cat /phoenix/experiments/index.jsonl 2>/dev/null || true"
-    );
-    if (experimentsExec.stdout) {
-      const experimentLines = experimentsExec.stdout
-        .trim()
-        .split("\n")
-        .filter((line) => line.length > 0);
-      for (const line of experimentLines) {
-        try {
-          const experiment = JSON.parse(line);
-          const status = determineExperimentStatus(experiment);
-          result.experiments.push({
-            id: experiment.id,
-            datasetName: experiment.datasetName || "unknown",
-            projectName: experiment.project_name,
-            status,
-            runCounts: {
-              successful: experiment.successful_run_count || 0,
-              failed: experiment.failed_run_count || 0,
-              missing: experiment.missing_run_count || 0,
-            },
-            updatedAt: experiment.updated_at,
-          });
-        } catch (e) {
-          // Skip invalid experiment lines
-        }
-      }
-    }
-  } catch (e) {
-    // No experiments file
-  }
-  // Collect prompt stats
-  try {
-    const promptsExec = await mode.exec(
-      "cat /phoenix/prompts/index.jsonl 2>/dev/null || true"
-    );
-    if (promptsExec.stdout) {
-      const promptLines = promptsExec.stdout
-        .trim()
-        .split("\n")
-        .filter((line) => line.length > 0);
-      for (const line of promptLines) {
-        try {
-          const prompt = JSON.parse(line);
-          // Count versions
-          const versionsExec = await mode.exec(
-            `wc -l < /phoenix/prompts/${prompt.name}/versions/index.jsonl 2>/dev/null || echo "0"`
-          );
-          const versionCount = parseInt(versionsExec.stdout.trim()) || 0;
-          result.prompts.push({
-            name: prompt.name,
-            versionCount,
-            updatedAt: prompt.updated_at,
-          });
-        } catch (e) {
-          // Skip invalid prompt lines
-        }
-      }
-    }
-  } catch (e) {
-    // No prompts file
-  }
-  return result;
-}
-// =============================================================================
-// Helper Functions
-// =============================================================================
-/**
- * Determines the status of an experiment based on its run counts
- */
-function determineExperimentStatus(
-  experiment: any
-): "completed" | "in_progress" | "failed" {
-  const totalExpected = experiment.example_count * experiment.repetitions;
-  const totalRuns =
-    (experiment.successful_run_count || 0) + (experiment.failed_run_count || 0);
-  if (totalRuns === 0) {
-    return "in_progress";
-  }
-  // If most runs are failed, consider it failed
-  if (
-    (experiment.failed_run_count || 0) > (experiment.successful_run_count || 0)
-  ) {
-    return "failed";
-  }
-  if (totalRuns >= totalExpected) {
-    return "completed";
-  }
-  return "in_progress";
-}
-/**
- * Gets recent activity highlights
- */
-function getRecentActivity(stats: {
-  projects: ProjectStats[];
-  datasets: DatasetInfo[];
-  experiments: ExperimentInfo[];
-  prompts: PromptInfo[];
-}): string[] {
-  const activities: string[] = [];
-  // Find recently updated experiments
-  const recentExperiments = stats.experiments
-    .filter((e) => e.updatedAt && isRecent(new Date(e.updatedAt), 24))
-    .sort(
-      (a, b) =>
-        new Date(b.updatedAt!).getTime() - new Date(a.updatedAt!).getTime()
-    );
-  for (const exp of recentExperiments.slice(0, 2)) {
-    const timeAgo = formatRelativeTime(new Date(exp.updatedAt!));
-    activities.push(
-      `${exp.projectName || exp.datasetName}: experiment "${exp.id.slice(0, 8)}..." ${exp.status} ${timeAgo}`
-    );
-  }
-  // Find recently updated datasets
-  const recentDatasets = stats.datasets
-    .filter((d) => d.updatedAt && isRecent(new Date(d.updatedAt), 24))
-    .sort(
-      (a, b) =>
-        new Date(b.updatedAt!).getTime() - new Date(a.updatedAt!).getTime()
-    );
-  for (const dataset of recentDatasets.slice(0, 2)) {
-    const timeAgo = formatRelativeTime(new Date(dataset.updatedAt!));
-    activities.push(
-      `${dataset.name}: dataset updated ${timeAgo} (${dataset.exampleCount} examples)`
-    );
-  }
-  return activities.slice(0, 3); // Limit to 3 activities
-}
-/**
- * Checks if a date is within the specified hours from now
- */
-function isRecent(date: Date, hoursAgo: number): boolean {
-  const now = new Date();
-  const diff = now.getTime() - date.getTime();
-  return diff < hoursAgo * 60 * 60 * 1000;
-}
-/**
- * Formats a date as relative time (e.g., "2 hours ago")
- */
-function formatRelativeTime(date: Date): string {
-  const now = new Date();
-  const diff = now.getTime() - date.getTime();
-  const minutes = Math.floor(diff / (1000 * 60));
-  const hours = Math.floor(diff / (1000 * 60 * 60));
-  const days = Math.floor(diff / (1000 * 60 * 60 * 24));
-  if (minutes < 1) {
-    return "just now";
-  } else if (minutes < 60) {
-    return `${minutes} minute${minutes !== 1 ? "s" : ""} ago`;
-  } else if (hours < 24) {
-    return `${hours} hour${hours !== 1 ? "s" : ""} ago`;
-  } else {
-    return `${days} day${days !== 1 ? "s" : ""} ago`;
-  }
-}

package/src/snapshot/datasets.ts DELETED Viewed

@@ -1,132 +0,0 @@
-import type { PhoenixClient } from "@arizeai/phoenix-client";
-import type { ExecutionMode } from "../modes/types.js";
-import { withErrorHandling, extractData } from "./client.js";
-interface Dataset {
-  id: string;
-  name: string;
-  description: string | null;
-  metadata: Record<string, unknown>;
-  created_at: string;
-  updated_at: string;
-}
-interface DatasetExample {
-  id: string;
-  input: Record<string, unknown>;
-  output: Record<string, unknown>;
-  metadata: Record<string, unknown>;
-  updated_at: string;
-}
-interface FetchDatasetsOptions {
-  limit?: number;
-}
-/**
- * Converts an array to JSONL format
- */
-function toJSONL(items: unknown[]): string {
-  if (items.length === 0) {
-    return "";
-  }
-  return items.map((item) => JSON.stringify(item)).join("\n");
-}
-/**
- * Fetches all datasets and their examples from Phoenix
- */
-export async function fetchDatasets(
-  client: PhoenixClient,
-  mode: ExecutionMode,
-  options: FetchDatasetsOptions = {}
-): Promise<void> {
-  const { limit = 100 } = options;
-  // Fetch all datasets with pagination
-  const datasets: Dataset[] = [];
-  let cursor: string | null = null;
-  while (datasets.length < limit) {
-    const query: Record<string, unknown> = {
-      limit: Math.min(limit - datasets.length, 100),
-    };
-    if (cursor) {
-      query.cursor = cursor;
-    }
-    const response = await withErrorHandling(
-      () => client.GET("/v1/datasets", { params: { query } }),
-      "fetching datasets"
-    );
-    const data = extractData(response);
-    datasets.push(...data.data);
-    cursor = data.next_cursor;
-    // Stop if no more data
-    if (!cursor || data.data.length === 0) {
-      break;
-    }
-  }
-  // Write datasets index
-  await mode.writeFile("/phoenix/datasets/index.jsonl", toJSONL(datasets));
-  // Fetch examples for each dataset
-  for (const dataset of datasets) {
-    // Write dataset metadata
-    await mode.writeFile(
-      `/phoenix/datasets/${dataset.name}/metadata.json`,
-      JSON.stringify(
-        {
-          id: dataset.id,
-          name: dataset.name,
-          description: dataset.description,
-          metadata: dataset.metadata,
-          created_at: dataset.created_at,
-          updated_at: dataset.updated_at,
-          snapshot_timestamp: new Date().toISOString(),
-        },
-        null,
-        2
-      )
-    );
-    // Fetch examples for this dataset
-    const examplesResponse = await withErrorHandling(
-      () =>
-        client.GET("/v1/datasets/{id}/examples", {
-          params: {
-            path: { id: dataset.id },
-          },
-        }),
-      `fetching examples for dataset ${dataset.name}`
-    );
-    const examplesData = extractData(examplesResponse);
-    const examples = examplesData.data.examples;
-    // Write examples as JSONL
-    await mode.writeFile(
-      `/phoenix/datasets/${dataset.name}/examples.jsonl`,
-      toJSONL(examples)
-    );
-    // Write dataset info with example count
-    await mode.writeFile(
-      `/phoenix/datasets/${dataset.name}/info.json`,
-      JSON.stringify(
-        {
-          dataset_id: dataset.id,
-          dataset_name: dataset.name,
-          example_count: examples.length,
-          version_id: examplesData.data.version_id,
-          filtered_splits: examplesData.data.filtered_splits,
-        },
-        null,
-        2
-      )
-    );
-  }
-}