npm - kimi-agent-swarm-cli - Versions diffs - 0.7.0 - Mend

kimi-agent-swarm-cli 0.7.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/README.md +49 -0
package/fixtures/asset-mgmt-roles.json +1543 -0
package/fixtures/basic-sources.json +58 -0
package/fixtures/github-repo-landscape.json +308 -0
package/fixtures/golden-answers.ts +56 -0
package/fixtures/jsonl-provider.ts +41 -0
package/fixtures/market-scan.json +246 -0
package/fixtures/paul-graham-corpus.json +272 -0
package/fixtures/sellside-research-roles.json +1709 -0
package/fixtures/youtube-niche.json +262 -0
package/package.json +45 -0
package/src/benchmark.ts +151 -0
package/src/cache.ts +86 -0
package/src/cli.ts +377 -0
package/src/command-provider.ts +99 -0
package/src/config.ts +134 -0
package/src/costs.ts +134 -0
package/src/distributed/memory-adapter.ts +152 -0
package/src/distributed/queue-adapter.ts +29 -0
package/src/distributed/redis-adapter.ts +185 -0
package/src/distributed/runner.ts +325 -0
package/src/distributed/task-splitter.ts +78 -0
package/src/export.ts +70 -0
package/src/init.ts +138 -0
package/src/leaderboard.ts +201 -0
package/src/providers/brave-provider.ts +161 -0
package/src/providers/github-provider.ts +151 -0
package/src/providers/index.ts +49 -0
package/src/providers/mock-search-provider.ts +45 -0
package/src/providers/search-provider.ts +12 -0
package/src/providers/serper-provider.ts +154 -0
package/src/providers/tavily-provider.ts +158 -0
package/src/runtime.ts +349 -0
package/src/scorer.ts +103 -0
package/src/types.ts +246 -0
package/src/verifier.ts +369 -0

package/fixtures/basic-sources.json ADDED Viewed

@@ -0,0 +1,58 @@
+{
+  "sources": [
+    {
+      "id": "S001",
+      "url": "https://example.com/official-agent-report",
+      "title": "Official Agent Research Report",
+      "sourceClass": "official",
+      "publishedAt": "2026-05-20",
+      "discoveredBy": "fixture:agent research",
+      "scores": {
+        "relevance": 4,
+        "authority": 4,
+        "freshness": 4,
+        "diversity": 3,
+        "extractionValue": 4
+      },
+      "claims": [
+        "Evidence-backed research workflows need source and claim traceability."
+      ]
+    },
+    {
+      "id": "S002",
+      "url": "https://example.com/community-thread",
+      "title": "Community Thread",
+      "sourceClass": "community",
+      "publishedAt": "2026-05-15",
+      "discoveredBy": "fixture:agent research",
+      "scores": {
+        "relevance": 3,
+        "authority": 2,
+        "freshness": 3,
+        "diversity": 4,
+        "extractionValue": 3
+      },
+      "claims": [
+        "Users prefer readable synthesis before audit files."
+      ]
+    },
+    {
+      "id": "S003",
+      "url": "https://example.com/duplicate-summary",
+      "title": "Duplicate Summary",
+      "sourceClass": "secondary",
+      "publishedAt": "2025-01-10",
+      "discoveredBy": "fixture:agent research",
+      "scores": {
+        "relevance": 1,
+        "authority": 1,
+        "freshness": 1,
+        "diversity": 0,
+        "extractionValue": 1
+      },
+      "claims": [
+        "Weak duplicate source should not be accepted."
+      ]
+    }
+  ]
+}

package/fixtures/github-repo-landscape.json ADDED Viewed

@@ -0,0 +1,308 @@
+{
+  "sources": [
+    {
+      "id": "GH-001",
+      "url": "https://github.com/browser-use/browser-use",
+      "title": "browser-use/browser-use",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 5, "authority": 5, "freshness": 5, "diversity": 3, "extractionValue": 5 },
+      "claims": [
+        "Browser-use connects AI agents directly to browser UI elements for task automation.",
+        "It is one of the most starred AI browser agent repositories."
+      ]
+    },
+    {
+      "id": "GH-002",
+      "url": "https://github.com/browserbase/stagehand",
+      "title": "browserbase/stagehand",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 5, "authority": 4, "freshness": 5, "diversity": 3, "extractionValue": 5 },
+      "claims": [
+        "Stagehand provides an AI-driven browser automation framework with act/extract/observe primitives.",
+        "It is built on top of Playwright."
+      ]
+    },
+    {
+      "id": "GH-003",
+      "url": "https://github.com/antiwork/shortest",
+      "title": "antiwork/shortest",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 5, "authority": 3, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "Shortest is a natural-language AI testing framework that converts prompts into browser tests."
+      ]
+    },
+    {
+      "id": "GH-004",
+      "url": "https://github.com/nanobrowser/nanobrowser",
+      "title": "nanobrowser/nanobrowser",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 5, "authority": 3, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "Nanobrowser is an open-source AI web agent that runs directly in the browser as an extension."
+      ]
+    },
+    {
+      "id": "GH-005",
+      "url": "https://github.com/Significant-Gravitas/AutoGPT",
+      "title": "Significant-Gravitas/AutoGPT",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 5, "freshness": 4, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "AutoGPT was one of the first open-source projects to popularize autonomous AI agents.",
+        "It focuses on goal-oriented autonomous task execution."
+      ]
+    },
+    {
+      "id": "GH-006",
+      "url": "https://github.com/langchain-ai/langchain",
+      "title": "langchain-ai/langchain",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 5, "freshness": 4, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "LangChain provides abstractions for chaining LLM calls, tools, and memory.",
+        "It is widely used as a foundation for agent frameworks."
+      ]
+    },
+    {
+      "id": "GH-007",
+      "url": "https://github.com/crewAIInc/crewAI",
+      "title": "crewAIInc/crewAI",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 4, "freshness": 4, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "CrewAI structures agents into role-based crews that collaborate on tasks."
+      ]
+    },
+    {
+      "id": "GH-008",
+      "url": "https://github.com/microsoft/autogen",
+      "title": "microsoft/autogen",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 5, "freshness": 4, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "AutoGen from Microsoft enables multi-agent conversations and tool use."
+      ]
+    },
+    {
+      "id": "GH-009",
+      "url": "https://github.com/pydantic/pydantic-ai",
+      "title": "pydantic/pydantic-ai",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 4, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "Pydantic AI is an agent framework built around type-safe structured outputs."
+      ]
+    },
+    {
+      "id": "GH-010",
+      "url": "https://github.com/huggingface/smolagents",
+      "title": "huggingface/smolagents",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 4, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "Smolagents from Hugging Face emphasizes small, efficient agent code execution."
+      ]
+    },
+    {
+      "id": "GH-011",
+      "url": "https://github.com/run-llama/llama_index",
+      "title": "run-llama/llama_index",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 5, "freshness": 4, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "LlamaIndex focuses on data ingestion and retrieval for LLM applications."
+      ]
+    },
+    {
+      "id": "GH-012",
+      "url": "https://github.com/deepset-ai/haystack",
+      "title": "deepset-ai/haystack",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 4, "freshness": 4, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "Haystack is an end-to-end NLP framework for building search and question-answering systems."
+      ]
+    },
+    {
+      "id": "GH-013",
+      "url": "https://github.com/ScrapeGraphAI/Scrapegraph-ai",
+      "title": "ScrapeGraphAI/Scrapegraph-ai",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 3, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "ScrapeGraphAI uses LLMs to generate scraping pipelines from natural language prompts."
+      ]
+    },
+    {
+      "id": "GH-014",
+      "url": "https://github.com/scrapy/scrapy",
+      "title": "scrapy/scrapy",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 5, "freshness": 4, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "Scrapy is a mature Python framework for large-scale web scraping."
+      ]
+    },
+    {
+      "id": "GH-015",
+      "url": "https://github.com/microsoft/playwright",
+      "title": "microsoft/playwright",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 5, "freshness": 4, "diversity": 3, "extractionValue": 4 },
+      "claims": [
+        "Playwright is a cross-browser automation library widely used by AI agent projects."
+      ]
+    },
+    {
+      "id": "GH-016",
+      "url": "https://github.com/SeleniumHQ/selenium",
+      "title": "SeleniumHQ/selenium",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 5, "freshness": 4, "diversity": 3, "extractionValue": 3 },
+      "claims": [
+        "Selenium is the legacy standard for browser automation."
+      ]
+    },
+    {
+      "id": "GH-017",
+      "url": "https://github.com/OpenInterpreter/open-interpreter",
+      "title": "OpenInterpreter/open-interpreter",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 4, "freshness": 4, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "Open Interpreter lets LLMs run code locally to accomplish tasks."
+      ]
+    },
+    {
+      "id": "GH-018",
+      "url": "https://github.com/OpenAI-Swarm/community",
+      "title": "OpenAI-Swarm/community",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 3, "freshness": 4, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "OpenAI Swarm demonstrated lightweight multi-agent orchestration patterns."
+      ]
+    },
+    {
+      "id": "GH-019",
+      "url": "https://github.com/reworkd/AgentGPT",
+      "title": "reworkd/AgentGPT",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 3, "freshness": 3, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "AgentGPT provided a browser-based interface for running autonomous agents."
+      ]
+    },
+    {
+      "id": "GH-020",
+      "url": "https://github.com/TransformerOptimus/SuperAGI",
+      "title": "TransformerOptimus/SuperAGI",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 3, "freshness": 3, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "SuperAGI aimed to be a production-ready autonomous agent framework with tools and memory."
+      ]
+    },
+    {
+      "id": "GH-021",
+      "url": "https://github.com/langchain-ai/langgraph",
+      "title": "langchain-ai/langgraph",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 4, "authority": 4, "freshness": 5, "diversity": 4, "extractionValue": 4 },
+      "claims": [
+        "LangGraph enables building stateful, multi-actor agent workflows as graphs."
+      ]
+    },
+    {
+      "id": "GH-022",
+      "url": "https://github.com/e2b-dev/E2B",
+      "title": "e2b-dev/E2B",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 3, "authority": 4, "freshness": 5, "diversity": 4, "extractionValue": 3 },
+      "claims": [
+        "E2B provides sandboxed cloud environments for running AI-generated code."
+      ]
+    },
+    {
+      "id": "GH-023",
+      "url": "https://github.com/vectara/py-vectara",
+      "title": "vectara/py-vectara",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 2, "authority": 3, "freshness": 4, "diversity": 4, "extractionValue": 2 },
+      "claims": [
+        "Vectara offers RAG-as-a-service with retrieval and summarization APIs."
+      ]
+    },
+    {
+      "id": "GH-024",
+      "url": "https://github.com/jina-ai/jina",
+      "title": "jina-ai/jina",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 2, "authority": 4, "freshness": 4, "diversity": 4, "extractionValue": 2 },
+      "claims": [
+        "Jina is a neural search framework for building multimodal AI applications."
+      ]
+    },
+    {
+      "id": "GH-025",
+      "url": "https://github.com/weaviate/weaviate",
+      "title": "weaviate/weaviate",
+      "sourceClass": "primary",
+      "publishedAt": "2026-01-01",
+      "discoveredBy": "github-repo-landscape",
+      "scores": { "relevance": 2, "authority": 4, "freshness": 4, "diversity": 4, "extractionValue": 2 },
+      "claims": [
+        "Weaviate is an open-source vector database for AI-native applications."
+      ]
+    }
+  ]
+}

package/fixtures/golden-answers.ts ADDED Viewed

@@ -0,0 +1,56 @@
+import type { GoldenAnswer } from "../src/types";
+export const goldenAnswers: Record<string, GoldenAnswer> = {
+  "fixture-paul-graham-corpus": {
+    expectedClaims: [
+      "Startups should initially do things that don't scale.",
+      "The maker's schedule requires long uninterrupted blocks of time.",
+      "The best startup ideas often come from the founders' own problems.",
+      "Wealth is created by doing what people want, not by moving it around.",
+      "Startups die more often from denial than from competition.",
+      "Mean people rarely win in the long run.",
+    ],
+    expectedSourceUrls: [
+      "http://www.paulgraham.com/ds.html",
+      "http://www.paulgraham.com/makersschedule.html",
+      "http://www.paulgraham.com/startupideas.html",
+      "http://www.paulgraham.com/wealth.html",
+      "http://www.paulgraham.com/really.html",
+      "http://www.paulgraham.com/mean.html",
+    ],
+  },
+  "fixture-github-repo-landscape": {
+    expectedClaims: [
+      "Browser-use connects AI agents directly to browser UI elements for task automation.",
+      "Stagehand provides an AI-driven browser automation framework with act/extract/observe primitives.",
+      "AutoGPT was one of the first open-source projects to popularize autonomous AI agents.",
+      "LangChain provides abstractions for chaining LLM calls, tools, and memory.",
+      "CrewAI structures agents into role-based crews that collaborate on tasks.",
+      "AutoGen from Microsoft enables multi-agent conversations and tool use.",
+    ],
+    expectedSourceUrls: [
+      "https://github.com/browser-use/browser-use",
+      "https://github.com/browserbase/stagehand",
+      "https://github.com/Significant-Gravitas/AutoGPT",
+      "https://github.com/langchain-ai/langchain",
+      "https://github.com/crewAIInc/crewAI",
+      "https://github.com/microsoft/autogen",
+    ],
+  },
+  "fixture-market-scan": {
+    expectedClaims: [
+      "GitHub Copilot is the most widely adopted AI coding assistant by installed base.",
+      "Cursor is an AI-first code editor built on top of VS Code.",
+      "Claude Code is a terminal-based agentic coding assistant.",
+      "Amazon Q Developer provides code generation, transformation, and operational assistance.",
+      "Enterprise adoption of AI coding assistants is accelerating in regulated industries.",
+    ],
+    expectedSourceUrls: [
+      "https://github.com/features/copilot",
+      "https://www.cursor.com/",
+      "https://www.anthropic.com/claude-code",
+      "https://aws.amazon.com/q/developer/",
+      "https://www.gartner.com/en/newsroom/example",
+    ],
+  },
+};

package/fixtures/jsonl-provider.ts ADDED Viewed

@@ -0,0 +1,41 @@
+#!/usr/bin/env bun
+import type { Source } from "../src/types";
+const sources: Source[] = [
+  {
+    id: "L001",
+    url: "https://example.com/local-command-primary",
+    title: "Local Command Primary Source",
+    sourceClass: "primary-data",
+    publishedAt: "2026-05-22",
+    discoveredBy: "local-command fixture",
+    scores: {
+      relevance: 4,
+      authority: 4,
+      freshness: 4,
+      diversity: 3,
+      extractionValue: 4,
+    },
+    claims: ["Local command providers can feed replayable source candidates into the runtime."],
+  },
+  {
+    id: "L002",
+    url: "https://example.com/local-command-low-quality",
+    title: "Local Command Low Quality Source",
+    sourceClass: "secondary",
+    publishedAt: "2024-01-01",
+    discoveredBy: "local-command fixture",
+    scores: {
+      relevance: 1,
+      authority: 1,
+      freshness: 1,
+      diversity: 1,
+      extractionValue: 1,
+    },
+    claims: ["Low quality command output should be rejected."],
+  },
+];
+for (const source of sources) {
+  console.log(JSON.stringify({ type: "source_candidate", source }));
+}