npm - @maintainabilityai/research-runner - Versions diffs - 0.1.3 → 0.1.5 - Mend

@maintainabilityai/research-runner 0.1.3 → 0.1.5

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (3) hide show

package/dist/llm/llm-router.js +12 -3
package/dist/runner/archeologist.js +25 -0
package/package.json +1 -1

package/dist/llm/llm-router.js CHANGED Viewed

@@ -10,7 +10,16 @@ const MODEL_BY_TIER = {
 };
 async function callLlm(opts) {
     const tierModels = MODEL_BY_TIER[opts.tier];
-    if (opts.provider === 'anthropic') {
+    // Hybrid routing: GitHub Models free tier caps requests at ~8K input
+    // tokens — too small for the synthesis step (full brief + every search
+    // result + mesh context routinely exceeds that). When the brief asks
+    // for github-models AND an Anthropic key is available, route synth →
+    // Anthropic and keep plan (small prompt) on github-models. Caller can
+    // force pure github-models by not setting anthropicApiKey.
+    const effectiveProvider = opts.provider === 'github-models' && opts.tier === 'synth' && opts.anthropicApiKey
+        ? 'anthropic'
+        : opts.provider;
+    if (effectiveProvider === 'anthropic') {
         if (!opts.anthropicApiKey) {
             throw new Error(`callLlm: provider=anthropic requires anthropicApiKey (set ANTHROPIC_API_KEY).`);
         }
@@ -33,7 +42,7 @@ async function callLlm(opts) {
             httpStatus: r.httpStatus,
         };
     }
-    if (opts.provider === 'github-models') {
+    if (effectiveProvider === 'github-models') {
         if (!opts.githubToken) {
             throw new Error(`callLlm: provider=github-models requires githubToken (set GITHUB_TOKEN; workflow needs \`permissions: models: read\`).`);
         }
@@ -56,5 +65,5 @@ async function callLlm(opts) {
             httpStatus: r.httpStatus,
         };
     }
-    throw new Error(`callLlm: provider "${opts.provider}" not yet implemented (phase 2c.1 ships anthropic + github-models; openai + azure-openai land later).`);
+    throw new Error(`callLlm: provider "${effectiveProvider}" not yet implemented (phase 2c.1 ships anthropic + github-models; openai + azure-openai land later).`);
 }

package/dist/runner/archeologist.js CHANGED Viewed

@@ -76,6 +76,18 @@ const synthesize_report_1 = require("./nodes/synthesize-report");
 const clone_and_index_1 = require("./nodes/clone-and-index");
 const analyze_architecture_1 = require("./nodes/analyze-architecture");
 const identify_gaps_1 = require("./nodes/identify-gaps");
+/**
+ * Progress log → stderr. Goes to GitHub Actions job output without
+ * polluting stdout (which carries the JSON result the workflow parses).
+ * Disabled when RESEARCH_RUNNER_QUIET=1 so unit tests stay clean.
+ */
+function progress(msg) {
+    if (process.env.RESEARCH_RUNNER_QUIET === '1') {
+        return;
+    }
+    const ts = new Date().toISOString().slice(11, 19); // HH:MM:SS
+    process.stderr.write(`[research-runner ${ts}] ${msg}\n`);
+}
 async function runArcheologist(opts) {
     // ----- validate_brief (pure) -----
     const briefParsed = schemas_1.ResearchBrief.safeParse(opts.brief);
@@ -89,6 +101,7 @@ async function runArcheologist(opts) {
     const githubToken = opts.githubToken ?? process.env.GITHUB_TOKEN ?? '';
     const tavilyApiKey = opts.tavilyApiKey ?? process.env.TAVILY_API_KEY ?? '';
     const usptoApiKey = opts.usptoApiKey ?? process.env.USPTO_API_KEY ?? '';
+    progress(`▶ run ${runId} | scope=${brief.scope.level}(${brief.scope.id}) | path=${brief.path} | llm_provider=${brief.llm_provider ?? 'anthropic'} | keys: anthropic=${!!anthropicApiKey} github=${!!githubToken} tavily=${!!tavilyApiKey} uspto=${!!usptoApiKey}`);
     const absoluteAuditDir = path.resolve(opts.meshDir, opts.auditDir);
     const absoluteOutputDir = path.resolve(opts.meshDir, opts.outputDir);
     fs.mkdirSync(absoluteOutputDir, { recursive: true });
@@ -240,6 +253,7 @@ async function runArcheologist(opts) {
         // ============================================================================
         // RESEARCH PATH (existing): plan_queries → 4 providers → dedupe → gap-analysis
         // ============================================================================
+        progress(`◐ plan_queries — calling LLM to generate query plan…`);
         const planStart = Date.now();
         const plan = await (0, plan_queries_1.planQueries)({
             meshDir: opts.meshDir,
@@ -251,6 +265,7 @@ async function runArcheologist(opts) {
             fetchImpl: opts.fetchImpl,
         });
         researchQueryPlan = plan.queryPlan;
+        progress(`✓ plan_queries (${plan.llm.provider} ${plan.llm.model}) in ${Date.now() - planStart}ms — ${plan.llm.inputTokens} in / ${plan.llm.outputTokens} out tokens, ${plan.llm.attempts} attempt${plan.llm.attempts !== 1 ? 's' : ''} → web=${plan.queryPlan.web.length} arxiv=${plan.queryPlan.arxiv.length} patent=${plan.queryPlan.patent.length} community=${plan.queryPlan.community.length}`);
         totalInputTokens += plan.llm.inputTokens;
         totalOutputTokens += plan.llm.outputTokens;
         totalCostUsd += plan.llm.costUsd;
@@ -271,6 +286,7 @@ async function runArcheologist(opts) {
         // ----- four-provider search (pure_api each, parallel across providers) -----
         // We run all four providers concurrently with Promise.allSettled so a
         // provider-level failure (e.g. PatentsView outage) doesn't block the rest.
+        progress(`◐ search — tavily(${plan.queryPlan.web.length}) + arxiv(${plan.queryPlan.arxiv.length}) + hackernews(${plan.queryPlan.community.length}) + uspto(${usptoApiKey ? plan.queryPlan.patent.length : 'skipped'}) in parallel…`);
         const searchStart = Date.now();
         const [tavily, arxiv, hn, uspto] = await Promise.allSettled([
             (0, tavily_search_1.runTavilySearch)({ apiKey: tavilyApiKey, queries: plan.queryPlan.web, fetchImpl: opts.fetchImpl }),
@@ -330,9 +346,12 @@ async function runArcheologist(opts) {
         handleProvider(arxiv, 'arxiv_search', 'arxiv', 'GET /api/query');
         handleProvider(hn, 'hackernews_search', 'hackernews', 'GET /api/v1/search');
         handleProvider(uspto, 'uspto_search', 'uspto', 'POST /api/v1/patent/');
+        const fmtSettled = (s) => s.status === 'fulfilled' ? 'OK' : `FAIL(${s.reason instanceof Error ? s.reason.message.slice(0, 60) : String(s.reason).slice(0, 60)})`;
+        progress(`✓ search done in ${searchDuration}ms — tavily=${providerResultCounts.tavily}/${fmtSettled(tavily)} arxiv=${providerResultCounts.arxiv}/${fmtSettled(arxiv)} hn=${providerResultCounts.hackernews}/${fmtSettled(hn)} uspto=${providerResultCounts.uspto}/${fmtSettled(uspto)} (raw=${allProviderResults.length})`);
         // ----- dedupe_and_rank (pure) — first pass -----
         let dedupeStart = Date.now();
         rankedSources = (0, dedupe_and_rank_1.dedupeAndRank)({ results: allProviderResults, topN: 20 });
+        progress(`✓ dedupe_and_rank — ${rankedSources.length} ranked sources (top score=${rankedSources[0]?.salience_score?.toFixed(2) ?? 'n/a'})`);
         emitter.emit({
             node_kind: 'pure',
             node_name: 'dedupe_and_rank',
@@ -354,6 +373,7 @@ async function runArcheologist(opts) {
                     outputs_summary: `signals=${gapSignals.map(s => s.kind).join(',')}`,
                 },
             });
+            progress(`◐ gap_analysis — ${gapSignals.length} signal(s): ${gapSignals.map(s => s.kind).join(',')}`);
             const gapStart = Date.now();
             const gap = await (0, gap_analysis_1.runGapAnalysis)({
                 meshDir: opts.meshDir,
@@ -365,6 +385,7 @@ async function runArcheologist(opts) {
                 githubToken,
                 fetchImpl: opts.fetchImpl,
             });
+            progress(`✓ gap_analysis (${gap.llm.provider} ${gap.llm.model}) in ${Date.now() - gapStart}ms — ${gap.llm.inputTokens} in / ${gap.llm.outputTokens} out tokens → ${gap.followUpQueries.length} follow-up queries`);
             totalInputTokens += gap.llm.inputTokens;
             totalOutputTokens += gap.llm.outputTokens;
             totalCostUsd += gap.llm.costUsd;
@@ -436,6 +457,7 @@ async function runArcheologist(opts) {
         }
     } // end research-path else branch
     // ----- synthesize_report (LLM) -----
+    progress(`◐ synthesize_report — calling LLM (provider hint=${brief.llm_provider ?? 'anthropic'}, sources=${rankedSources.length}); hybrid routing will pick anthropic for synth if anthropic key is set…`);
     const synthStart = Date.now();
     const synthesis = await (0, synthesize_report_1.synthesizeReport)({
         meshDir: opts.meshDir,
@@ -454,6 +476,7 @@ async function runArcheologist(opts) {
     totalInputTokens += synthesis.llm.inputTokens;
     totalOutputTokens += synthesis.llm.outputTokens;
     totalCostUsd += synthesis.llm.costUsd;
+    progress(`✓ synthesize_report (${synthesis.llm.provider} ${synthesis.llm.model}) in ${Date.now() - synthStart}ms — ${synthesis.llm.inputTokens} in / ${synthesis.llm.outputTokens} out tokens, ${synthesis.llm.attempts} attempt${synthesis.llm.attempts !== 1 ? 's' : ''}`);
     emitter.emit({
         node_kind: 'llm',
         node_name: 'synthesize_report',
@@ -554,6 +577,8 @@ async function runArcheologist(opts) {
         }
         catch { /* leave on disk — non-fatal, just a tmpdir entry */ }
     }
+    const totalDurationMs = Date.now() - startedAt.getTime();
+    progress(`◆ done ${runId} in ${(totalDurationMs / 1000).toFixed(1)}s — ${totalInputTokens} in / ${totalOutputTokens} out tokens, $${roundUsd(totalCostUsd)} | sources=${rankedSources.length} conclusions=${synthesis.citation_stats.conclusion_count} recs=${synthesis.citation_stats.recommendation_count} | artifact=${artifactPath}`);
     return {
         run_id: runId,
         topic: brief.topic,

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@maintainabilityai/research-runner",
-  "version": "0.1.3",
+  "version": "0.1.5",
   "description": "Research + PRD agent runner — orchestrates the Archeologist and PRD pipelines for the MaintainabilityAI governance mesh",
   "license": "MIT",
   "author": "MaintainabilityAI",