npm - @m8i-51/shoal - Versions diffs - 0.1.13 → 0.1.15 - Mend

@m8i-51/shoal 0.1.13 → 0.1.15

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (21) hide show

package/.env.example +6 -0
package/framework/__tests__/coverage.test.ts +1 -0
package/framework/__tests__/report.test.ts +1 -0
package/framework/account-manager.ts +10 -5
package/framework/coverage.ts +11 -0
package/framework/persona-pack.ts +137 -0
package/framework/product-discovery.ts +4 -2
package/framework/trackers/asana.ts +13 -0
package/framework/trackers/backlog.ts +14 -0
package/framework/trackers/github.ts +18 -0
package/framework/trackers/index.ts +9 -0
package/framework/trackers/jira.ts +19 -0
package/framework/trackers/notion.ts +16 -0
package/framework/trackers/types.ts +1 -0
package/framework/triage.ts +15 -5
package/framework/types.ts +1 -0
package/package.json +3 -2
package/run.ts +62 -9
package/web/dist/assets/index-riAs4l9D.js +85 -0
package/web/dist/index.html +1 -1
package/web/dist/assets/index-BgIAUEzL.js +0 -68

package/run.ts CHANGED Viewed

@@ -17,7 +17,8 @@ import type { Tool } from "./framework/llm-client";
 import { createMessageWithRetry, runAgentLoop, sleep, rateLimitRetries } from "./framework/agent-loop";
 import { collectedFindings, initRunLog, saveRunLog, saveFinding, runLog } from "./framework/findings";
 import { loadAgents, addAgent, retireAgent } from "./framework/agent-store";
-import { updateCoverage, computeWeightedSummary } from "./framework/coverage";
+import { updateCoverage, computeWeightedSummary, getLastRunPaths } from "./framework/coverage";
+import { loadPersonaPack, formatPackForPrompt, type PersonaPack } from "./framework/persona-pack";
 import { buildTrackers } from "./framework/trackers/index";
 import {
   setupObservation,
@@ -231,6 +232,10 @@ function makeExecutor(agentLog: AgentLog, scenarioOutcomes: ScenarioOutcome[], s
             `**Regression:** #${original_issue_number} "${original_issue_title}" has reappeared.\n\n${body}\n\n---\n*This issue was auto-generated by an AI regression agent*`,
             ["regression", "feedback-agent"]
           );
+          await trackers.commentOnIssue(
+            original_issue_number,
+            `⚠️ **Regression detected** by AI agent on ${new Date().toISOString().slice(0, 10)}\n\n${body}${url ? `\n\nNew issue: ${url}` : ""}`
+          );
           const check: RegressionCheck = {
             issueNumber: Number(original_issue_number),
             issueTitle: String(original_issue_title),
@@ -248,6 +253,10 @@ function makeExecutor(agentLog: AgentLog, scenarioOutcomes: ScenarioOutcome[], s
           const { original_issue_number, original_issue_title, note } = input as {
             original_issue_number: number; original_issue_title: string; note: string;
           };
+          await trackers.commentOnIssue(
+            original_issue_number,
+            `✅ **Verified as fixed** by AI agent on ${new Date().toISOString().slice(0, 10)}\n\n${note}`
+          );
           agentLog.regressionChecks.push({
             issueNumber: Number(original_issue_number),
             issueTitle: String(original_issue_title),
@@ -304,6 +313,7 @@ async function runExplorer(
     status: "completed",
     iterations: 0,
     actions: [],
+    visitedPaths: [],
     issuesPosted: [],
     regressionChecks: [],
     error: null,
@@ -357,6 +367,7 @@ async function runRegressionAgent(
     status: "completed",
     iterations: 0,
     actions: [],
+    visitedPaths: [],
     issuesPosted: [],
     regressionChecks: [],
     error: null,
@@ -405,6 +416,16 @@ const PERSONA_DESIGNER_TOOLS: Anthropic.Tool[] = [
     description: "Get a weighted summary of what has been explored across past runs. Use this to identify underrepresented lenses and perspectives before deciding whom to hire. / 過去のrunで何がどれだけ探索されたかの重み付きサマリーを取得する。採用方針の決定前に確認すること",
     input_schema: { type: "object", properties: {}, required: [] },
   },
+  {
+    name: "get_path_coverage",
+    description: "Get the list of URL paths visited in the previous run. Use this to identify unexplored areas of the app and recruit agents likely to visit NEW paths. / 前回のrunで訪れたURLパス一覧を取得する。未探索エリアを特定し、新しいパスを訪れる可能性の高いペルソナを採用するために使う",
+    input_schema: { type: "object", properties: {}, required: [] },
+  },
+  {
+    name: "get_persona_templates",
+    description: "Get the persona template pack defined for this project. Prefer these archetypes when adding agents — adapt names/details to fit the app context but keep the role intact. / このプロジェクト用に定義されたペルソナテンプレート一覧を取得する。エージェントを追加する際はまずこのテンプレートから選ぶこと",
+    input_schema: { type: "object", properties: {}, required: [] },
+  },
   {
     name: "get_open_issues",
     description: "Get the titles and labels of currently open GitHub Issues (known problems). Use this to understand what is already known and recruit agents who are likely to explore DIFFERENT areas. / 現在オープンなGitHub Issueのタイトルとラベルを取得する。既知の問題を把握し、未探索領域を掘れるペルソナを採用するために使う",
@@ -448,6 +469,8 @@ async function runPersonaDesigner(
   openIssues: { number: number | string; title: string; labels: string[] }[],
   scenarios: Scenario[],
   testAccounts: TestAccount[] = [],
+  lastRunPaths: { visitedPaths: string[]; runId: string } | null = null,
+  personaPack: PersonaPack | null = null,
 ): Promise<void> {
   console.log("\n[persona-designer] starting...");
   const messages: Anthropic.MessageParam[] = [
@@ -458,6 +481,14 @@ async function runPersonaDesigner(
     ? `\n[Available Test Accounts (one per role)]\n${testAccounts.map((a) => `- ${a.role}: ${a.email}`).join("\n")}\nWhen recruiting agents, match each persona's role to one of these accounts so they can operate with appropriate permissions.`
     : "";
+  const pathCoverageStep = lastRunPaths
+    ? "3. Call get_path_coverage to see which URL paths were visited last run — recruit agents whose role would naturally take them to DIFFERENT or unexplored paths"
+    : "3. (No previous run data yet — skip get_path_coverage)";
+  const personaTemplateStep = personaPack
+    ? "2. Call get_persona_templates to get project-specific persona archetypes — prefer these over inventing new personas from scratch"
+    : "2. (No persona templates configured — invent personas that fit the app context)";
   const systemPrompt = `You are the persona designer for "${productSpec.appName}".
 You create and manage test agents that simulate real users of the app.
@@ -466,11 +497,13 @@ ${orgGuidance}${accountContext}
 [Steps]
 1. Call get_coverage to review which lenses and categories are underrepresented in past runs
-2. Call get_open_issues to understand what problems are already known — recruit agents likely to find DIFFERENT issues in unexplored areas
-3. Call get_scenarios to see the user test scenarios generated for this run — about 70% of agents will be assigned a scenario, so recruit personas whose background fits those scenarios
-4. Call get_agents to check the current agent roster
-5. Add 2–3 agents with add_agent — balance between scenario-fit personas (step 3), underrepresented lenses (step 1), and unexplored areas (step 2)${testAccounts.length > 0 ? "\n   — assign each agent a role that matches one of the available test accounts" : ""}
-6. If there are agents with old createdAt dates (oldest 1–2), retire them with retire_agent`;
+${personaTemplateStep}
+${pathCoverageStep}
+4. Call get_open_issues to understand what problems are already known — recruit agents likely to find DIFFERENT issues in unexplored areas
+5. Call get_scenarios to see the user test scenarios generated for this run — about 70% of agents will be assigned a scenario, so recruit personas whose background fits those scenarios
+6. Call get_agents to check the current agent roster
+7. Add 2–3 agents with add_agent — balance between scenario-fit personas (step 5), underrepresented lenses (step 1), unexplored paths (step 3), and unexplored areas (step 4)${testAccounts.length > 0 ? "\n   — assign each agent a role that matches one of the available test accounts" : ""}
+8. If there are agents with old createdAt dates (oldest 1–2), retire them with retire_agent`;
   try {
     let iterations = 0;
@@ -494,6 +527,20 @@ ${orgGuidance}${accountContext}
         if (toolUse.name === "get_coverage") {
           result = computeWeightedSummary().formatted;
           console.log("  [persona-designer] coverage summary fetched");
+        } else if (toolUse.name === "get_persona_templates") {
+          if (!personaPack) {
+            result = "(no persona templates configured — set SHOAL_PERSONAS env var or add personas.yaml to your project)";
+          } else {
+            result = formatPackForPrompt(personaPack);
+          }
+          console.log(`  [persona-designer] persona templates fetched (${personaPack?.personas.length ?? 0})`);
+        } else if (toolUse.name === "get_path_coverage") {
+          if (!lastRunPaths || lastRunPaths.visitedPaths.length === 0) {
+            result = "(no path coverage data yet — this is the first run or no paths were recorded)";
+          } else {
+            result = `Paths visited in last run (${lastRunPaths.runId}):\n${lastRunPaths.visitedPaths.map((p) => `- ${p}`).join("\n")}\n\nRecruit agents whose role naturally takes them to paths NOT in this list.`;
+          }
+          console.log(`  [persona-designer] path coverage fetched (${lastRunPaths?.visitedPaths.length ?? 0} paths)`);
         } else if (toolUse.name === "get_open_issues") {
           if (openIssues.length === 0) {
             result = "(no open issues — either GitHub is not configured or there are no known issues yet)";
@@ -555,6 +602,7 @@ interface BrowserAgentLog {
   status: "completed" | "error" | "iteration_limit";
   iterations: number;
   actions: BrowserAction[];
+  visitedPaths: string[];
   feedbacksSaved: { title: string; category: string; findingId: string }[];
   error: string | null;
 }
@@ -690,6 +738,7 @@ async function executeBrowserTool(
         await page.goto(`${BASE_URL}${navPath}`, { waitUntil: "networkidle" });
         await page.waitForTimeout(3000);
         screenshot = await takeScreenshot(page, `navigate_${navPath.replace(/\//g, "_")}`);
+        agentLog.visitedPaths.push(navPath);
         resultText = `Navigated to ${navPath}`;
         break;
       }
@@ -870,6 +919,7 @@ async function runBrowserAgent(
     status: "completed",
     iterations: 0,
     actions: [],
+    visitedPaths: [],
     feedbacksSaved: [],
     error: null,
   };
@@ -1102,7 +1152,9 @@ async function main() {
     }
     // 4. HR agent
-    await runPersonaDesigner(productSpec, orgDesign.personaGuidance, openIssues, scenarios, testAccounts);
+    const lastRunPaths = getLastRunPaths();
+    const personaPack = await loadPersonaPack();
+    await runPersonaDesigner(productSpec, orgDesign.personaGuidance, openIssues, scenarios, testAccounts, lastRunPaths, personaPack);
     // 5. load agents + closed issues
     const allAgents = loadAgents();
@@ -1159,7 +1211,7 @@ async function main() {
     browserAgents.forEach((a) => console.log(`  - ${a.name} (${a.role})`));
     await sleep(2000);
-    await Promise.all(
+    const browserLogs = await Promise.all(
       browserAgents.map(async (agent) => {
         const assignment = pickAssignment(dispatchIdx++, scenarios);
         agentAssignments.set(agent.id, assignment);
@@ -1182,6 +1234,7 @@ async function main() {
         }
       })
     );
+    const allVisitedPaths = browserLogs.flatMap((log) => log.visitedPaths);
     // 8. triage (API + browser findings)
     await sleep(2000);
@@ -1199,7 +1252,7 @@ async function main() {
     console.log(`\n[report] ${reportPath}`);
     // 10. update coverage
-    updateCoverage(runLog.runId, collectedFindings, agentAssignments);
+    updateCoverage(runLog.runId, collectedFindings, agentAssignments, allVisitedPaths);
   } finally {
     await browser.close();