npm - agent-scenario-loop - Versions diffs - 0.1.1 → 0.1.3 - Mend

agent-scenario-loop 0.1.1 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (69) hide show

package/README.md +15 -9
package/app/profile-session.ts +98 -4
package/dist/core/agent-summary.d.ts +3 -2
package/dist/core/agent-summary.js +44 -2
package/dist/core/artifact-contract.d.ts +22 -4
package/dist/core/artifact-contract.js +512 -11
package/dist/core/comparison.d.ts +57 -3
package/dist/core/comparison.js +113 -1
package/dist/core/planner.d.ts +32 -1
package/dist/core/planner.js +144 -0
package/dist/core/run-index.d.ts +4 -0
package/dist/core/run-index.js +55 -1
package/dist/core/schema-validator.d.ts +1 -0
package/dist/core/schema-validator.js +1 -0
package/dist/runner/compare-latest.d.ts +8 -4
package/dist/runner/compare-latest.js +24 -5
package/dist/runner/example-android-live.d.ts +10 -1
package/dist/runner/example-android-live.js +55 -0
package/dist/runner/example-ios-live.d.ts +10 -1
package/dist/runner/example-ios-live.js +55 -0
package/dist/runner/init-project.d.ts +4 -1
package/dist/runner/init-project.js +26 -4
package/dist/runner/ios-simctl.d.ts +5 -0
package/dist/runner/ios-simctl.js +6 -0
package/dist/runner/live-comparison.d.ts +2 -2
package/dist/runner/live-comparison.js +2 -1
package/dist/runner/live-proof-summary.d.ts +5 -4
package/dist/runner/live-proof-summary.js +12 -2
package/dist/runner/live-proof.d.ts +3 -2
package/dist/runner/live-proof.js +9 -2
package/dist/runner/profile-android.d.ts +5 -0
package/dist/runner/profile-android.js +148 -24
package/dist/runner/profile-ios.d.ts +11 -1
package/dist/runner/profile-ios.js +128 -9
package/dist/runner/profile-mobile.d.ts +8 -0
package/dist/runner/profile-mobile.js +267 -28
package/docs/adapters.md +4 -0
package/docs/api.md +1 -1
package/docs/architecture.md +90 -0
package/docs/authoring.md +7 -1
package/docs/concepts.md +3 -24
package/docs/consumer-rehearsal.md +4 -0
package/docs/contracts.md +30 -100
package/docs/external-adapter-protocol.md +219 -0
package/docs/live-proofs.md +83 -2
package/docs/principles.md +9 -15
package/examples/mobile-app/README.md +12 -0
package/examples/mobile-app/runner-manifests/primary-runner.json +1 -0
package/examples/runners/README.md +1 -0
package/examples/runners/adb-android.json +1 -0
package/examples/runners/agent-device-android.json +1 -0
package/examples/runners/agent-device-ios.json +1 -0
package/examples/runners/argent-android.json +1 -0
package/examples/runners/argent-ios.json +1 -0
package/examples/runners/xcodebuildmcp-ios.json +1 -0
package/package.json +2 -1
package/schemas/causal-run.schema.json +85 -2
package/schemas/comparison.schema.json +130 -2
package/schemas/external-adapter-message.schema.json +693 -0
package/schemas/health.schema.json +72 -0
package/schemas/live-proof-set.schema.json +1 -1
package/schemas/live-proof.schema.json +14 -6
package/schemas/manifest.schema.json +442 -1
package/schemas/runner-capabilities.schema.json +20 -0
package/schemas/scenario.schema.json +16 -0
package/templates/primary-runner.json +1 -0
package/templates/skills/agent-scenario-loop/SKILL.md +93 -0
package/templates/skills/agent-scenario-loop/references/adoption-checklist.md +17 -0
package/templates/skills/agent-scenario-loop/references/artifact-interpretation.md +26 -0

package/README.md CHANGED Viewed

@@ -14,12 +14,14 @@ Execution tools can change. The scenario and evidence contract should not.
 | --- | --- |
 | Understand the idea in plain language | [Concepts](docs/concepts.md) |
 | Understand the project doctrine | [Principles](docs/principles.md) |
-| Write your first scenario | [Scenario Authoring](docs/authoring.md) |
-| Rehearse adoption in an existing app | [Consumer App Rehearsal](docs/consumer-rehearsal.md) |
+| Understand why ASL is a protocol, not a TypeScript-only library | [Architecture](docs/architecture.md) |
+| Implement or evaluate an out-of-process adapter in any language | [External Adapter Protocol](docs/external-adapter-protocol.md) |
 | Inspect artifacts, schemas, and supported surfaces | [Contracts](docs/contracts.md) |
-| Use the package from code | [Public API](docs/api.md) |
+| Write your first scenario | [Scenario Authoring](docs/authoring.md) |
 | Add a runner or evidence provider | [Adapter Onboarding](docs/adapters.md) |
+| Rehearse adoption in an existing app | [Consumer App Rehearsal](docs/consumer-rehearsal.md) |
 | Run fixture, Android, or iOS proofs | [Live Proofs](docs/live-proofs.md) |
+| Use the package from code | [Public API](docs/api.md) |
 | Inspect runner behavior and limits | [Runner docs](runner/README.md) |
 | Explore the neutral dogfood app | [examples/mobile-app](examples/mobile-app/README.md) |
 | See runner and provider fixtures | [examples/runners](examples/runners/README.md) |
@@ -43,6 +45,12 @@ Install or use the package, then scaffold a first scenario inside an app:
 asl-init --out . --scenario first-journey
 ```
+Add the optional repository-scoped agent skill when you want Codex to load ASL operating guidance from the consuming app:
+```bash
+asl-init --out . --scenario first-journey --with-agent-skill
+```
 Wire the generated app helper, emit truth events around one real journey, merge the generated `asl:*` scripts intentionally, then validate the project:
 ```bash
@@ -67,12 +75,6 @@ No simulator or device available yet? Run the fixture loop:
 pnpm demo:loop -- --out artifacts/demo-loop
 ```
-Read next:
-- [Scenario Authoring](docs/authoring.md) for scenario shape and truth events
-- [Consumer App Rehearsal](docs/consumer-rehearsal.md) for adoption in an existing app
-- [Live Proofs](docs/live-proofs.md) for Android, iOS, comparison, and release-proof paths
 ## Package Surface
 The root package exports stable core contracts:
@@ -117,3 +119,7 @@ pnpm release:check
 ```
 The package should remain product-neutral. Product-specific selectors, routes, auth assumptions, accounts, and scenario data belong in the consuming app, not in this repository.
+## Read next
+- [Concepts](docs/concepts.md) for the plain-language model

package/app/profile-session.ts CHANGED Viewed

@@ -12,11 +12,16 @@ export type ProfileSessionState = {
 export type ProfileSessionCommand = {
   id: string;
+  commandId?: string;
   scenario?: string;
   runId?: string;
   command: string;
+  queueId?: string;
+  sequence?: number;
   source?: 'deeplink' | 'storage';
   timestamp: number;
+  waitForMilestone?: string;
+  waitTimeoutMs?: number;
 };
 export type ProfileSignalKind = 'js' | 'memory' | 'network';
@@ -65,7 +70,16 @@ type StoredProfileSessionEntry = {
   startedAt?: number;
   stoppedAt?: number;
   command?: string;
+  commandId?: string;
   id?: string;
+  queueId?: string;
+  reason?: string;
+  result?: string;
+  sequence?: number;
+  source?: 'deeplink' | 'storage';
+  status?: 'received' | 'queued' | 'delivered' | 'completed' | 'skipped';
+  waitForMilestone?: string;
+  waitTimeoutMs?: number;
 };
 type StoredProfileSignals = Record<ProfileSignalKind, Record<string, unknown>>;
@@ -316,6 +330,41 @@ function logProfileSession(kind: 'start' | 'stop' | 'command', payload: Record<s
     if (typeof payload.id === 'string') {
       entry.id = payload.id;
     }
+    if (typeof payload.commandId === 'string') {
+      entry.commandId = payload.commandId;
+    } else if (typeof payload.id === 'string') {
+      entry.commandId = payload.id;
+    }
+    if (typeof payload.queueId === 'string') {
+      entry.queueId = payload.queueId;
+    }
+    if (typeof payload.sequence === 'number') {
+      entry.sequence = payload.sequence;
+    }
+    if (payload.source === 'deeplink' || payload.source === 'storage') {
+      entry.source = payload.source;
+    }
+    if (
+      payload.status === 'received' ||
+      payload.status === 'queued' ||
+      payload.status === 'delivered' ||
+      payload.status === 'completed' ||
+      payload.status === 'skipped'
+    ) {
+      entry.status = payload.status;
+    }
+    if (typeof payload.reason === 'string') {
+      entry.reason = payload.reason;
+    }
+    if (typeof payload.result === 'string') {
+      entry.result = payload.result;
+    }
+    if (typeof payload.waitForMilestone === 'string') {
+      entry.waitForMilestone = payload.waitForMilestone;
+    }
+    if (typeof payload.waitTimeoutMs === 'number') {
+      entry.waitTimeoutMs = payload.waitTimeoutMs;
+    }
   }
   appendStoredProfileSessionEntry(entry);
@@ -326,6 +375,11 @@ function getProfileSessionRoute(url: string): {
   scenario?: string;
   runId?: string;
   command?: string;
+  commandId?: string;
+  queueId?: string;
+  sequence?: number;
+  waitForMilestone?: string;
+  waitTimeoutMs?: number;
 } | null {
   const parsed = ExpoLinking.parse(url);
   const segments = [parsed.hostname, parsed.path]
@@ -347,8 +401,22 @@ function getProfileSessionRoute(url: string): {
     typeof parsed.queryParams?.runId === 'string' ? parsed.queryParams.runId : undefined;
   const command =
     typeof parsed.queryParams?.command === 'string' ? parsed.queryParams.command : undefined;
-  return { action, scenario, runId, command };
+  const commandId =
+    typeof parsed.queryParams?.commandId === 'string' ? parsed.queryParams.commandId : undefined;
+  const sequence =
+    typeof parsed.queryParams?.sequence === 'string' && Number.isInteger(Number(parsed.queryParams.sequence))
+      ? Number(parsed.queryParams.sequence)
+      : undefined;
+  const queueId =
+    typeof parsed.queryParams?.queueId === 'string' ? parsed.queryParams.queueId : undefined;
+  const waitForMilestone =
+    typeof parsed.queryParams?.waitForMilestone === 'string' ? parsed.queryParams.waitForMilestone : undefined;
+  const waitTimeoutMs =
+    typeof parsed.queryParams?.waitTimeoutMs === 'string' && Number.isInteger(Number(parsed.queryParams.waitTimeoutMs))
+      ? Number(parsed.queryParams.waitTimeoutMs)
+      : undefined;
+  return { action, scenario, runId, command, commandId, queueId, sequence, waitForMilestone, waitTimeoutMs };
 }
 function queuePendingProfileCommand(command: ProfileSessionCommand) {
@@ -456,17 +524,32 @@ function notifyProfileCommandListeners(command: ProfileSessionCommand) {
   const targetDispatched = dispatchProfileCommandTarget(command);
   if (targetDispatched) {
+    logProfileSession('command', {
+      ...command,
+      status: 'completed',
+      result: 'target-dispatched',
+    });
     return;
   }
   if (profileCommandListeners.size === 0) {
     queuePendingProfileCommand(command);
+    logProfileSession('command', {
+      ...command,
+      status: 'queued',
+      reason: 'no-command-listener',
+    });
     return;
   }
   for (const listener of profileCommandListeners) {
     listener(command);
   }
+  logProfileSession('command', {
+    ...command,
+    status: 'delivered',
+    result: 'listener-notified',
+  });
 }
 function flushPendingProfileCommands(listener: (command: ProfileSessionCommand) => void) {
@@ -560,10 +643,18 @@ export function applyProfileSessionUrl(url: string | null | undefined): boolean
       scenario: route.scenario,
       runId: route.runId,
       command: route.command,
+      ...(route.commandId ? { commandId: route.commandId } : {}),
+      ...(route.queueId ? { queueId: route.queueId } : {}),
+      ...(typeof route.sequence === 'number' ? { sequence: route.sequence } : {}),
       source: 'deeplink' as const,
       timestamp,
+      ...(route.waitForMilestone ? { waitForMilestone: route.waitForMilestone } : {}),
+      ...(typeof route.waitTimeoutMs === 'number' ? { waitTimeoutMs: route.waitTimeoutMs } : {}),
     };
-    logProfileSession('command', command);
+    logProfileSession('command', {
+      ...command,
+      status: 'received',
+    });
     notifyProfileCommandListeners(command);
     return true;
   }
@@ -776,7 +867,10 @@ export function useProfileSessionBootstrap(): void {
         }
         markProfileCommandIdProcessed(storageCommand);
-        logProfileSession('command', storageCommand);
+        logProfileSession('command', {
+          ...storageCommand,
+          status: 'received',
+        });
         notifyProfileCommandListeners(storageCommand);
       }
     };

package/dist/core/agent-summary.d.ts CHANGED Viewed

@@ -1,10 +1,10 @@
 /**
  * Builds the minimum agent-facing markdown summary for a run.
  *
- * @param {{health: Record<string, unknown>, verdict: Record<string, unknown>, comparison?: Record<string, unknown> | null}} options
+ * @param {{health: Record<string, unknown>, verdict: Record<string, unknown>, comparison?: Record<string, unknown> | null, manifest?: Record<string, unknown> | null}} options
  * @returns {string}
  */
-declare function buildAgentSummaryMarkdown({ health, verdict, comparison }: AgentSummaryInput): string;
+declare function buildAgentSummaryMarkdown({ health, verdict, comparison, manifest }: AgentSummaryInput): string;
 export { buildAgentSummaryMarkdown, };
 export type { AgentSummaryInput, SummaryRecord, };
 type SummaryRecord = Record<string, unknown>;
@@ -12,4 +12,5 @@ type AgentSummaryInput = {
     health: SummaryRecord;
     verdict: SummaryRecord;
     comparison?: SummaryRecord | null;
+    manifest?: SummaryRecord | null;
 };

package/dist/core/agent-summary.js CHANGED Viewed

@@ -122,13 +122,54 @@ function formatComparisonBasis(comparison) {
     }
     return lines;
 }
+/**
+ * Formats attempt terminal semantics for agent-readable summaries.
+ *
+ * @param {SummaryRecord | null | undefined} manifest
+ * @returns {string[]}
+ */
+function formatAttempt(manifest) {
+    const attempt = manifest?.attempt;
+    if (!attempt || typeof attempt !== 'object' || Array.isArray(attempt)) {
+        return [];
+    }
+    const attemptRecord = attempt;
+    const classification = attemptRecord.classification && typeof attemptRecord.classification === 'object' && !Array.isArray(attemptRecord.classification)
+        ? attemptRecord.classification
+        : {};
+    const cleanup = attemptRecord.cleanup && typeof attemptRecord.cleanup === 'object' && !Array.isArray(attemptRecord.cleanup)
+        ? attemptRecord.cleanup
+        : {};
+    const partialArtifacts = attemptRecord.partialArtifacts && typeof attemptRecord.partialArtifacts === 'object' && !Array.isArray(attemptRecord.partialArtifacts)
+        ? attemptRecord.partialArtifacts
+        : {};
+    const retryOfAttemptId = firstString([attemptRecord.retryOfAttemptId], '');
+    const retryReason = firstString([attemptRecord.retryReason], '');
+    const lines = [
+        '',
+        '## attempt',
+        '',
+        `- Attempt: ${code(firstString([attemptRecord.attemptId], 'unknown-attempt'))} (${attemptRecord.attemptNumber ?? 'unknown'}/${attemptRecord.maxAttempts ?? 'unknown'})`,
+        `- Terminal state: ${code(firstString([attemptRecord.terminalState], 'unknown'))}`,
+        `- Classification: ${code(firstString([classification.category], 'unknown'))}${classification.code ? ` ${code(classification.code)}` : ''}`,
+        `- Cleanup: ${code(firstString([cleanup.status], 'unknown'))}`,
+        `- Partial artifacts valid: ${partialArtifacts.valid === true ? 'true' : 'false'} - ${firstString([partialArtifacts.reason], 'no reason recorded')}`,
+    ];
+    if (retryOfAttemptId || retryReason) {
+        lines.push(`- Retry lineage: previous=${code(retryOfAttemptId || 'unknown')} reason=${retryReason || 'not recorded'}`);
+    }
+    if (Array.isArray(partialArtifacts.paths) && partialArtifacts.paths.length > 0) {
+        lines.push(`- Partial artifact paths: ${partialArtifacts.paths.map((item) => code(item)).join(', ')}`);
+    }
+    return lines;
+}
 /**
  * Builds the minimum agent-facing markdown summary for a run.
  *
- * @param {{health: Record<string, unknown>, verdict: Record<string, unknown>, comparison?: Record<string, unknown> | null}} options
+ * @param {{health: Record<string, unknown>, verdict: Record<string, unknown>, comparison?: Record<string, unknown> | null, manifest?: Record<string, unknown> | null}} options
  * @returns {string}
  */
-function buildAgentSummaryMarkdown({ health, verdict, comparison = null }) {
+function buildAgentSummaryMarkdown({ health, verdict, comparison = null, manifest = null }) {
     const scenarioId = firstString([health?.scenarioId, verdict?.scenarioId], 'unknown-scenario');
     const runId = firstString([health?.runId, verdict?.runId], 'unknown-run');
     const healthStatus = firstString([health?.healthStatus], 'failed');
@@ -169,6 +210,7 @@ function buildAgentSummaryMarkdown({ health, verdict, comparison = null }) {
     if (failedBudgets.length > 0) {
         lines.push('', '## failed budgets', '', ...failedBudgets);
     }
+    lines.push(...formatAttempt(manifest));
     if (comparison) {
         lines.push('', '## comparison', '', firstString([comparison.summary], 'No comparison summary provided.'));
         lines.push(...formatComparisonBasis(comparison));

package/dist/core/artifact-contract.d.ts CHANGED Viewed

@@ -8,6 +8,12 @@ type ProfileEvent = ArtifactRecord & {
     atMs?: number;
     timestamp?: number | string;
 };
+type ProfileSessionEntry = ArtifactRecord & {
+    kind?: string;
+    scenario?: string;
+    runId?: string;
+    timestamp?: number | string;
+};
 type BudgetCheck = {
     name: string;
     actual: unknown;
@@ -36,6 +42,17 @@ declare function extractProfileEvents(logText: string, filters?: {
     runId?: string;
     scenario?: string;
 }): ProfileEvent[];
+/**
+ * Extracts structured profile-session entries from device logs.
+ *
+ * @param {string} logText
+ * @param {{runId?: string, scenario?: string}} [filters]
+ * @returns {Record<string, unknown>[]}
+ */
+declare function extractProfileSessionEntries(logText: string, filters?: {
+    runId?: string;
+    scenario?: string;
+}): ProfileSessionEntry[];
 /**
  * Builds timing metrics from app-emitted profile events.
  *
@@ -75,8 +92,9 @@ declare function sortValue(value: any): any;
  * @param {{events: Record<string, unknown>[], startedAt?: string, phaseMap?: Record<string, string> | null, owner?: string | null}} options
  * @returns {Record<string, unknown>[]}
  */
-declare function buildCausalTimeline({ events, startedAt, phaseMap, owner, }: {
+declare function buildCausalTimeline({ events, sessionEntries, startedAt, phaseMap, owner, }: {
     events: ProfileEvent[];
+    sessionEntries?: ProfileSessionEntry[];
     startedAt?: string;
     phaseMap?: ArtifactRecord | null;
     owner?: string | null;
@@ -107,7 +125,7 @@ declare function buildCausalRun({ scenario, flowId, runId, platform, buildFlavor
  * @param {Record<string, unknown>} options
  * @returns {Record<string, unknown>}
  */
-declare function buildManifest({ scenario, scenarioHash, runId, platform, status, startedAt, endedAt, interactionDriver, comparisonLane, simulator, bundleId, gitSha, toolVersions, artifacts, failureReason, }: ArtifactRecord): ArtifactRecord;
+declare function buildManifest({ scenario, scenarioHash, runId, attemptId, attemptNumber, maxAttempts, retryOfAttemptId, retryReason, platform, status, terminalState, startedAt, endedAt, interactionDriver, comparisonLane, classification, cleanup, partialArtifacts, preconditions, postconditions, simulator, bundleId, gitSha, toolVersions, cohort, artifacts, failureReason, }: ArtifactRecord): ArtifactRecord;
 /**
  * Builds the human-readable profile summary.
  *
@@ -147,5 +165,5 @@ declare function evaluateUiContract({ rawDescription, requiredIdentifierPatterns
     checks: ArtifactRecord[];
     missingPatterns: string[];
 };
-export { PROFILE_EVENT_PREFIX, buildBudgetVerdict, buildCausalRun, buildCausalTimeline, buildManifest, buildMetricsFromProfileEvents, buildSummaryMarkdown, evaluateUiContract, evaluateProfileBudgets, extractCandidateIdentifiers, extractProfileEvents, findMatchingIdentifier, percentile, sortValue, };
-export type { ArtifactRecord, BudgetCheck, ProfileEvent, };
+export { PROFILE_EVENT_PREFIX, buildBudgetVerdict, buildCausalRun, buildCausalTimeline, buildManifest, buildMetricsFromProfileEvents, buildSummaryMarkdown, evaluateUiContract, evaluateProfileBudgets, extractCandidateIdentifiers, extractProfileEvents, extractProfileSessionEntries, findMatchingIdentifier, percentile, sortValue, };
+export type { ArtifactRecord, BudgetCheck, ProfileEvent, ProfileSessionEntry, };