npm - agent-scenario-loop - Versions diffs - 0.1.2 → 0.1.3 - Mend

agent-scenario-loop 0.1.2 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

package/README.md +9 -9
package/app/profile-session.ts +98 -4
package/dist/core/agent-summary.d.ts +3 -2
package/dist/core/agent-summary.js +44 -2
package/dist/core/artifact-contract.d.ts +22 -4
package/dist/core/artifact-contract.js +512 -11
package/dist/core/comparison.d.ts +57 -3
package/dist/core/comparison.js +113 -1
package/dist/core/planner.d.ts +32 -1
package/dist/core/planner.js +144 -0
package/dist/core/run-index.d.ts +4 -0
package/dist/core/run-index.js +55 -1
package/dist/core/schema-validator.d.ts +1 -0
package/dist/core/schema-validator.js +1 -0
package/dist/runner/compare-latest.d.ts +8 -4
package/dist/runner/compare-latest.js +24 -5
package/dist/runner/example-android-live.d.ts +10 -1
package/dist/runner/example-android-live.js +55 -0
package/dist/runner/example-ios-live.d.ts +10 -1
package/dist/runner/example-ios-live.js +55 -0
package/dist/runner/ios-simctl.d.ts +5 -0
package/dist/runner/ios-simctl.js +6 -0
package/dist/runner/live-comparison.d.ts +2 -2
package/dist/runner/live-comparison.js +2 -1
package/dist/runner/live-proof-summary.d.ts +5 -4
package/dist/runner/live-proof-summary.js +12 -2
package/dist/runner/live-proof.d.ts +3 -2
package/dist/runner/live-proof.js +9 -2
package/dist/runner/profile-android.d.ts +5 -0
package/dist/runner/profile-android.js +148 -24
package/dist/runner/profile-ios.d.ts +11 -1
package/dist/runner/profile-ios.js +128 -9
package/dist/runner/profile-mobile.d.ts +8 -0
package/dist/runner/profile-mobile.js +267 -28
package/docs/adapters.md +4 -0
package/docs/architecture.md +90 -0
package/docs/authoring.md +5 -1
package/docs/concepts.md +3 -24
package/docs/consumer-rehearsal.md +4 -0
package/docs/contracts.md +30 -100
package/docs/external-adapter-protocol.md +219 -0
package/docs/live-proofs.md +83 -2
package/docs/principles.md +9 -15
package/examples/mobile-app/README.md +12 -0
package/examples/mobile-app/runner-manifests/primary-runner.json +1 -0
package/examples/runners/README.md +1 -0
package/examples/runners/adb-android.json +1 -0
package/examples/runners/agent-device-android.json +1 -0
package/examples/runners/agent-device-ios.json +1 -0
package/examples/runners/argent-android.json +1 -0
package/examples/runners/argent-ios.json +1 -0
package/examples/runners/xcodebuildmcp-ios.json +1 -0
package/package.json +2 -1
package/schemas/causal-run.schema.json +85 -2
package/schemas/comparison.schema.json +130 -2
package/schemas/external-adapter-message.schema.json +693 -0
package/schemas/health.schema.json +72 -0
package/schemas/live-proof-set.schema.json +1 -1
package/schemas/live-proof.schema.json +14 -6
package/schemas/manifest.schema.json +442 -1
package/schemas/runner-capabilities.schema.json +20 -0
package/schemas/scenario.schema.json +16 -0
package/templates/primary-runner.json +1 -0

package/examples/runners/adb-android.json CHANGED Viewed

@@ -12,6 +12,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot", "record", "readLogs"],
   "artifactOutputs": ["logs", "signals", "screenshot", "video", "uiTree"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/examples/runners/agent-device-android.json CHANGED Viewed

@@ -14,6 +14,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot", "readLogs"],
   "artifactOutputs": ["logs", "signals", "screenshot", "uiTree"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/examples/runners/agent-device-ios.json CHANGED Viewed

@@ -14,6 +14,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot", "readLogs"],
   "artifactOutputs": ["logs", "signals", "screenshot", "uiTree"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/examples/runners/argent-android.json CHANGED Viewed

@@ -14,6 +14,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot"],
   "artifactOutputs": ["logs", "signals", "screenshot", "uiTree"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/examples/runners/argent-ios.json CHANGED Viewed

@@ -14,6 +14,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot"],
   "artifactOutputs": ["logs", "signals", "screenshot", "uiTree"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/examples/runners/xcodebuildmcp-ios.json CHANGED Viewed

@@ -16,6 +16,7 @@
   ],
   "driverActions": ["tap", "scroll", "assertVisible", "inspectTree", "screenshot", "record", "readLogs"],
   "artifactOutputs": ["logs", "signals", "screenshot", "video", "uiTree", "accessibility"],
+  "uiContexts": ["app"],
   "lifecycle": [
     "prepare",
     "launch",

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "agent-scenario-loop",
-  "version": "0.1.2",
+  "version": "0.1.3",
   "private": false,
   "description": "Scenario orchestration and evidence collection for agent-driven software development. Bring your own runner. Keep your scenarios. Keep your evidence.",
   "license": "MIT",
@@ -200,6 +200,7 @@
     "app/profile-session.ts",
     "core/config-template.json",
     "dist",
+    "!dist/**/__tests__",
     "!dist/scripts",
     "docs",
     "examples",

package/schemas/causal-run.schema.json CHANGED Viewed

@@ -98,10 +98,26 @@
         }
       }
     },
+    "provenanceRef": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["manifest", "runId"],
+      "properties": {
+        "manifest": {
+          "type": "string"
+        },
+        "runId": {
+          "type": "string"
+        },
+        "scenarioHash": {
+          "type": "string",
+          "pattern": "^[a-f0-9]{64}$"
+        }
+      }
+    },
     "budgets": {
       "type": "object",
       "description": "Named budget thresholds the run should be evaluated against.",
-      "minProperties": 1,
       "additionalProperties": {
         "$ref": "#/$defs/budgetThreshold"
       }
@@ -112,6 +128,41 @@
         "$ref": "#/$defs/timelineEvent"
       }
     },
+    "iterationSummary": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["expected", "completed", "failed", "timeouts", "incomplete", "status"],
+      "properties": {
+        "expected": {
+          "type": "integer",
+          "minimum": 1
+        },
+        "completed": {
+          "type": "integer",
+          "minimum": 0
+        },
+        "failed": {
+          "type": "integer",
+          "minimum": 0
+        },
+        "timeouts": {
+          "type": "integer",
+          "minimum": 0
+        },
+        "incomplete": {
+          "type": "array",
+          "uniqueItems": true,
+          "items": {
+            "type": "integer",
+            "minimum": 1
+          }
+        },
+        "status": {
+          "type": "string",
+          "enum": ["complete", "partial", "failed", "timeout"]
+        }
+      }
+    },
     "artifacts": {
       "type": "object",
       "additionalProperties": false,
@@ -169,12 +220,31 @@
           "items": {
             "type": "object",
             "additionalProperties": false,
-            "required": ["channel", "kind", "path", "sha256", "sizeBytes", "sourceFileName"],
+            "required": [
+              "channel",
+              "completenessStatus",
+              "corruptionStatus",
+              "kind",
+              "path",
+              "redactionStatus",
+              "sha256",
+              "sizeBytes",
+              "sourceFileName",
+              "transformations"
+            ],
             "properties": {
               "channel": {
                 "type": "string",
                 "enum": ["capture", "provider", "signal"]
               },
+              "completenessStatus": {
+                "type": "string",
+                "enum": ["complete", "truncated", "unknown"]
+              },
+              "corruptionStatus": {
+                "type": "string",
+                "enum": ["valid", "corrupt", "unknown"]
+              },
               "kind": {
                 "type": "string",
                 "enum": ["accessibility", "js", "logs", "memory", "network", "profiler", "screenshot", "uiTree", "video"]
@@ -183,6 +253,10 @@
                 "type": "string",
                 "minLength": 1
               },
+              "redactionStatus": {
+                "type": "string",
+                "enum": ["not-redacted", "redacted", "unknown"]
+              },
               "sha256": {
                 "type": "string",
                 "pattern": "^[a-f0-9]{64}$"
@@ -194,6 +268,15 @@
               "sourceFileName": {
                 "type": "string",
                 "minLength": 1
+              },
+              "transformations": {
+                "type": "array",
+                "minItems": 1,
+                "uniqueItems": true,
+                "items": {
+                  "type": "string",
+                  "enum": ["copied", "normalized", "redacted", "truncated", "compressed", "transcoded", "unknown"]
+                }
               }
             }
           }

package/schemas/comparison.schema.json CHANGED Viewed

@@ -33,7 +33,7 @@
     },
     "comparisonStatus": {
       "type": "string",
-      "enum": ["better", "worse", "unchanged", "mixed", "inconclusive"]
+      "enum": ["better", "worse", "unchanged", "mixed", "inconclusive", "low_confidence"]
     },
     "healthStatus": {
       "type": "string",
@@ -46,6 +46,9 @@
     "comparisonBasis": {
       "$ref": "#/$defs/comparisonBasis"
     },
+    "measurementPolicy": {
+      "$ref": "#/$defs/measurementPolicy"
+    },
     "metricComparisons": {
       "type": "array",
       "items": {
@@ -135,6 +138,10 @@
           "type": "string",
           "pattern": "^[a-f0-9]{64}$"
         },
+        "cohortHash": {
+          "type": "string",
+          "pattern": "^[a-f0-9]{64}$"
+        },
         "selectedRunDir": {
           "type": "string"
         },
@@ -159,6 +166,10 @@
         "trustedScenarioContractCandidates": {
           "type": "integer",
           "minimum": 0
+        },
+        "trustedCohortCandidates": {
+          "type": "integer",
+          "minimum": 0
         }
       }
     },
@@ -185,12 +196,129 @@
         },
         "status": {
           "type": "string",
-          "enum": ["better", "worse", "unchanged", "inconclusive"]
+          "enum": ["better", "worse", "unchanged", "inconclusive", "low_confidence"]
         },
         "notes": {
           "type": "string"
         }
       }
+    },
+    "measurementPolicy": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["baselineSelection", "samples", "tolerance", "confidence"],
+      "properties": {
+        "baselineSelection": {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["mode", "poisoningProtection"],
+          "properties": {
+            "mode": {
+              "type": "string",
+              "enum": ["explicit", "latestTrustedPrior"]
+            },
+            "poisoningProtection": {
+              "type": "object",
+              "additionalProperties": false,
+              "required": ["requirePassedHealth", "requirePassedVerdict", "requireMatchingScenarioId"],
+              "properties": {
+                "requirePassedHealth": {
+                  "type": "boolean"
+                },
+                "requirePassedVerdict": {
+                  "type": "boolean"
+                },
+                "requireMatchingScenarioId": {
+                  "type": "boolean"
+                },
+                "comparisonLane": {
+                  "type": "string"
+                },
+                "scenarioHash": {
+                  "type": "string",
+                  "pattern": "^[a-f0-9]{64}$"
+                },
+                "cohortHash": {
+                  "type": "string",
+                  "pattern": "^[a-f0-9]{64}$"
+                }
+              }
+            }
+          }
+        },
+        "samples": {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["baseline", "current"],
+          "properties": {
+            "baseline": {
+              "$ref": "#/$defs/samplePolicy"
+            },
+            "current": {
+              "$ref": "#/$defs/samplePolicy"
+            }
+          }
+        },
+        "tolerance": {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["timing"],
+          "properties": {
+            "timing": {
+              "type": "object",
+              "additionalProperties": false,
+              "required": ["absoluteMs", "relative"],
+              "properties": {
+                "absoluteMs": {
+                  "type": "number",
+                  "minimum": 0
+                },
+                "relative": {
+                  "type": "number",
+                  "minimum": 0
+                }
+              }
+            }
+          }
+        },
+        "confidence": {
+          "type": "object",
+          "additionalProperties": false,
+          "required": ["level", "minValidSamples"],
+          "properties": {
+            "level": {
+              "type": "string",
+              "enum": ["single_run", "multi_sample", "insufficient", "low_confidence"]
+            },
+            "minValidSamples": {
+              "type": "integer",
+              "minimum": 1
+            },
+            "reason": {
+              "type": "string"
+            }
+          }
+        }
+      }
+    },
+    "samplePolicy": {
+      "type": "object",
+      "additionalProperties": false,
+      "required": ["validSamples", "warmupSamples", "outliersExcluded"],
+      "properties": {
+        "validSamples": {
+          "type": "integer",
+          "minimum": 0
+        },
+        "warmupSamples": {
+          "type": "integer",
+          "minimum": 0
+        },
+        "outliersExcluded": {
+          "type": "integer",
+          "minimum": 0
+        }
+      }
     }
   }
 }