npm - livepilot - Versions diffs - 1.10.9 → 1.13.0 - Mend

livepilot 1.10.9 → 1.13.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (61) hide show

package/CHANGELOG.md +327 -0
package/README.md +7 -7
package/m4l_device/LivePilot_Analyzer.amxd +0 -0
package/m4l_device/livepilot_bridge.js +1 -1
package/mcp_server/__init__.py +1 -1
package/mcp_server/branches/__init__.py +32 -0
package/mcp_server/branches/types.py +230 -0
package/mcp_server/composer/__init__.py +10 -1
package/mcp_server/composer/branch_producer.py +229 -0
package/mcp_server/evaluation/policy.py +129 -2
package/mcp_server/experiment/engine.py +47 -11
package/mcp_server/experiment/models.py +72 -7
package/mcp_server/experiment/tools.py +231 -35
package/mcp_server/m4l_bridge.py +488 -13
package/mcp_server/memory/taste_graph.py +84 -11
package/mcp_server/persistence/taste_store.py +21 -5
package/mcp_server/runtime/execution_router.py +7 -0
package/mcp_server/runtime/mcp_dispatch.py +32 -0
package/mcp_server/runtime/remote_commands.py +54 -0
package/mcp_server/runtime/session_kernel.py +46 -0
package/mcp_server/runtime/tools.py +29 -3
package/mcp_server/sample_engine/slice_classifier.py +169 -0
package/mcp_server/server.py +11 -3
package/mcp_server/synthesis_brain/__init__.py +53 -0
package/mcp_server/synthesis_brain/adapters/__init__.py +34 -0
package/mcp_server/synthesis_brain/adapters/analog.py +167 -0
package/mcp_server/synthesis_brain/adapters/base.py +86 -0
package/mcp_server/synthesis_brain/adapters/drift.py +166 -0
package/mcp_server/synthesis_brain/adapters/meld.py +151 -0
package/mcp_server/synthesis_brain/adapters/operator.py +169 -0
package/mcp_server/synthesis_brain/adapters/wavetable.py +228 -0
package/mcp_server/synthesis_brain/engine.py +91 -0
package/mcp_server/synthesis_brain/models.py +121 -0
package/mcp_server/synthesis_brain/timbre.py +194 -0
package/mcp_server/tools/_conductor.py +144 -0
package/mcp_server/tools/analyzer.py +187 -7
package/mcp_server/tools/clips.py +65 -0
package/mcp_server/tools/devices.py +517 -5
package/mcp_server/tools/diagnostics.py +42 -0
package/mcp_server/tools/follow_actions.py +202 -0
package/mcp_server/tools/grooves.py +142 -0
package/mcp_server/tools/miditool.py +280 -0
package/mcp_server/tools/scales.py +126 -0
package/mcp_server/tools/take_lanes.py +135 -0
package/mcp_server/tools/tracks.py +46 -3
package/mcp_server/tools/transport.py +62 -1
package/mcp_server/wonder_mode/engine.py +324 -0
package/mcp_server/wonder_mode/tools.py +153 -1
package/package.json +2 -2
package/remote_script/LivePilot/__init__.py +8 -4
package/remote_script/LivePilot/clips.py +62 -0
package/remote_script/LivePilot/devices.py +444 -0
package/remote_script/LivePilot/diagnostics.py +52 -1
package/remote_script/LivePilot/follow_actions.py +235 -0
package/remote_script/LivePilot/grooves.py +185 -0
package/remote_script/LivePilot/scales.py +138 -0
package/remote_script/LivePilot/take_lanes.py +175 -0
package/remote_script/LivePilot/tracks.py +59 -1
package/remote_script/LivePilot/transport.py +90 -1
package/remote_script/LivePilot/version_detect.py +9 -0
package/server.json +3 -3

package/mcp_server/experiment/tools.py CHANGED Viewed

@@ -16,6 +16,7 @@ from typing import Optional
 from fastmcp import Context
 from ..server import mcp
+from ..branches import BranchSeed
 from . import engine
 from .models import BranchSnapshot
 import logging
@@ -63,18 +64,71 @@ def create_experiment(
     request_text: str,
     move_ids: Optional[list] = None,
     limit: int = 3,
+    seeds: Optional[list] = None,
+    compiled_plans: Optional[list] = None,
 ) -> dict:
     """Create an experiment set to compare multiple approaches.
-    If move_ids is provided, creates one branch per move.
-    Otherwise, uses propose_next_best_move to find candidates.
+    Three input modes (in priority order):
-    request_text: what the user wants (e.g., "make this punchier")
-    move_ids: specific moves to try (e.g., ["make_punchier", "tighten_low_end"])
-    limit: max branches when auto-proposing (default 3)
+    1. seeds (PR3+): a list of BranchSeed dicts. Each seed becomes one branch.
+       compiled_plans (optional parallel list) attaches pre-compiled plans
+       for freeform / synthesis / composer producers. Seed dict shape:
+         {seed_id, source, move_id, hypothesis, protected_qualities,
+          affected_scope, distinctness_reason, risk_label, novelty_label,
+          analytical_only}
+       Missing fields default per BranchSeed. This is the canonical path
+       for producers that have already done their own selection work.
+    2. move_ids: legacy path — one semantic_move seed per move_id.
+       Unchanged behavior; internally delegates to the seeds path.
+    3. Auto-proposal: neither seeds nor move_ids provided. Scans the semantic
+       move registry by keyword overlap with request_text and takes the top
+       ``limit`` moves (default 3).
     Returns: experiment set with branch IDs ready for run_experiment.
     """
+    # ── Mode 1: seeds provided ──────────────────────────────────────────
+    if seeds:
+        rehydrated: list[BranchSeed] = []
+        for i, s in enumerate(seeds):
+            if isinstance(s, BranchSeed):
+                rehydrated.append(s)
+            elif isinstance(s, dict):
+                try:
+                    rehydrated.append(BranchSeed(**s))
+                except TypeError as exc:
+                    return {"error": f"seeds[{i}] invalid: {exc}"}
+            else:
+                return {
+                    "error": (
+                        f"seeds[{i}] must be dict or BranchSeed, "
+                        f"got {type(s).__name__}"
+                    )
+                }
+        if compiled_plans is not None and len(compiled_plans) != len(rehydrated):
+            return {
+                "error": (
+                    f"compiled_plans length ({len(compiled_plans)}) must match "
+                    f"seeds length ({len(rehydrated)})"
+                )
+            }
+        ableton = _get_ableton(ctx)
+        ableton.send_command("get_session_info")
+        kernel_id = f"kern_{int(time.time())}"
+        experiment = engine.create_experiment_from_seeds(
+            request_text=request_text,
+            seeds=rehydrated,
+            kernel_id=kernel_id,
+            compiled_plans=compiled_plans,
+        )
+        return experiment.to_dict()
+    # ── Mode 2/3: legacy move_ids path ──────────────────────────────────
     if not move_ids:
         # Auto-propose moves from the registry
         from ..semantic_moves import registry
@@ -119,19 +173,30 @@ def create_experiment(
 async def run_experiment(
     ctx: Context,
     experiment_id: str,
+    exploration_rules: bool = False,
 ) -> dict:
     """Run all pending branches in an experiment.
     For each branch:
     1. Compile the semantic move against current session
+       (skipped when branch.compiled_plan is already set — PR3+)
     2. Capture before state
-    3. Execute the compiled plan (through the async router — v1.10.3 truth)
+    3. Execute the compiled plan (through the async router)
     4. Capture after state
     5. Undo all successful steps (revert to checkpoint)
-    6. Evaluate the branch
+    6. Evaluate the branch and classify its outcome via evaluation.policy
     7. Record per-step results on branch.execution_log
     Branches run sequentially (Ableton has linear undo).
+    exploration_rules (PR7): when True, branches that fail technical gates
+    (score < 0.40, non-positive measurable delta) are classified as
+    "interesting_but_failed" instead of "failed" — they stay in the
+    experiment for audit but don't appear in the ranking. Protection
+    violations STILL force undo regardless of this flag — that's a safety
+    invariant, not a taste judgment.
+    Default False preserves pre-PR7 behavior exactly.
     """
     experiment = engine.get_experiment(experiment_id)
     if not experiment:
@@ -149,19 +214,54 @@ async def run_experiment(
         if branch.status != "pending":
             continue
-        # Compile the move
-        move = registry.get_move(branch.move_id)
-        if not move:
-            branch.status = "failed"
-            branch.score = 0.0
-            branch.evaluation = {"error": f"Move {branch.move_id} not found"}
-            results.append(branch.to_dict())
-            continue
-        session_info = ableton.send_command("get_session_info")
-        kernel = {"session_info": session_info, "mode": "explore"}
-        plan = compiler.compile(move, kernel)
-        compiled_dict = plan.to_dict()
+        # PR3: respect a pre-existing compiled_plan on the branch (freeform /
+        # synthesis / composer producers bring their own). Only compile from
+        # move_id when the branch arrived without a plan — which requires a
+        # semantic_move seed (or a legacy move-only branch).
+        compiled_dict = branch.compiled_plan
+        if compiled_dict is None:
+            # Analytical-only branches short-circuit — no plan to run.
+            # Marked with status="analytical" so ranked_branches()
+            # (which only surfaces "evaluated") excludes them, and
+            # commit_experiment refuses to re-apply them.
+            if branch.seed is not None and branch.seed.analytical_only:
+                branch.status = "analytical"
+                branch.score = 0.0
+                branch.evaluation = {
+                    "score": 0.0,
+                    "keep_change": False,
+                    "status": "analytical",
+                    "note": "analytical_only branch — no execution path",
+                }
+                results.append(branch.to_dict())
+                continue
+            if not branch.move_id:
+                branch.status = "failed"
+                branch.score = 0.0
+                branch.evaluation = {
+                    "error": (
+                        "Branch has no compiled_plan and no move_id — "
+                        "freeform producers must pre-populate compiled_plan"
+                    )
+                }
+                results.append(branch.to_dict())
+                continue
+            # Compile from semantic move
+            move = registry.get_move(branch.move_id)
+            if not move:
+                branch.status = "failed"
+                branch.score = 0.0
+                branch.evaluation = {"error": f"Move {branch.move_id} not found"}
+                results.append(branch.to_dict())
+                continue
+            session_info = ableton.send_command("get_session_info")
+            kernel = {"session_info": session_info, "mode": "explore"}
+            plan = compiler.compile(move, kernel)
+            compiled_dict = plan.to_dict()
         # Run the branch through the async router
         await engine.run_branch_async(
@@ -174,26 +274,78 @@ async def run_experiment(
             ctx=ctx,
         )
-        # Evaluate
+        # Evaluate — score via the inline heuristic, then classify via
+        # evaluation.policy for a unified keep/undo/interesting_but_failed
+        # decision (PR7).
+        from ..evaluation.policy import classify_branch_outcome
         def eval_fn(before, after):
-            # Simple heuristic evaluation when spectral data isn't available
+            # Simple heuristic evaluation when spectral data isn't available.
+            # protection_violated is rough — derived from whether any track
+            # went silent (signal lost on a track = protection violation).
             score = 0.5  # Neutral
+            protection_violated = False
+            lost_tracks = 0
             if before.get("track_meters") and after.get("track_meters"):
-                # Check all tracks still alive
                 before_alive = sum(1 for t in before["track_meters"] if t.get("level", 0) > 0)
                 after_alive = sum(1 for t in after["track_meters"] if t.get("level", 0) > 0)
-                if after_alive >= before_alive:
+                lost_tracks = max(0, before_alive - after_alive)
+                if lost_tracks == 0:
                     score += 0.1
                 else:
-                    score -= 0.2  # Lost a track
+                    score -= 0.2
+                    # A track going silent is a protection violation — always
+                    # undo regardless of exploration mode.
+                    protection_violated = True
             if before.get("spectrum") and after.get("spectrum"):
-                # Spectral balance improvement heuristic
-                score += 0.1  # Bonus for having spectral data
-            return {"score": round(score, 3), "keep_change": score > 0.45}
+                score += 0.1  # presence-of-data bonus
+            score = round(score, 3)
+            outcome = classify_branch_outcome(
+                score=score,
+                protection_violated=protection_violated,
+                # Minimal hard-rule inputs — the heuristic doesn't compute
+                # measurable_count / goal_progress deltas. target_count=0 and
+                # measurable_count=0 lets rule 1 defer to score-only judgment.
+                measurable_count=0,
+                target_count=0,
+                goal_progress=0.0,
+                exploration_rules=exploration_rules,
+            )
+            return {
+                "score": outcome.score,
+                "keep_change": outcome.keep_change,
+                "status": outcome.status,
+                "failure_reasons": outcome.failure_reasons,
+                "note": outcome.note,
+                "lost_tracks": lost_tracks,
+            }
         engine.evaluate_branch(branch, eval_fn)
+        # Promote the classified status onto the branch. ranked_branches()
+        # only surfaces status="evaluated", so branches the classifier
+        # rejected ("undo") or retained for audit ("interesting_but_failed")
+        # are both correctly excluded from winner recommendations.
+        # Without this mapping, a branch the hard-rule classifier explicitly
+        # rejected could still win a ranking and be re-applied by commit.
+        if branch.evaluation and branch.evaluation.get("status"):
+            status = branch.evaluation["status"]
+            if status == "keep":
+                branch.status = "evaluated"
+            elif status == "interesting_but_failed":
+                branch.status = "interesting_but_failed"
+            elif status == "undo":
+                # Undo-classified branches had their steps rolled back by
+                # run_branch_async's undo pass; they must NOT be eligible
+                # winners. "rejected" is a terminal branch status distinct
+                # from "failed" (execution failed) and distinct from
+                # "interesting_but_failed" (exploration-mode retention).
+                branch.status = "rejected"
         results.append(branch.to_dict())
     return {
@@ -221,6 +373,30 @@ def compare_experiments(
         return {"error": f"Experiment {experiment_id} not found"}
     ranked = experiment.ranked_branches()
+    # Surface non-winning branch categories separately. None of these are
+    # candidates for commit — ranked_branches() filters them out — but the
+    # user sees what was tried.
+    interesting_failed = [
+        b for b in experiment.branches if b.status == "interesting_but_failed"
+    ]
+    rejected = [
+        b for b in experiment.branches if b.status == "rejected"
+    ]
+    analytical = [
+        b for b in experiment.branches if b.status == "analytical"
+    ]
+    def _audit_row(b):
+        return {
+            "branch_id": b.branch_id,
+            "name": b.name,
+            "move_id": b.move_id,
+            "score": b.score,
+            "summary": b.compiled_plan.get("summary", "") if b.compiled_plan else "",
+            "evaluation": b.evaluation,
+        }
     return {
         "experiment_id": experiment_id,
         "request": experiment.request_text,
@@ -228,16 +404,14 @@ def compare_experiments(
         "ranking": [
             {
                 "rank": i + 1,
-                "branch_id": b.branch_id,
-                "name": b.name,
-                "move_id": b.move_id,
-                "score": b.score,
-                "summary": b.compiled_plan.get("summary", "") if b.compiled_plan else "",
-                "evaluation": b.evaluation,
+                **_audit_row(b),
             }
             for i, b in enumerate(ranked)
         ],
         "winner": ranked[0].to_dict() if ranked else None,
+        "interesting_but_failed": [_audit_row(b) for b in interesting_failed],
+        "rejected": [_audit_row(b) for b in rejected],
+        "analytical": [_audit_row(b) for b in analytical],
     }
@@ -258,6 +432,28 @@ async def commit_experiment(
     if not experiment:
         return {"error": f"Experiment {experiment_id} not found"}
+    # Refuse to commit branches the classifier rejected or that were
+    # analytical-only. Those statuses exist specifically so callers
+    # can't route them into re-application, and ranked_branches()
+    # already excludes them — so reaching commit with such a branch
+    # means the caller is bypassing the ranking layer.
+    target = experiment.get_branch(branch_id)
+    if target is None:
+        return {"error": f"Branch {branch_id} not found"}
+    if target.status in ("rejected", "analytical", "failed"):
+        return {
+            "error": (
+                f"Cannot commit branch with status '{target.status}'. "
+                f"'rejected' = hard-rule classifier rolled back; "
+                f"'analytical' = no executable plan; "
+                f"'failed' = zero steps applied successfully. "
+                f"Use compare_experiments to see eligible winners "
+                f"(only status='evaluated' branches are ranking candidates)."
+            ),
+            "branch_id": branch_id,
+            "branch_status": target.status,
+        }
     ableton = _get_ableton(ctx)
     bridge = ctx.lifespan_context.get("m4l")
     mcp_registry = ctx.lifespan_context.get("mcp_dispatch", {})