@inspectr/mcplab 1.14.3 → 1.16.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/README.md +0 -35
- package/dist/app/assets/index-BSGuUMv-.js +254 -0
- package/dist/app/assets/index-Bekohuot.css +1 -0
- package/dist/app/index.html +2 -2
- package/dist/app-server/app-context.d.ts +0 -22
- package/dist/app-server/app-context.d.ts.map +1 -1
- package/dist/app-server/assistant-common.d.ts +37 -24
- package/dist/app-server/evals-routes.d.ts.map +1 -1
- package/dist/app-server/evals-routes.js +5 -41
- package/dist/app-server/evals-routes.js.map +1 -1
- package/dist/app-server/libraries-store.d.ts.map +1 -1
- package/dist/app-server/libraries-store.js +2 -3
- package/dist/app-server/libraries-store.js.map +1 -1
- package/dist/app-server/result-assistant-domain.d.ts +81 -65
- package/dist/app-server/result-assistant-domain.js +1 -2
- package/dist/app-server/result-assistant-domain.js.map +1 -1
- package/dist/app-server/result-assistant.d.ts.map +1 -1
- package/dist/app-server/result-assistant.js +7 -1
- package/dist/app-server/result-assistant.js.map +1 -1
- package/dist/app-server/router.d.ts.map +1 -1
- package/dist/app-server/router.js +0 -24
- package/dist/app-server/router.js.map +1 -1
- package/dist/app-server/runs-routes.d.ts +15 -4
- package/dist/app-server/runs-routes.d.ts.map +1 -1
- package/dist/app-server/runs-routes.js +189 -134
- package/dist/app-server/runs-routes.js.map +1 -1
- package/dist/app-server/runs-store.d.ts +6 -1
- package/dist/app-server/runs-store.d.ts.map +1 -1
- package/dist/app-server/runs-store.js +15 -1
- package/dist/app-server/runs-store.js.map +1 -1
- package/dist/app-server/scenario-assistant-domain.d.ts +144 -134
- package/dist/app-server/scenario-assistant-domain.d.ts.map +1 -1
- package/dist/app-server/scenario-assistant-domain.js +5 -8
- package/dist/app-server/scenario-assistant-domain.js.map +1 -1
- package/dist/app-server/scenario-assistant.d.ts.map +1 -1
- package/dist/app-server/scenario-assistant.js +7 -1
- package/dist/app-server/scenario-assistant.js.map +1 -1
- package/dist/app-server/snapshots-routes.d.ts +1 -13
- package/dist/app-server/snapshots-routes.d.ts.map +1 -1
- package/dist/app-server/snapshots-routes.js +9 -79
- package/dist/app-server/snapshots-routes.js.map +1 -1
- package/dist/app-server/types.d.ts +0 -2
- package/dist/app-server/types.d.ts.map +1 -1
- package/dist/cli.js +79 -288
- package/dist/cli.js.map +1 -1
- package/dist/interactive-helpers.d.ts +0 -1
- package/dist/interactive-helpers.d.ts.map +1 -1
- package/dist/interactive-helpers.js +0 -3
- package/dist/interactive-helpers.js.map +1 -1
- package/package.json +4 -4
- package/dist/app/assets/index-BBRB19an.js +0 -250
- package/dist/app/assets/index-DVQdbWhs.css +0 -1
package/README.md
CHANGED
|
@@ -446,40 +446,6 @@ mcplab watch -c examples/eval.yaml \
|
|
|
446
446
|
--agents claude-haiku,gpt-4o-mini
|
|
447
447
|
```
|
|
448
448
|
|
|
449
|
-
### Snapshot Baselines
|
|
450
|
-
|
|
451
|
-
Create a smart baseline from a fully passing run, then compare later runs against it:
|
|
452
|
-
|
|
453
|
-
```bash
|
|
454
|
-
# Create a snapshot (source run must be fully passing)
|
|
455
|
-
mcplab snapshot create --run 20260208-140213 --name "weather-api-baseline-v1"
|
|
456
|
-
|
|
457
|
-
# List snapshots
|
|
458
|
-
mcplab snapshot list
|
|
459
|
-
|
|
460
|
-
# Compare run against snapshot
|
|
461
|
-
mcplab snapshot compare --id <snapshotId> --run 20260208-150045
|
|
462
|
-
```
|
|
463
|
-
|
|
464
|
-
Optional: compare immediately after a run:
|
|
465
|
-
|
|
466
|
-
```bash
|
|
467
|
-
mcplab run -c mcplab/evals/eval.yaml --compare-snapshot <snapshotId>
|
|
468
|
-
```
|
|
469
|
-
|
|
470
|
-
Config-first snapshot eval workflow:
|
|
471
|
-
|
|
472
|
-
```bash
|
|
473
|
-
# Initialize snapshot eval policy in a config from a fully passing run
|
|
474
|
-
mcplab snapshot eval-init --config mcplab/evals/eval.yaml --run 20260208-140213 --name "baseline-v1"
|
|
475
|
-
|
|
476
|
-
# Update snapshot eval policy mode
|
|
477
|
-
mcplab snapshot eval-policy --config mcplab/evals/eval.yaml --enabled true --mode fail_on_drift
|
|
478
|
-
|
|
479
|
-
# Apply config snapshot policy during run (warn or fail_on_drift)
|
|
480
|
-
mcplab run -c mcplab/evals/eval.yaml --snapshot-eval
|
|
481
|
-
```
|
|
482
|
-
|
|
483
449
|
### Generate Reports
|
|
484
450
|
|
|
485
451
|
```bash
|
|
@@ -575,7 +541,6 @@ mcplab/
|
|
|
575
541
|
├── results/
|
|
576
542
|
│ ├── evaluation-runs/ # Run artifacts
|
|
577
543
|
│ └── tool-analysis/ # Saved tool analysis reports
|
|
578
|
-
├── snapshots/ # Snapshot baselines
|
|
579
544
|
├── reports/ # Custom markdown reports
|
|
580
545
|
├── servers.yaml # Library: shared server definitions
|
|
581
546
|
├── agents.yaml # Library: shared agent definitions
|