agentops-cockpit 0.9.7__tar.gz → 0.9.8__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/.gitignore +5 -1
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/Makefile +35 -6
- agentops_cockpit-0.9.8/PKG-INFO +172 -0
- agentops_cockpit-0.9.8/README.md +148 -0
- agentops_cockpit-0.9.8/docs/DEPLOYMENT.md +70 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/index.html +3 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/package.json +1 -1
- agentops_cockpit-0.9.8/public/AGENT_OPS_STORY.md +31 -0
- agentops_cockpit-0.9.8/public/AUDIT_SCENARIOS.md +101 -0
- agentops_cockpit-0.9.8/public/CHANGELOG.md +72 -0
- agentops_cockpit-0.9.8/public/COCKPIT_GUIDE.md +44 -0
- agentops_cockpit-0.9.8/public/DEPLOYMENT.md +70 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GEMINI.md +12 -6
- agentops_cockpit-0.9.8/public/GETTING_STARTED.md +62 -0
- agentops_cockpit-0.9.8/public/PRODUCTION_CHECKLIST.md +40 -0
- agentops_cockpit-0.9.8/public/README.md +140 -0
- agentops_cockpit-0.9.8/public/ROADMAP.md +59 -0
- agentops_cockpit-0.9.8/public/ROADMAP_V13.md +59 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_A2A_GUIDE.md +76 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_ARCH_REVIEW.md +50 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_AUDIT_GUIDE.md +110 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_COMMANDS_MASTER.md +106 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_FINOPS_GUIDE.md +104 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_INFRA_GUIDE.md +122 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_QUALITY_GUIDE.md +92 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_REDTEAM_GUIDE.md +86 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_UVX_MASTER.md +90 -0
- agentops_cockpit-0.9.8/public/TECHNICAL_UX_GUIDE.md +118 -0
- agentops_cockpit-0.9.8/public/arch-review-report.html +93 -0
- agentops_cockpit-0.9.8/public/compliance-evidence.md +262 -0
- agentops_cockpit-0.9.8/public/master-audit-report.html +4056 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/pyproject.toml +1 -1
- agentops_cockpit-0.9.8/src/App.tsx +43 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/a2ui/A2UIRenderer.tsx +16 -4
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/agent.py +104 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/cache/semantic_cache.py +10 -21
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/cli/main.py +243 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/eval/load_test.py +79 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/eval/quality_climber.py +142 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/eval/red_team.py +137 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/mcp_server.py +65 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/arch_review.py +240 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/base.py +50 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/behavioral.py +31 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/compliance.py +35 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/dependency.py +48 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/finops.py +48 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/graph.py +49 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/pivot.py +51 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/reasoning.py +67 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/reliability.py +53 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/security.py +87 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/sme_v12.py +76 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/sovereignty.py +74 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/auditors/sre_a2a.py +179 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/benchmarker.py +97 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/cost_optimizer.py +30 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/discovery.py +214 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/evidence_bridge.py +30 -63
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/frameworks.py +124 -1
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/git_portal.py +74 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/mcp_hub.py +56 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/orchestrator.py +617 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/policy_engine.py +85 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/reliability.py +139 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/remediator.py +54 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/secret_scanner.py +34 -22
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/swarm.py +17 -27
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/ui_auditor.py +67 -6
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/ops/watcher.py +109 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/watchlist.json +30 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/optimizer.py +262 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/tests/test_arch_review.py +6 -6
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_discovery.py +96 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_ops_core.py +56 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_orchestrator_fleet.py +73 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_persona_architect.py +75 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_persona_finops.py +31 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_persona_security.py +55 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_persona_sre.py +43 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_persona_ux.py +42 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/tests/test_quality_climber.py +2 -2
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_remediator.py +75 -0
- agentops_cockpit-0.9.8/src/agent_ops_cockpit/tests/test_ui_auditor.py +52 -0
- agentops_cockpit-0.9.8/src/components/AgentPulse.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/components/Home.tsx +37 -5
- agentops_cockpit-0.9.8/src/components/OperationalJourneys.tsx +567 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/docs/DocPage.tsx +11 -8
- agentops_cockpit-0.9.7/PKG-INFO +0 -246
- agentops_cockpit-0.9.7/README.md +0 -222
- agentops_cockpit-0.9.7/docs/DEPLOYMENT.md +0 -102
- agentops_cockpit-0.9.7/public/A2A_GUIDE.md +0 -58
- agentops_cockpit-0.9.7/public/AGENT_OPS_STORY.md +0 -48
- agentops_cockpit-0.9.7/public/BE_INTEGRATION_GUIDE.md +0 -35
- agentops_cockpit-0.9.7/public/CHANGELOG.md +0 -23
- agentops_cockpit-0.9.7/public/COCKPIT_GUIDE.md +0 -32
- agentops_cockpit-0.9.7/public/DEPLOYMENT.md +0 -102
- agentops_cockpit-0.9.7/public/GETTING_STARTED.md +0 -67
- agentops_cockpit-0.9.7/public/PRODUCTION_CHECKLIST.md +0 -45
- agentops_cockpit-0.9.7/public/README.md +0 -178
- agentops_cockpit-0.9.7/public/ROADMAP.md +0 -56
- agentops_cockpit-0.9.7/src/App.tsx +0 -38
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/agent.py +0 -142
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/cli/main.py +0 -291
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/eval/load_test.py +0 -96
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/eval/quality_climber.py +0 -147
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/eval/red_team.py +0 -104
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/mcp_server.py +0 -132
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/arch_review.py +0 -167
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/cost_optimizer.py +0 -39
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/mcp_hub.py +0 -79
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/orchestrator.py +0 -417
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/policy_engine.py +0 -85
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/reliability.py +0 -84
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/ops/watcher.py +0 -138
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/optimizer.py +0 -512
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/tests/test_optimizer.py +0 -68
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/tests/test_red_team.py +0 -35
- agentops_cockpit-0.9.7/src/agent_ops_cockpit/tests/test_secret_scanner.py +0 -24
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/Dockerfile +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/LICENSE +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/firebase.json +0 -0
- {agentops_cockpit-0.9.7/docs → agentops_cockpit-0.9.8/public}/A2A_GUIDE.md +0 -0
- {agentops_cockpit-0.9.7/docs → agentops_cockpit-0.9.8/public}/BE_INTEGRATION_GUIDE.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/CLI_COMMANDS.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/CONTRIBUTING.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/DEVELOPMENT.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GOOGLE_ARCHITECTURE.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GOVERNANCE_GUIDE.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_ARCH_REVIEW.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_AUDIT.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_DEPLOYMENT.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_LOAD_TEST.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_MCP.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_OPTIMIZER.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_POLICY.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_RED_TEAM.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/GUIDE_RELIABILITY.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/LIMITATIONS.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/OPTIMIZATION_GUIDE.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/PRD.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/SECURITY_GUIDE.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/assets/ecosystem.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/assets/trinity.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/assets/workflow.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/cicd-workflow.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/diagrams/agentic-stack.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/diagrams/value-proposition.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/hero.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/kokpi_branded.jpg +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/kokpi_kun.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/kokpi_simplistic.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/og-image.png +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/sample-report.html +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/public/sample-report.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/a2ui/components/index.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/a2ui/components/lit-component-example.ts +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/a2ui/types.ts +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/cache/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/cli/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/cost_control.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/eval/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/evidence.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/memory_optimizer.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/pii_scrubber.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/ops/policies.json +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/shadow/__init__.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/shadow/router.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/system_prompt.md +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/tests/golden_set.json +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/tests/test_agent.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/agent_ops_cockpit/tests/test_frameworks.py +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/components/FlightRecorder.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/components/OpsDashboard.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/components/ReportSamples.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/components/ThemeToggle.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/docs/DocHome.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/docs/DocLayout.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/index.css +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/knowledge/example_policy.txt +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/src/main.tsx +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/tsconfig.json +0 -0
- {agentops_cockpit-0.9.7 → agentops_cockpit-0.9.8}/vite.config.ts +0 -0
|
@@ -15,8 +15,14 @@ help:
|
|
|
15
15
|
@echo " make audit - [MASTER] Quick Safe-Build (uvx agentops-cockpit report --mode quick)"
|
|
16
16
|
@echo " make audit-deep - [MASTER] Deep System Audit (uvx agentops-cockpit report --mode deep)"
|
|
17
17
|
@echo " make optimizer-audit - [CODE] Quick code audit (uvx agentops-cockpit audit --quick)"
|
|
18
|
-
@echo " make
|
|
18
|
+
@echo " make arch-review - [ARCH] Reasoning-based architecture review (v1.0)"
|
|
19
|
+
@echo " make arch-review-export - [ARCH] Generate Executive v1.1 HTML Report"
|
|
20
|
+
@echo " make arch-benchmark - [ARCH] Run v1.2 Reliability Waterfall (Stress Test)"
|
|
21
|
+
@echo " make apply-fixes - [PHASE 4] Auto-remediate detected architectural gaps"
|
|
22
|
+
@echo " make propose-fixes - [PHASE 5] Create fix branch and commit remediations"
|
|
19
23
|
@echo " make reliability - Run unit tests and regression suite"
|
|
24
|
+
@echo " make smoke-test - [E2E] End-to-End Persona Journey smoke tests"
|
|
25
|
+
@echo " make regression - [FULL] Master Reliability + Smoke Tests"
|
|
20
26
|
@echo " make diagnose - [DevEx] System health check and env diagnosis"
|
|
21
27
|
@echo " make email-report - [GOV] Email the latest Persona-Approved report"
|
|
22
28
|
@echo " make red-team - Run adversarial security audit"
|
|
@@ -53,6 +59,14 @@ audit-all:
|
|
|
53
59
|
reliability:
|
|
54
60
|
@$(PYTHON) src/agent_ops_cockpit/ops/reliability.py
|
|
55
61
|
|
|
62
|
+
# 🧪 Smoke Test: E2E Persona Validation
|
|
63
|
+
smoke-test:
|
|
64
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/reliability.py --smoke
|
|
65
|
+
|
|
66
|
+
# 🚀 Regression: The Full Suite (Unit + Smoke)
|
|
67
|
+
regression:
|
|
68
|
+
@PYTHONPATH=src $(PYTHON) -c "from agent_ops_cockpit.ops.reliability import run_regression_suite; run_regression_suite()"
|
|
69
|
+
|
|
56
70
|
# 🩺 Diagnose: DevEx system check
|
|
57
71
|
diagnose:
|
|
58
72
|
@PYTHONPATH=src $(PYTHON) -m agent_ops_cockpit.cli.main diagnose
|
|
@@ -67,7 +81,23 @@ optimizer-audit-deep:
|
|
|
67
81
|
|
|
68
82
|
# 🏛️ Architecture: Design review against Google Well-Architected Framework
|
|
69
83
|
arch-review:
|
|
70
|
-
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py
|
|
84
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py audit
|
|
85
|
+
|
|
86
|
+
# 🏛️ Executive: Generate v1.1 HTML Summary
|
|
87
|
+
arch-review-export:
|
|
88
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py audit --export
|
|
89
|
+
|
|
90
|
+
# 🌊 Reliability: v1.2 Automated Benchmarking
|
|
91
|
+
arch-benchmark:
|
|
92
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py benchmark --count 50
|
|
93
|
+
|
|
94
|
+
# 🚀 The Closer: Auto-remediation engine for architecture gaps
|
|
95
|
+
apply-fixes:
|
|
96
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py apply-fixes
|
|
97
|
+
|
|
98
|
+
# 🌿 The Ambassador: Autonomous PR Factory
|
|
99
|
+
propose-fixes:
|
|
100
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/arch_review.py propose-fixes
|
|
71
101
|
|
|
72
102
|
# 🧗 Quality: Iterative Hill Climbing optimization
|
|
73
103
|
quality-baseline:
|
|
@@ -79,7 +109,7 @@ scan-secrets:
|
|
|
79
109
|
|
|
80
110
|
# 🎨 UI/UX: Face Auditor for frontend quality
|
|
81
111
|
ui-audit:
|
|
82
|
-
@$(PYTHON) src/agent_ops_cockpit/ops/ui_auditor.py
|
|
112
|
+
@$(PYTHON) src/agent_ops_cockpit/ops/ui_auditor.py $(TARGET)
|
|
83
113
|
|
|
84
114
|
# 🔥 Red Team: Unleash self-hacking security audit
|
|
85
115
|
|
|
@@ -95,9 +125,8 @@ URL ?= http://localhost:8000/agent/query?q=healthcheck
|
|
|
95
125
|
load_test:
|
|
96
126
|
@$(PYTHON) src/agent_ops_cockpit/eval/load_test.py run --url $(URL) --requests $(REQUESTS) --concurrency $(CONCURRENCY)
|
|
97
127
|
|
|
98
|
-
# 🚀 Production: The Vercel-style 1-click deploy (using
|
|
99
|
-
deploy-prod:
|
|
100
|
-
|
|
128
|
+
# 🚀 Production: The Vercel-style 1-click deploy (using Full Regression Suite)
|
|
129
|
+
deploy-prod: regression build
|
|
101
130
|
@echo "📦 Containerizing and deploying to Cloud Run..."
|
|
102
131
|
gcloud run deploy $(SERVICE_NAME) --source . --region $(REGION) --allow-unauthenticated --port 80
|
|
103
132
|
@echo "🔥 Deploying frontend to Firebase..."
|
|
@@ -0,0 +1,172 @@
|
|
|
1
|
+
Metadata-Version: 2.4
|
|
2
|
+
Name: agentops-cockpit
|
|
3
|
+
Version: 0.9.8
|
|
4
|
+
Summary: Production-grade Agent Operations (AgentOps) Platform
|
|
5
|
+
Project-URL: Homepage, https://github.com/enriquekalven/agent-ops-cockpit
|
|
6
|
+
Project-URL: Bug Tracker, https://github.com/enriquekalven/agent-ops-cockpit/issues
|
|
7
|
+
Author-email: Enrique <enrique@example.com>
|
|
8
|
+
License-File: LICENSE
|
|
9
|
+
Classifier: License :: OSI Approved :: MIT License
|
|
10
|
+
Classifier: Operating System :: OS Independent
|
|
11
|
+
Classifier: Programming Language :: Python :: 3
|
|
12
|
+
Requires-Python: >=3.10
|
|
13
|
+
Requires-Dist: aiohttp>=3.9.0
|
|
14
|
+
Requires-Dist: fastapi>=0.100.0
|
|
15
|
+
Requires-Dist: gitpython>=3.1.0
|
|
16
|
+
Requires-Dist: mcp>=0.1.0
|
|
17
|
+
Requires-Dist: packaging>=23.0
|
|
18
|
+
Requires-Dist: pydantic>=2.0.0
|
|
19
|
+
Requires-Dist: rich>=13.0.0
|
|
20
|
+
Requires-Dist: tenacity>=8.0.0
|
|
21
|
+
Requires-Dist: typer>=0.9.0
|
|
22
|
+
Requires-Dist: uvicorn>=0.20.0
|
|
23
|
+
Description-Content-Type: text/markdown
|
|
24
|
+
|
|
25
|
+
# 🕹️ AgentOps Cockpit
|
|
26
|
+
|
|
27
|
+
<div align="center">
|
|
28
|
+
<img src="public/assets/trinity.png" alt="AgentOps Cockpit Trinity" width="100%" />
|
|
29
|
+
</div>
|
|
30
|
+
|
|
31
|
+
<div align="center">
|
|
32
|
+
<br />
|
|
33
|
+
<a href="https://agent-cockpit.web.app" target="_blank"><strong>🌐 Official Website & Live Demo</strong></a>
|
|
34
|
+
<br /><br />
|
|
35
|
+
<a href="https://deploy.cloud.google.com?repo=https://github.com/enriquekalven/agent-cockpit">
|
|
36
|
+
<img src="https://deploy.cloud.google.com/button.svg" alt="Deploy to Google Cloud" />
|
|
37
|
+
</a>
|
|
38
|
+
<br />
|
|
39
|
+
<br />
|
|
40
|
+
<img src="https://img.shields.io/github/stars/enriquekalven/agent-cockpit?style=for-the-badge&color=ffd700" alt="GitHub Stars" />
|
|
41
|
+
<img src="https://img.shields.io/github/license/enriquekalven/agent-cockpit?style=for-the-badge&color=007bff" alt="License" />
|
|
42
|
+
<img src="https://img.shields.io/badge/Google-Well--Architected-4285F4?style=for-the-badge&logo=google-cloud" alt="Google Well-Architected" />
|
|
43
|
+
<img src="https://img.shields.io/badge/A2A_Standard-Enabled-10b981?style=for-the-badge" alt="A2A Standard" />
|
|
44
|
+
</div>
|
|
45
|
+
|
|
46
|
+
<br />
|
|
47
|
+
|
|
48
|
+
<div align="center">
|
|
49
|
+
<h3>"Infrastructure gives you the pipes. We give you the Intelligence."</h3>
|
|
50
|
+
<p>The developer distribution for building, optimizing, and securing AI agents on Google Cloud.</p>
|
|
51
|
+
</div>
|
|
52
|
+
|
|
53
|
+
---
|
|
54
|
+
|
|
55
|
+
## 📽️ The Mission
|
|
56
|
+
Most AI agent templates stop at a single Python file and an API key. **The AgentOps Cockpit** is for developers moving into production. It provides framework-agnostic governance, safety, and cost guardrails for the entire agentic ecosystem.
|
|
57
|
+
|
|
58
|
+
- **Governance-as-Code**: Audit your agent against [Google Well-Architected](/docs/GOOGLE_ARCHITECTURE.md) best practices with the **Evidence Bridge**—real-time citations for architectural integrity.
|
|
59
|
+
- **SME Persona Audits**: Parallelized review of your codebase by automated [**Principal SMEs**](docs/TECHNICAL_AUDIT_GUIDE.md) across FinOps, SecOps, Architecture, and Quality.
|
|
60
|
+
- **Agentic Trinity**: Dedicated layers for the Engine (Logic), Face (UX), and Cockpit (Ops).
|
|
61
|
+
- **A2A Connectivity**: Implements the [**Agent-to-Agent Transmission Standard**](docs/TECHNICAL_A2A_GUIDE.md) for secure swarm orchestration.
|
|
62
|
+
- **MCP Native**: Registration as a [Model Context Protocol](https://modelcontextprotocol.io) server for 1P/2P/3P tool consumption.
|
|
63
|
+
|
|
64
|
+
---
|
|
65
|
+
|
|
66
|
+
## 🏗️ The Agentic Trinity
|
|
67
|
+
We divide the complexity of production agents into three focused pillars:
|
|
68
|
+
|
|
69
|
+
```mermaid
|
|
70
|
+
graph TD
|
|
71
|
+
subgraph Trinity [The Agentic Trinity 2.0]
|
|
72
|
+
E(The Engine: Reasoning)
|
|
73
|
+
F(The Face: Interface)
|
|
74
|
+
C(The Cockpit: Operations)
|
|
75
|
+
S{Sovereignty & Compliance}
|
|
76
|
+
end
|
|
77
|
+
E <--> C
|
|
78
|
+
F <--> C
|
|
79
|
+
E <--> F
|
|
80
|
+
E -.-> S
|
|
81
|
+
F -.-> S
|
|
82
|
+
C -.-> S
|
|
83
|
+
style Trinity fill:#f8fafc,stroke:#334155,stroke-width:2px
|
|
84
|
+
style S fill:#0ea5e9,color:#fff,stroke:#0284c7
|
|
85
|
+
```
|
|
86
|
+
|
|
87
|
+
- **⚙️ The Engine**: The reasoning core. Built with **ADK**, FastAPI, and Vertex AI.
|
|
88
|
+
- **🎭 The Face**: The user experience. [Adaptive UI surfaces](docs/TECHNICAL_UX_GUIDE.md) and **GenUI** standards via the A2UI spec.
|
|
89
|
+
- **🕹️ The Cockpit**: The operational brain. [Cost control](docs/TECHNICAL_FINOPS_GUIDE.md), semantic caching, shadow routing, and [adversarial audits](docs/TECHNICAL_REDTEAM_GUIDE.md).
|
|
90
|
+
|
|
91
|
+
<div align="center">
|
|
92
|
+
<img src="public/assets/ecosystem.png" alt="Ecosystem Integrations" width="100%" />
|
|
93
|
+
</div>
|
|
94
|
+
|
|
95
|
+
---
|
|
96
|
+
|
|
97
|
+
## 🏛️ v1.3: The "Autonomous Architect" Standard (NEW)
|
|
98
|
+
Evolving from a compliance tool to an autonomous evolution engine. See the [**v1.3 Roadmap**](/docs/ROADMAP_V13.md).
|
|
99
|
+
|
|
100
|
+
- **🚀 Context-Aware Patching**: Moving from templates to LLM-Synthesized PRs that match your project's style.
|
|
101
|
+
- **🧪 Digital Twin Simulation**: `make simulation-run` for high-concurrency "Stress-Reasoning" test. [**Read Guide**](docs/TECHNICAL_ARCH_REVIEW.md).
|
|
102
|
+
- **🧗 Hill Climbing Optimization**: Iterative prompt tuning to reach the Global Peak. [**Read Guide**](docs/TECHNICAL_QUALITY_GUIDE.md).
|
|
103
|
+
- **🌍 Strategic Exit Strategy**: Automated TCO reports and migration plans for moving between cloud providers.
|
|
104
|
+
|
|
105
|
+
---
|
|
106
|
+
|
|
107
|
+
## 🚀 Key Innovation: The "Intelligence" Layer
|
|
108
|
+
|
|
109
|
+
### 🛡️ Red Team Auditor (Adversarial SRE)
|
|
110
|
+
Don't wait for your users to find prompt injections. Use the built-in [**Adversarial Evaluator**](docs/TECHNICAL_REDTEAM_GUIDE.md) to launch self-attacks against your agent, testing for PII leaks, instruction overrides, and multilingual jailbreaks.
|
|
111
|
+
|
|
112
|
+
### 🧠 Hive Mind (Semantic Caching)
|
|
113
|
+
**Reduce LLM costs by up to 40%.** The Hive Mind checks for semantically similar queries in 10ms, serving cached answers for common questions without calling the LLM.
|
|
114
|
+
|
|
115
|
+
### 🏛️ Arch Review & Autonomous Evolution
|
|
116
|
+
Every agent in the cockpit is graded against a framework-aware checklist. The Cockpit intelligently detects your stack and runs a tailored [**Architecture Review**](docs/TECHNICAL_ARCH_REVIEW.md). v1.3 introduces **Autonomous Evolution**—the ability to synthesize code fixes directly from audit findings.
|
|
117
|
+
|
|
118
|
+
### 🕹️ MCP Connectivity Hub (Model Context Protocol)
|
|
119
|
+
Stop building one-off tool integrations. The Cockpit provides a unified hub for **MCP Servers**. Connect to 1P/2P/3P tools via the standardized Model Context Protocol for secure, audited tool execution. Start the server with `make mcp-serve`.
|
|
120
|
+
|
|
121
|
+
### 🗄️ Situational Database Audits
|
|
122
|
+
The Cockpit now performs platform-specific performance and security audits for **AlloyDB**, **Pinecone**, **BigQuery**, and **Cloud SQL**.
|
|
123
|
+
|
|
124
|
+
---
|
|
125
|
+
|
|
126
|
+
### 🛡️ Advanced Governance & Discovery
|
|
127
|
+
Modern agents don't just live in `agent.py`. The Cockpit uses a centralized **Discovery Engine** to intelligently map your project:
|
|
128
|
+
- **`.gitignore` Compliance**: Zero-noise scanning that respects your project's ignore rules.
|
|
129
|
+
- **Library Isolation**: Intelligently ignores hits in `venv` or `node_modules` to focus on your code.
|
|
130
|
+
- **Config-Driven**: Use `cockpit.yaml` to define custom entry points, exclusions, and CI/CD thresholds.
|
|
131
|
+
|
|
132
|
+
---
|
|
133
|
+
|
|
134
|
+
## ⌨️ Master Command Registry
|
|
135
|
+
|
|
136
|
+
The Cockpit is available as a first-class CLI and a comprehensive Makefile-based operational toolkit.
|
|
137
|
+
|
|
138
|
+
| Registry | Description |
|
|
139
|
+
| :--- | :--- |
|
|
140
|
+
| 🕹️ [**Makefile Commands**](docs/TECHNICAL_COMMANDS_MASTER.md) | Standard local development and orchestration shortcuts. |
|
|
141
|
+
| 🚀 [**UVX Master Guide**](docs/TECHNICAL_UVX_MASTER.md) | Portable, zero-install commands for CI/CD and automation. |
|
|
142
|
+
|
|
143
|
+
---
|
|
144
|
+
|
|
145
|
+
## 🧑💼 Principal SME Persona Approvals
|
|
146
|
+
The Cockpit now features a **Multi-Persona Governance Board**. Every audit result is framed through the lens of a Principal Engineer in that domain:
|
|
147
|
+
* [**🏛️ Architecture**](docs/TECHNICAL_ARCH_REVIEW.md)
|
|
148
|
+
* [**💰 FinOps**](docs/TECHNICAL_FINOPS_GUIDE.md)
|
|
149
|
+
* [**🛡️ Red Team**](docs/TECHNICAL_REDTEAM_GUIDE.md)
|
|
150
|
+
* [**🧗 Quality**](docs/TECHNICAL_QUALITY_GUIDE.md)
|
|
151
|
+
* [**🌐 Infrastructure**](docs/TECHNICAL_INFRA_GUIDE.md)
|
|
152
|
+
* [**🎭 UX/UI**](docs/TECHNICAL_UX_GUIDE.md)
|
|
153
|
+
|
|
154
|
+
---
|
|
155
|
+
|
|
156
|
+
## 🚀 1-Click Production Pipeline
|
|
157
|
+
`make deploy-prod` triggers the following lifecycle:
|
|
158
|
+
1. Runs the Quick Safe-Build (`make audit`).
|
|
159
|
+
2. Compiles production frontend assets.
|
|
160
|
+
3. Deploys the Engine to **Google Cloud Run**.
|
|
161
|
+
4. Deploys the Face to **Firebase Hosting**.
|
|
162
|
+
|
|
163
|
+
---
|
|
164
|
+
|
|
165
|
+
## 🤝 Ecosystem & Attribution
|
|
166
|
+
The AgentOps Cockpit is designed to leverage and secure the best-of-breed tools in the Google Cloud ecosystem. We explicitly acknowledge and leverage the excellent work from:
|
|
167
|
+
|
|
168
|
+
* **[GoogleCloudPlatform/agent-starter-pack](https://github.com/GoogleCloudPlatform/agent-starter-pack/)**: We leverage this as a core reference for the **Agent Development Kit (ADK)** patterns and Vertex AI Agent Engine integration.
|
|
169
|
+
* **A2A Standard**: Our implementation follow the Agent-to-Agent Transmission Protocol for swarm intelligence.
|
|
170
|
+
|
|
171
|
+
---
|
|
172
|
+
*Reference: [Google Cloud Architecture Center - Agentic AI Overview](https://docs.cloud.google.com/architecture/agentic-ai-overview)*
|
|
@@ -0,0 +1,148 @@
|
|
|
1
|
+
# 🕹️ AgentOps Cockpit
|
|
2
|
+
|
|
3
|
+
<div align="center">
|
|
4
|
+
<img src="public/assets/trinity.png" alt="AgentOps Cockpit Trinity" width="100%" />
|
|
5
|
+
</div>
|
|
6
|
+
|
|
7
|
+
<div align="center">
|
|
8
|
+
<br />
|
|
9
|
+
<a href="https://agent-cockpit.web.app" target="_blank"><strong>🌐 Official Website & Live Demo</strong></a>
|
|
10
|
+
<br /><br />
|
|
11
|
+
<a href="https://deploy.cloud.google.com?repo=https://github.com/enriquekalven/agent-cockpit">
|
|
12
|
+
<img src="https://deploy.cloud.google.com/button.svg" alt="Deploy to Google Cloud" />
|
|
13
|
+
</a>
|
|
14
|
+
<br />
|
|
15
|
+
<br />
|
|
16
|
+
<img src="https://img.shields.io/github/stars/enriquekalven/agent-cockpit?style=for-the-badge&color=ffd700" alt="GitHub Stars" />
|
|
17
|
+
<img src="https://img.shields.io/github/license/enriquekalven/agent-cockpit?style=for-the-badge&color=007bff" alt="License" />
|
|
18
|
+
<img src="https://img.shields.io/badge/Google-Well--Architected-4285F4?style=for-the-badge&logo=google-cloud" alt="Google Well-Architected" />
|
|
19
|
+
<img src="https://img.shields.io/badge/A2A_Standard-Enabled-10b981?style=for-the-badge" alt="A2A Standard" />
|
|
20
|
+
</div>
|
|
21
|
+
|
|
22
|
+
<br />
|
|
23
|
+
|
|
24
|
+
<div align="center">
|
|
25
|
+
<h3>"Infrastructure gives you the pipes. We give you the Intelligence."</h3>
|
|
26
|
+
<p>The developer distribution for building, optimizing, and securing AI agents on Google Cloud.</p>
|
|
27
|
+
</div>
|
|
28
|
+
|
|
29
|
+
---
|
|
30
|
+
|
|
31
|
+
## 📽️ The Mission
|
|
32
|
+
Most AI agent templates stop at a single Python file and an API key. **The AgentOps Cockpit** is for developers moving into production. It provides framework-agnostic governance, safety, and cost guardrails for the entire agentic ecosystem.
|
|
33
|
+
|
|
34
|
+
- **Governance-as-Code**: Audit your agent against [Google Well-Architected](/docs/GOOGLE_ARCHITECTURE.md) best practices with the **Evidence Bridge**—real-time citations for architectural integrity.
|
|
35
|
+
- **SME Persona Audits**: Parallelized review of your codebase by automated [**Principal SMEs**](docs/TECHNICAL_AUDIT_GUIDE.md) across FinOps, SecOps, Architecture, and Quality.
|
|
36
|
+
- **Agentic Trinity**: Dedicated layers for the Engine (Logic), Face (UX), and Cockpit (Ops).
|
|
37
|
+
- **A2A Connectivity**: Implements the [**Agent-to-Agent Transmission Standard**](docs/TECHNICAL_A2A_GUIDE.md) for secure swarm orchestration.
|
|
38
|
+
- **MCP Native**: Registration as a [Model Context Protocol](https://modelcontextprotocol.io) server for 1P/2P/3P tool consumption.
|
|
39
|
+
|
|
40
|
+
---
|
|
41
|
+
|
|
42
|
+
## 🏗️ The Agentic Trinity
|
|
43
|
+
We divide the complexity of production agents into three focused pillars:
|
|
44
|
+
|
|
45
|
+
```mermaid
|
|
46
|
+
graph TD
|
|
47
|
+
subgraph Trinity [The Agentic Trinity 2.0]
|
|
48
|
+
E(The Engine: Reasoning)
|
|
49
|
+
F(The Face: Interface)
|
|
50
|
+
C(The Cockpit: Operations)
|
|
51
|
+
S{Sovereignty & Compliance}
|
|
52
|
+
end
|
|
53
|
+
E <--> C
|
|
54
|
+
F <--> C
|
|
55
|
+
E <--> F
|
|
56
|
+
E -.-> S
|
|
57
|
+
F -.-> S
|
|
58
|
+
C -.-> S
|
|
59
|
+
style Trinity fill:#f8fafc,stroke:#334155,stroke-width:2px
|
|
60
|
+
style S fill:#0ea5e9,color:#fff,stroke:#0284c7
|
|
61
|
+
```
|
|
62
|
+
|
|
63
|
+
- **⚙️ The Engine**: The reasoning core. Built with **ADK**, FastAPI, and Vertex AI.
|
|
64
|
+
- **🎭 The Face**: The user experience. [Adaptive UI surfaces](docs/TECHNICAL_UX_GUIDE.md) and **GenUI** standards via the A2UI spec.
|
|
65
|
+
- **🕹️ The Cockpit**: The operational brain. [Cost control](docs/TECHNICAL_FINOPS_GUIDE.md), semantic caching, shadow routing, and [adversarial audits](docs/TECHNICAL_REDTEAM_GUIDE.md).
|
|
66
|
+
|
|
67
|
+
<div align="center">
|
|
68
|
+
<img src="public/assets/ecosystem.png" alt="Ecosystem Integrations" width="100%" />
|
|
69
|
+
</div>
|
|
70
|
+
|
|
71
|
+
---
|
|
72
|
+
|
|
73
|
+
## 🏛️ v1.3: The "Autonomous Architect" Standard (NEW)
|
|
74
|
+
Evolving from a compliance tool to an autonomous evolution engine. See the [**v1.3 Roadmap**](/docs/ROADMAP_V13.md).
|
|
75
|
+
|
|
76
|
+
- **🚀 Context-Aware Patching**: Moving from templates to LLM-Synthesized PRs that match your project's style.
|
|
77
|
+
- **🧪 Digital Twin Simulation**: `make simulation-run` for high-concurrency "Stress-Reasoning" test. [**Read Guide**](docs/TECHNICAL_ARCH_REVIEW.md).
|
|
78
|
+
- **🧗 Hill Climbing Optimization**: Iterative prompt tuning to reach the Global Peak. [**Read Guide**](docs/TECHNICAL_QUALITY_GUIDE.md).
|
|
79
|
+
- **🌍 Strategic Exit Strategy**: Automated TCO reports and migration plans for moving between cloud providers.
|
|
80
|
+
|
|
81
|
+
---
|
|
82
|
+
|
|
83
|
+
## 🚀 Key Innovation: The "Intelligence" Layer
|
|
84
|
+
|
|
85
|
+
### 🛡️ Red Team Auditor (Adversarial SRE)
|
|
86
|
+
Don't wait for your users to find prompt injections. Use the built-in [**Adversarial Evaluator**](docs/TECHNICAL_REDTEAM_GUIDE.md) to launch self-attacks against your agent, testing for PII leaks, instruction overrides, and multilingual jailbreaks.
|
|
87
|
+
|
|
88
|
+
### 🧠 Hive Mind (Semantic Caching)
|
|
89
|
+
**Reduce LLM costs by up to 40%.** The Hive Mind checks for semantically similar queries in 10ms, serving cached answers for common questions without calling the LLM.
|
|
90
|
+
|
|
91
|
+
### 🏛️ Arch Review & Autonomous Evolution
|
|
92
|
+
Every agent in the cockpit is graded against a framework-aware checklist. The Cockpit intelligently detects your stack and runs a tailored [**Architecture Review**](docs/TECHNICAL_ARCH_REVIEW.md). v1.3 introduces **Autonomous Evolution**—the ability to synthesize code fixes directly from audit findings.
|
|
93
|
+
|
|
94
|
+
### 🕹️ MCP Connectivity Hub (Model Context Protocol)
|
|
95
|
+
Stop building one-off tool integrations. The Cockpit provides a unified hub for **MCP Servers**. Connect to 1P/2P/3P tools via the standardized Model Context Protocol for secure, audited tool execution. Start the server with `make mcp-serve`.
|
|
96
|
+
|
|
97
|
+
### 🗄️ Situational Database Audits
|
|
98
|
+
The Cockpit now performs platform-specific performance and security audits for **AlloyDB**, **Pinecone**, **BigQuery**, and **Cloud SQL**.
|
|
99
|
+
|
|
100
|
+
---
|
|
101
|
+
|
|
102
|
+
### 🛡️ Advanced Governance & Discovery
|
|
103
|
+
Modern agents don't just live in `agent.py`. The Cockpit uses a centralized **Discovery Engine** to intelligently map your project:
|
|
104
|
+
- **`.gitignore` Compliance**: Zero-noise scanning that respects your project's ignore rules.
|
|
105
|
+
- **Library Isolation**: Intelligently ignores hits in `venv` or `node_modules` to focus on your code.
|
|
106
|
+
- **Config-Driven**: Use `cockpit.yaml` to define custom entry points, exclusions, and CI/CD thresholds.
|
|
107
|
+
|
|
108
|
+
---
|
|
109
|
+
|
|
110
|
+
## ⌨️ Master Command Registry
|
|
111
|
+
|
|
112
|
+
The Cockpit is available as a first-class CLI and a comprehensive Makefile-based operational toolkit.
|
|
113
|
+
|
|
114
|
+
| Registry | Description |
|
|
115
|
+
| :--- | :--- |
|
|
116
|
+
| 🕹️ [**Makefile Commands**](docs/TECHNICAL_COMMANDS_MASTER.md) | Standard local development and orchestration shortcuts. |
|
|
117
|
+
| 🚀 [**UVX Master Guide**](docs/TECHNICAL_UVX_MASTER.md) | Portable, zero-install commands for CI/CD and automation. |
|
|
118
|
+
|
|
119
|
+
---
|
|
120
|
+
|
|
121
|
+
## 🧑💼 Principal SME Persona Approvals
|
|
122
|
+
The Cockpit now features a **Multi-Persona Governance Board**. Every audit result is framed through the lens of a Principal Engineer in that domain:
|
|
123
|
+
* [**🏛️ Architecture**](docs/TECHNICAL_ARCH_REVIEW.md)
|
|
124
|
+
* [**💰 FinOps**](docs/TECHNICAL_FINOPS_GUIDE.md)
|
|
125
|
+
* [**🛡️ Red Team**](docs/TECHNICAL_REDTEAM_GUIDE.md)
|
|
126
|
+
* [**🧗 Quality**](docs/TECHNICAL_QUALITY_GUIDE.md)
|
|
127
|
+
* [**🌐 Infrastructure**](docs/TECHNICAL_INFRA_GUIDE.md)
|
|
128
|
+
* [**🎭 UX/UI**](docs/TECHNICAL_UX_GUIDE.md)
|
|
129
|
+
|
|
130
|
+
---
|
|
131
|
+
|
|
132
|
+
## 🚀 1-Click Production Pipeline
|
|
133
|
+
`make deploy-prod` triggers the following lifecycle:
|
|
134
|
+
1. Runs the Quick Safe-Build (`make audit`).
|
|
135
|
+
2. Compiles production frontend assets.
|
|
136
|
+
3. Deploys the Engine to **Google Cloud Run**.
|
|
137
|
+
4. Deploys the Face to **Firebase Hosting**.
|
|
138
|
+
|
|
139
|
+
---
|
|
140
|
+
|
|
141
|
+
## 🤝 Ecosystem & Attribution
|
|
142
|
+
The AgentOps Cockpit is designed to leverage and secure the best-of-breed tools in the Google Cloud ecosystem. We explicitly acknowledge and leverage the excellent work from:
|
|
143
|
+
|
|
144
|
+
* **[GoogleCloudPlatform/agent-starter-pack](https://github.com/GoogleCloudPlatform/agent-starter-pack/)**: We leverage this as a core reference for the **Agent Development Kit (ADK)** patterns and Vertex AI Agent Engine integration.
|
|
145
|
+
* **A2A Standard**: Our implementation follow the Agent-to-Agent Transmission Protocol for swarm intelligence.
|
|
146
|
+
|
|
147
|
+
---
|
|
148
|
+
*Reference: [Google Cloud Architecture Center - Agentic AI Overview](https://docs.cloud.google.com/architecture/agentic-ai-overview)*
|
|
@@ -0,0 +1,70 @@
|
|
|
1
|
+
# 🚀 Production Deployment
|
|
2
|
+
## The "Autonomous" Standard (v1.3)
|
|
3
|
+
|
|
4
|
+
Deploying a "Well-Architected" agent requires orchestration across two primary Google Cloud environments. The Cockpit automates this through the `make deploy-prod` command.
|
|
5
|
+
|
|
6
|
+
---
|
|
7
|
+
|
|
8
|
+
## ⚙️ The Engine (Cloud Run)
|
|
9
|
+
The Python backend (FastAPI) is deployed as a serverless service.
|
|
10
|
+
- **Scaling**: scale-to-zero enabled.
|
|
11
|
+
- **Regions**: `us-central1` recommended for proximity to Vertex AI.
|
|
12
|
+
- **Best Practice**: Enable **Startup CPU Boost** to reduce cold-start latency (TTR).
|
|
13
|
+
|
|
14
|
+
## 🧠 Agent Engine (Vertex AI)
|
|
15
|
+
Recommended for agents that require deep integration with the Google Cloud agentic ecosystem.
|
|
16
|
+
- **Why**: Managed runtime, built-in tracing, and **Context Caching** support.
|
|
17
|
+
|
|
18
|
+
## ☸️ Enterprise Engine (GKE)
|
|
19
|
+
Recommended for high-intensity or specialized isolation workloads.
|
|
20
|
+
- **Why**: Full control over networking and GPU resources.
|
|
21
|
+
|
|
22
|
+
---
|
|
23
|
+
|
|
24
|
+
## 🏗️ 1-Click Deployment Sequence
|
|
25
|
+
`make deploy-prod` executes the following high-fidelity pipeline:
|
|
26
|
+
|
|
27
|
+
### Stage 1: The Quick "Safe-Build"
|
|
28
|
+
Runs `make audit` (~15s).
|
|
29
|
+
- Architecture sanity check.
|
|
30
|
+
- Secret leakage detection.
|
|
31
|
+
- Fast Red-Team (common injections).
|
|
32
|
+
- Token optimization audit.
|
|
33
|
+
|
|
34
|
+
### Stage 2: Face Build
|
|
35
|
+
Executes `npm run build` to compile the React/Vite frontend into production assets.
|
|
36
|
+
|
|
37
|
+
### Stage 3: Infrastructure Push
|
|
38
|
+
- Containerizes the Engine and pushes to **Artifact Registry**.
|
|
39
|
+
- Deploys the service to **Google Cloud Run**.
|
|
40
|
+
- Deploys static assets to **Firebase Hosting**.
|
|
41
|
+
|
|
42
|
+
---
|
|
43
|
+
|
|
44
|
+
## 📊 Infrastructure Decision Matrix
|
|
45
|
+
|
|
46
|
+
| Feature | Agent Engine | Cloud Run | GKE |
|
|
47
|
+
| :--- | :--- | :--- | :--- |
|
|
48
|
+
| **Orchestration** | Managed (ADK) | Custom (FastAPI) | Custom (K8s) |
|
|
49
|
+
| **Scaling** | Automatic | Scale-to-Zero | Dynamic / GPU |
|
|
50
|
+
| **Observability** | Vertex AI Traces | Cloud Logging | Prometheus / Istio |
|
|
51
|
+
| **Best Case** | Fast Prototyping | Standard Web Agents | High-Perf Enterprise |
|
|
52
|
+
|
|
53
|
+
---
|
|
54
|
+
|
|
55
|
+
## 🛡️ v1.3: Deep System Audit
|
|
56
|
+
For production-gate promotion, move from "Safe-Build" to "Deep Audit":
|
|
57
|
+
```bash
|
|
58
|
+
make audit-deep
|
|
59
|
+
```
|
|
60
|
+
- Full Adversarial Red-Teaming.
|
|
61
|
+
- Iterative Quality Hill Climbing.
|
|
62
|
+
- Precision Load Testing (`make load-test`).
|
|
63
|
+
|
|
64
|
+
---
|
|
65
|
+
|
|
66
|
+
## 🔑 Secret Management
|
|
67
|
+
Never commit `.env` files. Use **Google Cloud Secret Manager** and map them as environment variables in Cloud Run.
|
|
68
|
+
|
|
69
|
+
---
|
|
70
|
+
*Generated by the AgentOps Cockpit. Sovereign Systems Division (v1.3).*
|
|
@@ -4,6 +4,9 @@
|
|
|
4
4
|
<meta charset="UTF-8" />
|
|
5
5
|
<meta name="viewport" content="width=device-width, initial-scale=1.0" />
|
|
6
6
|
<title>AgentOps Cockpit</title>
|
|
7
|
+
<meta name="description" content="Production-grade AI Agent Governance and Operations Cockpit." />
|
|
8
|
+
<meta property="og:image" content="/og-image.png" />
|
|
9
|
+
<meta property="og:title" content="AgentOps Cockpit" />
|
|
7
10
|
<link rel="preconnect" href="https://fonts.googleapis.com">
|
|
8
11
|
<link rel="preconnect" href="https://fonts.gstatic.com" crossorigin>
|
|
9
12
|
<link href="https://fonts.googleapis.com/css2?family=Plus+Jakarta+Sans:wght@400;500;600;700;800&family=JetBrains+Mono:wght@400;500;600&display=swap" rel="stylesheet">
|
|
@@ -0,0 +1,31 @@
|
|
|
1
|
+
# 📖 The Agentic Trinity Vision
|
|
2
|
+
|
|
3
|
+
## "Infrastructure is a solved problem. Intelligence is the new frontier."
|
|
4
|
+
|
|
5
|
+
Most agent templates treat production as an afterthought. They give you a VPC and an API key, but leave you alone when the token bill hits $5,000 or when a user jailbreaks your agent's system prompt.
|
|
6
|
+
|
|
7
|
+
The **AgentOps Cockpit** was born from a simple realization: **Building a demo is easy; running a profitable agent is hard.**
|
|
8
|
+
|
|
9
|
+
---
|
|
10
|
+
|
|
11
|
+
### The Architecture: The Trinity
|
|
12
|
+
We believe every production agent must be built on three balanced pillars:
|
|
13
|
+
|
|
14
|
+
#### 1. The Engine (The Day 0 Brain)
|
|
15
|
+
This is where reasoning happens. By using Google's **Agent Development Kit (ADK)** and **Gemini 2.0**, we ensure that tool orchestration is deterministic and high-fidelity. The Engine isn't just a wrapper; it's a reasoning machine.
|
|
16
|
+
|
|
17
|
+
#### 2. The Face (The Day 1 Experience)
|
|
18
|
+
Text-in / Text-out is for chatbots, not for applications. **The Face** uses the **A2UI (Agent-to-User Interface)** protocol to transform JSON reasoning into interactive React components. It creates "Generative UI" that surfaces exactly what the user needs to see, right when the agent decides it.
|
|
19
|
+
|
|
20
|
+
#### 3. The Cockpit (The Day 2 Governance)
|
|
21
|
+
This is our unique contribution to the ecosystem. The Cockpit manages what happens *after* the agent is live.
|
|
22
|
+
- **Profitability**: Semantic caching and prompt compression.
|
|
23
|
+
- **Safety**: Automated adversarial red-teaming.
|
|
24
|
+
- **Compliance**: VPC-native PII scrubbing.
|
|
25
|
+
|
|
26
|
+
---
|
|
27
|
+
|
|
28
|
+
### Our North Star: 10K Star Governance
|
|
29
|
+
Our goal is to be the **Control Plane** for the agentic era. Whether you use LangChain, CrewAI, or raw custom logic, the Cockpit provides the specialized monitoring and auditing that ensure your AI agents are "Well-Architected" and enterprise-ready.
|
|
30
|
+
|
|
31
|
+
Welcome to the future of **High-Fidelity Agent Ops**.
|
|
@@ -0,0 +1,101 @@
|
|
|
1
|
+
# AgentOps Cockpit v1.0: Audit Scenarios & Capabilities
|
|
2
|
+
|
|
3
|
+
This document showcases the difference between "Heuristic Matching" (v0.9) and "Reasoning-Based Auditing" (v1.0) using the new AST and Semantic Graph Probing engines.
|
|
4
|
+
|
|
5
|
+
---
|
|
6
|
+
|
|
7
|
+
## 🟢 Scenario 1: The "Lazy" PII Masking (Simple)
|
|
8
|
+
|
|
9
|
+
### The Code
|
|
10
|
+
```python
|
|
11
|
+
# agent.py
|
|
12
|
+
user_input = get_user_query()
|
|
13
|
+
# TODO: implement PII mask
|
|
14
|
+
response = llm.invoke(user_input)
|
|
15
|
+
```
|
|
16
|
+
|
|
17
|
+
### ❌ Old v0.9 Auditor Result
|
|
18
|
+
* **Status:** `PASSED`
|
|
19
|
+
* **Rationale:** Found keyword "mask" in comments.
|
|
20
|
+
* **Verdict:** Dangerous false positive.
|
|
21
|
+
|
|
22
|
+
### ✅ New v1.0 Auditor (Reasoning)
|
|
23
|
+
* **Status:** `FAIL (CRITICAL)`
|
|
24
|
+
* **Finding:** `Incomplete PII Protection`
|
|
25
|
+
* **Reasoning:**
|
|
26
|
+
1. AST analysis identifies `user_input` as a raw variable.
|
|
27
|
+
2. No call to a "scrubber" function detected between variable assignment and LLM `invoke`.
|
|
28
|
+
3. Semantic scanner identifies "TODO" comment as an active risk rather than a feature.
|
|
29
|
+
* **ADR Recommendation:** Inject `google-adk` PII Scrubber before `llm.invoke`.
|
|
30
|
+
|
|
31
|
+
---
|
|
32
|
+
|
|
33
|
+
## 🟡 Scenario 2: The "Thundering Herd" Bottleneck (Medium)
|
|
34
|
+
|
|
35
|
+
### The Code
|
|
36
|
+
```python
|
|
37
|
+
async def get_data():
|
|
38
|
+
user = await db.get_user()
|
|
39
|
+
history = await db.get_history()
|
|
40
|
+
profile = await db.get_profile()
|
|
41
|
+
return user, history, profile
|
|
42
|
+
```
|
|
43
|
+
|
|
44
|
+
### ❌ Old v0.9 Auditor Result
|
|
45
|
+
* **Status:** `PASSED`
|
|
46
|
+
* **Rationale:** Code is valid Python/Async.
|
|
47
|
+
* **Verdict:** Ignores performance anti-patterns.
|
|
48
|
+
|
|
49
|
+
### ✅ New v1.0 Auditor (Reasoning)
|
|
50
|
+
* **Status:** `FAIL (MEDIUM IMPACT)`
|
|
51
|
+
* **Finding:** `Sequential Bottleneck Detected`
|
|
52
|
+
* **Reasoning:**
|
|
53
|
+
1. AST walker identifies 3+ `await` calls in a direct sequence.
|
|
54
|
+
2. Analyzes child nodes to determine these are independent data fetches.
|
|
55
|
+
* **Strategic ROI:** "Current latency is `T1 + T2 + T3`. Parallelizing via `asyncio.gather` reduces latency to `MAX(T1, T2, T3)`, improving responsiveness by ~60%."
|
|
56
|
+
|
|
57
|
+
---
|
|
58
|
+
|
|
59
|
+
## 🔴 Scenario 3: Cross-Framework Conflict (Complex)
|
|
60
|
+
|
|
61
|
+
### The Code
|
|
62
|
+
```python
|
|
63
|
+
from langgraph.graph import StateGraph
|
|
64
|
+
from crewai import Agent, Task, Crew
|
|
65
|
+
|
|
66
|
+
# ... logic using a CrewAI Agent as a node in a LangGraph State machine ...
|
|
67
|
+
```
|
|
68
|
+
|
|
69
|
+
### ❌ Old v0.9 Auditor Result
|
|
70
|
+
* **Status:** `PASSED`
|
|
71
|
+
* **Rationale:** Found keywords "langgraph" and "crewai".
|
|
72
|
+
* **Verdict:** Both frameworks are supported, so audit passes.
|
|
73
|
+
|
|
74
|
+
### ✅ New v1.0 Auditor (Reasoning)
|
|
75
|
+
* **Status:** `WARNING (ARCHITECTURAL CONFLICT)`
|
|
76
|
+
* **Finding:** `Orchestration Overlap`
|
|
77
|
+
* **Reasoning:**
|
|
78
|
+
1. Graph analysis detects two competing "Loop Managers" (LangGraph and CrewAI).
|
|
79
|
+
2. Identifies high risk of **Cyclic State Deadlock** where the LangGraph state and CrewAI internal state diverge.
|
|
80
|
+
* **Consulting Edge:** "You are attempting to manage state in two places. Recommend refactoring CrewAI agents into raw `tools` within LangGraph or using CrewAI in a purely sequential sub-task mode."
|
|
81
|
+
|
|
82
|
+
---
|
|
83
|
+
|
|
84
|
+
## 🏆 Scenario 4: The "Silent" Model Waste (FinOps)
|
|
85
|
+
|
|
86
|
+
### The Code
|
|
87
|
+
```python
|
|
88
|
+
# process_batch.py
|
|
89
|
+
results = []
|
|
90
|
+
for item in large_dataset:
|
|
91
|
+
# Processing simple classification
|
|
92
|
+
res = gemini_pro.generate_content(f"Is this category A or B: {item}")
|
|
93
|
+
results.append(res)
|
|
94
|
+
```
|
|
95
|
+
|
|
96
|
+
### ✅ New v1.0 Auditor (Reasoning)
|
|
97
|
+
* **Finding:** `High-Tier Model Inefficiency`
|
|
98
|
+
* **Reasoning:**
|
|
99
|
+
1. Detects `gemini-1.5-pro` (High Performance/Cost) inside a `for-loop`.
|
|
100
|
+
2. Semantic analyzer determines the task is "simple classification" based on the prompt string prefix.
|
|
101
|
+
* **Business Impact:** "You are using a sledgehammer for a nail. Switching this loop to `gemini-1.5-flash` will reduce monthly token spend from $400 to $40 with zero accuracy loss."
|