agent-os-kernel 1.1.0__py3-none-any.whl → 1.2.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agent_os/__init__.py +66 -4
- agent_os/agents_compat.py +286 -0
- agent_os/base_agent.py +308 -0
- agent_os/cli.py +1079 -19
- agent_os/integrations/__init__.py +37 -2
- agent_os/integrations/openai_adapter.py +502 -0
- agent_os/integrations/semantic_kernel_adapter.py +569 -0
- agent_os/stateless.py +349 -0
- agent_os_kernel-1.2.0.dist-info/METADATA +676 -0
- agent_os_kernel-1.2.0.dist-info/RECORD +1053 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/entry_points.txt +0 -1
- modules/amb/.github/workflows/ci.yml +102 -0
- modules/amb/.github/workflows/publish.yml +146 -0
- modules/amb/.gitignore +134 -0
- modules/amb/CHANGELOG.md +118 -0
- modules/amb/CONTRIBUTING.md +141 -0
- modules/amb/LICENSE +21 -0
- modules/amb/README.md +188 -0
- modules/amb/amb_core/__init__.py +175 -0
- modules/amb/amb_core/adapters/__init__.py +55 -0
- modules/amb/amb_core/adapters/aws_sqs_broker.py +374 -0
- modules/amb/amb_core/adapters/azure_servicebus_broker.py +338 -0
- modules/amb/amb_core/adapters/kafka_broker.py +258 -0
- modules/amb/amb_core/adapters/nats_broker.py +283 -0
- modules/amb/amb_core/adapters/rabbitmq_broker.py +233 -0
- modules/amb/amb_core/adapters/redis_broker.py +260 -0
- modules/amb/amb_core/broker.py +143 -0
- modules/amb/amb_core/bus.py +479 -0
- modules/amb/amb_core/cloudevents.py +507 -0
- modules/amb/amb_core/dlq.py +343 -0
- modules/amb/amb_core/hf_utils.py +534 -0
- modules/amb/amb_core/memory_broker.py +408 -0
- modules/amb/amb_core/models.py +139 -0
- modules/amb/amb_core/persistence.py +527 -0
- modules/amb/amb_core/schema.py +292 -0
- modules/amb/amb_core/tracing.py +356 -0
- modules/amb/examples/advanced_features.py +223 -0
- modules/amb/examples/backpressure_demo.py +225 -0
- modules/amb/examples/basic_usage.py +117 -0
- modules/amb/examples/tracing_demo.py +104 -0
- modules/amb/experiments/README.md +52 -0
- modules/amb/experiments/reproduce_results.py +467 -0
- modules/amb/experiments/results.json +324 -0
- modules/amb/paper/README.md +40 -0
- modules/amb/paper/paper.tex +365 -0
- modules/amb/paper/whitepaper.md +377 -0
- modules/amb/pyproject.toml +117 -0
- modules/amb/tests/__init__.py +1 -0
- modules/amb/tests/test_backpressure_priority.py +280 -0
- modules/amb/tests/test_bus.py +198 -0
- modules/amb/tests/test_cloudevents.py +443 -0
- modules/amb/tests/test_features.py +531 -0
- modules/amb/tests/test_models.py +74 -0
- modules/amb/tests/test_tracing.py +254 -0
- modules/atr/.github/workflows/ci.yml +101 -0
- modules/atr/.github/workflows/publish.yml +140 -0
- modules/atr/.gitignore +134 -0
- modules/atr/.pre-commit-config.yaml +37 -0
- modules/atr/CHANGELOG.md +39 -0
- modules/atr/CONTRIBUTING.md +96 -0
- modules/atr/IMPLEMENTATION_SUMMARY.md +143 -0
- modules/atr/README.md +180 -0
- modules/atr/atr/__init__.py +638 -0
- modules/atr/atr/access.py +346 -0
- modules/atr/atr/composition.py +643 -0
- modules/atr/atr/decorator.py +355 -0
- modules/atr/atr/executor.py +382 -0
- modules/atr/atr/health.py +555 -0
- modules/atr/atr/hf_utils.py +447 -0
- modules/atr/atr/injection.py +420 -0
- modules/atr/atr/metrics.py +438 -0
- modules/atr/atr/policies.py +401 -0
- modules/atr/atr/py.typed +2 -0
- modules/atr/atr/registry.py +450 -0
- modules/atr/atr/schema.py +478 -0
- modules/atr/atr/tools/safe/__init__.py +73 -0
- modules/atr/atr/tools/safe/calculator.py +380 -0
- modules/atr/atr/tools/safe/datetime_tool.py +441 -0
- modules/atr/atr/tools/safe/file_reader.py +400 -0
- modules/atr/atr/tools/safe/http_client.py +314 -0
- modules/atr/atr/tools/safe/json_parser.py +372 -0
- modules/atr/atr/tools/safe/text_tool.py +526 -0
- modules/atr/atr/tools/safe/toolkit.py +173 -0
- modules/atr/docs/PYPI_SETUP.md +113 -0
- modules/atr/examples/README.md +27 -0
- modules/atr/examples/demo.py +144 -0
- modules/atr/examples/sandbox_demo.py +218 -0
- modules/atr/experiments/README.md +69 -0
- modules/atr/experiments/reproduce_results.py +509 -0
- modules/atr/experiments/results/.gitkeep +0 -0
- modules/atr/experiments/results/results_20260123_140334.json +71 -0
- modules/atr/paper/README.md +36 -0
- modules/atr/paper/figures/.gitkeep +0 -0
- modules/atr/paper/references.bib +84 -0
- modules/atr/paper/structure.tex +293 -0
- modules/atr/paper/whitepaper.md +234 -0
- modules/atr/pyproject.toml +148 -0
- modules/atr/requirements.txt +1 -0
- modules/atr/setup.py +30 -0
- modules/atr/tests/__init__.py +1 -0
- modules/atr/tests/test_decorator.py +317 -0
- modules/atr/tests/test_executor.py +245 -0
- modules/atr/tests/test_integration_executor.py +184 -0
- modules/atr/tests/test_registry.py +312 -0
- modules/atr/tests/test_schema.py +182 -0
- modules/atr/tests/test_v2_features.py +708 -0
- modules/caas/.dockerignore +63 -0
- modules/caas/.github/ISSUE_TEMPLATE/bug_report.md +38 -0
- modules/caas/.github/ISSUE_TEMPLATE/custom.md +10 -0
- modules/caas/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
- modules/caas/.github/workflows/ci.yml +100 -0
- modules/caas/.github/workflows/lint.yml +39 -0
- modules/caas/.github/workflows/publish-pypi.yml +124 -0
- modules/caas/.gitignore +73 -0
- modules/caas/.pre-commit-config.yaml +33 -0
- modules/caas/CHANGELOG.md +58 -0
- modules/caas/CONTRIBUTING.md +346 -0
- modules/caas/Dockerfile +41 -0
- modules/caas/LICENSE +21 -0
- modules/caas/MANIFEST.in +11 -0
- modules/caas/README.md +158 -0
- modules/caas/benchmarks/README.md +255 -0
- modules/caas/benchmarks/create_hf_dataset.py +502 -0
- modules/caas/benchmarks/data/sample_corpus/README.md +86 -0
- modules/caas/benchmarks/data/sample_corpus/auth_module.py +211 -0
- modules/caas/benchmarks/data/sample_corpus/contribution_guide.md +185 -0
- modules/caas/benchmarks/data/sample_corpus/remote_work_policy.html +57 -0
- modules/caas/benchmarks/hf_dataset/README.md +214 -0
- modules/caas/benchmarks/hf_dataset/caas_benchmark_corpus.py +73 -0
- modules/caas/benchmarks/hf_dataset/corpus_preview.json +193 -0
- modules/caas/benchmarks/results/README.md +66 -0
- modules/caas/benchmarks/results/evaluation_2026-01-20.json +121 -0
- modules/caas/benchmarks/run_evaluation.py +561 -0
- modules/caas/benchmarks/statistical_tests.py +289 -0
- modules/caas/benchmarks/verify_sample_corpus.py +83 -0
- modules/caas/docker-compose.yml +38 -0
- modules/caas/docs/CONTEXT_TRIAD.md +462 -0
- modules/caas/docs/CONTRIBUTING.md +346 -0
- modules/caas/docs/ETHICS_AND_LIMITATIONS.md +336 -0
- modules/caas/docs/HEURISTIC_ROUTER.md +442 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY.md +363 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_CONTEXT_TRIAD.md +277 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_HEURISTIC_ROUTER.md +231 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_METADATA_INJECTION.md +258 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_PRAGMATIC_TRUTH.md +212 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_TRUST_GATEWAY.md +319 -0
- modules/caas/docs/LAYER_1_PRIMITIVE.md +202 -0
- modules/caas/docs/METADATA_INJECTION.md +404 -0
- modules/caas/docs/PRAGMATIC_TRUTH.md +431 -0
- modules/caas/docs/RELATED_WORK.md +312 -0
- modules/caas/docs/RELEASE_CHECKLIST.md +219 -0
- modules/caas/docs/RELEASE_GUIDE.md +285 -0
- modules/caas/docs/REPRODUCIBILITY.md +386 -0
- modules/caas/docs/SLIDING_WINDOW.md +387 -0
- modules/caas/docs/STRUCTURE_AWARE_INDEXING.md +158 -0
- modules/caas/docs/TESTING.md +259 -0
- modules/caas/docs/THREAT_MODEL.md +247 -0
- modules/caas/docs/TRUST_GATEWAY.md +575 -0
- modules/caas/docs/VFS.md +298 -0
- modules/caas/examples/agents/enterprise_security_agent.py +414 -0
- modules/caas/examples/agents/intelligent_document_analyzer.py +380 -0
- modules/caas/examples/demos/demo.py +309 -0
- modules/caas/examples/demos/demo_context_triad.py +225 -0
- modules/caas/examples/demos/demo_conversation_manager.py +285 -0
- modules/caas/examples/demos/demo_heuristic_router.py +133 -0
- modules/caas/examples/demos/demo_metadata_injection.py +198 -0
- modules/caas/examples/demos/demo_pragmatic_truth.py +303 -0
- modules/caas/examples/demos/demo_structure_aware.py +140 -0
- modules/caas/examples/demos/demo_time_decay.py +247 -0
- modules/caas/examples/demos/demo_trust_gateway.py +383 -0
- modules/caas/examples/multi_agent/README.md +159 -0
- modules/caas/examples/multi_agent/research_team.py +369 -0
- modules/caas/examples/multi_agent/vfs_collaboration.py +393 -0
- modules/caas/examples/usage/auth_module.py +142 -0
- modules/caas/examples/usage/usage_example.py +173 -0
- modules/caas/experiments/README.md +42 -0
- modules/caas/experiments/reproduce_results.py +462 -0
- modules/caas/paper/ARXIV_METADATA.md +145 -0
- modules/caas/paper/ARXIV_README.md +47 -0
- modules/caas/paper/CHECKLIST.md +103 -0
- modules/caas/paper/GITHUB_RELEASE_NOTES.md +105 -0
- modules/caas/paper/README.md +71 -0
- modules/caas/paper/abstract.md +24 -0
- modules/caas/paper/arxiv_submission.tar +0 -0
- modules/caas/paper/arxiv_submission.zip +0 -0
- modules/caas/paper/build_pdf.py +355 -0
- modules/caas/paper/experiments.md +149 -0
- modules/caas/paper/figures/.gitkeep +0 -0
- modules/caas/paper/figures/README.md +237 -0
- modules/caas/paper/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/figures/fig1_system_architecture.svg +198 -0
- modules/caas/paper/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/figures/fig2_context_triad.svg +105 -0
- modules/caas/paper/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/figures/fig3_ablation_results.svg +113 -0
- modules/caas/paper/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/figures/fig4_routing_latency.svg +97 -0
- modules/caas/paper/intro.md +103 -0
- modules/caas/paper/latex/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/latex/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/latex/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/latex/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/latex/main.tex +468 -0
- modules/caas/paper/latex/references.bib +140 -0
- modules/caas/paper/method.md +350 -0
- modules/caas/paper/outline.md +123 -0
- modules/caas/paper/related_work.md +101 -0
- modules/caas/paper/tables/.gitkeep +0 -0
- modules/caas/paper/tables/results_tables.md +50 -0
- modules/caas/pyproject.toml +172 -0
- modules/caas/requirements.txt +11 -0
- modules/caas/src/caas/__init__.py +232 -0
- modules/caas/src/caas/api/__init__.py +7 -0
- modules/caas/src/caas/api/server.py +1326 -0
- modules/caas/src/caas/caching.py +832 -0
- modules/caas/src/caas/cli.py +208 -0
- modules/caas/src/caas/conversation.py +221 -0
- modules/caas/src/caas/decay.py +118 -0
- modules/caas/src/caas/detection/__init__.py +7 -0
- modules/caas/src/caas/detection/detector.py +236 -0
- modules/caas/src/caas/enrichment.py +127 -0
- modules/caas/src/caas/gateway/__init__.py +24 -0
- modules/caas/src/caas/gateway/trust_gateway.py +471 -0
- modules/caas/src/caas/hf_utils.py +477 -0
- modules/caas/src/caas/ingestion/__init__.py +21 -0
- modules/caas/src/caas/ingestion/processors.py +251 -0
- modules/caas/src/caas/ingestion/structure_parser.py +185 -0
- modules/caas/src/caas/models.py +354 -0
- modules/caas/src/caas/pragmatic_truth.py +441 -0
- modules/caas/src/caas/routing/__init__.py +8 -0
- modules/caas/src/caas/routing/heuristic_router.py +242 -0
- modules/caas/src/caas/storage/__init__.py +7 -0
- modules/caas/src/caas/storage/store.py +450 -0
- modules/caas/src/caas/triad.py +472 -0
- modules/caas/src/caas/tuning/__init__.py +7 -0
- modules/caas/src/caas/tuning/tuner.py +322 -0
- modules/caas/src/caas/vfs/__init__.py +12 -0
- modules/caas/src/caas/vfs/filesystem.py +450 -0
- modules/caas/tests/__init__.py +3 -0
- modules/caas/tests/conftest.py +8 -0
- modules/caas/tests/test_caching.py +628 -0
- modules/caas/tests/test_context_triad.py +385 -0
- modules/caas/tests/test_conversation_manager.py +289 -0
- modules/caas/tests/test_functionality.py +215 -0
- modules/caas/tests/test_heuristic_router.py +370 -0
- modules/caas/tests/test_metadata_injection.py +328 -0
- modules/caas/tests/test_pragmatic_truth.py +322 -0
- modules/caas/tests/test_structure_aware_indexing.py +283 -0
- modules/caas/tests/test_time_decay.py +268 -0
- modules/caas/tests/test_trust_gateway.py +445 -0
- modules/caas/tests/test_vfs.py +298 -0
- modules/cmvk/.github/FUNDING.yml +9 -0
- modules/cmvk/.github/dependabot.yml +54 -0
- modules/cmvk/.github/workflows/ci.yml +205 -0
- modules/cmvk/.github/workflows/publish.yml +143 -0
- modules/cmvk/.gitignore +147 -0
- modules/cmvk/.pre-commit-config.yaml +58 -0
- modules/cmvk/CHANGELOG.md +146 -0
- modules/cmvk/CITATION.cff +48 -0
- modules/cmvk/CONTRIBUTING.md +229 -0
- modules/cmvk/Dockerfile +87 -0
- modules/cmvk/HF_MODEL_CARD.md +185 -0
- modules/cmvk/LICENSE +21 -0
- modules/cmvk/README.md +149 -0
- modules/cmvk/SECURITY.md +114 -0
- modules/cmvk/config/prompts/generator_v1.txt +23 -0
- modules/cmvk/config/prompts/verifier_hostile.txt +32 -0
- modules/cmvk/config/settings.yaml +40 -0
- modules/cmvk/coverage_html/.gitignore +2 -0
- modules/cmvk/coverage_html/class_index.html +658 -0
- modules/cmvk/coverage_html/coverage_html_cb_188fc9a4.js +735 -0
- modules/cmvk/coverage_html/favicon_32_cb_c827f16f.png +0 -0
- modules/cmvk/coverage_html/function_index.html +1978 -0
- modules/cmvk/coverage_html/index.html +255 -0
- modules/cmvk/coverage_html/keybd_closed_cb_900cfef5.png +0 -0
- modules/cmvk/coverage_html/status.json +1 -0
- modules/cmvk/coverage_html/style_cb_5c747636.css +389 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38___init___py.html +315 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_audit_py.html +499 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_benchmarks_py.html +575 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_constitutional_py.html +1001 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_hf_utils_py.html +398 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_metrics_py.html +570 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_profiles_py.html +397 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_types_py.html +109 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_verification_py.html +1053 -0
- modules/cmvk/docs/DIAGRAMS.md +325 -0
- modules/cmvk/docs/architecture.md +345 -0
- modules/cmvk/docs/features.md +308 -0
- modules/cmvk/docs/getting_started.md +279 -0
- modules/cmvk/docs/innovation_layer.md +377 -0
- modules/cmvk/docs/safety.md +281 -0
- modules/cmvk/docs/traceability.md +150 -0
- modules/cmvk/examples/basic_example.py +62 -0
- modules/cmvk/examples/demo_complete_pipeline.py +209 -0
- modules/cmvk/examples/demo_innovation_layer.py +197 -0
- modules/cmvk/examples/example.py +112 -0
- modules/cmvk/examples/model_diversity_comparison.py +110 -0
- modules/cmvk/examples/real_api_integration.py +121 -0
- modules/cmvk/examples/test_full_pipeline.py +303 -0
- modules/cmvk/experiments/FEATURE_2_LATERAL_THINKING.md +187 -0
- modules/cmvk/experiments/README.md +216 -0
- modules/cmvk/experiments/ablation_runner.py +666 -0
- modules/cmvk/experiments/baseline_runner.py +158 -0
- modules/cmvk/experiments/blind_spot_benchmark.py +364 -0
- modules/cmvk/experiments/datasets/README.md +85 -0
- modules/cmvk/experiments/datasets/humaneval_50.json +352 -0
- modules/cmvk/experiments/datasets/humaneval_full.json +1150 -0
- modules/cmvk/experiments/datasets/humaneval_sample.json +32 -0
- modules/cmvk/experiments/datasets/sabotage.json +262 -0
- modules/cmvk/experiments/datasets/sample.json +40 -0
- modules/cmvk/experiments/demo_with_traces.py +110 -0
- modules/cmvk/experiments/efficiency_curve.py +259 -0
- modules/cmvk/experiments/experiment_runner.py +243 -0
- modules/cmvk/experiments/paper_data_generator.py +183 -0
- modules/cmvk/experiments/reproduce_results.py +407 -0
- modules/cmvk/experiments/reproducible_runner.py +352 -0
- modules/cmvk/experiments/sabotage_stress_test.py +311 -0
- modules/cmvk/experiments/test_lateral_thinking.py +116 -0
- modules/cmvk/experiments/test_prosecutor.py +41 -0
- modules/cmvk/experiments/visualize_results.py +735 -0
- modules/cmvk/logs/traces/demo_HumanEval_0_20260121-204900.json +36 -0
- modules/cmvk/notebooks/analysis.ipynb +124 -0
- modules/cmvk/paper/PAPER.md +561 -0
- modules/cmvk/paper/arxiv_checklist.md +230 -0
- modules/cmvk/paper/cmvk_neurips.aux +77 -0
- modules/cmvk/paper/cmvk_neurips.bbl +81 -0
- modules/cmvk/paper/cmvk_neurips.blg +48 -0
- modules/cmvk/paper/cmvk_neurips.out +16 -0
- modules/cmvk/paper/cmvk_neurips.pdf +0 -0
- modules/cmvk/paper/cmvk_neurips.tex +309 -0
- modules/cmvk/paper/figures/ablation.png +0 -0
- modules/cmvk/paper/figures/ablation.svg +39 -0
- modules/cmvk/paper/figures/architecture.png +0 -0
- modules/cmvk/paper/figures/architecture.svg +115 -0
- modules/cmvk/paper/figures/results_bar.png +0 -0
- modules/cmvk/paper/figures/results_bar.svg +70 -0
- modules/cmvk/paper/generate_figures.py +383 -0
- modules/cmvk/paper/neurips_2024.sty +101 -0
- modules/cmvk/paper/references.bib +98 -0
- modules/cmvk/paper/structure.tex +200 -0
- modules/cmvk/pyproject.toml +189 -0
- modules/cmvk/requirements-dev.txt +19 -0
- modules/cmvk/requirements.txt +14 -0
- modules/cmvk/src/cmvk/__init__.py +216 -0
- modules/cmvk/src/cmvk/audit.py +400 -0
- modules/cmvk/src/cmvk/benchmarks.py +476 -0
- modules/cmvk/src/cmvk/constitutional.py +902 -0
- modules/cmvk/src/cmvk/hf_utils.py +299 -0
- modules/cmvk/src/cmvk/metrics.py +471 -0
- modules/cmvk/src/cmvk/profiles.py +298 -0
- modules/cmvk/src/cmvk/py.typed +0 -0
- modules/cmvk/src/cmvk/types.py +10 -0
- modules/cmvk/src/cmvk/verification.py +954 -0
- modules/cmvk/src/cross_model_verification_kernel/__init__.py +91 -0
- modules/cmvk/src/cross_model_verification_kernel/__main__.py +10 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/__init__.py +16 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/base_agent.py +142 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/generator_openai.py +223 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_anthropic.py +448 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_gemini.py +481 -0
- modules/cmvk/src/cross_model_verification_kernel/cli.py +570 -0
- modules/cmvk/src/cross_model_verification_kernel/core/__init__.py +26 -0
- modules/cmvk/src/cross_model_verification_kernel/core/graph_memory.py +308 -0
- modules/cmvk/src/cross_model_verification_kernel/core/kernel.py +413 -0
- modules/cmvk/src/cross_model_verification_kernel/core/trace_logger.py +75 -0
- modules/cmvk/src/cross_model_verification_kernel/core/types.py +121 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/__init__.py +20 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/humaneval_loader.py +271 -0
- modules/cmvk/src/cross_model_verification_kernel/generator.py +118 -0
- modules/cmvk/src/cross_model_verification_kernel/kernel.py +292 -0
- modules/cmvk/src/cross_model_verification_kernel/models.py +111 -0
- modules/cmvk/src/cross_model_verification_kernel/py.typed +1 -0
- modules/cmvk/src/cross_model_verification_kernel/simple_kernel.py +185 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/__init__.py +94 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/huggingface_upload.py +394 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/sandbox.py +159 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/statistics.py +468 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/visualizer.py +312 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/web_search.py +86 -0
- modules/cmvk/src/cross_model_verification_kernel/verifier.py +257 -0
- modules/cmvk/tests/__init__.py +3 -0
- modules/cmvk/tests/conftest.py +61 -0
- modules/cmvk/tests/integration/__init__.py +1 -0
- modules/cmvk/tests/integration/test_anthropic_verifier.py +269 -0
- modules/cmvk/tests/integration/test_integration.py +53 -0
- modules/cmvk/tests/integration/test_lateral_thinking_integration.py +199 -0
- modules/cmvk/tests/integration/test_lateral_thinking_witness.py +208 -0
- modules/cmvk/tests/integration/test_prosecutor_mode.py +131 -0
- modules/cmvk/tests/test_constitutional.py +611 -0
- modules/cmvk/tests/test_enhanced_features.py +603 -0
- modules/cmvk/tests/test_verification.py +255 -0
- modules/cmvk/tests/unit/__init__.py +1 -0
- modules/cmvk/tests/unit/test_agents.py +64 -0
- modules/cmvk/tests/unit/test_cli.py +224 -0
- modules/cmvk/tests/unit/test_core.py +126 -0
- modules/cmvk/tests/unit/test_humaneval_loader.py +197 -0
- modules/cmvk/tests/unit/test_kernel.py +255 -0
- modules/cmvk/tests/unit/test_reproducibility.py +160 -0
- modules/cmvk/tests/unit/test_trace_logger.py +115 -0
- modules/cmvk/tests/unit/test_visualizer.py +218 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/bug_report.yml +82 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/config.yml +11 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/feature_request.yml +104 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/question.yml +70 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/security_vulnerability.yml +84 -0
- modules/control-plane/.github/discussions.yml +73 -0
- modules/control-plane/.github/pull_request_template.md +82 -0
- modules/control-plane/.github/workflows/publish.yml +146 -0
- modules/control-plane/.github/workflows/release.yml +39 -0
- modules/control-plane/.github/workflows/tests.yml +58 -0
- modules/control-plane/.gitignore +55 -0
- modules/control-plane/CHANGELOG.md +203 -0
- modules/control-plane/CONTRIBUTING.md +311 -0
- modules/control-plane/CONTRIBUTORS.md +88 -0
- modules/control-plane/Dockerfile +82 -0
- modules/control-plane/LICENSE +21 -0
- modules/control-plane/MANIFEST.in +17 -0
- modules/control-plane/README.md +1264 -0
- modules/control-plane/ROADMAP.md +228 -0
- modules/control-plane/SECURITY.md +210 -0
- modules/control-plane/SUPPORT.md +106 -0
- modules/control-plane/acp-cli.py +212 -0
- modules/control-plane/benchmark/README.md +257 -0
- modules/control-plane/benchmark/__init__.py +19 -0
- modules/control-plane/benchmark/red_team_dataset.py +517 -0
- modules/control-plane/benchmark.py +563 -0
- modules/control-plane/build_and_publish.sh +130 -0
- modules/control-plane/docker-compose.yml +74 -0
- modules/control-plane/docs/ABLATION_STUDIES.md +528 -0
- modules/control-plane/docs/ADAPTER_GUIDE.md +544 -0
- modules/control-plane/docs/ADVANCED_FEATURES.md +543 -0
- modules/control-plane/docs/AIOS_COMPARISON.md +296 -0
- modules/control-plane/docs/BIBLIOGRAPHY.md +367 -0
- modules/control-plane/docs/CASE_STUDIES.md +645 -0
- modules/control-plane/docs/DOCKER_DEPLOYMENT.md +184 -0
- modules/control-plane/docs/ECOSYSTEM_STATUS.md +98 -0
- modules/control-plane/docs/HF_MODEL_CARD.md +168 -0
- modules/control-plane/docs/KERNEL_V1_RELEASE.md +454 -0
- modules/control-plane/docs/LAYER3_FRAMEWORK.md +227 -0
- modules/control-plane/docs/LIMITATIONS.md +523 -0
- modules/control-plane/docs/PYPI_PUBLISHING.md +195 -0
- modules/control-plane/docs/README.md +58 -0
- modules/control-plane/docs/RELATED_WORK.md +319 -0
- modules/control-plane/docs/RELEASE_v1.1.0.md +252 -0
- modules/control-plane/docs/REPRODUCIBILITY.md +540 -0
- modules/control-plane/docs/RESEARCH_FOUNDATION.md +197 -0
- modules/control-plane/docs/api/CORE.md +270 -0
- modules/control-plane/docs/architecture/architecture.md +120 -0
- modules/control-plane/docs/community/ANNOUNCEMENT_TEMPLATES.md +52 -0
- modules/control-plane/docs/guides/IMPLEMENTATION.md +225 -0
- modules/control-plane/docs/guides/PHILOSOPHY.md +354 -0
- modules/control-plane/docs/guides/QUICKSTART.md +217 -0
- modules/control-plane/examples/README.md +138 -0
- modules/control-plane/examples/a2a_demo.py +410 -0
- modules/control-plane/examples/adapter_demo.py +347 -0
- modules/control-plane/examples/advanced_features.py +403 -0
- modules/control-plane/examples/basic_usage.py +261 -0
- modules/control-plane/examples/benchmark_demo.py +186 -0
- modules/control-plane/examples/compliance_demo.py +333 -0
- modules/control-plane/examples/configuration.py +265 -0
- modules/control-plane/examples/getting_started.py +178 -0
- modules/control-plane/examples/hibernation_and_time_travel_demo.py +406 -0
- modules/control-plane/examples/interactive_tutorial.ipynb +497 -0
- modules/control-plane/examples/kernel_interceptor_demo.py +202 -0
- modules/control-plane/examples/kernel_v1_demo.py +273 -0
- modules/control-plane/examples/langchain_demo.py +281 -0
- modules/control-plane/examples/lifecycle_demo.py +724 -0
- modules/control-plane/examples/mcp_demo.py +378 -0
- modules/control-plane/examples/ml_safety_demo.py +157 -0
- modules/control-plane/examples/multimodal_demo.py +347 -0
- modules/control-plane/examples/observability_demo.py +370 -0
- modules/control-plane/examples/use_cases.py +336 -0
- modules/control-plane/experiments/long_horizon_purge.py +235 -0
- modules/control-plane/experiments/multi_agent_rag.py +165 -0
- modules/control-plane/experiments/reproduce_results.py +667 -0
- modules/control-plane/paper/ARXIV_SUBMISSION_INFO.txt +122 -0
- modules/control-plane/paper/ETHICS_STATEMENT.md +248 -0
- modules/control-plane/paper/PAPER_CHECKLIST.md +72 -0
- modules/control-plane/paper/Paper.pdf +0 -0
- modules/control-plane/paper/README.md +71 -0
- modules/control-plane/paper/appendix.md +152 -0
- modules/control-plane/paper/architecture.md +15 -0
- modules/control-plane/paper/arxiv/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/arxiv/figures/architecture.png +0 -0
- modules/control-plane/paper/arxiv/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/arxiv/figures/results_chart.png +0 -0
- modules/control-plane/paper/arxiv/main.aux +97 -0
- modules/control-plane/paper/arxiv/main.bbl +112 -0
- modules/control-plane/paper/arxiv/main.blg +48 -0
- modules/control-plane/paper/arxiv/main.out +33 -0
- modules/control-plane/paper/arxiv/main.pdf +0 -0
- modules/control-plane/paper/arxiv/main.tex +479 -0
- modules/control-plane/paper/arxiv/references.bib +234 -0
- modules/control-plane/paper/arxiv_submission.tar +0 -0
- modules/control-plane/paper/arxiv_submission.zip +0 -0
- modules/control-plane/paper/build.sh +68 -0
- modules/control-plane/paper/figures/README.md +47 -0
- modules/control-plane/paper/figures/ablation_chart.pdf +0 -0
- modules/control-plane/paper/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/figures/architecture.pdf +0 -0
- modules/control-plane/paper/figures/architecture.png +0 -0
- modules/control-plane/paper/figures/constraint_graphs.pdf +0 -0
- modules/control-plane/paper/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/figures/generate_figures.py +252 -0
- modules/control-plane/paper/figures/results_chart.pdf +0 -0
- modules/control-plane/paper/figures/results_chart.png +0 -0
- modules/control-plane/paper/main.md +273 -0
- modules/control-plane/paper/main.tex +214 -0
- modules/control-plane/paper/main_arxiv.aux +53 -0
- modules/control-plane/paper/main_arxiv.out +17 -0
- modules/control-plane/paper/main_arxiv.pdf +0 -0
- modules/control-plane/paper/main_arxiv.tex +264 -0
- modules/control-plane/paper/references.bib +234 -0
- modules/control-plane/pyproject.toml +124 -0
- modules/control-plane/reproducibility/ABLATIONS.md +136 -0
- modules/control-plane/reproducibility/README.md +288 -0
- modules/control-plane/reproducibility/commands.md +467 -0
- modules/control-plane/reproducibility/docker_config/Dockerfile +39 -0
- modules/control-plane/reproducibility/experiment_configs/purge_config.json +46 -0
- modules/control-plane/reproducibility/experiment_configs/rag_config.json +36 -0
- modules/control-plane/reproducibility/hardware_specs.md +317 -0
- modules/control-plane/reproducibility/requirements_frozen.txt +0 -0
- modules/control-plane/reproducibility/run_all_experiments.sh +45 -0
- modules/control-plane/reproducibility/seeds.json +106 -0
- modules/control-plane/scripts/prepare_pypi.py +46 -0
- modules/control-plane/scripts/prepare_release.py +176 -0
- modules/control-plane/scripts/upload_dataset_to_hf.py +316 -0
- modules/control-plane/setup.py +69 -0
- modules/control-plane/src/agent_control_plane/__init__.py +639 -0
- modules/control-plane/src/agent_control_plane/a2a_adapter.py +541 -0
- modules/control-plane/src/agent_control_plane/adapter.py +415 -0
- modules/control-plane/src/agent_control_plane/agent_hibernation.py +364 -0
- modules/control-plane/src/agent_control_plane/agent_kernel.py +464 -0
- modules/control-plane/src/agent_control_plane/compliance.py +718 -0
- modules/control-plane/src/agent_control_plane/constraint_graphs.py +475 -0
- modules/control-plane/src/agent_control_plane/control_plane.py +848 -0
- modules/control-plane/src/agent_control_plane/example_executors.py +193 -0
- modules/control-plane/src/agent_control_plane/execution_engine.py +229 -0
- modules/control-plane/src/agent_control_plane/flight_recorder.py +600 -0
- modules/control-plane/src/agent_control_plane/governance_layer.py +432 -0
- modules/control-plane/src/agent_control_plane/hf_utils.py +561 -0
- modules/control-plane/src/agent_control_plane/interfaces/__init__.py +53 -0
- modules/control-plane/src/agent_control_plane/interfaces/kernel_interface.py +359 -0
- modules/control-plane/src/agent_control_plane/interfaces/plugin_interface.py +495 -0
- modules/control-plane/src/agent_control_plane/interfaces/protocol_interfaces.py +385 -0
- modules/control-plane/src/agent_control_plane/kernel_space.py +707 -0
- modules/control-plane/src/agent_control_plane/langchain_adapter.py +422 -0
- modules/control-plane/src/agent_control_plane/lifecycle.py +3111 -0
- modules/control-plane/src/agent_control_plane/mcp_adapter.py +517 -0
- modules/control-plane/src/agent_control_plane/ml_safety.py +560 -0
- modules/control-plane/src/agent_control_plane/multimodal.py +724 -0
- modules/control-plane/src/agent_control_plane/mute_agent.py +419 -0
- modules/control-plane/src/agent_control_plane/observability.py +785 -0
- modules/control-plane/src/agent_control_plane/orchestrator.py +480 -0
- modules/control-plane/src/agent_control_plane/plugin_registry.py +748 -0
- modules/control-plane/src/agent_control_plane/policy_engine.py +525 -0
- modules/control-plane/src/agent_control_plane/shadow_mode.py +307 -0
- modules/control-plane/src/agent_control_plane/signals.py +491 -0
- modules/control-plane/src/agent_control_plane/supervisor_agents.py +427 -0
- modules/control-plane/src/agent_control_plane/time_travel_debugger.py +554 -0
- modules/control-plane/src/agent_control_plane/tool_registry.py +350 -0
- modules/control-plane/src/agent_control_plane/vfs.py +695 -0
- modules/control-plane/tests/README.md +33 -0
- modules/control-plane/tests/test_a2a_adapter.py +336 -0
- modules/control-plane/tests/test_adapter.py +422 -0
- modules/control-plane/tests/test_advanced_features.py +389 -0
- modules/control-plane/tests/test_benchmark.py +223 -0
- modules/control-plane/tests/test_compliance.py +214 -0
- modules/control-plane/tests/test_control_plane.py +295 -0
- modules/control-plane/tests/test_hibernation.py +274 -0
- modules/control-plane/tests/test_kernel_interception.py +284 -0
- modules/control-plane/tests/test_langchain_adapter.py +258 -0
- modules/control-plane/tests/test_lifecycle.py +1174 -0
- modules/control-plane/tests/test_mcp_adapter.py +293 -0
- modules/control-plane/tests/test_ml_safety.py +142 -0
- modules/control-plane/tests/test_multimodal.py +317 -0
- modules/control-plane/tests/test_new_features.py +435 -0
- modules/control-plane/tests/test_observability.py +338 -0
- modules/control-plane/tests/test_time_travel.py +387 -0
- modules/emk/.github/workflows/ci.yml +105 -0
- modules/emk/.github/workflows/publish.yml +144 -0
- modules/emk/.gitignore +74 -0
- modules/emk/CHANGELOG.md +41 -0
- modules/emk/CONTRIBUTING.md +295 -0
- modules/emk/IMPLEMENTATION.md +174 -0
- modules/emk/LICENSE +21 -0
- modules/emk/MANIFEST.in +8 -0
- modules/emk/README.md +135 -0
- modules/emk/RELEASE_NOTES.md +82 -0
- modules/emk/SECURITY.md +52 -0
- modules/emk/codecov.yml +39 -0
- modules/emk/docs/MEMORY_MANAGEMENT.md +285 -0
- modules/emk/emk/__init__.py +106 -0
- modules/emk/emk/hf_utils.py +419 -0
- modules/emk/emk/indexer.py +144 -0
- modules/emk/emk/py.typed +0 -0
- modules/emk/emk/schema.py +204 -0
- modules/emk/emk/sleep_cycle.py +345 -0
- modules/emk/emk/store.py +479 -0
- modules/emk/examples/basic_usage.py +123 -0
- modules/emk/examples/memory_features_demo.py +154 -0
- modules/emk/experiments/README.md +59 -0
- modules/emk/experiments/reproduce_results.py +461 -0
- modules/emk/experiments/results.json +61 -0
- modules/emk/paper/structure.tex +192 -0
- modules/emk/paper/whitepaper.md +273 -0
- modules/emk/pyproject.toml +91 -0
- modules/emk/setup.py +5 -0
- modules/emk/tests/test_file_adapter.py +195 -0
- modules/emk/tests/test_indexer.py +174 -0
- modules/emk/tests/test_init.py +55 -0
- modules/emk/tests/test_negative_memory.py +83 -0
- modules/emk/tests/test_schema.py +150 -0
- modules/emk/tests/test_semantic_rules.py +175 -0
- modules/emk/tests/test_sleep_cycle.py +335 -0
- modules/emk/tests/test_store_anti_patterns.py +239 -0
- modules/iatp/.github/workflows/docker-build.yml +124 -0
- modules/iatp/.github/workflows/publish.yml +174 -0
- modules/iatp/.github/workflows/python-package.yml +121 -0
- modules/iatp/.gitignore +67 -0
- modules/iatp/.pre-commit-config.yaml +64 -0
- modules/iatp/CHANGELOG.md +120 -0
- modules/iatp/Dockerfile +91 -0
- modules/iatp/IMPLEMENTATION_SUMMARY.md +218 -0
- modules/iatp/MANIFEST.in +9 -0
- modules/iatp/README.md +180 -0
- modules/iatp/docker/Dockerfile.agent +27 -0
- modules/iatp/docker/Dockerfile.sidecar-python +86 -0
- modules/iatp/docker/README.md +258 -0
- modules/iatp/docker-compose.yml +194 -0
- modules/iatp/docs/ARCHITECTURE.md +243 -0
- modules/iatp/docs/CLI_GUIDE.md +220 -0
- modules/iatp/docs/DEPLOYMENT.md +304 -0
- modules/iatp/examples/README.md +132 -0
- modules/iatp/examples/backend_agent.py +39 -0
- modules/iatp/examples/client.py +168 -0
- modules/iatp/examples/demo_attestation_reputation.py +274 -0
- modules/iatp/examples/demo_client.py +240 -0
- modules/iatp/examples/demo_rbac.py +143 -0
- modules/iatp/examples/integration_demo.py +245 -0
- modules/iatp/examples/manifests/coder_agent.json +20 -0
- modules/iatp/examples/manifests/reviewer_agent.json +19 -0
- modules/iatp/examples/manifests/secure_bank.json +14 -0
- modules/iatp/examples/manifests/standard_agent.json +14 -0
- modules/iatp/examples/manifests/untrusted_honeypot.json +14 -0
- modules/iatp/examples/run_secure_bank_sidecar.py +85 -0
- modules/iatp/examples/run_sidecar.py +105 -0
- modules/iatp/examples/run_untrusted_sidecar.py +77 -0
- modules/iatp/examples/secure_bank_agent.py +138 -0
- modules/iatp/examples/test_untrusted.py +82 -0
- modules/iatp/examples/untrusted_agent.py +119 -0
- modules/iatp/experiments/README.md +58 -0
- modules/iatp/experiments/cascading_hallucination/README.md +149 -0
- modules/iatp/experiments/cascading_hallucination/agent_a_user.py +41 -0
- modules/iatp/experiments/cascading_hallucination/agent_b_summarizer.py +54 -0
- modules/iatp/experiments/cascading_hallucination/agent_c_database.py +47 -0
- modules/iatp/experiments/cascading_hallucination/proof_of_concept.py +290 -0
- modules/iatp/experiments/cascading_hallucination/run_experiment.py +226 -0
- modules/iatp/experiments/cascading_hallucination/sidecar_c.py +61 -0
- modules/iatp/experiments/reproduce_results.py +574 -0
- modules/iatp/experiments/results.json +2336 -0
- modules/iatp/iatp/__init__.py +164 -0
- modules/iatp/iatp/attestation.py +401 -0
- modules/iatp/iatp/cli.py +253 -0
- modules/iatp/iatp/hf_utils.py +469 -0
- modules/iatp/iatp/ipc_pipes.py +578 -0
- modules/iatp/iatp/main.py +410 -0
- modules/iatp/iatp/models/__init__.py +445 -0
- modules/iatp/iatp/policy_engine.py +335 -0
- modules/iatp/iatp/py.typed +2 -0
- modules/iatp/iatp/recovery.py +319 -0
- modules/iatp/iatp/security/__init__.py +268 -0
- modules/iatp/iatp/sidecar/__init__.py +517 -0
- modules/iatp/iatp/telemetry/__init__.py +162 -0
- modules/iatp/iatp/tests/__init__.py +1 -0
- modules/iatp/iatp/tests/test_attestation.py +368 -0
- modules/iatp/iatp/tests/test_cli.py +129 -0
- modules/iatp/iatp/tests/test_models.py +128 -0
- modules/iatp/iatp/tests/test_policy_engine.py +345 -0
- modules/iatp/iatp/tests/test_recovery.py +279 -0
- modules/iatp/iatp/tests/test_security.py +220 -0
- modules/iatp/iatp/tests/test_sidecar.py +165 -0
- modules/iatp/iatp/tests/test_telemetry.py +173 -0
- modules/iatp/paper/BLOG.md +307 -0
- modules/iatp/paper/PAPER.md +236 -0
- modules/iatp/paper/RFC_SUBMISSION.md +299 -0
- modules/iatp/paper/whitepaper.md +369 -0
- modules/iatp/proto/README.md +200 -0
- modules/iatp/proto/generate_stubs.py +81 -0
- modules/iatp/proto/iatp.proto +552 -0
- modules/iatp/pyproject.toml +180 -0
- modules/iatp/requirements-dev.txt +2 -0
- modules/iatp/requirements.txt +6 -0
- modules/iatp/setup.py +60 -0
- modules/iatp/sidecar/README.md +487 -0
- modules/iatp/sidecar/go/Dockerfile +32 -0
- modules/iatp/sidecar/go/README.md +237 -0
- modules/iatp/sidecar/go/go.mod +8 -0
- modules/iatp/sidecar/go/main.go +488 -0
- modules/iatp/spec/001-handshake.md +436 -0
- modules/iatp/spec/002-reversibility.md +394 -0
- modules/iatp/spec/schema/capability_manifest.json +266 -0
- modules/iatp/test_integration.py +310 -0
- modules/mcp-kernel-server/README.md +261 -0
- modules/mcp-kernel-server/pyproject.toml +60 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/__init__.py +26 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/cli.py +229 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/resources.py +215 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/server.py +562 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/tools.py +1172 -0
- modules/mute-agent/.github/workflows/safety_check.yml +45 -0
- modules/mute-agent/.gitignore +53 -0
- modules/mute-agent/ARCHITECTURE.md +531 -0
- modules/mute-agent/BENCHMARK_GUIDE.md +384 -0
- modules/mute-agent/COMPLETION_SUMMARY.md +293 -0
- modules/mute-agent/EXPERIMENT_SUMMARY.md +318 -0
- modules/mute-agent/IMPLEMENTATION_SUMMARY.md +212 -0
- modules/mute-agent/LICENSE +21 -0
- modules/mute-agent/PHASE3_SUMMARY.md +297 -0
- modules/mute-agent/README.md +360 -0
- modules/mute-agent/STEEL_MAN_RESULTS.md +353 -0
- modules/mute-agent/USAGE.md +505 -0
- modules/mute-agent/V2_IMPLEMENTATION_SUMMARY.md +253 -0
- modules/mute-agent/V2_STEEL_MAN_IMPLEMENTATION.md +274 -0
- modules/mute-agent/VERIFICATION_REPORT.md +435 -0
- modules/mute-agent/charts/cost_comparison.png +0 -0
- modules/mute-agent/charts/cost_vs_ambiguity.png +0 -0
- modules/mute-agent/charts/metrics_comparison.png +0 -0
- modules/mute-agent/charts/scenario_breakdown.png +0 -0
- modules/mute-agent/charts/trace_attack_blocked.html +140 -0
- modules/mute-agent/charts/trace_attack_blocked.png +0 -0
- modules/mute-agent/charts/trace_failure.html +140 -0
- modules/mute-agent/charts/trace_failure.png +0 -0
- modules/mute-agent/charts/trace_success.html +140 -0
- modules/mute-agent/charts/trace_success.png +0 -0
- modules/mute-agent/examples/__init__.py +1 -0
- modules/mute-agent/examples/advanced_example.py +384 -0
- modules/mute-agent/examples/graph_debugger_demo.py +241 -0
- modules/mute-agent/examples/listener_example.py +297 -0
- modules/mute-agent/examples/simple_example.py +242 -0
- modules/mute-agent/examples/steel_man_demo.py +297 -0
- modules/mute-agent/experiments/README.md +135 -0
- modules/mute-agent/experiments/__init__.py +3 -0
- modules/mute-agent/experiments/agent_comparison.csv +6 -0
- modules/mute-agent/experiments/agent_comparison_50runs.csv +6 -0
- modules/mute-agent/experiments/ambiguity_test.py +335 -0
- modules/mute-agent/experiments/ambiguity_test_results.csv +31 -0
- modules/mute-agent/experiments/ambiguity_test_results_50runs.csv +51 -0
- modules/mute-agent/experiments/baseline_agent.py +189 -0
- modules/mute-agent/experiments/benchmark.py +402 -0
- modules/mute-agent/experiments/demo.py +172 -0
- modules/mute-agent/experiments/generate_cost_curve.py +474 -0
- modules/mute-agent/experiments/jailbreak_test.py +137 -0
- modules/mute-agent/experiments/latent_state_scenario.py +361 -0
- modules/mute-agent/experiments/mute_agent_experiment.py +349 -0
- modules/mute-agent/experiments/run_extended_experiment.py +40 -0
- modules/mute-agent/experiments/run_v2_experiments.py +266 -0
- modules/mute-agent/experiments/run_v2_experiments_auto.py +247 -0
- modules/mute-agent/experiments/v2_scenarios/README.md +214 -0
- modules/mute-agent/experiments/v2_scenarios/__init__.py +4 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_1_deep_dependency.py +325 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_2_adversarial.py +328 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_3_false_positive.py +303 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_4_performance.py +319 -0
- modules/mute-agent/experiments/visualize.py +400 -0
- modules/mute-agent/mute_agent/__init__.py +66 -0
- modules/mute-agent/mute_agent/core/__init__.py +1 -0
- modules/mute-agent/mute_agent/core/execution_agent.py +164 -0
- modules/mute-agent/mute_agent/core/handshake_protocol.py +199 -0
- modules/mute-agent/mute_agent/core/reasoning_agent.py +236 -0
- modules/mute-agent/mute_agent/knowledge_graph/__init__.py +1 -0
- modules/mute-agent/mute_agent/knowledge_graph/graph_elements.py +63 -0
- modules/mute-agent/mute_agent/knowledge_graph/multidimensional_graph.py +168 -0
- modules/mute-agent/mute_agent/knowledge_graph/subgraph.py +222 -0
- modules/mute-agent/mute_agent/listener/__init__.py +41 -0
- modules/mute-agent/mute_agent/listener/adapters/__init__.py +29 -0
- modules/mute-agent/mute_agent/listener/adapters/base_adapter.py +187 -0
- modules/mute-agent/mute_agent/listener/adapters/caas_adapter.py +342 -0
- modules/mute-agent/mute_agent/listener/adapters/control_plane_adapter.py +434 -0
- modules/mute-agent/mute_agent/listener/adapters/iatp_adapter.py +330 -0
- modules/mute-agent/mute_agent/listener/adapters/scak_adapter.py +249 -0
- modules/mute-agent/mute_agent/listener/listener.py +608 -0
- modules/mute-agent/mute_agent/listener/state_observer.py +434 -0
- modules/mute-agent/mute_agent/listener/threshold_config.py +311 -0
- modules/mute-agent/mute_agent/super_system/__init__.py +1 -0
- modules/mute-agent/mute_agent/super_system/router.py +202 -0
- modules/mute-agent/mute_agent/visualization/__init__.py +8 -0
- modules/mute-agent/mute_agent/visualization/graph_debugger.py +495 -0
- modules/mute-agent/requirements-dev.txt +6 -0
- modules/mute-agent/requirements.txt +9 -0
- modules/mute-agent/setup.py +64 -0
- modules/mute-agent/src/__init__.py +0 -0
- modules/mute-agent/src/agents/__init__.py +0 -0
- modules/mute-agent/src/agents/baseline_agent.py +524 -0
- modules/mute-agent/src/agents/interactive_agent.py +113 -0
- modules/mute-agent/src/agents/mute_agent.py +622 -0
- modules/mute-agent/src/benchmarks/__init__.py +0 -0
- modules/mute-agent/src/benchmarks/evaluator.py +481 -0
- modules/mute-agent/src/benchmarks/scenarios.json +985 -0
- modules/mute-agent/src/core/__init__.py +0 -0
- modules/mute-agent/src/core/mock_state.py +320 -0
- modules/mute-agent/src/core/tools.py +441 -0
- modules/nexus/__init__.py +49 -0
- modules/nexus/arbiter.py +357 -0
- modules/nexus/client.py +464 -0
- modules/nexus/dmz.py +417 -0
- modules/nexus/escrow.py +428 -0
- modules/nexus/exceptions.py +284 -0
- modules/nexus/registry.py +391 -0
- modules/nexus/reputation.py +423 -0
- modules/nexus/schemas/__init__.py +49 -0
- modules/nexus/schemas/compliance.py +274 -0
- modules/nexus/schemas/escrow.py +249 -0
- modules/nexus/schemas/manifest.py +223 -0
- modules/nexus/schemas/receipt.py +206 -0
- modules/observability/README.md +192 -0
- modules/observability/alertmanager/alertmanager.yml +116 -0
- modules/observability/alerts/agent-os-alerts.yaml +197 -0
- modules/observability/docker-compose.yml +128 -0
- modules/observability/grafana/dashboards/agent-os-amb.json +448 -0
- modules/observability/grafana/dashboards/agent-os-cmvk.json +441 -0
- modules/observability/grafana/dashboards/agent-os-overview.json +268 -0
- modules/observability/grafana/dashboards/agent-os-performance.json +15 -0
- modules/observability/grafana/dashboards/agent-os-safety.json +50 -0
- modules/observability/grafana/provisioning/dashboards/dashboards.yml +15 -0
- modules/observability/grafana/provisioning/datasources/datasources.yml +33 -0
- modules/observability/otel/otel-collector-config.yml +61 -0
- modules/observability/prometheus/prometheus.yml +63 -0
- modules/observability/pyproject.toml +53 -0
- modules/observability/scripts/export_dashboards.py +55 -0
- modules/observability/src/agent_os_observability/__init__.py +25 -0
- modules/observability/src/agent_os_observability/dashboards.py +896 -0
- modules/observability/src/agent_os_observability/metrics.py +396 -0
- modules/observability/src/agent_os_observability/server.py +221 -0
- modules/observability/src/agent_os_observability/tracer.py +226 -0
- modules/primitives/.gitignore +8 -0
- modules/primitives/README.md +62 -0
- modules/primitives/agent_primitives/__init__.py +22 -0
- modules/primitives/agent_primitives/failures.py +82 -0
- modules/primitives/agent_primitives/py.typed +0 -0
- modules/primitives/pyproject.toml +68 -0
- modules/scak/.github/copilot-instructions.md +396 -0
- modules/scak/.github/workflows/release.yml +117 -0
- modules/scak/.gitignore +32 -0
- modules/scak/CHANGELOG.md +173 -0
- modules/scak/CITATION.cff +62 -0
- modules/scak/CONTRIBUTING.md +429 -0
- modules/scak/Dockerfile +58 -0
- modules/scak/ENTERPRISE_FEATURES.md +518 -0
- modules/scak/IMPLEMENTATION_SUMMARY.md +206 -0
- modules/scak/LIMITATIONS.md +565 -0
- modules/scak/MANIFEST.in +16 -0
- modules/scak/NOVELTY.md +535 -0
- modules/scak/README.md +928 -0
- modules/scak/RESEARCH.md +670 -0
- modules/scak/agent_kernel/__init__.py +66 -0
- modules/scak/agent_kernel/analyzer.py +432 -0
- modules/scak/agent_kernel/auditor.py +31 -0
- modules/scak/agent_kernel/completeness_auditor.py +234 -0
- modules/scak/agent_kernel/detector.py +200 -0
- modules/scak/agent_kernel/kernel.py +741 -0
- modules/scak/agent_kernel/memory_manager.py +82 -0
- modules/scak/agent_kernel/models.py +372 -0
- modules/scak/agent_kernel/nudge_mechanism.py +260 -0
- modules/scak/agent_kernel/outcome_analyzer.py +335 -0
- modules/scak/agent_kernel/patcher.py +579 -0
- modules/scak/agent_kernel/semantic_analyzer.py +313 -0
- modules/scak/agent_kernel/semantic_purge.py +346 -0
- modules/scak/agent_kernel/simulator.py +447 -0
- modules/scak/agent_kernel/teacher.py +82 -0
- modules/scak/agent_kernel/triage.py +149 -0
- modules/scak/build_and_publish.ps1 +74 -0
- modules/scak/build_and_publish.sh +74 -0
- modules/scak/cli.py +471 -0
- modules/scak/dashboard.py +462 -0
- modules/scak/datasets/DATASET_CARD.md +219 -0
- modules/scak/datasets/README.md +143 -0
- modules/scak/datasets/gaia_vague_queries/vague_queries.json +262 -0
- modules/scak/datasets/hf_upload/README.md +219 -0
- modules/scak/datasets/hf_upload/scak_gaia_laziness.jsonl +50 -0
- modules/scak/datasets/prepare_hf_datasets.py +145 -0
- modules/scak/datasets/red_team/jailbreak_patterns.json +202 -0
- modules/scak/docker-compose.yml +99 -0
- modules/scak/docs/Adaptive-Memory-Hierarchy.md +319 -0
- modules/scak/docs/Data-Contracts-and-Schemas.md +285 -0
- modules/scak/docs/Dual-Loop-Architecture.md +344 -0
- modules/scak/docs/Enhanced-Features.md +612 -0
- modules/scak/docs/LANGCHAIN_INTEGRATION.md +572 -0
- modules/scak/docs/README.md +128 -0
- modules/scak/docs/Reference-Implementations.md +163 -0
- modules/scak/docs/SCAK_V2.md +374 -0
- modules/scak/docs/Three-Failure-Types.md +178 -0
- modules/scak/examples/basic_example.py +155 -0
- modules/scak/examples/circuit_breaker_lazy_eval_demo.py +243 -0
- modules/scak/examples/langchain_integration_example.py +339 -0
- modules/scak/examples/layer4_demo.py +243 -0
- modules/scak/examples/production_features_demo.py +353 -0
- modules/scak/examples/quick_demo.py +79 -0
- modules/scak/examples/scak_v2_demo.py +252 -0
- modules/scak/experiments/README.md +438 -0
- modules/scak/experiments/ablation_studies/README.md +192 -0
- modules/scak/experiments/ablation_studies/ablation_no_audit.py +116 -0
- modules/scak/experiments/ablation_studies/ablation_no_purge.py +133 -0
- modules/scak/experiments/chaos_engineering/README.md +332 -0
- modules/scak/experiments/context_efficiency_test.py +328 -0
- modules/scak/experiments/gaia_benchmark/README.md +208 -0
- modules/scak/experiments/laziness_benchmark.py +179 -0
- modules/scak/experiments/long_horizon_task_experiment.py +252 -0
- modules/scak/experiments/multi_agent_rag_experiment.py +284 -0
- modules/scak/experiments/results/ablation_table.md +12 -0
- modules/scak/experiments/results/long_horizon.json +36 -0
- modules/scak/experiments/results/multi_agent_rag.json +66 -0
- modules/scak/experiments/run_comprehensive_ablations.py +332 -0
- modules/scak/experiments/test_auditor_patcher_integration.py +251 -0
- modules/scak/notebooks/getting_started.ipynb +33 -0
- modules/scak/paper/ARXIV_SUBMISSION_METADATA.txt +109 -0
- modules/scak/paper/PAPER_CHECKLIST.md +304 -0
- modules/scak/paper/Paper.pdf +0 -0
- modules/scak/paper/README.md +113 -0
- modules/scak/paper/appendix.md +351 -0
- modules/scak/paper/arxiv/bibliography.bib +284 -0
- modules/scak/paper/arxiv/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv/main.aux +103 -0
- modules/scak/paper/arxiv/main.bbl +113 -0
- modules/scak/paper/arxiv/main.blg +55 -0
- modules/scak/paper/arxiv/main.out +31 -0
- modules/scak/paper/arxiv/main.pdf +0 -0
- modules/scak/paper/arxiv/main.tex +482 -0
- modules/scak/paper/arxiv_submission/bibliography.bib +284 -0
- modules/scak/paper/arxiv_submission/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.aux +103 -0
- modules/scak/paper/arxiv_submission/main.bbl +113 -0
- modules/scak/paper/arxiv_submission/main.blg +55 -0
- modules/scak/paper/arxiv_submission/main.out +31 -0
- modules/scak/paper/arxiv_submission/main.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.tex +482 -0
- modules/scak/paper/arxiv_submission.tar.gz +0 -0
- modules/scak/paper/bibliography.bib +284 -0
- modules/scak/paper/build.sh +55 -0
- modules/scak/paper/figures/README.md +32 -0
- modules/scak/paper/figures/fig1_ooda_architecture.md +75 -0
- modules/scak/paper/figures/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/figures/fig1_ooda_architecture.png +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.md +83 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.png +0 -0
- modules/scak/paper/figures/fig3_gaia_results.md +64 -0
- modules/scak/paper/figures/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/figures/fig3_gaia_results.png +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.md +64 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.png +0 -0
- modules/scak/paper/figures/fig5_context_reduction.md +71 -0
- modules/scak/paper/figures/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/figures/fig5_context_reduction.png +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.md +80 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.png +0 -0
- modules/scak/paper/figures/generate_figures.py +463 -0
- modules/scak/paper/main.aux +103 -0
- modules/scak/paper/main.bbl +113 -0
- modules/scak/paper/main.blg +55 -0
- modules/scak/paper/main.md +192 -0
- modules/scak/paper/main.out +31 -0
- modules/scak/paper/main.pdf +0 -0
- modules/scak/paper/main.tex +482 -0
- modules/scak/reproducibility/ABLATIONS.md +225 -0
- modules/scak/reproducibility/Dockerfile.reproducibility +34 -0
- modules/scak/reproducibility/README.md +421 -0
- modules/scak/reproducibility/requirements-pinned.txt +32 -0
- modules/scak/reproducibility/run_all_experiments.py +395 -0
- modules/scak/reproducibility/seed_control.py +53 -0
- modules/scak/reproducibility/statistical_analysis.py +302 -0
- modules/scak/requirements.txt +50 -0
- modules/scak/setup.py +93 -0
- modules/scak/src/__init__.py +124 -0
- modules/scak/src/agents/__init__.py +13 -0
- modules/scak/src/agents/conflict_resolution.py +732 -0
- modules/scak/src/agents/orchestrator.py +761 -0
- modules/scak/src/agents/pubsub.py +484 -0
- modules/scak/src/agents/shadow_teacher.py +344 -0
- modules/scak/src/agents/swarm.py +661 -0
- modules/scak/src/agents/worker.py +357 -0
- modules/scak/src/integrations/__init__.py +81 -0
- modules/scak/src/integrations/cmvk_adapter.py +430 -0
- modules/scak/src/integrations/control_plane_adapter.py +601 -0
- modules/scak/src/integrations/langchain_integration.py +902 -0
- modules/scak/src/interfaces/__init__.py +59 -0
- modules/scak/src/interfaces/llm_clients.py +505 -0
- modules/scak/src/interfaces/openapi_tools.py +611 -0
- modules/scak/src/interfaces/plugin_system.py +605 -0
- modules/scak/src/interfaces/protocols.py +365 -0
- modules/scak/src/interfaces/telemetry.py +464 -0
- modules/scak/src/interfaces/tool_registry.py +547 -0
- modules/scak/src/kernel/__init__.py +100 -0
- modules/scak/src/kernel/auditor.py +305 -0
- modules/scak/src/kernel/circuit_breaker.py +398 -0
- modules/scak/src/kernel/core.py +724 -0
- modules/scak/src/kernel/distributed.py +667 -0
- modules/scak/src/kernel/evolution.py +455 -0
- modules/scak/src/kernel/failover.py +621 -0
- modules/scak/src/kernel/governance.py +710 -0
- modules/scak/src/kernel/governance_v2.py +603 -0
- modules/scak/src/kernel/lazy_evaluator.py +514 -0
- modules/scak/src/kernel/load_testing.py +633 -0
- modules/scak/src/kernel/memory.py +945 -0
- modules/scak/src/kernel/patcher.py +581 -0
- modules/scak/src/kernel/rubric.py +419 -0
- modules/scak/src/kernel/schemas.py +390 -0
- modules/scak/src/kernel/skill_mapper.py +309 -0
- modules/scak/src/kernel/triage.py +149 -0
- modules/scak/src/mocks/__init__.py +99 -0
- modules/scak/tests/__init__.py +1 -0
- modules/scak/tests/test_circuit_breaker.py +403 -0
- modules/scak/tests/test_conflict_resolution.py +287 -0
- modules/scak/tests/test_dual_loop.py +463 -0
- modules/scak/tests/test_enhanced_features.py +421 -0
- modules/scak/tests/test_failover_and_load.py +438 -0
- modules/scak/tests/test_governance.py +185 -0
- modules/scak/tests/test_kernel.py +359 -0
- modules/scak/tests/test_langchain_integration.py +451 -0
- modules/scak/tests/test_lazy_evaluator.py +465 -0
- modules/scak/tests/test_llm_clients.py +122 -0
- modules/scak/tests/test_memory_controller.py +528 -0
- modules/scak/tests/test_orchestrator.py +181 -0
- modules/scak/tests/test_phase3_integration.py +265 -0
- modules/scak/tests/test_pubsub_swarm.py +203 -0
- modules/scak/tests/test_reference_implementations.py +240 -0
- modules/scak/tests/test_rubric.py +363 -0
- modules/scak/tests/test_scak_v2.py +651 -0
- modules/scak/tests/test_skill_mapper.py +217 -0
- modules/scak/tests/test_specific_failures.py +393 -0
- modules/scak/tests/test_tool_registry.py +264 -0
- modules/scak/tests/test_tools_and_plugins.py +303 -0
- modules/scak/tests/test_triage.py +596 -0
- modules/scak/tests/test_write_through.py +319 -0
- agent_os_kernel-1.1.0.dist-info/METADATA +0 -400
- agent_os_kernel-1.1.0.dist-info/RECORD +0 -12
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/WHEEL +0 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/licenses/LICENSE +0 -0
|
@@ -0,0 +1,197 @@
|
|
|
1
|
+
# Research Foundation and Academic Grounding
|
|
2
|
+
|
|
3
|
+
This document provides the academic and research foundation for the Agent Control Plane's design decisions, safety mechanisms, and governance approaches.
|
|
4
|
+
|
|
5
|
+
## Core Research Papers
|
|
6
|
+
|
|
7
|
+
### Agent Safety and Governance
|
|
8
|
+
|
|
9
|
+
1. **"A Safety Framework for Real-World Agentic Systems"** (arXiv:2511.21990, 2024)
|
|
10
|
+
- Framework for contextual risk management in agentic systems
|
|
11
|
+
- Informs our PolicyEngine's dynamic risk assessment
|
|
12
|
+
- Applied in: Risk scoring, contextual policy evaluation
|
|
13
|
+
|
|
14
|
+
2. **"MAESTRO: A Threat Modeling Framework for Agentic AI"** (Cloud Security Alliance, 2025)
|
|
15
|
+
- Multi-agent security threat vectors and defense mechanisms
|
|
16
|
+
- Informs our multi-agent supervision and policy isolation
|
|
17
|
+
- Applied in: Supervisor agents, inter-agent communication security
|
|
18
|
+
|
|
19
|
+
3. **"Red-Teaming Agentic AI: Evaluation Frameworks and Benchmarks"** (arXiv:2511.21990, 2024)
|
|
20
|
+
- Adversarial testing methodologies for agentic systems
|
|
21
|
+
- Informs our red team dataset and benchmark design
|
|
22
|
+
- Applied in: benchmark/red_team_dataset.py, safety violation testing
|
|
23
|
+
|
|
24
|
+
### Multi-Agent Systems
|
|
25
|
+
|
|
26
|
+
4. **"Multi-Agent Systems: A Survey"** (arXiv:2308.05391, 2023)
|
|
27
|
+
- Comprehensive overview of MAS architectures and patterns
|
|
28
|
+
- Hierarchical control patterns to prevent cascade failures
|
|
29
|
+
- Applied in: Supervisor agents, agent hierarchy design
|
|
30
|
+
- Citation: Used for understanding coordination patterns and failure modes
|
|
31
|
+
|
|
32
|
+
5. **"Fault-Tolerant Multi-Agent Systems"** (IEEE Transactions on Systems, Man, and Cybernetics, 2024)
|
|
33
|
+
- Resilience models and failure recovery patterns
|
|
34
|
+
- Circuit breaker patterns and retry policies
|
|
35
|
+
- Applied in: ExecutionEngine rollback mechanisms, error recovery
|
|
36
|
+
|
|
37
|
+
### Governance and Compliance
|
|
38
|
+
|
|
39
|
+
6. **"Responsible AI Governance: A Review"** (ScienceDirect, 2024)
|
|
40
|
+
- Procedural practices for AI system governance
|
|
41
|
+
- Risk-based governance frameworks
|
|
42
|
+
- Applied in: PolicyEngine design, audit requirements
|
|
43
|
+
|
|
44
|
+
7. **"Practices for Governing Agentic AI Systems"** (OpenAI, 2023)
|
|
45
|
+
- Pre-deployment and post-deployment governance checks
|
|
46
|
+
- Monitoring and intervention strategies
|
|
47
|
+
- Applied in: Shadow mode, pre-execution validation, audit logging
|
|
48
|
+
|
|
49
|
+
8. **"Evaluating Agentic AI: Frameworks and Metrics"** (World Economic Forum, 2025)
|
|
50
|
+
- Standardized evaluation metrics for agentic systems
|
|
51
|
+
- Safety, reliability, and efficiency benchmarks
|
|
52
|
+
- Applied in: Benchmark methodology, performance metrics
|
|
53
|
+
|
|
54
|
+
### Privacy and Security
|
|
55
|
+
|
|
56
|
+
9. **"Privacy in Agentic Systems"** (arXiv:2409.1087, 2024)
|
|
57
|
+
- Privacy-preserving techniques for autonomous agents
|
|
58
|
+
- Differential privacy and secure computation
|
|
59
|
+
- Applied in: PII detection in constraint graphs, data access controls
|
|
60
|
+
|
|
61
|
+
10. **"Agent-to-Agent Communication Security"** (ACM CCS, 2024)
|
|
62
|
+
- Security patterns for inter-agent messaging
|
|
63
|
+
- Authentication and authorization in agent networks
|
|
64
|
+
- Applied in: A2A adapter security, agent authentication
|
|
65
|
+
|
|
66
|
+
### Enterprise AI Orchestration
|
|
67
|
+
|
|
68
|
+
11. **"Unlocking Exponential Value with AI Agent Orchestration"** (Deloitte, 2025)
|
|
69
|
+
- Enterprise patterns for agent deployment
|
|
70
|
+
- Governance requirements for production systems
|
|
71
|
+
- Applied in: Resource management, quota systems
|
|
72
|
+
|
|
73
|
+
12. **"AI Agent Orchestration Frameworks: A Comparative Study"** (Kubiya, 2025)
|
|
74
|
+
- Comparison of agent frameworks (LangChain, AutoGen, CrewAI)
|
|
75
|
+
- Integration patterns and middleware approaches
|
|
76
|
+
- Applied in: Adapter design, framework integration strategy
|
|
77
|
+
|
|
78
|
+
## Design Principles Grounded in Research
|
|
79
|
+
|
|
80
|
+
### 1. Deterministic Enforcement Over Probabilistic Filtering
|
|
81
|
+
|
|
82
|
+
**Research Basis:**
|
|
83
|
+
- "A Safety Framework for Real-World Agentic Systems" emphasizes that safety mechanisms must be deterministic and not rely on LLM reasoning
|
|
84
|
+
- Operating systems use permission-based security (not request-based) for a reason
|
|
85
|
+
|
|
86
|
+
**Implementation:**
|
|
87
|
+
- Agent Kernel enforces permissions at the API boundary
|
|
88
|
+
- Policy evaluation occurs before execution, not during
|
|
89
|
+
- No reliance on prompt engineering for security
|
|
90
|
+
|
|
91
|
+
### 2. Layered Defense Architecture
|
|
92
|
+
|
|
93
|
+
**Research Basis:**
|
|
94
|
+
- "MAESTRO: A Threat Modeling Framework" recommends defense-in-depth for agentic systems
|
|
95
|
+
- Multiple validation layers reduce single-point-of-failure risks
|
|
96
|
+
|
|
97
|
+
**Implementation:**
|
|
98
|
+
- Layer 1: Permission checking (Agent Kernel)
|
|
99
|
+
- Layer 2: Policy evaluation (Policy Engine)
|
|
100
|
+
- Layer 3: Resource constraints (Execution Engine)
|
|
101
|
+
- Layer 4: Runtime monitoring (Supervisor Agents)
|
|
102
|
+
|
|
103
|
+
### 3. Capability-Based Security (The Mute Agent)
|
|
104
|
+
|
|
105
|
+
**Research Basis:**
|
|
106
|
+
- Principle of least privilege from security research
|
|
107
|
+
- "If a system can't do something, it can't be tricked into doing it"
|
|
108
|
+
|
|
109
|
+
**Implementation:**
|
|
110
|
+
- Agents receive only necessary permissions
|
|
111
|
+
- Out-of-scope requests return NULL, not refusals
|
|
112
|
+
- No "helpful" hallucinations that might bypass boundaries
|
|
113
|
+
|
|
114
|
+
### 4. Simulation Before Execution (Shadow Mode)
|
|
115
|
+
|
|
116
|
+
**Research Basis:**
|
|
117
|
+
- "Practices for Governing Agentic AI Systems" recommends simulation for pre-deployment testing
|
|
118
|
+
- Reduces risk of unintended consequences in production
|
|
119
|
+
|
|
120
|
+
**Implementation:**
|
|
121
|
+
- Actions intercepted before execution
|
|
122
|
+
- Full policy validation without side effects
|
|
123
|
+
- Statistical analysis of agent behavior patterns
|
|
124
|
+
|
|
125
|
+
### 5. Multi-Dimensional Context (Constraint Graphs)
|
|
126
|
+
|
|
127
|
+
**Research Basis:**
|
|
128
|
+
- Context-aware access control from ABAC research
|
|
129
|
+
- "Privacy in Agentic Systems" emphasizes context in data governance
|
|
130
|
+
|
|
131
|
+
**Implementation:**
|
|
132
|
+
- Data Graph: What exists (data resources)
|
|
133
|
+
- Policy Graph: What's allowed (business rules)
|
|
134
|
+
- Temporal Graph: What's true now (time-based constraints)
|
|
135
|
+
|
|
136
|
+
## Benchmark Methodology
|
|
137
|
+
|
|
138
|
+
Our comparative safety study follows research-backed evaluation practices:
|
|
139
|
+
|
|
140
|
+
### Dataset Design
|
|
141
|
+
Based on "Red-Teaming Agentic AI" taxonomy:
|
|
142
|
+
- Direct violations (15 prompts): SQL injection, system commands
|
|
143
|
+
- Prompt injections (15 prompts): Jailbreaks, instruction overrides
|
|
144
|
+
- Contextual confusion (15 prompts): Social engineering
|
|
145
|
+
- Valid requests (15 prompts): False positive testing
|
|
146
|
+
|
|
147
|
+
### Metrics
|
|
148
|
+
Following "Evaluating Agentic AI" frameworks:
|
|
149
|
+
- **Safety Violation Rate (SVR)**: % of malicious prompts that succeed
|
|
150
|
+
- **False Positive Rate (FPR)**: % of valid requests incorrectly blocked
|
|
151
|
+
- **Token Efficiency**: Output tokens used (lower is better for "scale by subtraction")
|
|
152
|
+
- **Response Time**: Mean time to decision (µs)
|
|
153
|
+
|
|
154
|
+
### Baseline Comparison
|
|
155
|
+
- **Prompt-based safety**: Industry standard (system prompts with safety instructions)
|
|
156
|
+
- **Control Plane governance**: Our deterministic approach
|
|
157
|
+
|
|
158
|
+
## Open Research Questions
|
|
159
|
+
|
|
160
|
+
Areas where further research is needed:
|
|
161
|
+
|
|
162
|
+
1. **Optimal Supervision Ratios**: What's the right supervisor-to-worker agent ratio?
|
|
163
|
+
2. **Multi-Agent Coordination**: How to handle emergent behaviors in agent swarms?
|
|
164
|
+
3. **Privacy-Utility Tradeoffs**: Balancing governance with agent capabilities
|
|
165
|
+
4. **Adversarial Robustness**: Can deterministic systems handle all attack vectors?
|
|
166
|
+
5. **Human-in-the-Loop**: When should humans intervene in agent decisions?
|
|
167
|
+
|
|
168
|
+
## Contributing Research
|
|
169
|
+
|
|
170
|
+
We welcome research contributions:
|
|
171
|
+
- Novel threat vectors for our red team dataset
|
|
172
|
+
- Improved policy evaluation algorithms
|
|
173
|
+
- Benchmarks comparing with other frameworks
|
|
174
|
+
- Case studies from production deployments
|
|
175
|
+
|
|
176
|
+
## Citation Format
|
|
177
|
+
|
|
178
|
+
If you use the Agent Control Plane in research, please cite:
|
|
179
|
+
|
|
180
|
+
```bibtex
|
|
181
|
+
@software{agent_control_plane,
|
|
182
|
+
title = {Agent Control Plane: A Governance Layer for Autonomous AI Agents},
|
|
183
|
+
author = {Agent Control Plane Contributors},
|
|
184
|
+
year = {2025},
|
|
185
|
+
url = {https://github.com/imran-siddique/agent-control-plane},
|
|
186
|
+
note = {MIT License}
|
|
187
|
+
}
|
|
188
|
+
```
|
|
189
|
+
|
|
190
|
+
## References
|
|
191
|
+
|
|
192
|
+
See [BIBLIOGRAPHY.md](./BIBLIOGRAPHY.md) for complete list of references with links and DOIs.
|
|
193
|
+
|
|
194
|
+
---
|
|
195
|
+
|
|
196
|
+
**Last Updated**: January 2026
|
|
197
|
+
**Maintained by**: Agent Control Plane Core Team
|
|
@@ -0,0 +1,270 @@
|
|
|
1
|
+
# API Reference
|
|
2
|
+
|
|
3
|
+
This document provides a comprehensive API reference for the Agent Control Plane.
|
|
4
|
+
|
|
5
|
+
## Core Classes
|
|
6
|
+
|
|
7
|
+
### AgentControlPlane
|
|
8
|
+
|
|
9
|
+
The main interface for the Agent Control Plane.
|
|
10
|
+
|
|
11
|
+
```python
|
|
12
|
+
from agent_control_plane import AgentControlPlane
|
|
13
|
+
|
|
14
|
+
control_plane = AgentControlPlane()
|
|
15
|
+
```
|
|
16
|
+
|
|
17
|
+
#### Methods
|
|
18
|
+
|
|
19
|
+
##### `create_agent(agent_id: str, permissions: Dict[ActionType, PermissionLevel]) -> AgentContext`
|
|
20
|
+
|
|
21
|
+
Create a new agent with specified permissions.
|
|
22
|
+
|
|
23
|
+
**Parameters:**
|
|
24
|
+
- `agent_id` (str): Unique identifier for the agent
|
|
25
|
+
- `permissions` (Dict[ActionType, PermissionLevel]): Permission mapping
|
|
26
|
+
|
|
27
|
+
**Returns:**
|
|
28
|
+
- `AgentContext`: Agent context object
|
|
29
|
+
|
|
30
|
+
**Example:**
|
|
31
|
+
```python
|
|
32
|
+
from agent_control_plane.agent_kernel import ActionType, PermissionLevel
|
|
33
|
+
|
|
34
|
+
permissions = {
|
|
35
|
+
ActionType.FILE_READ: PermissionLevel.READ_ONLY,
|
|
36
|
+
ActionType.API_CALL: PermissionLevel.READ_WRITE,
|
|
37
|
+
}
|
|
38
|
+
|
|
39
|
+
agent = control_plane.create_agent("my-agent", permissions)
|
|
40
|
+
```
|
|
41
|
+
|
|
42
|
+
##### `execute_action(agent_context: AgentContext, action_type: ActionType, params: Dict[str, Any]) -> Dict[str, Any]`
|
|
43
|
+
|
|
44
|
+
Execute an action on behalf of an agent.
|
|
45
|
+
|
|
46
|
+
**Parameters:**
|
|
47
|
+
- `agent_context` (AgentContext): Agent context
|
|
48
|
+
- `action_type` (ActionType): Type of action to execute
|
|
49
|
+
- `params` (Dict[str, Any]): Action parameters
|
|
50
|
+
|
|
51
|
+
**Returns:**
|
|
52
|
+
- Dict with keys: `success` (bool), `result` (Any), `error` (str), `risk_score` (float)
|
|
53
|
+
|
|
54
|
+
**Example:**
|
|
55
|
+
```python
|
|
56
|
+
result = control_plane.execute_action(
|
|
57
|
+
agent,
|
|
58
|
+
ActionType.FILE_READ,
|
|
59
|
+
{"path": "/data/file.txt"}
|
|
60
|
+
)
|
|
61
|
+
|
|
62
|
+
if result["success"]:
|
|
63
|
+
print(result["result"])
|
|
64
|
+
else:
|
|
65
|
+
print(result["error"])
|
|
66
|
+
```
|
|
67
|
+
|
|
68
|
+
##### `get_audit_log(agent_id: str) -> List[Dict]`
|
|
69
|
+
|
|
70
|
+
Get audit log entries for an agent.
|
|
71
|
+
|
|
72
|
+
**Parameters:**
|
|
73
|
+
- `agent_id` (str): Agent identifier
|
|
74
|
+
|
|
75
|
+
**Returns:**
|
|
76
|
+
- List[Dict]: Audit log entries
|
|
77
|
+
|
|
78
|
+
## Enums
|
|
79
|
+
|
|
80
|
+
### ActionType
|
|
81
|
+
|
|
82
|
+
Types of actions an agent can request.
|
|
83
|
+
|
|
84
|
+
```python
|
|
85
|
+
from agent_control_plane.agent_kernel import ActionType
|
|
86
|
+
|
|
87
|
+
ActionType.CODE_EXECUTION # Execute code
|
|
88
|
+
ActionType.FILE_READ # Read files
|
|
89
|
+
ActionType.FILE_WRITE # Write files
|
|
90
|
+
ActionType.API_CALL # Make API calls
|
|
91
|
+
ActionType.DATABASE_QUERY # Query database
|
|
92
|
+
ActionType.DATABASE_WRITE # Write to database
|
|
93
|
+
ActionType.WORKFLOW_TRIGGER # Trigger workflows
|
|
94
|
+
```
|
|
95
|
+
|
|
96
|
+
### PermissionLevel
|
|
97
|
+
|
|
98
|
+
Permission levels for actions.
|
|
99
|
+
|
|
100
|
+
```python
|
|
101
|
+
from agent_control_plane.agent_kernel import PermissionLevel
|
|
102
|
+
|
|
103
|
+
PermissionLevel.NONE # No access
|
|
104
|
+
PermissionLevel.READ_ONLY # Read-only access
|
|
105
|
+
PermissionLevel.READ_WRITE # Read and write access
|
|
106
|
+
PermissionLevel.ADMIN # Administrative access
|
|
107
|
+
```
|
|
108
|
+
|
|
109
|
+
### ExecutionStatus
|
|
110
|
+
|
|
111
|
+
Status of an execution request.
|
|
112
|
+
|
|
113
|
+
```python
|
|
114
|
+
from agent_control_plane.agent_kernel import ExecutionStatus
|
|
115
|
+
|
|
116
|
+
ExecutionStatus.PENDING # Request pending
|
|
117
|
+
ExecutionStatus.APPROVED # Request approved
|
|
118
|
+
ExecutionStatus.DENIED # Request denied
|
|
119
|
+
ExecutionStatus.EXECUTING # Currently executing
|
|
120
|
+
ExecutionStatus.COMPLETED # Execution completed
|
|
121
|
+
ExecutionStatus.FAILED # Execution failed
|
|
122
|
+
ExecutionStatus.ROLLED_BACK # Execution rolled back
|
|
123
|
+
```
|
|
124
|
+
|
|
125
|
+
## Policy Engine
|
|
126
|
+
|
|
127
|
+
### ResourceQuota
|
|
128
|
+
|
|
129
|
+
Resource quota configuration for an agent.
|
|
130
|
+
|
|
131
|
+
```python
|
|
132
|
+
from agent_control_plane.policy_engine import ResourceQuota
|
|
133
|
+
|
|
134
|
+
quota = ResourceQuota(
|
|
135
|
+
agent_id="my-agent",
|
|
136
|
+
max_requests_per_minute=60,
|
|
137
|
+
max_requests_per_hour=1000,
|
|
138
|
+
max_execution_time_seconds=300.0,
|
|
139
|
+
max_concurrent_executions=5
|
|
140
|
+
)
|
|
141
|
+
|
|
142
|
+
control_plane.policy_engine.set_quota("my-agent", quota)
|
|
143
|
+
```
|
|
144
|
+
|
|
145
|
+
### RiskPolicy
|
|
146
|
+
|
|
147
|
+
Risk-based policy configuration.
|
|
148
|
+
|
|
149
|
+
```python
|
|
150
|
+
from agent_control_plane.policy_engine import RiskPolicy
|
|
151
|
+
|
|
152
|
+
policy = RiskPolicy(
|
|
153
|
+
max_risk_score=0.5,
|
|
154
|
+
require_approval_above=0.7,
|
|
155
|
+
deny_above=0.9
|
|
156
|
+
)
|
|
157
|
+
|
|
158
|
+
control_plane.policy_engine.set_risk_policy("default", policy)
|
|
159
|
+
```
|
|
160
|
+
|
|
161
|
+
## Helper Functions
|
|
162
|
+
|
|
163
|
+
### `create_read_only_agent(control_plane: AgentControlPlane, agent_id: str) -> AgentContext`
|
|
164
|
+
|
|
165
|
+
Create an agent with read-only permissions.
|
|
166
|
+
|
|
167
|
+
```python
|
|
168
|
+
from agent_control_plane import create_read_only_agent
|
|
169
|
+
|
|
170
|
+
agent = create_read_only_agent(control_plane, "reader")
|
|
171
|
+
```
|
|
172
|
+
|
|
173
|
+
### `create_standard_agent(control_plane: AgentControlPlane, agent_id: str) -> AgentContext`
|
|
174
|
+
|
|
175
|
+
Create an agent with standard permissions (read/write but not admin).
|
|
176
|
+
|
|
177
|
+
```python
|
|
178
|
+
from agent_control_plane import create_standard_agent
|
|
179
|
+
|
|
180
|
+
agent = create_standard_agent(control_plane, "worker")
|
|
181
|
+
```
|
|
182
|
+
|
|
183
|
+
### `create_admin_agent(control_plane: AgentControlPlane, agent_id: str) -> AgentContext`
|
|
184
|
+
|
|
185
|
+
Create an agent with administrative permissions.
|
|
186
|
+
|
|
187
|
+
```python
|
|
188
|
+
from agent_control_plane import create_admin_agent
|
|
189
|
+
|
|
190
|
+
agent = create_admin_agent(control_plane, "admin")
|
|
191
|
+
```
|
|
192
|
+
|
|
193
|
+
## Advanced Features
|
|
194
|
+
|
|
195
|
+
### Shadow Mode
|
|
196
|
+
|
|
197
|
+
Enable simulation mode for testing without side effects.
|
|
198
|
+
|
|
199
|
+
```python
|
|
200
|
+
from agent_control_plane.shadow_mode import ShadowModeConfig
|
|
201
|
+
|
|
202
|
+
config = ShadowModeConfig(
|
|
203
|
+
enabled=True,
|
|
204
|
+
log_reasoning=True
|
|
205
|
+
)
|
|
206
|
+
|
|
207
|
+
control_plane.enable_shadow_mode("agent-id", config)
|
|
208
|
+
```
|
|
209
|
+
|
|
210
|
+
### Mute Agent
|
|
211
|
+
|
|
212
|
+
Create capability-based agents that return NULL for out-of-scope requests.
|
|
213
|
+
|
|
214
|
+
```python
|
|
215
|
+
from agent_control_plane.mute_agent import create_mute_sql_agent
|
|
216
|
+
|
|
217
|
+
config = create_mute_sql_agent("sql-agent")
|
|
218
|
+
control_plane.enable_mute_agent("sql-agent", config)
|
|
219
|
+
```
|
|
220
|
+
|
|
221
|
+
### Constraint Graphs
|
|
222
|
+
|
|
223
|
+
Define multi-dimensional context for agents.
|
|
224
|
+
|
|
225
|
+
```python
|
|
226
|
+
from agent_control_plane.constraint_graphs import (
|
|
227
|
+
DataGraph, TemporalGraph, GraphNode, GraphNodeType
|
|
228
|
+
)
|
|
229
|
+
|
|
230
|
+
# Data Graph
|
|
231
|
+
data_graph = DataGraph()
|
|
232
|
+
data_graph.add_node(GraphNode(
|
|
233
|
+
id="allowed_data",
|
|
234
|
+
node_type=GraphNodeType.FILE,
|
|
235
|
+
metadata={"path": "/data/"}
|
|
236
|
+
))
|
|
237
|
+
|
|
238
|
+
control_plane.set_data_graph("agent-id", data_graph)
|
|
239
|
+
|
|
240
|
+
# Temporal Graph
|
|
241
|
+
from datetime import time
|
|
242
|
+
|
|
243
|
+
temporal_graph = TemporalGraph()
|
|
244
|
+
temporal_graph.set_business_hours(time(9, 0), time(17, 0))
|
|
245
|
+
|
|
246
|
+
control_plane.set_temporal_graph("agent-id", temporal_graph)
|
|
247
|
+
```
|
|
248
|
+
|
|
249
|
+
## Error Handling
|
|
250
|
+
|
|
251
|
+
All operations return dictionaries with consistent structure:
|
|
252
|
+
|
|
253
|
+
```python
|
|
254
|
+
result = control_plane.execute_action(agent, action_type, params)
|
|
255
|
+
|
|
256
|
+
if result["success"]:
|
|
257
|
+
# Operation succeeded
|
|
258
|
+
data = result["result"]
|
|
259
|
+
risk = result.get("risk_score", 0.0)
|
|
260
|
+
else:
|
|
261
|
+
# Operation failed
|
|
262
|
+
error = result["error"]
|
|
263
|
+
reason = result.get("reason", "Unknown")
|
|
264
|
+
```
|
|
265
|
+
|
|
266
|
+
## See Also
|
|
267
|
+
|
|
268
|
+
- [Quick Start Guide](../docs/guides/QUICKSTART.md)
|
|
269
|
+
- [Examples](../examples/)
|
|
270
|
+
- [Architecture](../docs/architecture/architecture.md)
|
|
@@ -0,0 +1,120 @@
|
|
|
1
|
+
# Agent Control Plane Architecture
|
|
2
|
+
|
|
3
|
+
## Overview
|
|
4
|
+
|
|
5
|
+
The Agent Control Plane is a governance and management layer for autonomous AI agents. It treats the LLM as a raw compute component and provides a kernel-like layer for safe, controlled execution.
|
|
6
|
+
|
|
7
|
+
## Core Components
|
|
8
|
+
|
|
9
|
+
### 1. Agent Kernel
|
|
10
|
+
The kernel mediates all interactions between the LLM (raw compute) and the execution environment. It:
|
|
11
|
+
- Intercepts all agent requests before execution
|
|
12
|
+
- Validates permissions and policies
|
|
13
|
+
- Manages execution context and state
|
|
14
|
+
- Provides isolation between agents
|
|
15
|
+
|
|
16
|
+
### 2. Policy Engine
|
|
17
|
+
Enforces governance rules and constraints:
|
|
18
|
+
- Resource quotas (tokens, API calls, compute time)
|
|
19
|
+
- Data access policies (read/write permissions)
|
|
20
|
+
- Action whitelists/blacklists
|
|
21
|
+
- Rate limiting and throttling
|
|
22
|
+
- Risk assessment for proposed actions
|
|
23
|
+
|
|
24
|
+
### 3. Resource Manager
|
|
25
|
+
Controls access to system resources:
|
|
26
|
+
- Compute allocation (CPU, memory, GPU)
|
|
27
|
+
- API rate limits and quotas
|
|
28
|
+
- Database connection pooling
|
|
29
|
+
- File system access control
|
|
30
|
+
- Network access policies
|
|
31
|
+
|
|
32
|
+
### 4. Execution Engine
|
|
33
|
+
Safely executes agent actions:
|
|
34
|
+
- Sandboxed execution environments
|
|
35
|
+
- Transaction management (rollback capability)
|
|
36
|
+
- Error handling and recovery
|
|
37
|
+
- Timeout enforcement
|
|
38
|
+
- Result validation
|
|
39
|
+
|
|
40
|
+
### 5. Audit Logger
|
|
41
|
+
Comprehensive tracking for compliance and debugging:
|
|
42
|
+
- All agent requests and responses
|
|
43
|
+
- Policy decisions and violations
|
|
44
|
+
- Resource usage metrics
|
|
45
|
+
- Security events
|
|
46
|
+
- Execution traces
|
|
47
|
+
|
|
48
|
+
## Architecture Diagram
|
|
49
|
+
|
|
50
|
+
```
|
|
51
|
+
┌─────────────────────────────────────────────────────────────┐
|
|
52
|
+
│ Application Layer │
|
|
53
|
+
│ (Chat, Workflow, Tools) │
|
|
54
|
+
└─────────────────────────┬───────────────────────────────────┘
|
|
55
|
+
│
|
|
56
|
+
┌─────────────────────────▼───────────────────────────────────┐
|
|
57
|
+
│ Agent Control Plane │
|
|
58
|
+
│ ┌──────────────┐ ┌──────────────┐ ┌──────────────┐ │
|
|
59
|
+
│ │ Agent │ │ Policy │ │ Audit │ │
|
|
60
|
+
│ │ Kernel │◄─┤ Engine │◄─┤ Logger │ │
|
|
61
|
+
│ └──────┬───────┘ └──────────────┘ └──────────────┘ │
|
|
62
|
+
│ │ │
|
|
63
|
+
│ ┌──────▼───────┐ ┌──────────────┐ │
|
|
64
|
+
│ │ Resource │ │ Execution │ │
|
|
65
|
+
│ │ Manager │◄─┤ Engine │ │
|
|
66
|
+
│ └──────────────┘ └──────────────┘ │
|
|
67
|
+
└─────────────────────────┬───────────────────────────────────┘
|
|
68
|
+
│
|
|
69
|
+
┌─────────────────────────▼───────────────────────────────────┐
|
|
70
|
+
│ LLM (Raw Compute) │
|
|
71
|
+
│ (GPT-4, Claude, Llama, etc.) │
|
|
72
|
+
└─────────────────────────────────────────────────────────────┘
|
|
73
|
+
│
|
|
74
|
+
┌─────────────────────────▼───────────────────────────────────┐
|
|
75
|
+
│ Execution Environment │
|
|
76
|
+
│ (Code, Databases, APIs, File System) │
|
|
77
|
+
└─────────────────────────────────────────────────────────────┘
|
|
78
|
+
```
|
|
79
|
+
|
|
80
|
+
## Key Features
|
|
81
|
+
|
|
82
|
+
### Governance
|
|
83
|
+
- Fine-grained permission system
|
|
84
|
+
- Policy-based access control
|
|
85
|
+
- Compliance and audit trails
|
|
86
|
+
- Risk scoring and assessment
|
|
87
|
+
|
|
88
|
+
### Safety
|
|
89
|
+
- Sandboxed execution
|
|
90
|
+
- Resource limits and quotas
|
|
91
|
+
- Rollback and recovery
|
|
92
|
+
- Input/output validation
|
|
93
|
+
|
|
94
|
+
### Observability
|
|
95
|
+
- Real-time monitoring
|
|
96
|
+
- Metrics and analytics
|
|
97
|
+
- Trace collection
|
|
98
|
+
- Alerting and notifications
|
|
99
|
+
|
|
100
|
+
### Scalability
|
|
101
|
+
- Multi-tenant support
|
|
102
|
+
- Horizontal scaling
|
|
103
|
+
- Load balancing
|
|
104
|
+
- Distributed execution
|
|
105
|
+
|
|
106
|
+
## Use Cases
|
|
107
|
+
|
|
108
|
+
1. **Enterprise AI Agents**: Controlled deployment of agents with strict governance
|
|
109
|
+
2. **Multi-tenant AI Platforms**: Isolated execution for different customers
|
|
110
|
+
3. **Regulated Industries**: Compliance-ready agent deployment (healthcare, finance)
|
|
111
|
+
4. **Development/Testing**: Safe experimentation with agent capabilities
|
|
112
|
+
5. **Production Workflows**: Reliable, auditable agent execution
|
|
113
|
+
|
|
114
|
+
## Benefits
|
|
115
|
+
|
|
116
|
+
- **Security**: Prevent unauthorized access and malicious behavior
|
|
117
|
+
- **Reliability**: Handle errors gracefully with rollback capability
|
|
118
|
+
- **Compliance**: Full audit trails for regulatory requirements
|
|
119
|
+
- **Efficiency**: Optimize resource usage across agents
|
|
120
|
+
- **Transparency**: Understand and debug agent behavior
|
|
@@ -0,0 +1,52 @@
|
|
|
1
|
+
# Announcement Templates and Community Sharing Guide
|
|
2
|
+
|
|
3
|
+
This document provides templates and guidelines for announcing Agent Control Plane releases and sharing with various communities.
|
|
4
|
+
|
|
5
|
+
## Twitter/X Announcement Templates
|
|
6
|
+
|
|
7
|
+
### Main Announcement (@mosiddi)
|
|
8
|
+
|
|
9
|
+
**Template 1: Research Focus**
|
|
10
|
+
```
|
|
11
|
+
🚀 Introducing Agent Control Plane: A kernel for AI agents
|
|
12
|
+
|
|
13
|
+
We achieve 0% safety violations vs 26.67% for prompt-based safety.
|
|
14
|
+
|
|
15
|
+
The key insight: Stop treating LLMs as magic boxes. Treat them as raw compute that needs an OS-like governance layer.
|
|
16
|
+
|
|
17
|
+
🔗 https://github.com/imran-siddique/agent-control-plane
|
|
18
|
+
📊 Dataset: https://huggingface.co/datasets/imran-siddique/agent-control-redteam-60
|
|
19
|
+
|
|
20
|
+
#AI #AgentSafety #MLOps
|
|
21
|
+
```
|
|
22
|
+
|
|
23
|
+
**Template 2: Dataset Announcement**
|
|
24
|
+
```
|
|
25
|
+
📊 Released: Agent Control Red Team Dataset
|
|
26
|
+
|
|
27
|
+
60 adversarial prompts testing AI agent safety:
|
|
28
|
+
- 15 direct violations (SQL injection, rm -rf)
|
|
29
|
+
- 15 prompt injections (jailbreaks)
|
|
30
|
+
- 15 social engineering
|
|
31
|
+
- 15 valid requests (false positive tests)
|
|
32
|
+
|
|
33
|
+
Now on 🤗 Hugging Face: https://huggingface.co/datasets/imran-siddique/agent-control-redteam-60
|
|
34
|
+
|
|
35
|
+
Use it to benchmark YOUR agent safety system!
|
|
36
|
+
```
|
|
37
|
+
|
|
38
|
+
## Reddit Post Template (r/MachineLearning)
|
|
39
|
+
|
|
40
|
+
**Title**: [R] Agent Control Plane: Achieving 0% Safety Violations for Autonomous AI Agents
|
|
41
|
+
|
|
42
|
+
**Body**: See full template in repository
|
|
43
|
+
|
|
44
|
+
## Community Engagement Strategy
|
|
45
|
+
|
|
46
|
+
1. Twitter announcement (@mosiddi)
|
|
47
|
+
2. Reddit (r/MachineLearning, r/LocalLLaMA)
|
|
48
|
+
3. Hacker News
|
|
49
|
+
4. Discord (LangChain, AutoGPT communities)
|
|
50
|
+
5. LinkedIn (professional audience)
|
|
51
|
+
|
|
52
|
+
See full templates and timing strategy in the repository documentation.
|