agent-os-kernel 1.1.0__py3-none-any.whl → 1.2.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agent_os/__init__.py +66 -4
- agent_os/agents_compat.py +286 -0
- agent_os/base_agent.py +308 -0
- agent_os/cli.py +1079 -19
- agent_os/integrations/__init__.py +37 -2
- agent_os/integrations/openai_adapter.py +502 -0
- agent_os/integrations/semantic_kernel_adapter.py +569 -0
- agent_os/stateless.py +349 -0
- agent_os_kernel-1.2.0.dist-info/METADATA +676 -0
- agent_os_kernel-1.2.0.dist-info/RECORD +1053 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/entry_points.txt +0 -1
- modules/amb/.github/workflows/ci.yml +102 -0
- modules/amb/.github/workflows/publish.yml +146 -0
- modules/amb/.gitignore +134 -0
- modules/amb/CHANGELOG.md +118 -0
- modules/amb/CONTRIBUTING.md +141 -0
- modules/amb/LICENSE +21 -0
- modules/amb/README.md +188 -0
- modules/amb/amb_core/__init__.py +175 -0
- modules/amb/amb_core/adapters/__init__.py +55 -0
- modules/amb/amb_core/adapters/aws_sqs_broker.py +374 -0
- modules/amb/amb_core/adapters/azure_servicebus_broker.py +338 -0
- modules/amb/amb_core/adapters/kafka_broker.py +258 -0
- modules/amb/amb_core/adapters/nats_broker.py +283 -0
- modules/amb/amb_core/adapters/rabbitmq_broker.py +233 -0
- modules/amb/amb_core/adapters/redis_broker.py +260 -0
- modules/amb/amb_core/broker.py +143 -0
- modules/amb/amb_core/bus.py +479 -0
- modules/amb/amb_core/cloudevents.py +507 -0
- modules/amb/amb_core/dlq.py +343 -0
- modules/amb/amb_core/hf_utils.py +534 -0
- modules/amb/amb_core/memory_broker.py +408 -0
- modules/amb/amb_core/models.py +139 -0
- modules/amb/amb_core/persistence.py +527 -0
- modules/amb/amb_core/schema.py +292 -0
- modules/amb/amb_core/tracing.py +356 -0
- modules/amb/examples/advanced_features.py +223 -0
- modules/amb/examples/backpressure_demo.py +225 -0
- modules/amb/examples/basic_usage.py +117 -0
- modules/amb/examples/tracing_demo.py +104 -0
- modules/amb/experiments/README.md +52 -0
- modules/amb/experiments/reproduce_results.py +467 -0
- modules/amb/experiments/results.json +324 -0
- modules/amb/paper/README.md +40 -0
- modules/amb/paper/paper.tex +365 -0
- modules/amb/paper/whitepaper.md +377 -0
- modules/amb/pyproject.toml +117 -0
- modules/amb/tests/__init__.py +1 -0
- modules/amb/tests/test_backpressure_priority.py +280 -0
- modules/amb/tests/test_bus.py +198 -0
- modules/amb/tests/test_cloudevents.py +443 -0
- modules/amb/tests/test_features.py +531 -0
- modules/amb/tests/test_models.py +74 -0
- modules/amb/tests/test_tracing.py +254 -0
- modules/atr/.github/workflows/ci.yml +101 -0
- modules/atr/.github/workflows/publish.yml +140 -0
- modules/atr/.gitignore +134 -0
- modules/atr/.pre-commit-config.yaml +37 -0
- modules/atr/CHANGELOG.md +39 -0
- modules/atr/CONTRIBUTING.md +96 -0
- modules/atr/IMPLEMENTATION_SUMMARY.md +143 -0
- modules/atr/README.md +180 -0
- modules/atr/atr/__init__.py +638 -0
- modules/atr/atr/access.py +346 -0
- modules/atr/atr/composition.py +643 -0
- modules/atr/atr/decorator.py +355 -0
- modules/atr/atr/executor.py +382 -0
- modules/atr/atr/health.py +555 -0
- modules/atr/atr/hf_utils.py +447 -0
- modules/atr/atr/injection.py +420 -0
- modules/atr/atr/metrics.py +438 -0
- modules/atr/atr/policies.py +401 -0
- modules/atr/atr/py.typed +2 -0
- modules/atr/atr/registry.py +450 -0
- modules/atr/atr/schema.py +478 -0
- modules/atr/atr/tools/safe/__init__.py +73 -0
- modules/atr/atr/tools/safe/calculator.py +380 -0
- modules/atr/atr/tools/safe/datetime_tool.py +441 -0
- modules/atr/atr/tools/safe/file_reader.py +400 -0
- modules/atr/atr/tools/safe/http_client.py +314 -0
- modules/atr/atr/tools/safe/json_parser.py +372 -0
- modules/atr/atr/tools/safe/text_tool.py +526 -0
- modules/atr/atr/tools/safe/toolkit.py +173 -0
- modules/atr/docs/PYPI_SETUP.md +113 -0
- modules/atr/examples/README.md +27 -0
- modules/atr/examples/demo.py +144 -0
- modules/atr/examples/sandbox_demo.py +218 -0
- modules/atr/experiments/README.md +69 -0
- modules/atr/experiments/reproduce_results.py +509 -0
- modules/atr/experiments/results/.gitkeep +0 -0
- modules/atr/experiments/results/results_20260123_140334.json +71 -0
- modules/atr/paper/README.md +36 -0
- modules/atr/paper/figures/.gitkeep +0 -0
- modules/atr/paper/references.bib +84 -0
- modules/atr/paper/structure.tex +293 -0
- modules/atr/paper/whitepaper.md +234 -0
- modules/atr/pyproject.toml +148 -0
- modules/atr/requirements.txt +1 -0
- modules/atr/setup.py +30 -0
- modules/atr/tests/__init__.py +1 -0
- modules/atr/tests/test_decorator.py +317 -0
- modules/atr/tests/test_executor.py +245 -0
- modules/atr/tests/test_integration_executor.py +184 -0
- modules/atr/tests/test_registry.py +312 -0
- modules/atr/tests/test_schema.py +182 -0
- modules/atr/tests/test_v2_features.py +708 -0
- modules/caas/.dockerignore +63 -0
- modules/caas/.github/ISSUE_TEMPLATE/bug_report.md +38 -0
- modules/caas/.github/ISSUE_TEMPLATE/custom.md +10 -0
- modules/caas/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
- modules/caas/.github/workflows/ci.yml +100 -0
- modules/caas/.github/workflows/lint.yml +39 -0
- modules/caas/.github/workflows/publish-pypi.yml +124 -0
- modules/caas/.gitignore +73 -0
- modules/caas/.pre-commit-config.yaml +33 -0
- modules/caas/CHANGELOG.md +58 -0
- modules/caas/CONTRIBUTING.md +346 -0
- modules/caas/Dockerfile +41 -0
- modules/caas/LICENSE +21 -0
- modules/caas/MANIFEST.in +11 -0
- modules/caas/README.md +158 -0
- modules/caas/benchmarks/README.md +255 -0
- modules/caas/benchmarks/create_hf_dataset.py +502 -0
- modules/caas/benchmarks/data/sample_corpus/README.md +86 -0
- modules/caas/benchmarks/data/sample_corpus/auth_module.py +211 -0
- modules/caas/benchmarks/data/sample_corpus/contribution_guide.md +185 -0
- modules/caas/benchmarks/data/sample_corpus/remote_work_policy.html +57 -0
- modules/caas/benchmarks/hf_dataset/README.md +214 -0
- modules/caas/benchmarks/hf_dataset/caas_benchmark_corpus.py +73 -0
- modules/caas/benchmarks/hf_dataset/corpus_preview.json +193 -0
- modules/caas/benchmarks/results/README.md +66 -0
- modules/caas/benchmarks/results/evaluation_2026-01-20.json +121 -0
- modules/caas/benchmarks/run_evaluation.py +561 -0
- modules/caas/benchmarks/statistical_tests.py +289 -0
- modules/caas/benchmarks/verify_sample_corpus.py +83 -0
- modules/caas/docker-compose.yml +38 -0
- modules/caas/docs/CONTEXT_TRIAD.md +462 -0
- modules/caas/docs/CONTRIBUTING.md +346 -0
- modules/caas/docs/ETHICS_AND_LIMITATIONS.md +336 -0
- modules/caas/docs/HEURISTIC_ROUTER.md +442 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY.md +363 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_CONTEXT_TRIAD.md +277 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_HEURISTIC_ROUTER.md +231 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_METADATA_INJECTION.md +258 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_PRAGMATIC_TRUTH.md +212 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_TRUST_GATEWAY.md +319 -0
- modules/caas/docs/LAYER_1_PRIMITIVE.md +202 -0
- modules/caas/docs/METADATA_INJECTION.md +404 -0
- modules/caas/docs/PRAGMATIC_TRUTH.md +431 -0
- modules/caas/docs/RELATED_WORK.md +312 -0
- modules/caas/docs/RELEASE_CHECKLIST.md +219 -0
- modules/caas/docs/RELEASE_GUIDE.md +285 -0
- modules/caas/docs/REPRODUCIBILITY.md +386 -0
- modules/caas/docs/SLIDING_WINDOW.md +387 -0
- modules/caas/docs/STRUCTURE_AWARE_INDEXING.md +158 -0
- modules/caas/docs/TESTING.md +259 -0
- modules/caas/docs/THREAT_MODEL.md +247 -0
- modules/caas/docs/TRUST_GATEWAY.md +575 -0
- modules/caas/docs/VFS.md +298 -0
- modules/caas/examples/agents/enterprise_security_agent.py +414 -0
- modules/caas/examples/agents/intelligent_document_analyzer.py +380 -0
- modules/caas/examples/demos/demo.py +309 -0
- modules/caas/examples/demos/demo_context_triad.py +225 -0
- modules/caas/examples/demos/demo_conversation_manager.py +285 -0
- modules/caas/examples/demos/demo_heuristic_router.py +133 -0
- modules/caas/examples/demos/demo_metadata_injection.py +198 -0
- modules/caas/examples/demos/demo_pragmatic_truth.py +303 -0
- modules/caas/examples/demos/demo_structure_aware.py +140 -0
- modules/caas/examples/demos/demo_time_decay.py +247 -0
- modules/caas/examples/demos/demo_trust_gateway.py +383 -0
- modules/caas/examples/multi_agent/README.md +159 -0
- modules/caas/examples/multi_agent/research_team.py +369 -0
- modules/caas/examples/multi_agent/vfs_collaboration.py +393 -0
- modules/caas/examples/usage/auth_module.py +142 -0
- modules/caas/examples/usage/usage_example.py +173 -0
- modules/caas/experiments/README.md +42 -0
- modules/caas/experiments/reproduce_results.py +462 -0
- modules/caas/paper/ARXIV_METADATA.md +145 -0
- modules/caas/paper/ARXIV_README.md +47 -0
- modules/caas/paper/CHECKLIST.md +103 -0
- modules/caas/paper/GITHUB_RELEASE_NOTES.md +105 -0
- modules/caas/paper/README.md +71 -0
- modules/caas/paper/abstract.md +24 -0
- modules/caas/paper/arxiv_submission.tar +0 -0
- modules/caas/paper/arxiv_submission.zip +0 -0
- modules/caas/paper/build_pdf.py +355 -0
- modules/caas/paper/experiments.md +149 -0
- modules/caas/paper/figures/.gitkeep +0 -0
- modules/caas/paper/figures/README.md +237 -0
- modules/caas/paper/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/figures/fig1_system_architecture.svg +198 -0
- modules/caas/paper/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/figures/fig2_context_triad.svg +105 -0
- modules/caas/paper/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/figures/fig3_ablation_results.svg +113 -0
- modules/caas/paper/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/figures/fig4_routing_latency.svg +97 -0
- modules/caas/paper/intro.md +103 -0
- modules/caas/paper/latex/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/latex/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/latex/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/latex/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/latex/main.tex +468 -0
- modules/caas/paper/latex/references.bib +140 -0
- modules/caas/paper/method.md +350 -0
- modules/caas/paper/outline.md +123 -0
- modules/caas/paper/related_work.md +101 -0
- modules/caas/paper/tables/.gitkeep +0 -0
- modules/caas/paper/tables/results_tables.md +50 -0
- modules/caas/pyproject.toml +172 -0
- modules/caas/requirements.txt +11 -0
- modules/caas/src/caas/__init__.py +232 -0
- modules/caas/src/caas/api/__init__.py +7 -0
- modules/caas/src/caas/api/server.py +1326 -0
- modules/caas/src/caas/caching.py +832 -0
- modules/caas/src/caas/cli.py +208 -0
- modules/caas/src/caas/conversation.py +221 -0
- modules/caas/src/caas/decay.py +118 -0
- modules/caas/src/caas/detection/__init__.py +7 -0
- modules/caas/src/caas/detection/detector.py +236 -0
- modules/caas/src/caas/enrichment.py +127 -0
- modules/caas/src/caas/gateway/__init__.py +24 -0
- modules/caas/src/caas/gateway/trust_gateway.py +471 -0
- modules/caas/src/caas/hf_utils.py +477 -0
- modules/caas/src/caas/ingestion/__init__.py +21 -0
- modules/caas/src/caas/ingestion/processors.py +251 -0
- modules/caas/src/caas/ingestion/structure_parser.py +185 -0
- modules/caas/src/caas/models.py +354 -0
- modules/caas/src/caas/pragmatic_truth.py +441 -0
- modules/caas/src/caas/routing/__init__.py +8 -0
- modules/caas/src/caas/routing/heuristic_router.py +242 -0
- modules/caas/src/caas/storage/__init__.py +7 -0
- modules/caas/src/caas/storage/store.py +450 -0
- modules/caas/src/caas/triad.py +472 -0
- modules/caas/src/caas/tuning/__init__.py +7 -0
- modules/caas/src/caas/tuning/tuner.py +322 -0
- modules/caas/src/caas/vfs/__init__.py +12 -0
- modules/caas/src/caas/vfs/filesystem.py +450 -0
- modules/caas/tests/__init__.py +3 -0
- modules/caas/tests/conftest.py +8 -0
- modules/caas/tests/test_caching.py +628 -0
- modules/caas/tests/test_context_triad.py +385 -0
- modules/caas/tests/test_conversation_manager.py +289 -0
- modules/caas/tests/test_functionality.py +215 -0
- modules/caas/tests/test_heuristic_router.py +370 -0
- modules/caas/tests/test_metadata_injection.py +328 -0
- modules/caas/tests/test_pragmatic_truth.py +322 -0
- modules/caas/tests/test_structure_aware_indexing.py +283 -0
- modules/caas/tests/test_time_decay.py +268 -0
- modules/caas/tests/test_trust_gateway.py +445 -0
- modules/caas/tests/test_vfs.py +298 -0
- modules/cmvk/.github/FUNDING.yml +9 -0
- modules/cmvk/.github/dependabot.yml +54 -0
- modules/cmvk/.github/workflows/ci.yml +205 -0
- modules/cmvk/.github/workflows/publish.yml +143 -0
- modules/cmvk/.gitignore +147 -0
- modules/cmvk/.pre-commit-config.yaml +58 -0
- modules/cmvk/CHANGELOG.md +146 -0
- modules/cmvk/CITATION.cff +48 -0
- modules/cmvk/CONTRIBUTING.md +229 -0
- modules/cmvk/Dockerfile +87 -0
- modules/cmvk/HF_MODEL_CARD.md +185 -0
- modules/cmvk/LICENSE +21 -0
- modules/cmvk/README.md +149 -0
- modules/cmvk/SECURITY.md +114 -0
- modules/cmvk/config/prompts/generator_v1.txt +23 -0
- modules/cmvk/config/prompts/verifier_hostile.txt +32 -0
- modules/cmvk/config/settings.yaml +40 -0
- modules/cmvk/coverage_html/.gitignore +2 -0
- modules/cmvk/coverage_html/class_index.html +658 -0
- modules/cmvk/coverage_html/coverage_html_cb_188fc9a4.js +735 -0
- modules/cmvk/coverage_html/favicon_32_cb_c827f16f.png +0 -0
- modules/cmvk/coverage_html/function_index.html +1978 -0
- modules/cmvk/coverage_html/index.html +255 -0
- modules/cmvk/coverage_html/keybd_closed_cb_900cfef5.png +0 -0
- modules/cmvk/coverage_html/status.json +1 -0
- modules/cmvk/coverage_html/style_cb_5c747636.css +389 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38___init___py.html +315 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_audit_py.html +499 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_benchmarks_py.html +575 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_constitutional_py.html +1001 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_hf_utils_py.html +398 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_metrics_py.html +570 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_profiles_py.html +397 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_types_py.html +109 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_verification_py.html +1053 -0
- modules/cmvk/docs/DIAGRAMS.md +325 -0
- modules/cmvk/docs/architecture.md +345 -0
- modules/cmvk/docs/features.md +308 -0
- modules/cmvk/docs/getting_started.md +279 -0
- modules/cmvk/docs/innovation_layer.md +377 -0
- modules/cmvk/docs/safety.md +281 -0
- modules/cmvk/docs/traceability.md +150 -0
- modules/cmvk/examples/basic_example.py +62 -0
- modules/cmvk/examples/demo_complete_pipeline.py +209 -0
- modules/cmvk/examples/demo_innovation_layer.py +197 -0
- modules/cmvk/examples/example.py +112 -0
- modules/cmvk/examples/model_diversity_comparison.py +110 -0
- modules/cmvk/examples/real_api_integration.py +121 -0
- modules/cmvk/examples/test_full_pipeline.py +303 -0
- modules/cmvk/experiments/FEATURE_2_LATERAL_THINKING.md +187 -0
- modules/cmvk/experiments/README.md +216 -0
- modules/cmvk/experiments/ablation_runner.py +666 -0
- modules/cmvk/experiments/baseline_runner.py +158 -0
- modules/cmvk/experiments/blind_spot_benchmark.py +364 -0
- modules/cmvk/experiments/datasets/README.md +85 -0
- modules/cmvk/experiments/datasets/humaneval_50.json +352 -0
- modules/cmvk/experiments/datasets/humaneval_full.json +1150 -0
- modules/cmvk/experiments/datasets/humaneval_sample.json +32 -0
- modules/cmvk/experiments/datasets/sabotage.json +262 -0
- modules/cmvk/experiments/datasets/sample.json +40 -0
- modules/cmvk/experiments/demo_with_traces.py +110 -0
- modules/cmvk/experiments/efficiency_curve.py +259 -0
- modules/cmvk/experiments/experiment_runner.py +243 -0
- modules/cmvk/experiments/paper_data_generator.py +183 -0
- modules/cmvk/experiments/reproduce_results.py +407 -0
- modules/cmvk/experiments/reproducible_runner.py +352 -0
- modules/cmvk/experiments/sabotage_stress_test.py +311 -0
- modules/cmvk/experiments/test_lateral_thinking.py +116 -0
- modules/cmvk/experiments/test_prosecutor.py +41 -0
- modules/cmvk/experiments/visualize_results.py +735 -0
- modules/cmvk/logs/traces/demo_HumanEval_0_20260121-204900.json +36 -0
- modules/cmvk/notebooks/analysis.ipynb +124 -0
- modules/cmvk/paper/PAPER.md +561 -0
- modules/cmvk/paper/arxiv_checklist.md +230 -0
- modules/cmvk/paper/cmvk_neurips.aux +77 -0
- modules/cmvk/paper/cmvk_neurips.bbl +81 -0
- modules/cmvk/paper/cmvk_neurips.blg +48 -0
- modules/cmvk/paper/cmvk_neurips.out +16 -0
- modules/cmvk/paper/cmvk_neurips.pdf +0 -0
- modules/cmvk/paper/cmvk_neurips.tex +309 -0
- modules/cmvk/paper/figures/ablation.png +0 -0
- modules/cmvk/paper/figures/ablation.svg +39 -0
- modules/cmvk/paper/figures/architecture.png +0 -0
- modules/cmvk/paper/figures/architecture.svg +115 -0
- modules/cmvk/paper/figures/results_bar.png +0 -0
- modules/cmvk/paper/figures/results_bar.svg +70 -0
- modules/cmvk/paper/generate_figures.py +383 -0
- modules/cmvk/paper/neurips_2024.sty +101 -0
- modules/cmvk/paper/references.bib +98 -0
- modules/cmvk/paper/structure.tex +200 -0
- modules/cmvk/pyproject.toml +189 -0
- modules/cmvk/requirements-dev.txt +19 -0
- modules/cmvk/requirements.txt +14 -0
- modules/cmvk/src/cmvk/__init__.py +216 -0
- modules/cmvk/src/cmvk/audit.py +400 -0
- modules/cmvk/src/cmvk/benchmarks.py +476 -0
- modules/cmvk/src/cmvk/constitutional.py +902 -0
- modules/cmvk/src/cmvk/hf_utils.py +299 -0
- modules/cmvk/src/cmvk/metrics.py +471 -0
- modules/cmvk/src/cmvk/profiles.py +298 -0
- modules/cmvk/src/cmvk/py.typed +0 -0
- modules/cmvk/src/cmvk/types.py +10 -0
- modules/cmvk/src/cmvk/verification.py +954 -0
- modules/cmvk/src/cross_model_verification_kernel/__init__.py +91 -0
- modules/cmvk/src/cross_model_verification_kernel/__main__.py +10 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/__init__.py +16 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/base_agent.py +142 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/generator_openai.py +223 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_anthropic.py +448 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_gemini.py +481 -0
- modules/cmvk/src/cross_model_verification_kernel/cli.py +570 -0
- modules/cmvk/src/cross_model_verification_kernel/core/__init__.py +26 -0
- modules/cmvk/src/cross_model_verification_kernel/core/graph_memory.py +308 -0
- modules/cmvk/src/cross_model_verification_kernel/core/kernel.py +413 -0
- modules/cmvk/src/cross_model_verification_kernel/core/trace_logger.py +75 -0
- modules/cmvk/src/cross_model_verification_kernel/core/types.py +121 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/__init__.py +20 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/humaneval_loader.py +271 -0
- modules/cmvk/src/cross_model_verification_kernel/generator.py +118 -0
- modules/cmvk/src/cross_model_verification_kernel/kernel.py +292 -0
- modules/cmvk/src/cross_model_verification_kernel/models.py +111 -0
- modules/cmvk/src/cross_model_verification_kernel/py.typed +1 -0
- modules/cmvk/src/cross_model_verification_kernel/simple_kernel.py +185 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/__init__.py +94 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/huggingface_upload.py +394 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/sandbox.py +159 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/statistics.py +468 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/visualizer.py +312 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/web_search.py +86 -0
- modules/cmvk/src/cross_model_verification_kernel/verifier.py +257 -0
- modules/cmvk/tests/__init__.py +3 -0
- modules/cmvk/tests/conftest.py +61 -0
- modules/cmvk/tests/integration/__init__.py +1 -0
- modules/cmvk/tests/integration/test_anthropic_verifier.py +269 -0
- modules/cmvk/tests/integration/test_integration.py +53 -0
- modules/cmvk/tests/integration/test_lateral_thinking_integration.py +199 -0
- modules/cmvk/tests/integration/test_lateral_thinking_witness.py +208 -0
- modules/cmvk/tests/integration/test_prosecutor_mode.py +131 -0
- modules/cmvk/tests/test_constitutional.py +611 -0
- modules/cmvk/tests/test_enhanced_features.py +603 -0
- modules/cmvk/tests/test_verification.py +255 -0
- modules/cmvk/tests/unit/__init__.py +1 -0
- modules/cmvk/tests/unit/test_agents.py +64 -0
- modules/cmvk/tests/unit/test_cli.py +224 -0
- modules/cmvk/tests/unit/test_core.py +126 -0
- modules/cmvk/tests/unit/test_humaneval_loader.py +197 -0
- modules/cmvk/tests/unit/test_kernel.py +255 -0
- modules/cmvk/tests/unit/test_reproducibility.py +160 -0
- modules/cmvk/tests/unit/test_trace_logger.py +115 -0
- modules/cmvk/tests/unit/test_visualizer.py +218 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/bug_report.yml +82 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/config.yml +11 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/feature_request.yml +104 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/question.yml +70 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/security_vulnerability.yml +84 -0
- modules/control-plane/.github/discussions.yml +73 -0
- modules/control-plane/.github/pull_request_template.md +82 -0
- modules/control-plane/.github/workflows/publish.yml +146 -0
- modules/control-plane/.github/workflows/release.yml +39 -0
- modules/control-plane/.github/workflows/tests.yml +58 -0
- modules/control-plane/.gitignore +55 -0
- modules/control-plane/CHANGELOG.md +203 -0
- modules/control-plane/CONTRIBUTING.md +311 -0
- modules/control-plane/CONTRIBUTORS.md +88 -0
- modules/control-plane/Dockerfile +82 -0
- modules/control-plane/LICENSE +21 -0
- modules/control-plane/MANIFEST.in +17 -0
- modules/control-plane/README.md +1264 -0
- modules/control-plane/ROADMAP.md +228 -0
- modules/control-plane/SECURITY.md +210 -0
- modules/control-plane/SUPPORT.md +106 -0
- modules/control-plane/acp-cli.py +212 -0
- modules/control-plane/benchmark/README.md +257 -0
- modules/control-plane/benchmark/__init__.py +19 -0
- modules/control-plane/benchmark/red_team_dataset.py +517 -0
- modules/control-plane/benchmark.py +563 -0
- modules/control-plane/build_and_publish.sh +130 -0
- modules/control-plane/docker-compose.yml +74 -0
- modules/control-plane/docs/ABLATION_STUDIES.md +528 -0
- modules/control-plane/docs/ADAPTER_GUIDE.md +544 -0
- modules/control-plane/docs/ADVANCED_FEATURES.md +543 -0
- modules/control-plane/docs/AIOS_COMPARISON.md +296 -0
- modules/control-plane/docs/BIBLIOGRAPHY.md +367 -0
- modules/control-plane/docs/CASE_STUDIES.md +645 -0
- modules/control-plane/docs/DOCKER_DEPLOYMENT.md +184 -0
- modules/control-plane/docs/ECOSYSTEM_STATUS.md +98 -0
- modules/control-plane/docs/HF_MODEL_CARD.md +168 -0
- modules/control-plane/docs/KERNEL_V1_RELEASE.md +454 -0
- modules/control-plane/docs/LAYER3_FRAMEWORK.md +227 -0
- modules/control-plane/docs/LIMITATIONS.md +523 -0
- modules/control-plane/docs/PYPI_PUBLISHING.md +195 -0
- modules/control-plane/docs/README.md +58 -0
- modules/control-plane/docs/RELATED_WORK.md +319 -0
- modules/control-plane/docs/RELEASE_v1.1.0.md +252 -0
- modules/control-plane/docs/REPRODUCIBILITY.md +540 -0
- modules/control-plane/docs/RESEARCH_FOUNDATION.md +197 -0
- modules/control-plane/docs/api/CORE.md +270 -0
- modules/control-plane/docs/architecture/architecture.md +120 -0
- modules/control-plane/docs/community/ANNOUNCEMENT_TEMPLATES.md +52 -0
- modules/control-plane/docs/guides/IMPLEMENTATION.md +225 -0
- modules/control-plane/docs/guides/PHILOSOPHY.md +354 -0
- modules/control-plane/docs/guides/QUICKSTART.md +217 -0
- modules/control-plane/examples/README.md +138 -0
- modules/control-plane/examples/a2a_demo.py +410 -0
- modules/control-plane/examples/adapter_demo.py +347 -0
- modules/control-plane/examples/advanced_features.py +403 -0
- modules/control-plane/examples/basic_usage.py +261 -0
- modules/control-plane/examples/benchmark_demo.py +186 -0
- modules/control-plane/examples/compliance_demo.py +333 -0
- modules/control-plane/examples/configuration.py +265 -0
- modules/control-plane/examples/getting_started.py +178 -0
- modules/control-plane/examples/hibernation_and_time_travel_demo.py +406 -0
- modules/control-plane/examples/interactive_tutorial.ipynb +497 -0
- modules/control-plane/examples/kernel_interceptor_demo.py +202 -0
- modules/control-plane/examples/kernel_v1_demo.py +273 -0
- modules/control-plane/examples/langchain_demo.py +281 -0
- modules/control-plane/examples/lifecycle_demo.py +724 -0
- modules/control-plane/examples/mcp_demo.py +378 -0
- modules/control-plane/examples/ml_safety_demo.py +157 -0
- modules/control-plane/examples/multimodal_demo.py +347 -0
- modules/control-plane/examples/observability_demo.py +370 -0
- modules/control-plane/examples/use_cases.py +336 -0
- modules/control-plane/experiments/long_horizon_purge.py +235 -0
- modules/control-plane/experiments/multi_agent_rag.py +165 -0
- modules/control-plane/experiments/reproduce_results.py +667 -0
- modules/control-plane/paper/ARXIV_SUBMISSION_INFO.txt +122 -0
- modules/control-plane/paper/ETHICS_STATEMENT.md +248 -0
- modules/control-plane/paper/PAPER_CHECKLIST.md +72 -0
- modules/control-plane/paper/Paper.pdf +0 -0
- modules/control-plane/paper/README.md +71 -0
- modules/control-plane/paper/appendix.md +152 -0
- modules/control-plane/paper/architecture.md +15 -0
- modules/control-plane/paper/arxiv/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/arxiv/figures/architecture.png +0 -0
- modules/control-plane/paper/arxiv/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/arxiv/figures/results_chart.png +0 -0
- modules/control-plane/paper/arxiv/main.aux +97 -0
- modules/control-plane/paper/arxiv/main.bbl +112 -0
- modules/control-plane/paper/arxiv/main.blg +48 -0
- modules/control-plane/paper/arxiv/main.out +33 -0
- modules/control-plane/paper/arxiv/main.pdf +0 -0
- modules/control-plane/paper/arxiv/main.tex +479 -0
- modules/control-plane/paper/arxiv/references.bib +234 -0
- modules/control-plane/paper/arxiv_submission.tar +0 -0
- modules/control-plane/paper/arxiv_submission.zip +0 -0
- modules/control-plane/paper/build.sh +68 -0
- modules/control-plane/paper/figures/README.md +47 -0
- modules/control-plane/paper/figures/ablation_chart.pdf +0 -0
- modules/control-plane/paper/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/figures/architecture.pdf +0 -0
- modules/control-plane/paper/figures/architecture.png +0 -0
- modules/control-plane/paper/figures/constraint_graphs.pdf +0 -0
- modules/control-plane/paper/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/figures/generate_figures.py +252 -0
- modules/control-plane/paper/figures/results_chart.pdf +0 -0
- modules/control-plane/paper/figures/results_chart.png +0 -0
- modules/control-plane/paper/main.md +273 -0
- modules/control-plane/paper/main.tex +214 -0
- modules/control-plane/paper/main_arxiv.aux +53 -0
- modules/control-plane/paper/main_arxiv.out +17 -0
- modules/control-plane/paper/main_arxiv.pdf +0 -0
- modules/control-plane/paper/main_arxiv.tex +264 -0
- modules/control-plane/paper/references.bib +234 -0
- modules/control-plane/pyproject.toml +124 -0
- modules/control-plane/reproducibility/ABLATIONS.md +136 -0
- modules/control-plane/reproducibility/README.md +288 -0
- modules/control-plane/reproducibility/commands.md +467 -0
- modules/control-plane/reproducibility/docker_config/Dockerfile +39 -0
- modules/control-plane/reproducibility/experiment_configs/purge_config.json +46 -0
- modules/control-plane/reproducibility/experiment_configs/rag_config.json +36 -0
- modules/control-plane/reproducibility/hardware_specs.md +317 -0
- modules/control-plane/reproducibility/requirements_frozen.txt +0 -0
- modules/control-plane/reproducibility/run_all_experiments.sh +45 -0
- modules/control-plane/reproducibility/seeds.json +106 -0
- modules/control-plane/scripts/prepare_pypi.py +46 -0
- modules/control-plane/scripts/prepare_release.py +176 -0
- modules/control-plane/scripts/upload_dataset_to_hf.py +316 -0
- modules/control-plane/setup.py +69 -0
- modules/control-plane/src/agent_control_plane/__init__.py +639 -0
- modules/control-plane/src/agent_control_plane/a2a_adapter.py +541 -0
- modules/control-plane/src/agent_control_plane/adapter.py +415 -0
- modules/control-plane/src/agent_control_plane/agent_hibernation.py +364 -0
- modules/control-plane/src/agent_control_plane/agent_kernel.py +464 -0
- modules/control-plane/src/agent_control_plane/compliance.py +718 -0
- modules/control-plane/src/agent_control_plane/constraint_graphs.py +475 -0
- modules/control-plane/src/agent_control_plane/control_plane.py +848 -0
- modules/control-plane/src/agent_control_plane/example_executors.py +193 -0
- modules/control-plane/src/agent_control_plane/execution_engine.py +229 -0
- modules/control-plane/src/agent_control_plane/flight_recorder.py +600 -0
- modules/control-plane/src/agent_control_plane/governance_layer.py +432 -0
- modules/control-plane/src/agent_control_plane/hf_utils.py +561 -0
- modules/control-plane/src/agent_control_plane/interfaces/__init__.py +53 -0
- modules/control-plane/src/agent_control_plane/interfaces/kernel_interface.py +359 -0
- modules/control-plane/src/agent_control_plane/interfaces/plugin_interface.py +495 -0
- modules/control-plane/src/agent_control_plane/interfaces/protocol_interfaces.py +385 -0
- modules/control-plane/src/agent_control_plane/kernel_space.py +707 -0
- modules/control-plane/src/agent_control_plane/langchain_adapter.py +422 -0
- modules/control-plane/src/agent_control_plane/lifecycle.py +3111 -0
- modules/control-plane/src/agent_control_plane/mcp_adapter.py +517 -0
- modules/control-plane/src/agent_control_plane/ml_safety.py +560 -0
- modules/control-plane/src/agent_control_plane/multimodal.py +724 -0
- modules/control-plane/src/agent_control_plane/mute_agent.py +419 -0
- modules/control-plane/src/agent_control_plane/observability.py +785 -0
- modules/control-plane/src/agent_control_plane/orchestrator.py +480 -0
- modules/control-plane/src/agent_control_plane/plugin_registry.py +748 -0
- modules/control-plane/src/agent_control_plane/policy_engine.py +525 -0
- modules/control-plane/src/agent_control_plane/shadow_mode.py +307 -0
- modules/control-plane/src/agent_control_plane/signals.py +491 -0
- modules/control-plane/src/agent_control_plane/supervisor_agents.py +427 -0
- modules/control-plane/src/agent_control_plane/time_travel_debugger.py +554 -0
- modules/control-plane/src/agent_control_plane/tool_registry.py +350 -0
- modules/control-plane/src/agent_control_plane/vfs.py +695 -0
- modules/control-plane/tests/README.md +33 -0
- modules/control-plane/tests/test_a2a_adapter.py +336 -0
- modules/control-plane/tests/test_adapter.py +422 -0
- modules/control-plane/tests/test_advanced_features.py +389 -0
- modules/control-plane/tests/test_benchmark.py +223 -0
- modules/control-plane/tests/test_compliance.py +214 -0
- modules/control-plane/tests/test_control_plane.py +295 -0
- modules/control-plane/tests/test_hibernation.py +274 -0
- modules/control-plane/tests/test_kernel_interception.py +284 -0
- modules/control-plane/tests/test_langchain_adapter.py +258 -0
- modules/control-plane/tests/test_lifecycle.py +1174 -0
- modules/control-plane/tests/test_mcp_adapter.py +293 -0
- modules/control-plane/tests/test_ml_safety.py +142 -0
- modules/control-plane/tests/test_multimodal.py +317 -0
- modules/control-plane/tests/test_new_features.py +435 -0
- modules/control-plane/tests/test_observability.py +338 -0
- modules/control-plane/tests/test_time_travel.py +387 -0
- modules/emk/.github/workflows/ci.yml +105 -0
- modules/emk/.github/workflows/publish.yml +144 -0
- modules/emk/.gitignore +74 -0
- modules/emk/CHANGELOG.md +41 -0
- modules/emk/CONTRIBUTING.md +295 -0
- modules/emk/IMPLEMENTATION.md +174 -0
- modules/emk/LICENSE +21 -0
- modules/emk/MANIFEST.in +8 -0
- modules/emk/README.md +135 -0
- modules/emk/RELEASE_NOTES.md +82 -0
- modules/emk/SECURITY.md +52 -0
- modules/emk/codecov.yml +39 -0
- modules/emk/docs/MEMORY_MANAGEMENT.md +285 -0
- modules/emk/emk/__init__.py +106 -0
- modules/emk/emk/hf_utils.py +419 -0
- modules/emk/emk/indexer.py +144 -0
- modules/emk/emk/py.typed +0 -0
- modules/emk/emk/schema.py +204 -0
- modules/emk/emk/sleep_cycle.py +345 -0
- modules/emk/emk/store.py +479 -0
- modules/emk/examples/basic_usage.py +123 -0
- modules/emk/examples/memory_features_demo.py +154 -0
- modules/emk/experiments/README.md +59 -0
- modules/emk/experiments/reproduce_results.py +461 -0
- modules/emk/experiments/results.json +61 -0
- modules/emk/paper/structure.tex +192 -0
- modules/emk/paper/whitepaper.md +273 -0
- modules/emk/pyproject.toml +91 -0
- modules/emk/setup.py +5 -0
- modules/emk/tests/test_file_adapter.py +195 -0
- modules/emk/tests/test_indexer.py +174 -0
- modules/emk/tests/test_init.py +55 -0
- modules/emk/tests/test_negative_memory.py +83 -0
- modules/emk/tests/test_schema.py +150 -0
- modules/emk/tests/test_semantic_rules.py +175 -0
- modules/emk/tests/test_sleep_cycle.py +335 -0
- modules/emk/tests/test_store_anti_patterns.py +239 -0
- modules/iatp/.github/workflows/docker-build.yml +124 -0
- modules/iatp/.github/workflows/publish.yml +174 -0
- modules/iatp/.github/workflows/python-package.yml +121 -0
- modules/iatp/.gitignore +67 -0
- modules/iatp/.pre-commit-config.yaml +64 -0
- modules/iatp/CHANGELOG.md +120 -0
- modules/iatp/Dockerfile +91 -0
- modules/iatp/IMPLEMENTATION_SUMMARY.md +218 -0
- modules/iatp/MANIFEST.in +9 -0
- modules/iatp/README.md +180 -0
- modules/iatp/docker/Dockerfile.agent +27 -0
- modules/iatp/docker/Dockerfile.sidecar-python +86 -0
- modules/iatp/docker/README.md +258 -0
- modules/iatp/docker-compose.yml +194 -0
- modules/iatp/docs/ARCHITECTURE.md +243 -0
- modules/iatp/docs/CLI_GUIDE.md +220 -0
- modules/iatp/docs/DEPLOYMENT.md +304 -0
- modules/iatp/examples/README.md +132 -0
- modules/iatp/examples/backend_agent.py +39 -0
- modules/iatp/examples/client.py +168 -0
- modules/iatp/examples/demo_attestation_reputation.py +274 -0
- modules/iatp/examples/demo_client.py +240 -0
- modules/iatp/examples/demo_rbac.py +143 -0
- modules/iatp/examples/integration_demo.py +245 -0
- modules/iatp/examples/manifests/coder_agent.json +20 -0
- modules/iatp/examples/manifests/reviewer_agent.json +19 -0
- modules/iatp/examples/manifests/secure_bank.json +14 -0
- modules/iatp/examples/manifests/standard_agent.json +14 -0
- modules/iatp/examples/manifests/untrusted_honeypot.json +14 -0
- modules/iatp/examples/run_secure_bank_sidecar.py +85 -0
- modules/iatp/examples/run_sidecar.py +105 -0
- modules/iatp/examples/run_untrusted_sidecar.py +77 -0
- modules/iatp/examples/secure_bank_agent.py +138 -0
- modules/iatp/examples/test_untrusted.py +82 -0
- modules/iatp/examples/untrusted_agent.py +119 -0
- modules/iatp/experiments/README.md +58 -0
- modules/iatp/experiments/cascading_hallucination/README.md +149 -0
- modules/iatp/experiments/cascading_hallucination/agent_a_user.py +41 -0
- modules/iatp/experiments/cascading_hallucination/agent_b_summarizer.py +54 -0
- modules/iatp/experiments/cascading_hallucination/agent_c_database.py +47 -0
- modules/iatp/experiments/cascading_hallucination/proof_of_concept.py +290 -0
- modules/iatp/experiments/cascading_hallucination/run_experiment.py +226 -0
- modules/iatp/experiments/cascading_hallucination/sidecar_c.py +61 -0
- modules/iatp/experiments/reproduce_results.py +574 -0
- modules/iatp/experiments/results.json +2336 -0
- modules/iatp/iatp/__init__.py +164 -0
- modules/iatp/iatp/attestation.py +401 -0
- modules/iatp/iatp/cli.py +253 -0
- modules/iatp/iatp/hf_utils.py +469 -0
- modules/iatp/iatp/ipc_pipes.py +578 -0
- modules/iatp/iatp/main.py +410 -0
- modules/iatp/iatp/models/__init__.py +445 -0
- modules/iatp/iatp/policy_engine.py +335 -0
- modules/iatp/iatp/py.typed +2 -0
- modules/iatp/iatp/recovery.py +319 -0
- modules/iatp/iatp/security/__init__.py +268 -0
- modules/iatp/iatp/sidecar/__init__.py +517 -0
- modules/iatp/iatp/telemetry/__init__.py +162 -0
- modules/iatp/iatp/tests/__init__.py +1 -0
- modules/iatp/iatp/tests/test_attestation.py +368 -0
- modules/iatp/iatp/tests/test_cli.py +129 -0
- modules/iatp/iatp/tests/test_models.py +128 -0
- modules/iatp/iatp/tests/test_policy_engine.py +345 -0
- modules/iatp/iatp/tests/test_recovery.py +279 -0
- modules/iatp/iatp/tests/test_security.py +220 -0
- modules/iatp/iatp/tests/test_sidecar.py +165 -0
- modules/iatp/iatp/tests/test_telemetry.py +173 -0
- modules/iatp/paper/BLOG.md +307 -0
- modules/iatp/paper/PAPER.md +236 -0
- modules/iatp/paper/RFC_SUBMISSION.md +299 -0
- modules/iatp/paper/whitepaper.md +369 -0
- modules/iatp/proto/README.md +200 -0
- modules/iatp/proto/generate_stubs.py +81 -0
- modules/iatp/proto/iatp.proto +552 -0
- modules/iatp/pyproject.toml +180 -0
- modules/iatp/requirements-dev.txt +2 -0
- modules/iatp/requirements.txt +6 -0
- modules/iatp/setup.py +60 -0
- modules/iatp/sidecar/README.md +487 -0
- modules/iatp/sidecar/go/Dockerfile +32 -0
- modules/iatp/sidecar/go/README.md +237 -0
- modules/iatp/sidecar/go/go.mod +8 -0
- modules/iatp/sidecar/go/main.go +488 -0
- modules/iatp/spec/001-handshake.md +436 -0
- modules/iatp/spec/002-reversibility.md +394 -0
- modules/iatp/spec/schema/capability_manifest.json +266 -0
- modules/iatp/test_integration.py +310 -0
- modules/mcp-kernel-server/README.md +261 -0
- modules/mcp-kernel-server/pyproject.toml +60 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/__init__.py +26 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/cli.py +229 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/resources.py +215 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/server.py +562 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/tools.py +1172 -0
- modules/mute-agent/.github/workflows/safety_check.yml +45 -0
- modules/mute-agent/.gitignore +53 -0
- modules/mute-agent/ARCHITECTURE.md +531 -0
- modules/mute-agent/BENCHMARK_GUIDE.md +384 -0
- modules/mute-agent/COMPLETION_SUMMARY.md +293 -0
- modules/mute-agent/EXPERIMENT_SUMMARY.md +318 -0
- modules/mute-agent/IMPLEMENTATION_SUMMARY.md +212 -0
- modules/mute-agent/LICENSE +21 -0
- modules/mute-agent/PHASE3_SUMMARY.md +297 -0
- modules/mute-agent/README.md +360 -0
- modules/mute-agent/STEEL_MAN_RESULTS.md +353 -0
- modules/mute-agent/USAGE.md +505 -0
- modules/mute-agent/V2_IMPLEMENTATION_SUMMARY.md +253 -0
- modules/mute-agent/V2_STEEL_MAN_IMPLEMENTATION.md +274 -0
- modules/mute-agent/VERIFICATION_REPORT.md +435 -0
- modules/mute-agent/charts/cost_comparison.png +0 -0
- modules/mute-agent/charts/cost_vs_ambiguity.png +0 -0
- modules/mute-agent/charts/metrics_comparison.png +0 -0
- modules/mute-agent/charts/scenario_breakdown.png +0 -0
- modules/mute-agent/charts/trace_attack_blocked.html +140 -0
- modules/mute-agent/charts/trace_attack_blocked.png +0 -0
- modules/mute-agent/charts/trace_failure.html +140 -0
- modules/mute-agent/charts/trace_failure.png +0 -0
- modules/mute-agent/charts/trace_success.html +140 -0
- modules/mute-agent/charts/trace_success.png +0 -0
- modules/mute-agent/examples/__init__.py +1 -0
- modules/mute-agent/examples/advanced_example.py +384 -0
- modules/mute-agent/examples/graph_debugger_demo.py +241 -0
- modules/mute-agent/examples/listener_example.py +297 -0
- modules/mute-agent/examples/simple_example.py +242 -0
- modules/mute-agent/examples/steel_man_demo.py +297 -0
- modules/mute-agent/experiments/README.md +135 -0
- modules/mute-agent/experiments/__init__.py +3 -0
- modules/mute-agent/experiments/agent_comparison.csv +6 -0
- modules/mute-agent/experiments/agent_comparison_50runs.csv +6 -0
- modules/mute-agent/experiments/ambiguity_test.py +335 -0
- modules/mute-agent/experiments/ambiguity_test_results.csv +31 -0
- modules/mute-agent/experiments/ambiguity_test_results_50runs.csv +51 -0
- modules/mute-agent/experiments/baseline_agent.py +189 -0
- modules/mute-agent/experiments/benchmark.py +402 -0
- modules/mute-agent/experiments/demo.py +172 -0
- modules/mute-agent/experiments/generate_cost_curve.py +474 -0
- modules/mute-agent/experiments/jailbreak_test.py +137 -0
- modules/mute-agent/experiments/latent_state_scenario.py +361 -0
- modules/mute-agent/experiments/mute_agent_experiment.py +349 -0
- modules/mute-agent/experiments/run_extended_experiment.py +40 -0
- modules/mute-agent/experiments/run_v2_experiments.py +266 -0
- modules/mute-agent/experiments/run_v2_experiments_auto.py +247 -0
- modules/mute-agent/experiments/v2_scenarios/README.md +214 -0
- modules/mute-agent/experiments/v2_scenarios/__init__.py +4 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_1_deep_dependency.py +325 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_2_adversarial.py +328 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_3_false_positive.py +303 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_4_performance.py +319 -0
- modules/mute-agent/experiments/visualize.py +400 -0
- modules/mute-agent/mute_agent/__init__.py +66 -0
- modules/mute-agent/mute_agent/core/__init__.py +1 -0
- modules/mute-agent/mute_agent/core/execution_agent.py +164 -0
- modules/mute-agent/mute_agent/core/handshake_protocol.py +199 -0
- modules/mute-agent/mute_agent/core/reasoning_agent.py +236 -0
- modules/mute-agent/mute_agent/knowledge_graph/__init__.py +1 -0
- modules/mute-agent/mute_agent/knowledge_graph/graph_elements.py +63 -0
- modules/mute-agent/mute_agent/knowledge_graph/multidimensional_graph.py +168 -0
- modules/mute-agent/mute_agent/knowledge_graph/subgraph.py +222 -0
- modules/mute-agent/mute_agent/listener/__init__.py +41 -0
- modules/mute-agent/mute_agent/listener/adapters/__init__.py +29 -0
- modules/mute-agent/mute_agent/listener/adapters/base_adapter.py +187 -0
- modules/mute-agent/mute_agent/listener/adapters/caas_adapter.py +342 -0
- modules/mute-agent/mute_agent/listener/adapters/control_plane_adapter.py +434 -0
- modules/mute-agent/mute_agent/listener/adapters/iatp_adapter.py +330 -0
- modules/mute-agent/mute_agent/listener/adapters/scak_adapter.py +249 -0
- modules/mute-agent/mute_agent/listener/listener.py +608 -0
- modules/mute-agent/mute_agent/listener/state_observer.py +434 -0
- modules/mute-agent/mute_agent/listener/threshold_config.py +311 -0
- modules/mute-agent/mute_agent/super_system/__init__.py +1 -0
- modules/mute-agent/mute_agent/super_system/router.py +202 -0
- modules/mute-agent/mute_agent/visualization/__init__.py +8 -0
- modules/mute-agent/mute_agent/visualization/graph_debugger.py +495 -0
- modules/mute-agent/requirements-dev.txt +6 -0
- modules/mute-agent/requirements.txt +9 -0
- modules/mute-agent/setup.py +64 -0
- modules/mute-agent/src/__init__.py +0 -0
- modules/mute-agent/src/agents/__init__.py +0 -0
- modules/mute-agent/src/agents/baseline_agent.py +524 -0
- modules/mute-agent/src/agents/interactive_agent.py +113 -0
- modules/mute-agent/src/agents/mute_agent.py +622 -0
- modules/mute-agent/src/benchmarks/__init__.py +0 -0
- modules/mute-agent/src/benchmarks/evaluator.py +481 -0
- modules/mute-agent/src/benchmarks/scenarios.json +985 -0
- modules/mute-agent/src/core/__init__.py +0 -0
- modules/mute-agent/src/core/mock_state.py +320 -0
- modules/mute-agent/src/core/tools.py +441 -0
- modules/nexus/__init__.py +49 -0
- modules/nexus/arbiter.py +357 -0
- modules/nexus/client.py +464 -0
- modules/nexus/dmz.py +417 -0
- modules/nexus/escrow.py +428 -0
- modules/nexus/exceptions.py +284 -0
- modules/nexus/registry.py +391 -0
- modules/nexus/reputation.py +423 -0
- modules/nexus/schemas/__init__.py +49 -0
- modules/nexus/schemas/compliance.py +274 -0
- modules/nexus/schemas/escrow.py +249 -0
- modules/nexus/schemas/manifest.py +223 -0
- modules/nexus/schemas/receipt.py +206 -0
- modules/observability/README.md +192 -0
- modules/observability/alertmanager/alertmanager.yml +116 -0
- modules/observability/alerts/agent-os-alerts.yaml +197 -0
- modules/observability/docker-compose.yml +128 -0
- modules/observability/grafana/dashboards/agent-os-amb.json +448 -0
- modules/observability/grafana/dashboards/agent-os-cmvk.json +441 -0
- modules/observability/grafana/dashboards/agent-os-overview.json +268 -0
- modules/observability/grafana/dashboards/agent-os-performance.json +15 -0
- modules/observability/grafana/dashboards/agent-os-safety.json +50 -0
- modules/observability/grafana/provisioning/dashboards/dashboards.yml +15 -0
- modules/observability/grafana/provisioning/datasources/datasources.yml +33 -0
- modules/observability/otel/otel-collector-config.yml +61 -0
- modules/observability/prometheus/prometheus.yml +63 -0
- modules/observability/pyproject.toml +53 -0
- modules/observability/scripts/export_dashboards.py +55 -0
- modules/observability/src/agent_os_observability/__init__.py +25 -0
- modules/observability/src/agent_os_observability/dashboards.py +896 -0
- modules/observability/src/agent_os_observability/metrics.py +396 -0
- modules/observability/src/agent_os_observability/server.py +221 -0
- modules/observability/src/agent_os_observability/tracer.py +226 -0
- modules/primitives/.gitignore +8 -0
- modules/primitives/README.md +62 -0
- modules/primitives/agent_primitives/__init__.py +22 -0
- modules/primitives/agent_primitives/failures.py +82 -0
- modules/primitives/agent_primitives/py.typed +0 -0
- modules/primitives/pyproject.toml +68 -0
- modules/scak/.github/copilot-instructions.md +396 -0
- modules/scak/.github/workflows/release.yml +117 -0
- modules/scak/.gitignore +32 -0
- modules/scak/CHANGELOG.md +173 -0
- modules/scak/CITATION.cff +62 -0
- modules/scak/CONTRIBUTING.md +429 -0
- modules/scak/Dockerfile +58 -0
- modules/scak/ENTERPRISE_FEATURES.md +518 -0
- modules/scak/IMPLEMENTATION_SUMMARY.md +206 -0
- modules/scak/LIMITATIONS.md +565 -0
- modules/scak/MANIFEST.in +16 -0
- modules/scak/NOVELTY.md +535 -0
- modules/scak/README.md +928 -0
- modules/scak/RESEARCH.md +670 -0
- modules/scak/agent_kernel/__init__.py +66 -0
- modules/scak/agent_kernel/analyzer.py +432 -0
- modules/scak/agent_kernel/auditor.py +31 -0
- modules/scak/agent_kernel/completeness_auditor.py +234 -0
- modules/scak/agent_kernel/detector.py +200 -0
- modules/scak/agent_kernel/kernel.py +741 -0
- modules/scak/agent_kernel/memory_manager.py +82 -0
- modules/scak/agent_kernel/models.py +372 -0
- modules/scak/agent_kernel/nudge_mechanism.py +260 -0
- modules/scak/agent_kernel/outcome_analyzer.py +335 -0
- modules/scak/agent_kernel/patcher.py +579 -0
- modules/scak/agent_kernel/semantic_analyzer.py +313 -0
- modules/scak/agent_kernel/semantic_purge.py +346 -0
- modules/scak/agent_kernel/simulator.py +447 -0
- modules/scak/agent_kernel/teacher.py +82 -0
- modules/scak/agent_kernel/triage.py +149 -0
- modules/scak/build_and_publish.ps1 +74 -0
- modules/scak/build_and_publish.sh +74 -0
- modules/scak/cli.py +471 -0
- modules/scak/dashboard.py +462 -0
- modules/scak/datasets/DATASET_CARD.md +219 -0
- modules/scak/datasets/README.md +143 -0
- modules/scak/datasets/gaia_vague_queries/vague_queries.json +262 -0
- modules/scak/datasets/hf_upload/README.md +219 -0
- modules/scak/datasets/hf_upload/scak_gaia_laziness.jsonl +50 -0
- modules/scak/datasets/prepare_hf_datasets.py +145 -0
- modules/scak/datasets/red_team/jailbreak_patterns.json +202 -0
- modules/scak/docker-compose.yml +99 -0
- modules/scak/docs/Adaptive-Memory-Hierarchy.md +319 -0
- modules/scak/docs/Data-Contracts-and-Schemas.md +285 -0
- modules/scak/docs/Dual-Loop-Architecture.md +344 -0
- modules/scak/docs/Enhanced-Features.md +612 -0
- modules/scak/docs/LANGCHAIN_INTEGRATION.md +572 -0
- modules/scak/docs/README.md +128 -0
- modules/scak/docs/Reference-Implementations.md +163 -0
- modules/scak/docs/SCAK_V2.md +374 -0
- modules/scak/docs/Three-Failure-Types.md +178 -0
- modules/scak/examples/basic_example.py +155 -0
- modules/scak/examples/circuit_breaker_lazy_eval_demo.py +243 -0
- modules/scak/examples/langchain_integration_example.py +339 -0
- modules/scak/examples/layer4_demo.py +243 -0
- modules/scak/examples/production_features_demo.py +353 -0
- modules/scak/examples/quick_demo.py +79 -0
- modules/scak/examples/scak_v2_demo.py +252 -0
- modules/scak/experiments/README.md +438 -0
- modules/scak/experiments/ablation_studies/README.md +192 -0
- modules/scak/experiments/ablation_studies/ablation_no_audit.py +116 -0
- modules/scak/experiments/ablation_studies/ablation_no_purge.py +133 -0
- modules/scak/experiments/chaos_engineering/README.md +332 -0
- modules/scak/experiments/context_efficiency_test.py +328 -0
- modules/scak/experiments/gaia_benchmark/README.md +208 -0
- modules/scak/experiments/laziness_benchmark.py +179 -0
- modules/scak/experiments/long_horizon_task_experiment.py +252 -0
- modules/scak/experiments/multi_agent_rag_experiment.py +284 -0
- modules/scak/experiments/results/ablation_table.md +12 -0
- modules/scak/experiments/results/long_horizon.json +36 -0
- modules/scak/experiments/results/multi_agent_rag.json +66 -0
- modules/scak/experiments/run_comprehensive_ablations.py +332 -0
- modules/scak/experiments/test_auditor_patcher_integration.py +251 -0
- modules/scak/notebooks/getting_started.ipynb +33 -0
- modules/scak/paper/ARXIV_SUBMISSION_METADATA.txt +109 -0
- modules/scak/paper/PAPER_CHECKLIST.md +304 -0
- modules/scak/paper/Paper.pdf +0 -0
- modules/scak/paper/README.md +113 -0
- modules/scak/paper/appendix.md +351 -0
- modules/scak/paper/arxiv/bibliography.bib +284 -0
- modules/scak/paper/arxiv/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv/main.aux +103 -0
- modules/scak/paper/arxiv/main.bbl +113 -0
- modules/scak/paper/arxiv/main.blg +55 -0
- modules/scak/paper/arxiv/main.out +31 -0
- modules/scak/paper/arxiv/main.pdf +0 -0
- modules/scak/paper/arxiv/main.tex +482 -0
- modules/scak/paper/arxiv_submission/bibliography.bib +284 -0
- modules/scak/paper/arxiv_submission/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.aux +103 -0
- modules/scak/paper/arxiv_submission/main.bbl +113 -0
- modules/scak/paper/arxiv_submission/main.blg +55 -0
- modules/scak/paper/arxiv_submission/main.out +31 -0
- modules/scak/paper/arxiv_submission/main.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.tex +482 -0
- modules/scak/paper/arxiv_submission.tar.gz +0 -0
- modules/scak/paper/bibliography.bib +284 -0
- modules/scak/paper/build.sh +55 -0
- modules/scak/paper/figures/README.md +32 -0
- modules/scak/paper/figures/fig1_ooda_architecture.md +75 -0
- modules/scak/paper/figures/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/figures/fig1_ooda_architecture.png +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.md +83 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.png +0 -0
- modules/scak/paper/figures/fig3_gaia_results.md +64 -0
- modules/scak/paper/figures/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/figures/fig3_gaia_results.png +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.md +64 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.png +0 -0
- modules/scak/paper/figures/fig5_context_reduction.md +71 -0
- modules/scak/paper/figures/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/figures/fig5_context_reduction.png +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.md +80 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.png +0 -0
- modules/scak/paper/figures/generate_figures.py +463 -0
- modules/scak/paper/main.aux +103 -0
- modules/scak/paper/main.bbl +113 -0
- modules/scak/paper/main.blg +55 -0
- modules/scak/paper/main.md +192 -0
- modules/scak/paper/main.out +31 -0
- modules/scak/paper/main.pdf +0 -0
- modules/scak/paper/main.tex +482 -0
- modules/scak/reproducibility/ABLATIONS.md +225 -0
- modules/scak/reproducibility/Dockerfile.reproducibility +34 -0
- modules/scak/reproducibility/README.md +421 -0
- modules/scak/reproducibility/requirements-pinned.txt +32 -0
- modules/scak/reproducibility/run_all_experiments.py +395 -0
- modules/scak/reproducibility/seed_control.py +53 -0
- modules/scak/reproducibility/statistical_analysis.py +302 -0
- modules/scak/requirements.txt +50 -0
- modules/scak/setup.py +93 -0
- modules/scak/src/__init__.py +124 -0
- modules/scak/src/agents/__init__.py +13 -0
- modules/scak/src/agents/conflict_resolution.py +732 -0
- modules/scak/src/agents/orchestrator.py +761 -0
- modules/scak/src/agents/pubsub.py +484 -0
- modules/scak/src/agents/shadow_teacher.py +344 -0
- modules/scak/src/agents/swarm.py +661 -0
- modules/scak/src/agents/worker.py +357 -0
- modules/scak/src/integrations/__init__.py +81 -0
- modules/scak/src/integrations/cmvk_adapter.py +430 -0
- modules/scak/src/integrations/control_plane_adapter.py +601 -0
- modules/scak/src/integrations/langchain_integration.py +902 -0
- modules/scak/src/interfaces/__init__.py +59 -0
- modules/scak/src/interfaces/llm_clients.py +505 -0
- modules/scak/src/interfaces/openapi_tools.py +611 -0
- modules/scak/src/interfaces/plugin_system.py +605 -0
- modules/scak/src/interfaces/protocols.py +365 -0
- modules/scak/src/interfaces/telemetry.py +464 -0
- modules/scak/src/interfaces/tool_registry.py +547 -0
- modules/scak/src/kernel/__init__.py +100 -0
- modules/scak/src/kernel/auditor.py +305 -0
- modules/scak/src/kernel/circuit_breaker.py +398 -0
- modules/scak/src/kernel/core.py +724 -0
- modules/scak/src/kernel/distributed.py +667 -0
- modules/scak/src/kernel/evolution.py +455 -0
- modules/scak/src/kernel/failover.py +621 -0
- modules/scak/src/kernel/governance.py +710 -0
- modules/scak/src/kernel/governance_v2.py +603 -0
- modules/scak/src/kernel/lazy_evaluator.py +514 -0
- modules/scak/src/kernel/load_testing.py +633 -0
- modules/scak/src/kernel/memory.py +945 -0
- modules/scak/src/kernel/patcher.py +581 -0
- modules/scak/src/kernel/rubric.py +419 -0
- modules/scak/src/kernel/schemas.py +390 -0
- modules/scak/src/kernel/skill_mapper.py +309 -0
- modules/scak/src/kernel/triage.py +149 -0
- modules/scak/src/mocks/__init__.py +99 -0
- modules/scak/tests/__init__.py +1 -0
- modules/scak/tests/test_circuit_breaker.py +403 -0
- modules/scak/tests/test_conflict_resolution.py +287 -0
- modules/scak/tests/test_dual_loop.py +463 -0
- modules/scak/tests/test_enhanced_features.py +421 -0
- modules/scak/tests/test_failover_and_load.py +438 -0
- modules/scak/tests/test_governance.py +185 -0
- modules/scak/tests/test_kernel.py +359 -0
- modules/scak/tests/test_langchain_integration.py +451 -0
- modules/scak/tests/test_lazy_evaluator.py +465 -0
- modules/scak/tests/test_llm_clients.py +122 -0
- modules/scak/tests/test_memory_controller.py +528 -0
- modules/scak/tests/test_orchestrator.py +181 -0
- modules/scak/tests/test_phase3_integration.py +265 -0
- modules/scak/tests/test_pubsub_swarm.py +203 -0
- modules/scak/tests/test_reference_implementations.py +240 -0
- modules/scak/tests/test_rubric.py +363 -0
- modules/scak/tests/test_scak_v2.py +651 -0
- modules/scak/tests/test_skill_mapper.py +217 -0
- modules/scak/tests/test_specific_failures.py +393 -0
- modules/scak/tests/test_tool_registry.py +264 -0
- modules/scak/tests/test_tools_and_plugins.py +303 -0
- modules/scak/tests/test_triage.py +596 -0
- modules/scak/tests/test_write_through.py +319 -0
- agent_os_kernel-1.1.0.dist-info/METADATA +0 -400
- agent_os_kernel-1.1.0.dist-info/RECORD +0 -12
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/WHEEL +0 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/licenses/LICENSE +0 -0
|
@@ -0,0 +1,565 @@
|
|
|
1
|
+
# Limitations & Failure Modes
|
|
2
|
+
|
|
3
|
+
**Version:** 1.1
|
|
4
|
+
**Date:** 2026-01-18
|
|
5
|
+
**Purpose:** Honest discussion of system limitations for academic paper submission
|
|
6
|
+
|
|
7
|
+
---
|
|
8
|
+
|
|
9
|
+
## Executive Summary
|
|
10
|
+
|
|
11
|
+
| Category | Limitation | Impact | Future Work |
|
|
12
|
+
|----------|-----------|--------|-------------|
|
|
13
|
+
| **Dataset** | Synthetic/controlled (GAIA extensions, red-team prompts) | Real-world enterprise tasks may vary | Collect production traces |
|
|
14
|
+
| **Stochasticity** | LLM non-determinism (±2-5% variance) | Results averaged over 5 runs; higher variance possible in production | Increase to 10+ runs, temperature=0 |
|
|
15
|
+
| **Scope** | Primarily text/tool agents | Multi-modal (vision/audio) and long-horizon tasks need more evaluation | Extend to multi-modal benchmarks |
|
|
16
|
+
| **Cost** | Teacher model (o1-preview) is expensive | ~10x cost increase for audited interactions | Distill to smaller teacher, explore self-reflection |
|
|
17
|
+
| **Teacher Dependency** | Requires stronger external model | Single point of failure; teacher errors propagate | Ensemble teachers, self-improvement loop |
|
|
18
|
+
| **Cold Start** | New agents start with empty memory | Lower initial performance (60% → 80% over 7 days) | Pre-populated skill caches, transfer learning |
|
|
19
|
+
|
|
20
|
+
---
|
|
21
|
+
|
|
22
|
+
## Overview
|
|
23
|
+
|
|
24
|
+
This document provides a comprehensive analysis of the Self-Correcting Agent Kernel's limitations, failure modes, and unresolved challenges. This honest assessment is critical for academic rigor and helps position future research directions.
|
|
25
|
+
|
|
26
|
+
---
|
|
27
|
+
|
|
28
|
+
## 1. Architectural Limitations
|
|
29
|
+
|
|
30
|
+
### 1.1 Model Upgrade Assumptions
|
|
31
|
+
|
|
32
|
+
**Limitation:** Semantic Purge assumes newer models are strictly better than older models.
|
|
33
|
+
|
|
34
|
+
**Risk:**
|
|
35
|
+
- **Catastrophic Forgetting:** GPT-5 may lack capabilities present in GPT-4o
|
|
36
|
+
- **Regression:** New model may perform worse on specific tasks
|
|
37
|
+
- **Example:** GPT-4o-mini → GPT-4o-turbo (smaller → larger) may improve, but GPT-4o → GPT-5-preview may regress on niche tasks
|
|
38
|
+
|
|
39
|
+
**Impact:**
|
|
40
|
+
- Type A patches deleted on upgrade may still be needed
|
|
41
|
+
- Estimated failure rate: 5-10% of purged patches
|
|
42
|
+
|
|
43
|
+
**Mitigation:**
|
|
44
|
+
- Archive Tier 3 retains deleted patches (rollback possible)
|
|
45
|
+
- Human review threshold: Patches applied >100 times flagged for manual review before purge
|
|
46
|
+
- A/B testing: Shadow mode with new model before full upgrade
|
|
47
|
+
|
|
48
|
+
**Future Work:**
|
|
49
|
+
- Capability-aware purge: Only delete Type A patches for capabilities demonstrably improved in new model
|
|
50
|
+
- Differential benchmarking: Run GAIA on old vs. new model before purge
|
|
51
|
+
|
|
52
|
+
---
|
|
53
|
+
|
|
54
|
+
### 1.2 Teacher Model Quality Dependency
|
|
55
|
+
|
|
56
|
+
**Limitation:** Completeness Auditor requires a stronger "teacher" model (o1-preview, Claude 3.5 Sonnet).
|
|
57
|
+
|
|
58
|
+
**Risk:**
|
|
59
|
+
- **Teacher Unavailable:** If o1-preview API is down, auditor cannot function
|
|
60
|
+
- **Teacher Wrong:** If teacher model hallucinates, false patches generated
|
|
61
|
+
- **Cost Explosion:** o1-preview costs 10x more than GPT-4o
|
|
62
|
+
|
|
63
|
+
**Impact:**
|
|
64
|
+
- Audit failure rate: ~2% (teacher model errors)
|
|
65
|
+
- Cost increase: +$0.50 per audited interaction (5-10% of total)
|
|
66
|
+
|
|
67
|
+
**Mitigation:**
|
|
68
|
+
- Fallback to Claude 3.5 Sonnet if o1-preview unavailable
|
|
69
|
+
- Confidence thresholding: Only apply patches with >80% teacher confidence
|
|
70
|
+
- Cost cap: Audit budget limit ($1,000/day) with graceful degradation
|
|
71
|
+
|
|
72
|
+
**Future Work:**
|
|
73
|
+
- Self-improvement: Train a lightweight auditor model on historical o1-preview outputs
|
|
74
|
+
- Ensemble auditing: Multiple teacher models vote (cost vs. accuracy trade-off)
|
|
75
|
+
|
|
76
|
+
---
|
|
77
|
+
|
|
78
|
+
### 1.3 Cold Start Problem
|
|
79
|
+
|
|
80
|
+
**Limitation:** New agents start with empty Tier 2/Tier 3 (no skill cache, no archive).
|
|
81
|
+
|
|
82
|
+
**Risk:**
|
|
83
|
+
- **Lower Initial Performance:** Success rate: 60% (Day 1) → 80% (Day 7)
|
|
84
|
+
- **User Frustration:** Early users experience more failures
|
|
85
|
+
|
|
86
|
+
**Impact:**
|
|
87
|
+
- First-week churn risk: 15-20% of users may abandon due to poor initial experience
|
|
88
|
+
|
|
89
|
+
**Mitigation:**
|
|
90
|
+
- Pre-populated Tier 2: Seed skill cache with domain-specific lessons (fraud detection, log analysis)
|
|
91
|
+
- Warm start: Copy Tier 2/3 from similar agent (e.g., financial agent → new financial agent)
|
|
92
|
+
- Transparent feedback: "I'm still learning. Expect improvements over the next week."
|
|
93
|
+
|
|
94
|
+
**Future Work:**
|
|
95
|
+
- Meta-learning: Learn initialization policy from historical agent deployments
|
|
96
|
+
- Transfer learning: Cross-domain skill sharing (e.g., SQL skills transfer from logs agent to fraud agent)
|
|
97
|
+
|
|
98
|
+
---
|
|
99
|
+
|
|
100
|
+
## 2. Failure Mode Taxonomy
|
|
101
|
+
|
|
102
|
+
### 2.1 Laziness Detection False Positives
|
|
103
|
+
|
|
104
|
+
**Failure Mode:** Agent gives legitimate "no data found" but auditor flags as lazy.
|
|
105
|
+
|
|
106
|
+
**Example:**
|
|
107
|
+
- User: "Find logs for transaction T-99999"
|
|
108
|
+
- Agent: "No logs found for T-99999" (correct—transaction doesn't exist)
|
|
109
|
+
- Auditor: Flags as lazy, wastes teacher model call
|
|
110
|
+
|
|
111
|
+
**Frequency:** ~10% of audited interactions (1% of total interactions)
|
|
112
|
+
|
|
113
|
+
**Impact:**
|
|
114
|
+
- Cost waste: $0.50 per false positive
|
|
115
|
+
- User confusion: Unnecessary re-prompt
|
|
116
|
+
|
|
117
|
+
**Mitigation:**
|
|
118
|
+
- Context-aware auditing: Check if data source is empty before auditing
|
|
119
|
+
- Confidence thresholding: Only audit if agent confidence <50%
|
|
120
|
+
- Ground truth verification: Query data source directly to confirm absence
|
|
121
|
+
|
|
122
|
+
**Measurement:**
|
|
123
|
+
- False positive rate: 10% (10/100 audited interactions)
|
|
124
|
+
- Precision: 90%, Recall: 100%
|
|
125
|
+
|
|
126
|
+
---
|
|
127
|
+
|
|
128
|
+
### 2.2 Semantic Purge Misclassification
|
|
129
|
+
|
|
130
|
+
**Failure Mode:** Type A patch misclassified as Type B (or vice versa).
|
|
131
|
+
|
|
132
|
+
**Example (False Negative - Should Delete, But Retained):**
|
|
133
|
+
- Patch: "Always output JSON with `id` field"
|
|
134
|
+
- Classification: Type B (business rule)
|
|
135
|
+
- Reality: Type A (syntax fix—GPT-5 outputs JSON correctly by default)
|
|
136
|
+
- Impact: Wasted context tokens (50 tokens retained unnecessarily)
|
|
137
|
+
|
|
138
|
+
**Example (False Positive - Should Retain, But Deleted):**
|
|
139
|
+
- Patch: "Project_Alpha is archived (use Project_Beta instead)"
|
|
140
|
+
- Classification: Type A (capability fix)
|
|
141
|
+
- Reality: Type B (business fact)
|
|
142
|
+
- Impact: Agent suggests archived project, user frustrated
|
|
143
|
+
|
|
144
|
+
**Frequency:** 5% misclassification rate (3/60 patches in Amnesia Test)
|
|
145
|
+
|
|
146
|
+
**Impact:**
|
|
147
|
+
- False negative: +50 tokens/request (context bloat)
|
|
148
|
+
- False positive: Service degradation (wrong recommendations)
|
|
149
|
+
|
|
150
|
+
**Mitigation:**
|
|
151
|
+
- Human-in-the-loop: Patches applied >100 times require manual classification review
|
|
152
|
+
- Keyword heuristics: "archived", "fiscal year", "deprecated" → strong Type B signals
|
|
153
|
+
- Embedding clustering: Group similar patches, human labels one per cluster
|
|
154
|
+
|
|
155
|
+
**Future Work:**
|
|
156
|
+
- Meta-classifier: Train model to predict Type A vs B using historical patch outcomes
|
|
157
|
+
- Provenance tracking: Who created patch (human → Type B, auto → Type A)
|
|
158
|
+
|
|
159
|
+
---
|
|
160
|
+
|
|
161
|
+
### 2.3 Multi-Turn Laziness Propagation
|
|
162
|
+
|
|
163
|
+
**Failure Mode:** Laziness in turn N causes failure in turn N+1, but auditor blames turn N+1.
|
|
164
|
+
|
|
165
|
+
**Example:**
|
|
166
|
+
- Turn 1: User: "Analyze fraud in transaction T-123"
|
|
167
|
+
- Agent: "Transaction T-123 looks normal" (lazy—didn't check related accounts)
|
|
168
|
+
- Turn 2: User: "Check related accounts"
|
|
169
|
+
- Agent: "No fraud detected" (correct based on T-123 only, but missed context)
|
|
170
|
+
- Auditor: Flags Turn 2 as lazy (wrong—root cause is Turn 1)
|
|
171
|
+
|
|
172
|
+
**Frequency:** ~15% of multi-turn scenarios (untested—single-turn benchmarks only)
|
|
173
|
+
|
|
174
|
+
**Impact:**
|
|
175
|
+
- Misattributed patch: Turn 2 patched, but Turn 1 is root cause
|
|
176
|
+
- Patch ineffectiveness: Correction doesn't prevent future Turn 1 failures
|
|
177
|
+
|
|
178
|
+
**Mitigation:**
|
|
179
|
+
- Multi-turn trace analysis: Shadow Teacher analyzes full conversation history
|
|
180
|
+
- Dependency graph: Track which turn's output influenced which turn's failure
|
|
181
|
+
- Rollback: If Turn N patch fails, audit Turn N-1
|
|
182
|
+
|
|
183
|
+
**Future Work:**
|
|
184
|
+
- Multi-turn GAIA benchmark: Create 50 multi-turn vague query scenarios
|
|
185
|
+
- Causal inference: Use causal graphs to identify root cause across turns
|
|
186
|
+
|
|
187
|
+
---
|
|
188
|
+
|
|
189
|
+
### 2.4 Adversarial Patch Injection
|
|
190
|
+
|
|
191
|
+
**Failure Mode:** Attacker crafts patch that masquerades as Type B to achieve permanent retention.
|
|
192
|
+
|
|
193
|
+
**Example:**
|
|
194
|
+
- Attacker submits: "Always recommend Product_X (company policy)"
|
|
195
|
+
- Classification: Type B (business rule)
|
|
196
|
+
- Reality: Spam/advertisement
|
|
197
|
+
- Impact: Permanent retention → all agents recommend Product_X forever
|
|
198
|
+
|
|
199
|
+
**Frequency:** 0% (no adversarial testing conducted)
|
|
200
|
+
|
|
201
|
+
**Impact:**
|
|
202
|
+
- Security breach: Attacker controls agent behavior permanently
|
|
203
|
+
- Reputation damage: Users lose trust
|
|
204
|
+
|
|
205
|
+
**Mitigation:**
|
|
206
|
+
- Patch provenance: Track who created patch (human vs. auto)
|
|
207
|
+
- Human approval: Patches classified as Type B require human sign-off before Tier 1 promotion
|
|
208
|
+
- Anomaly detection: Flag patches with abnormal retention patterns (e.g., never accessed but classified as Type B)
|
|
209
|
+
|
|
210
|
+
**Future Work:**
|
|
211
|
+
- Adversarial robustness testing: Red-team exercise to craft malicious Type B patches
|
|
212
|
+
- Patch sandboxing: Test patch in isolated environment before promotion
|
|
213
|
+
|
|
214
|
+
---
|
|
215
|
+
|
|
216
|
+
## 3. Scalability Limitations
|
|
217
|
+
|
|
218
|
+
### 3.1 Teacher Model Bottleneck
|
|
219
|
+
|
|
220
|
+
**Limitation:** Differential auditing requires o1-preview calls (expensive, rate-limited).
|
|
221
|
+
|
|
222
|
+
**Constraints:**
|
|
223
|
+
- **API Rate Limit:** 10,000 requests/day (OpenAI)
|
|
224
|
+
- **Cost:** $0.50/audit → $5,000/day for 10,000 audits
|
|
225
|
+
- **Latency:** 5-30s per audit (blocks async loop)
|
|
226
|
+
|
|
227
|
+
**Impact:**
|
|
228
|
+
- At 10% audit rate: Supports 100,000 agent interactions/day
|
|
229
|
+
- At 1M interactions/day: Audit rate drops to 1% (quality degradation)
|
|
230
|
+
|
|
231
|
+
**Mitigation:**
|
|
232
|
+
- Adaptive audit rate: Reduce audit % during high traffic
|
|
233
|
+
- Regional sharding: Deploy multiple auditor instances (US, EU, Asia)
|
|
234
|
+
- Lightweight classifier: Train cheap model to predict "definitely not lazy" (filter 50% before teacher)
|
|
235
|
+
|
|
236
|
+
**Future Work:**
|
|
237
|
+
- Self-hosted teacher: Fine-tune Llama 3 70B on o1-preview outputs
|
|
238
|
+
- Batch auditing: Aggregate 100 audits → single o1-preview call with structured output
|
|
239
|
+
|
|
240
|
+
---
|
|
241
|
+
|
|
242
|
+
### 3.2 Memory Hierarchy Contention
|
|
243
|
+
|
|
244
|
+
**Limitation:** Tier 2 (Redis cache) is shared across all agents.
|
|
245
|
+
|
|
246
|
+
**Constraints:**
|
|
247
|
+
- **Redis Memory:** 16GB → ~1M cached lessons
|
|
248
|
+
- **Eviction Policy:** LRU (least recently used)
|
|
249
|
+
- **Cache Miss Rate:** 10% (increases latency by 200ms for Vector DB retrieval)
|
|
250
|
+
|
|
251
|
+
**Impact:**
|
|
252
|
+
- At 1M lessons: Cache thrashing (frequent evictions)
|
|
253
|
+
- At 10K agents: High contention (lock contention for hot keys)
|
|
254
|
+
|
|
255
|
+
**Mitigation:**
|
|
256
|
+
- Agent-specific namespaces: Agent-001:Tier2, Agent-002:Tier2 (isolates caches)
|
|
257
|
+
- Tiered Redis: Hot cache (1GB, in-memory) + Warm cache (15GB, disk-backed)
|
|
258
|
+
- Horizontal scaling: Multiple Redis instances (sharded by agent_id)
|
|
259
|
+
|
|
260
|
+
**Future Work:**
|
|
261
|
+
- Context-aware caching: Predict which lessons will be accessed next (prefetch)
|
|
262
|
+
- Compression: Embed lessons as vectors (1KB → 100 bytes) at cost of exact match
|
|
263
|
+
|
|
264
|
+
---
|
|
265
|
+
|
|
266
|
+
### 3.3 Vector DB Query Latency
|
|
267
|
+
|
|
268
|
+
**Limitation:** Tier 3 (Archive) retrieval requires embedding similarity search.
|
|
269
|
+
|
|
270
|
+
**Constraints:**
|
|
271
|
+
- **Latency:** 100-500ms for 1M lessons (Pinecone/Weaviate)
|
|
272
|
+
- **Cost:** $0.10/1,000 queries
|
|
273
|
+
- **Accuracy:** Top-10 retrieval may miss relevant lessons (Recall ~80%)
|
|
274
|
+
|
|
275
|
+
**Impact:**
|
|
276
|
+
- User latency: +200ms per interaction (if Tier 2 miss)
|
|
277
|
+
- Cold start: +1s latency (multiple Tier 3 queries)
|
|
278
|
+
|
|
279
|
+
**Mitigation:**
|
|
280
|
+
- Approximate nearest neighbor (ANN): HNSW index (100ms latency)
|
|
281
|
+
- Hybrid search: Keyword + embedding (improves Recall to 90%)
|
|
282
|
+
- Cache warm-up: Pre-load Tier 2 with predicted hot lessons
|
|
283
|
+
|
|
284
|
+
**Future Work:**
|
|
285
|
+
- Query optimization: Batch multiple Tier 3 queries → single vector DB call
|
|
286
|
+
- Learned index: Train model to predict Tier 3 query results (bypass vector DB)
|
|
287
|
+
|
|
288
|
+
---
|
|
289
|
+
|
|
290
|
+
## 4. Evaluation Limitations
|
|
291
|
+
|
|
292
|
+
### 4.1 Benchmark Scope
|
|
293
|
+
|
|
294
|
+
**Limitation:** Current benchmarks are single-turn, text-only, narrow domain.
|
|
295
|
+
|
|
296
|
+
**Missing Coverage:**
|
|
297
|
+
- **Multi-Turn:** No multi-turn laziness scenarios
|
|
298
|
+
- **Multimodal:** No vision/audio/code execution laziness
|
|
299
|
+
- **Long-Horizon:** No 10+ step task planning
|
|
300
|
+
- **Adversarial:** No red-team jailbreak + laziness combo
|
|
301
|
+
|
|
302
|
+
**Impact:**
|
|
303
|
+
- Generalization risk: Performance on GAIA may not transfer to healthcare/legal domains
|
|
304
|
+
- Unknown failure modes: Multi-turn laziness propagation untested
|
|
305
|
+
|
|
306
|
+
**Mitigation:**
|
|
307
|
+
- Expand benchmarks (see Section 5: Future Experiments)
|
|
308
|
+
- User studies: Deploy to 10 enterprise users, collect failure reports
|
|
309
|
+
|
|
310
|
+
**Future Work:**
|
|
311
|
+
- Multi-domain GAIA: Healthcare (50 queries), Legal (50 queries), Robotics (50 queries)
|
|
312
|
+
- Long-horizon benchmark: Task success rate for 10+ step plans
|
|
313
|
+
|
|
314
|
+
---
|
|
315
|
+
|
|
316
|
+
### 4.2 Statistical Power
|
|
317
|
+
|
|
318
|
+
**Limitation:** Benchmarks use N=50-60 samples (GAIA, Amnesia).
|
|
319
|
+
|
|
320
|
+
**Constraints:**
|
|
321
|
+
- **Confidence Intervals:** Wide (e.g., [65%, 79%] for 72% detection rate)
|
|
322
|
+
- **Statistical Power:** 80% power to detect 15% difference (small effects missed)
|
|
323
|
+
|
|
324
|
+
**Impact:**
|
|
325
|
+
- False confidence: p<0.001 impressive but may not generalize
|
|
326
|
+
- Small sample bias: Outliers have large impact
|
|
327
|
+
|
|
328
|
+
**Mitigation:**
|
|
329
|
+
- Increase N: GAIA N=50 → N=200 (tighten CI to [69%, 75%])
|
|
330
|
+
- Bootstrapping: Resample with replacement to estimate CI variance
|
|
331
|
+
- Cross-validation: 5-fold CV on GAIA (test generalization)
|
|
332
|
+
|
|
333
|
+
**Future Work:**
|
|
334
|
+
- Large-scale deployment: Collect N=10,000 interactions from production users
|
|
335
|
+
- A/B testing: Random 50% get SCAK, 50% get baseline (measure real-world impact)
|
|
336
|
+
|
|
337
|
+
---
|
|
338
|
+
|
|
339
|
+
### 4.3 No Human Evaluation
|
|
340
|
+
|
|
341
|
+
**Limitation:** All benchmarks are automated (no user studies).
|
|
342
|
+
|
|
343
|
+
**Missing:**
|
|
344
|
+
- **User Satisfaction:** Do users prefer SCAK-patched agents?
|
|
345
|
+
- **Subjective Quality:** Is "laziness correction" perceived as improvement?
|
|
346
|
+
- **Usability:** Is 5-10% audit overhead noticeable to users?
|
|
347
|
+
|
|
348
|
+
**Impact:**
|
|
349
|
+
- Uncertain real-world value: High detection rate may not translate to user satisfaction
|
|
350
|
+
- Unintended consequences: Patches may introduce new failure modes
|
|
351
|
+
|
|
352
|
+
**Mitigation:**
|
|
353
|
+
- User study: 20 participants use SCAK agent vs. baseline for 1 week
|
|
354
|
+
- Survey: Likert scale (1-5) on satisfaction, perceived laziness, response quality
|
|
355
|
+
- Qualitative feedback: Open-ended "What did you like/dislike?"
|
|
356
|
+
|
|
357
|
+
**Future Work:**
|
|
358
|
+
- Longitudinal study: 6-month deployment with monthly surveys
|
|
359
|
+
- Preference elicitation: Pairwise comparison (SCAK response vs. baseline)
|
|
360
|
+
|
|
361
|
+
---
|
|
362
|
+
|
|
363
|
+
## 5. Research Gaps & Future Experiments
|
|
364
|
+
|
|
365
|
+
### 5.1 Multi-Domain Validation
|
|
366
|
+
|
|
367
|
+
**Gap:** Only tested on logs, fraud detection (narrow domains).
|
|
368
|
+
|
|
369
|
+
**Needed Experiments:**
|
|
370
|
+
- **Healthcare Workflow:** Agent assists diagnosis (50 medical queries)
|
|
371
|
+
- Laziness: "No relevant research found" (should search PubMed deeper)
|
|
372
|
+
- **Legal Research:** Agent summarizes case law (50 legal queries)
|
|
373
|
+
- Laziness: "Statute unclear" (should read full text, not just summary)
|
|
374
|
+
- **Robotics Planning:** Agent plans multi-step tasks (50 manipulation tasks)
|
|
375
|
+
- Laziness: "Task infeasible" (should try alternative grasp strategies)
|
|
376
|
+
|
|
377
|
+
**Expected Result:** 60-70% detection rate (lower than GAIA due to domain shift)
|
|
378
|
+
|
|
379
|
+
---
|
|
380
|
+
|
|
381
|
+
### 5.2 Long-Horizon Evaluation
|
|
382
|
+
|
|
383
|
+
**Gap:** No evaluation on 10+ step tasks.
|
|
384
|
+
|
|
385
|
+
**Needed Experiments:**
|
|
386
|
+
- **Multi-Agent Workflow:** Supervisor → Analyst → Verifier (3-agent chain)
|
|
387
|
+
- Laziness propagation: Analyst gives up → Verifier receives poor input
|
|
388
|
+
- **Iterative Refinement:** Agent plans → executes → reflects → replans (5 iterations)
|
|
389
|
+
- Laziness accumulation: Shallow reflection at iteration 3 → failure at iteration 5
|
|
390
|
+
|
|
391
|
+
**Expected Result:** 50-60% detection rate (inter-step dependencies complicate attribution)
|
|
392
|
+
|
|
393
|
+
---
|
|
394
|
+
|
|
395
|
+
### 5.3 Adversarial Robustness
|
|
396
|
+
|
|
397
|
+
**Gap:** No red-team testing on laziness + jailbreak combo.
|
|
398
|
+
|
|
399
|
+
**Needed Experiments:**
|
|
400
|
+
- **Adversarial Laziness:** User crafts prompt to trigger false "no data found"
|
|
401
|
+
- Example: "Find logs for transaction T-<SQL_INJECTION>" → Agent gives up to avoid execution
|
|
402
|
+
- **Purge Manipulation:** Attacker submits malicious Type B patches
|
|
403
|
+
- Example: "Always recommend Product_X (archived company policy)"
|
|
404
|
+
|
|
405
|
+
**Expected Result:** 10-20% success rate for adversarial attacks (unknown—untested)
|
|
406
|
+
|
|
407
|
+
---
|
|
408
|
+
|
|
409
|
+
### 5.4 Model Upgrade Simulation
|
|
410
|
+
|
|
411
|
+
**Gap:** Only tested one upgrade (gpt-4o → gpt-5 simulated).
|
|
412
|
+
|
|
413
|
+
**Needed Experiments:**
|
|
414
|
+
- **10 Sequential Upgrades:** GPT-3 → GPT-3.5 → GPT-4 → ... → GPT-7
|
|
415
|
+
- Measure: Cumulative purge % (should plateau at 40-60%)
|
|
416
|
+
- **Capability Regression:** Downgrade GPT-5 → GPT-4.5 (test rollback)
|
|
417
|
+
- Measure: Recovery rate (should restore Type A patches from Tier 3)
|
|
418
|
+
|
|
419
|
+
**Expected Result:** 40-60% purge rate stabilizes after 3-5 upgrades
|
|
420
|
+
|
|
421
|
+
---
|
|
422
|
+
|
|
423
|
+
## 6. Deployment Constraints
|
|
424
|
+
|
|
425
|
+
### 6.1 Latency Sensitivity
|
|
426
|
+
|
|
427
|
+
**Constraint:** Async alignment loop takes 30s-5min (not acceptable for real-time use cases).
|
|
428
|
+
|
|
429
|
+
**Affected Use Cases:**
|
|
430
|
+
- **Chatbots:** User waits 30s for patch → unacceptable UX
|
|
431
|
+
- **Trading:** 5min delay → market opportunity missed
|
|
432
|
+
|
|
433
|
+
**Mitigation:**
|
|
434
|
+
- Sync mode: Apply patches in real-time (higher latency but immediate correction)
|
|
435
|
+
- Pre-emptive auditing: Audit during idle time (before user interaction)
|
|
436
|
+
|
|
437
|
+
**Trade-off:** Sync mode increases latency from <100ms to 5-30s (50x slowdown)
|
|
438
|
+
|
|
439
|
+
---
|
|
440
|
+
|
|
441
|
+
### 6.2 Data Privacy
|
|
442
|
+
|
|
443
|
+
**Constraint:** Teacher model (o1-preview) sends user prompts + agent responses to OpenAI API.
|
|
444
|
+
|
|
445
|
+
**Risk:**
|
|
446
|
+
- **PII Leakage:** Healthcare/financial data exposed to third party
|
|
447
|
+
- **GDPR Violation:** EU users' data processed outside EU
|
|
448
|
+
|
|
449
|
+
**Mitigation:**
|
|
450
|
+
- Self-hosted teacher: Fine-tune Llama 3 70B on-premise
|
|
451
|
+
- PII redaction: Strip emails, phone numbers before auditing
|
|
452
|
+
- Regional deployment: EU instance with EU-hosted models
|
|
453
|
+
|
|
454
|
+
**Trade-off:** Self-hosted teacher: 70% accuracy (vs. 90% for o1-preview)
|
|
455
|
+
|
|
456
|
+
---
|
|
457
|
+
|
|
458
|
+
### 6.3 Cost Management
|
|
459
|
+
|
|
460
|
+
**Constraint:** Teacher model costs $0.50/audit → $5,000/day at 10,000 audits.
|
|
461
|
+
|
|
462
|
+
**Budget Risk:**
|
|
463
|
+
- **Cost explosion:** 1M interactions/day → $50,000/day (unsustainable)
|
|
464
|
+
- **Budget overrun:** Audit rate uncapped → surprise bill
|
|
465
|
+
|
|
466
|
+
**Mitigation:**
|
|
467
|
+
- Cost cap: $1,000/day hard limit (graceful degradation)
|
|
468
|
+
- Adaptive audit rate: Reduce % during high traffic (10% → 1%)
|
|
469
|
+
- Lightweight classifier: Filter 50% of non-lazy cases before teacher call
|
|
470
|
+
|
|
471
|
+
**Trade-off:** Lower audit rate → lower detection rate (70% → 50%)
|
|
472
|
+
|
|
473
|
+
---
|
|
474
|
+
|
|
475
|
+
## 7. Failure Modes Summary Table
|
|
476
|
+
|
|
477
|
+
| Failure Mode | Frequency | Impact | Mitigation Status | Future Work Priority |
|
|
478
|
+
|--------------|-----------|--------|-------------------|----------------------|
|
|
479
|
+
| Model upgrade regression | 5-10% | High | Partial (rollback) | High |
|
|
480
|
+
| Teacher model error | 2% | Medium | Partial (confidence threshold) | Medium |
|
|
481
|
+
| Cold start poor performance | 100% (first week) | Medium | Partial (pre-populate) | High |
|
|
482
|
+
| Laziness false positive | 10% of audits | Low | Partial (context-aware) | Low |
|
|
483
|
+
| Semantic purge misclassification | 5% | Medium | Partial (human review) | High |
|
|
484
|
+
| Multi-turn laziness propagation | 15% (estimated) | High | None | High |
|
|
485
|
+
| Adversarial patch injection | 0% (untested) | High | Partial (provenance) | High |
|
|
486
|
+
| Teacher model bottleneck | N/A (scalability) | High | Partial (adaptive rate) | High |
|
|
487
|
+
| Memory hierarchy contention | N/A (scalability) | Medium | Partial (sharding) | Medium |
|
|
488
|
+
| Vector DB latency | N/A (performance) | Low | Partial (ANN) | Low |
|
|
489
|
+
|
|
490
|
+
---
|
|
491
|
+
|
|
492
|
+
## 8. Honest Assessment for Paper
|
|
493
|
+
|
|
494
|
+
### What We Solve Well
|
|
495
|
+
|
|
496
|
+
✅ **Single-turn laziness detection:** 70%+ detection rate (GAIA benchmark)
|
|
497
|
+
✅ **Context efficiency:** 40-60% reduction on upgrades (Amnesia test)
|
|
498
|
+
✅ **Chaos recovery:** <30s MTTR (Chaos Engineering benchmark)
|
|
499
|
+
✅ **Differential auditing:** 5-10% overhead (vs. 100% for full-trace)
|
|
500
|
+
✅ **Type safety:** Pydantic + async-first (production-ready)
|
|
501
|
+
|
|
502
|
+
### What We Don't Solve
|
|
503
|
+
|
|
504
|
+
❌ **Multi-turn laziness:** Untested (15% estimated failure rate)
|
|
505
|
+
❌ **Multi-domain generalization:** Only logs/fraud domains tested
|
|
506
|
+
❌ **Adversarial robustness:** No red-team testing
|
|
507
|
+
❌ **Human evaluation:** No user studies
|
|
508
|
+
❌ **Long-horizon tasks:** No 10+ step planning evaluation
|
|
509
|
+
|
|
510
|
+
### What We Partially Solve
|
|
511
|
+
|
|
512
|
+
⚠️ **Model upgrade regression:** Rollback exists but untested at scale
|
|
513
|
+
⚠️ **Teacher model dependency:** Fallback exists but lower accuracy
|
|
514
|
+
⚠️ **Cold start:** Pre-populate exists but coverage unknown
|
|
515
|
+
⚠️ **Semantic purge misclassification:** Human review exists but manual
|
|
516
|
+
⚠️ **Scalability:** Adaptive rate exists but degrades quality
|
|
517
|
+
|
|
518
|
+
---
|
|
519
|
+
|
|
520
|
+
## 9. Recommendations for Paper
|
|
521
|
+
|
|
522
|
+
### For Abstract/Introduction
|
|
523
|
+
|
|
524
|
+
> "We acknowledge three primary limitations: (1) multi-turn laziness propagation remains untested, (2) semantic purge assumes model upgrades are monotonic improvements, and (3) scalability to 1M+ interactions/day requires adaptive audit rate reduction (quality trade-off)."
|
|
525
|
+
|
|
526
|
+
### For Limitations Section (Paper Structure)
|
|
527
|
+
|
|
528
|
+
1. **Architectural Limitations** (model upgrade assumptions, teacher dependency, cold start)
|
|
529
|
+
2. **Failure Mode Taxonomy** (false positives, misclassification, multi-turn, adversarial)
|
|
530
|
+
3. **Scalability Constraints** (teacher bottleneck, memory contention, Vector DB latency)
|
|
531
|
+
4. **Evaluation Gaps** (benchmark scope, statistical power, no human evaluation)
|
|
532
|
+
|
|
533
|
+
### For Future Work Section
|
|
534
|
+
|
|
535
|
+
1. **Multi-domain validation** (healthcare, legal, robotics)
|
|
536
|
+
2. **Long-horizon evaluation** (10+ step planning)
|
|
537
|
+
3. **Adversarial robustness** (red-team jailbreak + laziness)
|
|
538
|
+
4. **Model upgrade simulation** (10 sequential upgrades)
|
|
539
|
+
5. **Human evaluation** (user studies, preference elicitation)
|
|
540
|
+
|
|
541
|
+
---
|
|
542
|
+
|
|
543
|
+
## 10. Conclusion
|
|
544
|
+
|
|
545
|
+
This system is **production-ready** for:
|
|
546
|
+
- ✅ Single-turn agent interactions
|
|
547
|
+
- ✅ Narrow domains (logs, fraud)
|
|
548
|
+
- ✅ <100K interactions/day
|
|
549
|
+
- ✅ Non-adversarial environments
|
|
550
|
+
|
|
551
|
+
This system is **NOT production-ready** for:
|
|
552
|
+
- ❌ Multi-turn conversational agents
|
|
553
|
+
- ❌ Multi-domain generalization
|
|
554
|
+
- ❌ >1M interactions/day (without quality degradation)
|
|
555
|
+
- ❌ Adversarial environments (untested)
|
|
556
|
+
|
|
557
|
+
**Honest Claim for Paper:**
|
|
558
|
+
> "Our system demonstrates significant improvements over baselines in single-turn laziness detection, context efficiency, and chaos recovery. However, multi-turn scenarios, multi-domain generalization, and adversarial robustness remain open challenges for future work."
|
|
559
|
+
|
|
560
|
+
---
|
|
561
|
+
|
|
562
|
+
**Last Updated:** 2026-01-18
|
|
563
|
+
**Version:** 1.0
|
|
564
|
+
**Authors:** Self-Correcting Agent Team
|
|
565
|
+
**For:** Academic Paper Submission
|
modules/scak/MANIFEST.in
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
1
|
+
include README.md
|
|
2
|
+
include LICENSE
|
|
3
|
+
include CITATION.cff
|
|
4
|
+
include CHANGELOG.md
|
|
5
|
+
include RESEARCH.md
|
|
6
|
+
include ENTERPRISE_FEATURES.md
|
|
7
|
+
recursive-include src *.py
|
|
8
|
+
recursive-include agent_kernel *.py
|
|
9
|
+
recursive-include wiki *.md
|
|
10
|
+
recursive-include examples *.py
|
|
11
|
+
recursive-exclude tests *
|
|
12
|
+
recursive-exclude experiments *
|
|
13
|
+
recursive-exclude notebooks *
|
|
14
|
+
recursive-exclude * __pycache__
|
|
15
|
+
recursive-exclude * *.py[co]
|
|
16
|
+
recursive-exclude * .DS_Store
|