agent-os-kernel 1.1.0__py3-none-any.whl → 1.3.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- agent_os/__init__.py +66 -4
- agent_os/agents_compat.py +286 -0
- agent_os/base_agent.py +308 -0
- agent_os/cli.py +1079 -19
- agent_os/integrations/__init__.py +37 -2
- agent_os/integrations/openai_adapter.py +502 -0
- agent_os/integrations/semantic_kernel_adapter.py +569 -0
- agent_os/stateless.py +349 -0
- agent_os_kernel-1.3.0.dist-info/METADATA +676 -0
- agent_os_kernel-1.3.0.dist-info/RECORD +1053 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.3.0.dist-info}/entry_points.txt +0 -1
- modules/amb/.github/workflows/ci.yml +102 -0
- modules/amb/.github/workflows/publish.yml +146 -0
- modules/amb/.gitignore +134 -0
- modules/amb/CHANGELOG.md +118 -0
- modules/amb/CONTRIBUTING.md +141 -0
- modules/amb/LICENSE +21 -0
- modules/amb/README.md +188 -0
- modules/amb/amb_core/__init__.py +175 -0
- modules/amb/amb_core/adapters/__init__.py +55 -0
- modules/amb/amb_core/adapters/aws_sqs_broker.py +374 -0
- modules/amb/amb_core/adapters/azure_servicebus_broker.py +338 -0
- modules/amb/amb_core/adapters/kafka_broker.py +258 -0
- modules/amb/amb_core/adapters/nats_broker.py +283 -0
- modules/amb/amb_core/adapters/rabbitmq_broker.py +233 -0
- modules/amb/amb_core/adapters/redis_broker.py +260 -0
- modules/amb/amb_core/broker.py +143 -0
- modules/amb/amb_core/bus.py +479 -0
- modules/amb/amb_core/cloudevents.py +507 -0
- modules/amb/amb_core/dlq.py +343 -0
- modules/amb/amb_core/hf_utils.py +534 -0
- modules/amb/amb_core/memory_broker.py +408 -0
- modules/amb/amb_core/models.py +139 -0
- modules/amb/amb_core/persistence.py +527 -0
- modules/amb/amb_core/schema.py +292 -0
- modules/amb/amb_core/tracing.py +356 -0
- modules/amb/examples/advanced_features.py +223 -0
- modules/amb/examples/backpressure_demo.py +225 -0
- modules/amb/examples/basic_usage.py +117 -0
- modules/amb/examples/tracing_demo.py +104 -0
- modules/amb/experiments/README.md +52 -0
- modules/amb/experiments/reproduce_results.py +467 -0
- modules/amb/experiments/results.json +324 -0
- modules/amb/paper/README.md +40 -0
- modules/amb/paper/paper.tex +365 -0
- modules/amb/paper/whitepaper.md +377 -0
- modules/amb/pyproject.toml +117 -0
- modules/amb/tests/__init__.py +1 -0
- modules/amb/tests/test_backpressure_priority.py +280 -0
- modules/amb/tests/test_bus.py +198 -0
- modules/amb/tests/test_cloudevents.py +443 -0
- modules/amb/tests/test_features.py +531 -0
- modules/amb/tests/test_models.py +74 -0
- modules/amb/tests/test_tracing.py +254 -0
- modules/atr/.github/workflows/ci.yml +101 -0
- modules/atr/.github/workflows/publish.yml +140 -0
- modules/atr/.gitignore +134 -0
- modules/atr/.pre-commit-config.yaml +37 -0
- modules/atr/CHANGELOG.md +39 -0
- modules/atr/CONTRIBUTING.md +96 -0
- modules/atr/IMPLEMENTATION_SUMMARY.md +143 -0
- modules/atr/README.md +180 -0
- modules/atr/atr/__init__.py +638 -0
- modules/atr/atr/access.py +346 -0
- modules/atr/atr/composition.py +643 -0
- modules/atr/atr/decorator.py +355 -0
- modules/atr/atr/executor.py +382 -0
- modules/atr/atr/health.py +555 -0
- modules/atr/atr/hf_utils.py +447 -0
- modules/atr/atr/injection.py +420 -0
- modules/atr/atr/metrics.py +438 -0
- modules/atr/atr/policies.py +401 -0
- modules/atr/atr/py.typed +2 -0
- modules/atr/atr/registry.py +450 -0
- modules/atr/atr/schema.py +478 -0
- modules/atr/atr/tools/safe/__init__.py +73 -0
- modules/atr/atr/tools/safe/calculator.py +380 -0
- modules/atr/atr/tools/safe/datetime_tool.py +441 -0
- modules/atr/atr/tools/safe/file_reader.py +400 -0
- modules/atr/atr/tools/safe/http_client.py +314 -0
- modules/atr/atr/tools/safe/json_parser.py +372 -0
- modules/atr/atr/tools/safe/text_tool.py +526 -0
- modules/atr/atr/tools/safe/toolkit.py +173 -0
- modules/atr/docs/PYPI_SETUP.md +113 -0
- modules/atr/examples/README.md +27 -0
- modules/atr/examples/demo.py +144 -0
- modules/atr/examples/sandbox_demo.py +218 -0
- modules/atr/experiments/README.md +69 -0
- modules/atr/experiments/reproduce_results.py +509 -0
- modules/atr/experiments/results/.gitkeep +0 -0
- modules/atr/experiments/results/results_20260123_140334.json +71 -0
- modules/atr/paper/README.md +36 -0
- modules/atr/paper/figures/.gitkeep +0 -0
- modules/atr/paper/references.bib +84 -0
- modules/atr/paper/structure.tex +293 -0
- modules/atr/paper/whitepaper.md +234 -0
- modules/atr/pyproject.toml +148 -0
- modules/atr/requirements.txt +1 -0
- modules/atr/setup.py +30 -0
- modules/atr/tests/__init__.py +1 -0
- modules/atr/tests/test_decorator.py +317 -0
- modules/atr/tests/test_executor.py +245 -0
- modules/atr/tests/test_integration_executor.py +184 -0
- modules/atr/tests/test_registry.py +312 -0
- modules/atr/tests/test_schema.py +182 -0
- modules/atr/tests/test_v2_features.py +708 -0
- modules/caas/.dockerignore +63 -0
- modules/caas/.github/ISSUE_TEMPLATE/bug_report.md +38 -0
- modules/caas/.github/ISSUE_TEMPLATE/custom.md +10 -0
- modules/caas/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
- modules/caas/.github/workflows/ci.yml +100 -0
- modules/caas/.github/workflows/lint.yml +39 -0
- modules/caas/.github/workflows/publish-pypi.yml +124 -0
- modules/caas/.gitignore +73 -0
- modules/caas/.pre-commit-config.yaml +33 -0
- modules/caas/CHANGELOG.md +58 -0
- modules/caas/CONTRIBUTING.md +346 -0
- modules/caas/Dockerfile +41 -0
- modules/caas/LICENSE +21 -0
- modules/caas/MANIFEST.in +11 -0
- modules/caas/README.md +158 -0
- modules/caas/benchmarks/README.md +255 -0
- modules/caas/benchmarks/create_hf_dataset.py +502 -0
- modules/caas/benchmarks/data/sample_corpus/README.md +86 -0
- modules/caas/benchmarks/data/sample_corpus/auth_module.py +211 -0
- modules/caas/benchmarks/data/sample_corpus/contribution_guide.md +185 -0
- modules/caas/benchmarks/data/sample_corpus/remote_work_policy.html +57 -0
- modules/caas/benchmarks/hf_dataset/README.md +214 -0
- modules/caas/benchmarks/hf_dataset/caas_benchmark_corpus.py +73 -0
- modules/caas/benchmarks/hf_dataset/corpus_preview.json +193 -0
- modules/caas/benchmarks/results/README.md +66 -0
- modules/caas/benchmarks/results/evaluation_2026-01-20.json +121 -0
- modules/caas/benchmarks/run_evaluation.py +561 -0
- modules/caas/benchmarks/statistical_tests.py +289 -0
- modules/caas/benchmarks/verify_sample_corpus.py +83 -0
- modules/caas/docker-compose.yml +38 -0
- modules/caas/docs/CONTEXT_TRIAD.md +462 -0
- modules/caas/docs/CONTRIBUTING.md +346 -0
- modules/caas/docs/ETHICS_AND_LIMITATIONS.md +336 -0
- modules/caas/docs/HEURISTIC_ROUTER.md +442 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY.md +363 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_CONTEXT_TRIAD.md +277 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_HEURISTIC_ROUTER.md +231 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_METADATA_INJECTION.md +258 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_PRAGMATIC_TRUTH.md +212 -0
- modules/caas/docs/IMPLEMENTATION_SUMMARY_TRUST_GATEWAY.md +319 -0
- modules/caas/docs/LAYER_1_PRIMITIVE.md +202 -0
- modules/caas/docs/METADATA_INJECTION.md +404 -0
- modules/caas/docs/PRAGMATIC_TRUTH.md +431 -0
- modules/caas/docs/RELATED_WORK.md +312 -0
- modules/caas/docs/RELEASE_CHECKLIST.md +219 -0
- modules/caas/docs/RELEASE_GUIDE.md +285 -0
- modules/caas/docs/REPRODUCIBILITY.md +386 -0
- modules/caas/docs/SLIDING_WINDOW.md +387 -0
- modules/caas/docs/STRUCTURE_AWARE_INDEXING.md +158 -0
- modules/caas/docs/TESTING.md +259 -0
- modules/caas/docs/THREAT_MODEL.md +247 -0
- modules/caas/docs/TRUST_GATEWAY.md +575 -0
- modules/caas/docs/VFS.md +298 -0
- modules/caas/examples/agents/enterprise_security_agent.py +414 -0
- modules/caas/examples/agents/intelligent_document_analyzer.py +380 -0
- modules/caas/examples/demos/demo.py +309 -0
- modules/caas/examples/demos/demo_context_triad.py +225 -0
- modules/caas/examples/demos/demo_conversation_manager.py +285 -0
- modules/caas/examples/demos/demo_heuristic_router.py +133 -0
- modules/caas/examples/demos/demo_metadata_injection.py +198 -0
- modules/caas/examples/demos/demo_pragmatic_truth.py +303 -0
- modules/caas/examples/demos/demo_structure_aware.py +140 -0
- modules/caas/examples/demos/demo_time_decay.py +247 -0
- modules/caas/examples/demos/demo_trust_gateway.py +383 -0
- modules/caas/examples/multi_agent/README.md +159 -0
- modules/caas/examples/multi_agent/research_team.py +369 -0
- modules/caas/examples/multi_agent/vfs_collaboration.py +393 -0
- modules/caas/examples/usage/auth_module.py +142 -0
- modules/caas/examples/usage/usage_example.py +173 -0
- modules/caas/experiments/README.md +42 -0
- modules/caas/experiments/reproduce_results.py +462 -0
- modules/caas/paper/ARXIV_METADATA.md +145 -0
- modules/caas/paper/ARXIV_README.md +47 -0
- modules/caas/paper/CHECKLIST.md +103 -0
- modules/caas/paper/GITHUB_RELEASE_NOTES.md +105 -0
- modules/caas/paper/README.md +71 -0
- modules/caas/paper/abstract.md +24 -0
- modules/caas/paper/arxiv_submission.tar +0 -0
- modules/caas/paper/arxiv_submission.zip +0 -0
- modules/caas/paper/build_pdf.py +355 -0
- modules/caas/paper/experiments.md +149 -0
- modules/caas/paper/figures/.gitkeep +0 -0
- modules/caas/paper/figures/README.md +237 -0
- modules/caas/paper/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/figures/fig1_system_architecture.svg +198 -0
- modules/caas/paper/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/figures/fig2_context_triad.svg +105 -0
- modules/caas/paper/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/figures/fig3_ablation_results.svg +113 -0
- modules/caas/paper/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/figures/fig4_routing_latency.svg +97 -0
- modules/caas/paper/intro.md +103 -0
- modules/caas/paper/latex/figures/fig1_system_architecture.png +0 -0
- modules/caas/paper/latex/figures/fig2_context_triad.png +0 -0
- modules/caas/paper/latex/figures/fig3_ablation_results.png +0 -0
- modules/caas/paper/latex/figures/fig4_routing_latency.png +0 -0
- modules/caas/paper/latex/main.tex +468 -0
- modules/caas/paper/latex/references.bib +140 -0
- modules/caas/paper/method.md +350 -0
- modules/caas/paper/outline.md +123 -0
- modules/caas/paper/related_work.md +101 -0
- modules/caas/paper/tables/.gitkeep +0 -0
- modules/caas/paper/tables/results_tables.md +50 -0
- modules/caas/pyproject.toml +172 -0
- modules/caas/requirements.txt +11 -0
- modules/caas/src/caas/__init__.py +232 -0
- modules/caas/src/caas/api/__init__.py +7 -0
- modules/caas/src/caas/api/server.py +1326 -0
- modules/caas/src/caas/caching.py +832 -0
- modules/caas/src/caas/cli.py +208 -0
- modules/caas/src/caas/conversation.py +221 -0
- modules/caas/src/caas/decay.py +118 -0
- modules/caas/src/caas/detection/__init__.py +7 -0
- modules/caas/src/caas/detection/detector.py +236 -0
- modules/caas/src/caas/enrichment.py +127 -0
- modules/caas/src/caas/gateway/__init__.py +24 -0
- modules/caas/src/caas/gateway/trust_gateway.py +471 -0
- modules/caas/src/caas/hf_utils.py +477 -0
- modules/caas/src/caas/ingestion/__init__.py +21 -0
- modules/caas/src/caas/ingestion/processors.py +251 -0
- modules/caas/src/caas/ingestion/structure_parser.py +185 -0
- modules/caas/src/caas/models.py +354 -0
- modules/caas/src/caas/pragmatic_truth.py +441 -0
- modules/caas/src/caas/routing/__init__.py +8 -0
- modules/caas/src/caas/routing/heuristic_router.py +242 -0
- modules/caas/src/caas/storage/__init__.py +7 -0
- modules/caas/src/caas/storage/store.py +450 -0
- modules/caas/src/caas/triad.py +472 -0
- modules/caas/src/caas/tuning/__init__.py +7 -0
- modules/caas/src/caas/tuning/tuner.py +322 -0
- modules/caas/src/caas/vfs/__init__.py +12 -0
- modules/caas/src/caas/vfs/filesystem.py +450 -0
- modules/caas/tests/__init__.py +3 -0
- modules/caas/tests/conftest.py +8 -0
- modules/caas/tests/test_caching.py +628 -0
- modules/caas/tests/test_context_triad.py +385 -0
- modules/caas/tests/test_conversation_manager.py +289 -0
- modules/caas/tests/test_functionality.py +215 -0
- modules/caas/tests/test_heuristic_router.py +370 -0
- modules/caas/tests/test_metadata_injection.py +328 -0
- modules/caas/tests/test_pragmatic_truth.py +322 -0
- modules/caas/tests/test_structure_aware_indexing.py +283 -0
- modules/caas/tests/test_time_decay.py +268 -0
- modules/caas/tests/test_trust_gateway.py +445 -0
- modules/caas/tests/test_vfs.py +298 -0
- modules/cmvk/.github/FUNDING.yml +9 -0
- modules/cmvk/.github/dependabot.yml +54 -0
- modules/cmvk/.github/workflows/ci.yml +205 -0
- modules/cmvk/.github/workflows/publish.yml +143 -0
- modules/cmvk/.gitignore +147 -0
- modules/cmvk/.pre-commit-config.yaml +58 -0
- modules/cmvk/CHANGELOG.md +146 -0
- modules/cmvk/CITATION.cff +48 -0
- modules/cmvk/CONTRIBUTING.md +229 -0
- modules/cmvk/Dockerfile +87 -0
- modules/cmvk/HF_MODEL_CARD.md +185 -0
- modules/cmvk/LICENSE +21 -0
- modules/cmvk/README.md +149 -0
- modules/cmvk/SECURITY.md +114 -0
- modules/cmvk/config/prompts/generator_v1.txt +23 -0
- modules/cmvk/config/prompts/verifier_hostile.txt +32 -0
- modules/cmvk/config/settings.yaml +40 -0
- modules/cmvk/coverage_html/.gitignore +2 -0
- modules/cmvk/coverage_html/class_index.html +658 -0
- modules/cmvk/coverage_html/coverage_html_cb_188fc9a4.js +735 -0
- modules/cmvk/coverage_html/favicon_32_cb_c827f16f.png +0 -0
- modules/cmvk/coverage_html/function_index.html +1978 -0
- modules/cmvk/coverage_html/index.html +255 -0
- modules/cmvk/coverage_html/keybd_closed_cb_900cfef5.png +0 -0
- modules/cmvk/coverage_html/status.json +1 -0
- modules/cmvk/coverage_html/style_cb_5c747636.css +389 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38___init___py.html +315 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_audit_py.html +499 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_benchmarks_py.html +575 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_constitutional_py.html +1001 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_hf_utils_py.html +398 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_metrics_py.html +570 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_profiles_py.html +397 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_types_py.html +109 -0
- modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_verification_py.html +1053 -0
- modules/cmvk/docs/DIAGRAMS.md +325 -0
- modules/cmvk/docs/architecture.md +345 -0
- modules/cmvk/docs/features.md +308 -0
- modules/cmvk/docs/getting_started.md +279 -0
- modules/cmvk/docs/innovation_layer.md +377 -0
- modules/cmvk/docs/safety.md +281 -0
- modules/cmvk/docs/traceability.md +150 -0
- modules/cmvk/examples/basic_example.py +62 -0
- modules/cmvk/examples/demo_complete_pipeline.py +209 -0
- modules/cmvk/examples/demo_innovation_layer.py +197 -0
- modules/cmvk/examples/example.py +112 -0
- modules/cmvk/examples/model_diversity_comparison.py +110 -0
- modules/cmvk/examples/real_api_integration.py +121 -0
- modules/cmvk/examples/test_full_pipeline.py +303 -0
- modules/cmvk/experiments/FEATURE_2_LATERAL_THINKING.md +187 -0
- modules/cmvk/experiments/README.md +216 -0
- modules/cmvk/experiments/ablation_runner.py +666 -0
- modules/cmvk/experiments/baseline_runner.py +158 -0
- modules/cmvk/experiments/blind_spot_benchmark.py +364 -0
- modules/cmvk/experiments/datasets/README.md +85 -0
- modules/cmvk/experiments/datasets/humaneval_50.json +352 -0
- modules/cmvk/experiments/datasets/humaneval_full.json +1150 -0
- modules/cmvk/experiments/datasets/humaneval_sample.json +32 -0
- modules/cmvk/experiments/datasets/sabotage.json +262 -0
- modules/cmvk/experiments/datasets/sample.json +40 -0
- modules/cmvk/experiments/demo_with_traces.py +110 -0
- modules/cmvk/experiments/efficiency_curve.py +259 -0
- modules/cmvk/experiments/experiment_runner.py +243 -0
- modules/cmvk/experiments/paper_data_generator.py +183 -0
- modules/cmvk/experiments/reproduce_results.py +407 -0
- modules/cmvk/experiments/reproducible_runner.py +352 -0
- modules/cmvk/experiments/sabotage_stress_test.py +311 -0
- modules/cmvk/experiments/test_lateral_thinking.py +116 -0
- modules/cmvk/experiments/test_prosecutor.py +41 -0
- modules/cmvk/experiments/visualize_results.py +735 -0
- modules/cmvk/logs/traces/demo_HumanEval_0_20260121-204900.json +36 -0
- modules/cmvk/notebooks/analysis.ipynb +124 -0
- modules/cmvk/paper/PAPER.md +561 -0
- modules/cmvk/paper/arxiv_checklist.md +230 -0
- modules/cmvk/paper/cmvk_neurips.aux +77 -0
- modules/cmvk/paper/cmvk_neurips.bbl +81 -0
- modules/cmvk/paper/cmvk_neurips.blg +48 -0
- modules/cmvk/paper/cmvk_neurips.out +16 -0
- modules/cmvk/paper/cmvk_neurips.pdf +0 -0
- modules/cmvk/paper/cmvk_neurips.tex +309 -0
- modules/cmvk/paper/figures/ablation.png +0 -0
- modules/cmvk/paper/figures/ablation.svg +39 -0
- modules/cmvk/paper/figures/architecture.png +0 -0
- modules/cmvk/paper/figures/architecture.svg +115 -0
- modules/cmvk/paper/figures/results_bar.png +0 -0
- modules/cmvk/paper/figures/results_bar.svg +70 -0
- modules/cmvk/paper/generate_figures.py +383 -0
- modules/cmvk/paper/neurips_2024.sty +101 -0
- modules/cmvk/paper/references.bib +98 -0
- modules/cmvk/paper/structure.tex +200 -0
- modules/cmvk/pyproject.toml +189 -0
- modules/cmvk/requirements-dev.txt +19 -0
- modules/cmvk/requirements.txt +14 -0
- modules/cmvk/src/cmvk/__init__.py +216 -0
- modules/cmvk/src/cmvk/audit.py +400 -0
- modules/cmvk/src/cmvk/benchmarks.py +476 -0
- modules/cmvk/src/cmvk/constitutional.py +902 -0
- modules/cmvk/src/cmvk/hf_utils.py +299 -0
- modules/cmvk/src/cmvk/metrics.py +471 -0
- modules/cmvk/src/cmvk/profiles.py +298 -0
- modules/cmvk/src/cmvk/py.typed +0 -0
- modules/cmvk/src/cmvk/types.py +10 -0
- modules/cmvk/src/cmvk/verification.py +954 -0
- modules/cmvk/src/cross_model_verification_kernel/__init__.py +91 -0
- modules/cmvk/src/cross_model_verification_kernel/__main__.py +10 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/__init__.py +16 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/base_agent.py +142 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/generator_openai.py +223 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_anthropic.py +448 -0
- modules/cmvk/src/cross_model_verification_kernel/agents/verifier_gemini.py +481 -0
- modules/cmvk/src/cross_model_verification_kernel/cli.py +570 -0
- modules/cmvk/src/cross_model_verification_kernel/core/__init__.py +26 -0
- modules/cmvk/src/cross_model_verification_kernel/core/graph_memory.py +308 -0
- modules/cmvk/src/cross_model_verification_kernel/core/kernel.py +413 -0
- modules/cmvk/src/cross_model_verification_kernel/core/trace_logger.py +75 -0
- modules/cmvk/src/cross_model_verification_kernel/core/types.py +121 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/__init__.py +20 -0
- modules/cmvk/src/cross_model_verification_kernel/datasets/humaneval_loader.py +271 -0
- modules/cmvk/src/cross_model_verification_kernel/generator.py +118 -0
- modules/cmvk/src/cross_model_verification_kernel/kernel.py +292 -0
- modules/cmvk/src/cross_model_verification_kernel/models.py +111 -0
- modules/cmvk/src/cross_model_verification_kernel/py.typed +1 -0
- modules/cmvk/src/cross_model_verification_kernel/simple_kernel.py +185 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/__init__.py +94 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/huggingface_upload.py +394 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/sandbox.py +159 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/statistics.py +468 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/visualizer.py +312 -0
- modules/cmvk/src/cross_model_verification_kernel/tools/web_search.py +86 -0
- modules/cmvk/src/cross_model_verification_kernel/verifier.py +257 -0
- modules/cmvk/tests/__init__.py +3 -0
- modules/cmvk/tests/conftest.py +61 -0
- modules/cmvk/tests/integration/__init__.py +1 -0
- modules/cmvk/tests/integration/test_anthropic_verifier.py +269 -0
- modules/cmvk/tests/integration/test_integration.py +53 -0
- modules/cmvk/tests/integration/test_lateral_thinking_integration.py +199 -0
- modules/cmvk/tests/integration/test_lateral_thinking_witness.py +208 -0
- modules/cmvk/tests/integration/test_prosecutor_mode.py +131 -0
- modules/cmvk/tests/test_constitutional.py +611 -0
- modules/cmvk/tests/test_enhanced_features.py +603 -0
- modules/cmvk/tests/test_verification.py +255 -0
- modules/cmvk/tests/unit/__init__.py +1 -0
- modules/cmvk/tests/unit/test_agents.py +64 -0
- modules/cmvk/tests/unit/test_cli.py +224 -0
- modules/cmvk/tests/unit/test_core.py +126 -0
- modules/cmvk/tests/unit/test_humaneval_loader.py +197 -0
- modules/cmvk/tests/unit/test_kernel.py +255 -0
- modules/cmvk/tests/unit/test_reproducibility.py +160 -0
- modules/cmvk/tests/unit/test_trace_logger.py +115 -0
- modules/cmvk/tests/unit/test_visualizer.py +218 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/bug_report.yml +82 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/config.yml +11 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/feature_request.yml +104 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/question.yml +70 -0
- modules/control-plane/.github/ISSUE_TEMPLATE/security_vulnerability.yml +84 -0
- modules/control-plane/.github/discussions.yml +73 -0
- modules/control-plane/.github/pull_request_template.md +82 -0
- modules/control-plane/.github/workflows/publish.yml +146 -0
- modules/control-plane/.github/workflows/release.yml +39 -0
- modules/control-plane/.github/workflows/tests.yml +58 -0
- modules/control-plane/.gitignore +55 -0
- modules/control-plane/CHANGELOG.md +203 -0
- modules/control-plane/CONTRIBUTING.md +311 -0
- modules/control-plane/CONTRIBUTORS.md +88 -0
- modules/control-plane/Dockerfile +82 -0
- modules/control-plane/LICENSE +21 -0
- modules/control-plane/MANIFEST.in +17 -0
- modules/control-plane/README.md +1264 -0
- modules/control-plane/ROADMAP.md +228 -0
- modules/control-plane/SECURITY.md +210 -0
- modules/control-plane/SUPPORT.md +106 -0
- modules/control-plane/acp-cli.py +212 -0
- modules/control-plane/benchmark/README.md +257 -0
- modules/control-plane/benchmark/__init__.py +19 -0
- modules/control-plane/benchmark/red_team_dataset.py +517 -0
- modules/control-plane/benchmark.py +563 -0
- modules/control-plane/build_and_publish.sh +130 -0
- modules/control-plane/docker-compose.yml +74 -0
- modules/control-plane/docs/ABLATION_STUDIES.md +528 -0
- modules/control-plane/docs/ADAPTER_GUIDE.md +544 -0
- modules/control-plane/docs/ADVANCED_FEATURES.md +543 -0
- modules/control-plane/docs/AIOS_COMPARISON.md +296 -0
- modules/control-plane/docs/BIBLIOGRAPHY.md +367 -0
- modules/control-plane/docs/CASE_STUDIES.md +645 -0
- modules/control-plane/docs/DOCKER_DEPLOYMENT.md +184 -0
- modules/control-plane/docs/ECOSYSTEM_STATUS.md +98 -0
- modules/control-plane/docs/HF_MODEL_CARD.md +168 -0
- modules/control-plane/docs/KERNEL_V1_RELEASE.md +454 -0
- modules/control-plane/docs/LAYER3_FRAMEWORK.md +227 -0
- modules/control-plane/docs/LIMITATIONS.md +523 -0
- modules/control-plane/docs/PYPI_PUBLISHING.md +195 -0
- modules/control-plane/docs/README.md +58 -0
- modules/control-plane/docs/RELATED_WORK.md +319 -0
- modules/control-plane/docs/RELEASE_v1.1.0.md +252 -0
- modules/control-plane/docs/REPRODUCIBILITY.md +540 -0
- modules/control-plane/docs/RESEARCH_FOUNDATION.md +197 -0
- modules/control-plane/docs/api/CORE.md +270 -0
- modules/control-plane/docs/architecture/architecture.md +120 -0
- modules/control-plane/docs/community/ANNOUNCEMENT_TEMPLATES.md +52 -0
- modules/control-plane/docs/guides/IMPLEMENTATION.md +225 -0
- modules/control-plane/docs/guides/PHILOSOPHY.md +354 -0
- modules/control-plane/docs/guides/QUICKSTART.md +217 -0
- modules/control-plane/examples/README.md +138 -0
- modules/control-plane/examples/a2a_demo.py +410 -0
- modules/control-plane/examples/adapter_demo.py +347 -0
- modules/control-plane/examples/advanced_features.py +403 -0
- modules/control-plane/examples/basic_usage.py +261 -0
- modules/control-plane/examples/benchmark_demo.py +186 -0
- modules/control-plane/examples/compliance_demo.py +333 -0
- modules/control-plane/examples/configuration.py +265 -0
- modules/control-plane/examples/getting_started.py +178 -0
- modules/control-plane/examples/hibernation_and_time_travel_demo.py +406 -0
- modules/control-plane/examples/interactive_tutorial.ipynb +497 -0
- modules/control-plane/examples/kernel_interceptor_demo.py +202 -0
- modules/control-plane/examples/kernel_v1_demo.py +273 -0
- modules/control-plane/examples/langchain_demo.py +281 -0
- modules/control-plane/examples/lifecycle_demo.py +724 -0
- modules/control-plane/examples/mcp_demo.py +378 -0
- modules/control-plane/examples/ml_safety_demo.py +157 -0
- modules/control-plane/examples/multimodal_demo.py +347 -0
- modules/control-plane/examples/observability_demo.py +370 -0
- modules/control-plane/examples/use_cases.py +336 -0
- modules/control-plane/experiments/long_horizon_purge.py +235 -0
- modules/control-plane/experiments/multi_agent_rag.py +165 -0
- modules/control-plane/experiments/reproduce_results.py +667 -0
- modules/control-plane/paper/ARXIV_SUBMISSION_INFO.txt +122 -0
- modules/control-plane/paper/ETHICS_STATEMENT.md +248 -0
- modules/control-plane/paper/PAPER_CHECKLIST.md +72 -0
- modules/control-plane/paper/Paper.pdf +0 -0
- modules/control-plane/paper/README.md +71 -0
- modules/control-plane/paper/appendix.md +152 -0
- modules/control-plane/paper/architecture.md +15 -0
- modules/control-plane/paper/arxiv/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/arxiv/figures/architecture.png +0 -0
- modules/control-plane/paper/arxiv/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/arxiv/figures/results_chart.png +0 -0
- modules/control-plane/paper/arxiv/main.aux +97 -0
- modules/control-plane/paper/arxiv/main.bbl +112 -0
- modules/control-plane/paper/arxiv/main.blg +48 -0
- modules/control-plane/paper/arxiv/main.out +33 -0
- modules/control-plane/paper/arxiv/main.pdf +0 -0
- modules/control-plane/paper/arxiv/main.tex +479 -0
- modules/control-plane/paper/arxiv/references.bib +234 -0
- modules/control-plane/paper/arxiv_submission.tar +0 -0
- modules/control-plane/paper/arxiv_submission.zip +0 -0
- modules/control-plane/paper/build.sh +68 -0
- modules/control-plane/paper/figures/README.md +47 -0
- modules/control-plane/paper/figures/ablation_chart.pdf +0 -0
- modules/control-plane/paper/figures/ablation_chart.png +0 -0
- modules/control-plane/paper/figures/architecture.pdf +0 -0
- modules/control-plane/paper/figures/architecture.png +0 -0
- modules/control-plane/paper/figures/constraint_graphs.pdf +0 -0
- modules/control-plane/paper/figures/constraint_graphs.png +0 -0
- modules/control-plane/paper/figures/generate_figures.py +252 -0
- modules/control-plane/paper/figures/results_chart.pdf +0 -0
- modules/control-plane/paper/figures/results_chart.png +0 -0
- modules/control-plane/paper/main.md +273 -0
- modules/control-plane/paper/main.tex +214 -0
- modules/control-plane/paper/main_arxiv.aux +53 -0
- modules/control-plane/paper/main_arxiv.out +17 -0
- modules/control-plane/paper/main_arxiv.pdf +0 -0
- modules/control-plane/paper/main_arxiv.tex +264 -0
- modules/control-plane/paper/references.bib +234 -0
- modules/control-plane/pyproject.toml +124 -0
- modules/control-plane/reproducibility/ABLATIONS.md +136 -0
- modules/control-plane/reproducibility/README.md +288 -0
- modules/control-plane/reproducibility/commands.md +467 -0
- modules/control-plane/reproducibility/docker_config/Dockerfile +39 -0
- modules/control-plane/reproducibility/experiment_configs/purge_config.json +46 -0
- modules/control-plane/reproducibility/experiment_configs/rag_config.json +36 -0
- modules/control-plane/reproducibility/hardware_specs.md +317 -0
- modules/control-plane/reproducibility/requirements_frozen.txt +0 -0
- modules/control-plane/reproducibility/run_all_experiments.sh +45 -0
- modules/control-plane/reproducibility/seeds.json +106 -0
- modules/control-plane/scripts/prepare_pypi.py +46 -0
- modules/control-plane/scripts/prepare_release.py +176 -0
- modules/control-plane/scripts/upload_dataset_to_hf.py +316 -0
- modules/control-plane/setup.py +69 -0
- modules/control-plane/src/agent_control_plane/__init__.py +639 -0
- modules/control-plane/src/agent_control_plane/a2a_adapter.py +541 -0
- modules/control-plane/src/agent_control_plane/adapter.py +415 -0
- modules/control-plane/src/agent_control_plane/agent_hibernation.py +364 -0
- modules/control-plane/src/agent_control_plane/agent_kernel.py +464 -0
- modules/control-plane/src/agent_control_plane/compliance.py +718 -0
- modules/control-plane/src/agent_control_plane/constraint_graphs.py +475 -0
- modules/control-plane/src/agent_control_plane/control_plane.py +848 -0
- modules/control-plane/src/agent_control_plane/example_executors.py +193 -0
- modules/control-plane/src/agent_control_plane/execution_engine.py +229 -0
- modules/control-plane/src/agent_control_plane/flight_recorder.py +600 -0
- modules/control-plane/src/agent_control_plane/governance_layer.py +432 -0
- modules/control-plane/src/agent_control_plane/hf_utils.py +561 -0
- modules/control-plane/src/agent_control_plane/interfaces/__init__.py +53 -0
- modules/control-plane/src/agent_control_plane/interfaces/kernel_interface.py +359 -0
- modules/control-plane/src/agent_control_plane/interfaces/plugin_interface.py +495 -0
- modules/control-plane/src/agent_control_plane/interfaces/protocol_interfaces.py +385 -0
- modules/control-plane/src/agent_control_plane/kernel_space.py +707 -0
- modules/control-plane/src/agent_control_plane/langchain_adapter.py +422 -0
- modules/control-plane/src/agent_control_plane/lifecycle.py +3111 -0
- modules/control-plane/src/agent_control_plane/mcp_adapter.py +517 -0
- modules/control-plane/src/agent_control_plane/ml_safety.py +560 -0
- modules/control-plane/src/agent_control_plane/multimodal.py +724 -0
- modules/control-plane/src/agent_control_plane/mute_agent.py +419 -0
- modules/control-plane/src/agent_control_plane/observability.py +785 -0
- modules/control-plane/src/agent_control_plane/orchestrator.py +480 -0
- modules/control-plane/src/agent_control_plane/plugin_registry.py +748 -0
- modules/control-plane/src/agent_control_plane/policy_engine.py +525 -0
- modules/control-plane/src/agent_control_plane/shadow_mode.py +307 -0
- modules/control-plane/src/agent_control_plane/signals.py +491 -0
- modules/control-plane/src/agent_control_plane/supervisor_agents.py +427 -0
- modules/control-plane/src/agent_control_plane/time_travel_debugger.py +554 -0
- modules/control-plane/src/agent_control_plane/tool_registry.py +350 -0
- modules/control-plane/src/agent_control_plane/vfs.py +695 -0
- modules/control-plane/tests/README.md +33 -0
- modules/control-plane/tests/test_a2a_adapter.py +336 -0
- modules/control-plane/tests/test_adapter.py +422 -0
- modules/control-plane/tests/test_advanced_features.py +389 -0
- modules/control-plane/tests/test_benchmark.py +223 -0
- modules/control-plane/tests/test_compliance.py +214 -0
- modules/control-plane/tests/test_control_plane.py +295 -0
- modules/control-plane/tests/test_hibernation.py +274 -0
- modules/control-plane/tests/test_kernel_interception.py +284 -0
- modules/control-plane/tests/test_langchain_adapter.py +258 -0
- modules/control-plane/tests/test_lifecycle.py +1174 -0
- modules/control-plane/tests/test_mcp_adapter.py +293 -0
- modules/control-plane/tests/test_ml_safety.py +142 -0
- modules/control-plane/tests/test_multimodal.py +317 -0
- modules/control-plane/tests/test_new_features.py +435 -0
- modules/control-plane/tests/test_observability.py +338 -0
- modules/control-plane/tests/test_time_travel.py +387 -0
- modules/emk/.github/workflows/ci.yml +105 -0
- modules/emk/.github/workflows/publish.yml +144 -0
- modules/emk/.gitignore +74 -0
- modules/emk/CHANGELOG.md +41 -0
- modules/emk/CONTRIBUTING.md +295 -0
- modules/emk/IMPLEMENTATION.md +174 -0
- modules/emk/LICENSE +21 -0
- modules/emk/MANIFEST.in +8 -0
- modules/emk/README.md +135 -0
- modules/emk/RELEASE_NOTES.md +82 -0
- modules/emk/SECURITY.md +52 -0
- modules/emk/codecov.yml +39 -0
- modules/emk/docs/MEMORY_MANAGEMENT.md +285 -0
- modules/emk/emk/__init__.py +106 -0
- modules/emk/emk/hf_utils.py +419 -0
- modules/emk/emk/indexer.py +144 -0
- modules/emk/emk/py.typed +0 -0
- modules/emk/emk/schema.py +204 -0
- modules/emk/emk/sleep_cycle.py +345 -0
- modules/emk/emk/store.py +479 -0
- modules/emk/examples/basic_usage.py +123 -0
- modules/emk/examples/memory_features_demo.py +154 -0
- modules/emk/experiments/README.md +59 -0
- modules/emk/experiments/reproduce_results.py +461 -0
- modules/emk/experiments/results.json +61 -0
- modules/emk/paper/structure.tex +192 -0
- modules/emk/paper/whitepaper.md +273 -0
- modules/emk/pyproject.toml +91 -0
- modules/emk/setup.py +5 -0
- modules/emk/tests/test_file_adapter.py +195 -0
- modules/emk/tests/test_indexer.py +174 -0
- modules/emk/tests/test_init.py +55 -0
- modules/emk/tests/test_negative_memory.py +83 -0
- modules/emk/tests/test_schema.py +150 -0
- modules/emk/tests/test_semantic_rules.py +175 -0
- modules/emk/tests/test_sleep_cycle.py +335 -0
- modules/emk/tests/test_store_anti_patterns.py +239 -0
- modules/iatp/.github/workflows/docker-build.yml +124 -0
- modules/iatp/.github/workflows/publish.yml +174 -0
- modules/iatp/.github/workflows/python-package.yml +121 -0
- modules/iatp/.gitignore +67 -0
- modules/iatp/.pre-commit-config.yaml +64 -0
- modules/iatp/CHANGELOG.md +120 -0
- modules/iatp/Dockerfile +91 -0
- modules/iatp/IMPLEMENTATION_SUMMARY.md +218 -0
- modules/iatp/MANIFEST.in +9 -0
- modules/iatp/README.md +180 -0
- modules/iatp/docker/Dockerfile.agent +27 -0
- modules/iatp/docker/Dockerfile.sidecar-python +86 -0
- modules/iatp/docker/README.md +258 -0
- modules/iatp/docker-compose.yml +194 -0
- modules/iatp/docs/ARCHITECTURE.md +243 -0
- modules/iatp/docs/CLI_GUIDE.md +220 -0
- modules/iatp/docs/DEPLOYMENT.md +304 -0
- modules/iatp/examples/README.md +132 -0
- modules/iatp/examples/backend_agent.py +39 -0
- modules/iatp/examples/client.py +168 -0
- modules/iatp/examples/demo_attestation_reputation.py +274 -0
- modules/iatp/examples/demo_client.py +240 -0
- modules/iatp/examples/demo_rbac.py +143 -0
- modules/iatp/examples/integration_demo.py +245 -0
- modules/iatp/examples/manifests/coder_agent.json +20 -0
- modules/iatp/examples/manifests/reviewer_agent.json +19 -0
- modules/iatp/examples/manifests/secure_bank.json +14 -0
- modules/iatp/examples/manifests/standard_agent.json +14 -0
- modules/iatp/examples/manifests/untrusted_honeypot.json +14 -0
- modules/iatp/examples/run_secure_bank_sidecar.py +85 -0
- modules/iatp/examples/run_sidecar.py +105 -0
- modules/iatp/examples/run_untrusted_sidecar.py +77 -0
- modules/iatp/examples/secure_bank_agent.py +138 -0
- modules/iatp/examples/test_untrusted.py +82 -0
- modules/iatp/examples/untrusted_agent.py +119 -0
- modules/iatp/experiments/README.md +58 -0
- modules/iatp/experiments/cascading_hallucination/README.md +149 -0
- modules/iatp/experiments/cascading_hallucination/agent_a_user.py +41 -0
- modules/iatp/experiments/cascading_hallucination/agent_b_summarizer.py +54 -0
- modules/iatp/experiments/cascading_hallucination/agent_c_database.py +47 -0
- modules/iatp/experiments/cascading_hallucination/proof_of_concept.py +290 -0
- modules/iatp/experiments/cascading_hallucination/run_experiment.py +226 -0
- modules/iatp/experiments/cascading_hallucination/sidecar_c.py +61 -0
- modules/iatp/experiments/reproduce_results.py +574 -0
- modules/iatp/experiments/results.json +2336 -0
- modules/iatp/iatp/__init__.py +164 -0
- modules/iatp/iatp/attestation.py +401 -0
- modules/iatp/iatp/cli.py +253 -0
- modules/iatp/iatp/hf_utils.py +469 -0
- modules/iatp/iatp/ipc_pipes.py +578 -0
- modules/iatp/iatp/main.py +410 -0
- modules/iatp/iatp/models/__init__.py +445 -0
- modules/iatp/iatp/policy_engine.py +335 -0
- modules/iatp/iatp/py.typed +2 -0
- modules/iatp/iatp/recovery.py +319 -0
- modules/iatp/iatp/security/__init__.py +268 -0
- modules/iatp/iatp/sidecar/__init__.py +517 -0
- modules/iatp/iatp/telemetry/__init__.py +162 -0
- modules/iatp/iatp/tests/__init__.py +1 -0
- modules/iatp/iatp/tests/test_attestation.py +368 -0
- modules/iatp/iatp/tests/test_cli.py +129 -0
- modules/iatp/iatp/tests/test_models.py +128 -0
- modules/iatp/iatp/tests/test_policy_engine.py +345 -0
- modules/iatp/iatp/tests/test_recovery.py +279 -0
- modules/iatp/iatp/tests/test_security.py +220 -0
- modules/iatp/iatp/tests/test_sidecar.py +165 -0
- modules/iatp/iatp/tests/test_telemetry.py +173 -0
- modules/iatp/paper/BLOG.md +307 -0
- modules/iatp/paper/PAPER.md +236 -0
- modules/iatp/paper/RFC_SUBMISSION.md +299 -0
- modules/iatp/paper/whitepaper.md +369 -0
- modules/iatp/proto/README.md +200 -0
- modules/iatp/proto/generate_stubs.py +81 -0
- modules/iatp/proto/iatp.proto +552 -0
- modules/iatp/pyproject.toml +180 -0
- modules/iatp/requirements-dev.txt +2 -0
- modules/iatp/requirements.txt +6 -0
- modules/iatp/setup.py +60 -0
- modules/iatp/sidecar/README.md +487 -0
- modules/iatp/sidecar/go/Dockerfile +32 -0
- modules/iatp/sidecar/go/README.md +237 -0
- modules/iatp/sidecar/go/go.mod +8 -0
- modules/iatp/sidecar/go/main.go +488 -0
- modules/iatp/spec/001-handshake.md +436 -0
- modules/iatp/spec/002-reversibility.md +394 -0
- modules/iatp/spec/schema/capability_manifest.json +266 -0
- modules/iatp/test_integration.py +310 -0
- modules/mcp-kernel-server/README.md +261 -0
- modules/mcp-kernel-server/pyproject.toml +60 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/__init__.py +26 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/cli.py +229 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/resources.py +215 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/server.py +562 -0
- modules/mcp-kernel-server/src/mcp_kernel_server/tools.py +1172 -0
- modules/mute-agent/.github/workflows/safety_check.yml +45 -0
- modules/mute-agent/.gitignore +53 -0
- modules/mute-agent/ARCHITECTURE.md +531 -0
- modules/mute-agent/BENCHMARK_GUIDE.md +384 -0
- modules/mute-agent/COMPLETION_SUMMARY.md +293 -0
- modules/mute-agent/EXPERIMENT_SUMMARY.md +318 -0
- modules/mute-agent/IMPLEMENTATION_SUMMARY.md +212 -0
- modules/mute-agent/LICENSE +21 -0
- modules/mute-agent/PHASE3_SUMMARY.md +297 -0
- modules/mute-agent/README.md +360 -0
- modules/mute-agent/STEEL_MAN_RESULTS.md +353 -0
- modules/mute-agent/USAGE.md +505 -0
- modules/mute-agent/V2_IMPLEMENTATION_SUMMARY.md +253 -0
- modules/mute-agent/V2_STEEL_MAN_IMPLEMENTATION.md +274 -0
- modules/mute-agent/VERIFICATION_REPORT.md +435 -0
- modules/mute-agent/charts/cost_comparison.png +0 -0
- modules/mute-agent/charts/cost_vs_ambiguity.png +0 -0
- modules/mute-agent/charts/metrics_comparison.png +0 -0
- modules/mute-agent/charts/scenario_breakdown.png +0 -0
- modules/mute-agent/charts/trace_attack_blocked.html +140 -0
- modules/mute-agent/charts/trace_attack_blocked.png +0 -0
- modules/mute-agent/charts/trace_failure.html +140 -0
- modules/mute-agent/charts/trace_failure.png +0 -0
- modules/mute-agent/charts/trace_success.html +140 -0
- modules/mute-agent/charts/trace_success.png +0 -0
- modules/mute-agent/examples/__init__.py +1 -0
- modules/mute-agent/examples/advanced_example.py +384 -0
- modules/mute-agent/examples/graph_debugger_demo.py +241 -0
- modules/mute-agent/examples/listener_example.py +297 -0
- modules/mute-agent/examples/simple_example.py +242 -0
- modules/mute-agent/examples/steel_man_demo.py +297 -0
- modules/mute-agent/experiments/README.md +135 -0
- modules/mute-agent/experiments/__init__.py +3 -0
- modules/mute-agent/experiments/agent_comparison.csv +6 -0
- modules/mute-agent/experiments/agent_comparison_50runs.csv +6 -0
- modules/mute-agent/experiments/ambiguity_test.py +335 -0
- modules/mute-agent/experiments/ambiguity_test_results.csv +31 -0
- modules/mute-agent/experiments/ambiguity_test_results_50runs.csv +51 -0
- modules/mute-agent/experiments/baseline_agent.py +189 -0
- modules/mute-agent/experiments/benchmark.py +402 -0
- modules/mute-agent/experiments/demo.py +172 -0
- modules/mute-agent/experiments/generate_cost_curve.py +474 -0
- modules/mute-agent/experiments/jailbreak_test.py +137 -0
- modules/mute-agent/experiments/latent_state_scenario.py +361 -0
- modules/mute-agent/experiments/mute_agent_experiment.py +349 -0
- modules/mute-agent/experiments/run_extended_experiment.py +40 -0
- modules/mute-agent/experiments/run_v2_experiments.py +266 -0
- modules/mute-agent/experiments/run_v2_experiments_auto.py +247 -0
- modules/mute-agent/experiments/v2_scenarios/README.md +214 -0
- modules/mute-agent/experiments/v2_scenarios/__init__.py +4 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_1_deep_dependency.py +325 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_2_adversarial.py +328 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_3_false_positive.py +303 -0
- modules/mute-agent/experiments/v2_scenarios/scenario_4_performance.py +319 -0
- modules/mute-agent/experiments/visualize.py +400 -0
- modules/mute-agent/mute_agent/__init__.py +66 -0
- modules/mute-agent/mute_agent/core/__init__.py +1 -0
- modules/mute-agent/mute_agent/core/execution_agent.py +164 -0
- modules/mute-agent/mute_agent/core/handshake_protocol.py +199 -0
- modules/mute-agent/mute_agent/core/reasoning_agent.py +236 -0
- modules/mute-agent/mute_agent/knowledge_graph/__init__.py +1 -0
- modules/mute-agent/mute_agent/knowledge_graph/graph_elements.py +63 -0
- modules/mute-agent/mute_agent/knowledge_graph/multidimensional_graph.py +168 -0
- modules/mute-agent/mute_agent/knowledge_graph/subgraph.py +222 -0
- modules/mute-agent/mute_agent/listener/__init__.py +41 -0
- modules/mute-agent/mute_agent/listener/adapters/__init__.py +29 -0
- modules/mute-agent/mute_agent/listener/adapters/base_adapter.py +187 -0
- modules/mute-agent/mute_agent/listener/adapters/caas_adapter.py +342 -0
- modules/mute-agent/mute_agent/listener/adapters/control_plane_adapter.py +434 -0
- modules/mute-agent/mute_agent/listener/adapters/iatp_adapter.py +330 -0
- modules/mute-agent/mute_agent/listener/adapters/scak_adapter.py +249 -0
- modules/mute-agent/mute_agent/listener/listener.py +608 -0
- modules/mute-agent/mute_agent/listener/state_observer.py +434 -0
- modules/mute-agent/mute_agent/listener/threshold_config.py +311 -0
- modules/mute-agent/mute_agent/super_system/__init__.py +1 -0
- modules/mute-agent/mute_agent/super_system/router.py +202 -0
- modules/mute-agent/mute_agent/visualization/__init__.py +8 -0
- modules/mute-agent/mute_agent/visualization/graph_debugger.py +495 -0
- modules/mute-agent/requirements-dev.txt +6 -0
- modules/mute-agent/requirements.txt +9 -0
- modules/mute-agent/setup.py +64 -0
- modules/mute-agent/src/__init__.py +0 -0
- modules/mute-agent/src/agents/__init__.py +0 -0
- modules/mute-agent/src/agents/baseline_agent.py +524 -0
- modules/mute-agent/src/agents/interactive_agent.py +113 -0
- modules/mute-agent/src/agents/mute_agent.py +622 -0
- modules/mute-agent/src/benchmarks/__init__.py +0 -0
- modules/mute-agent/src/benchmarks/evaluator.py +481 -0
- modules/mute-agent/src/benchmarks/scenarios.json +985 -0
- modules/mute-agent/src/core/__init__.py +0 -0
- modules/mute-agent/src/core/mock_state.py +320 -0
- modules/mute-agent/src/core/tools.py +441 -0
- modules/nexus/__init__.py +49 -0
- modules/nexus/arbiter.py +357 -0
- modules/nexus/client.py +464 -0
- modules/nexus/dmz.py +417 -0
- modules/nexus/escrow.py +428 -0
- modules/nexus/exceptions.py +284 -0
- modules/nexus/registry.py +391 -0
- modules/nexus/reputation.py +423 -0
- modules/nexus/schemas/__init__.py +49 -0
- modules/nexus/schemas/compliance.py +274 -0
- modules/nexus/schemas/escrow.py +249 -0
- modules/nexus/schemas/manifest.py +223 -0
- modules/nexus/schemas/receipt.py +206 -0
- modules/observability/README.md +192 -0
- modules/observability/alertmanager/alertmanager.yml +116 -0
- modules/observability/alerts/agent-os-alerts.yaml +197 -0
- modules/observability/docker-compose.yml +128 -0
- modules/observability/grafana/dashboards/agent-os-amb.json +448 -0
- modules/observability/grafana/dashboards/agent-os-cmvk.json +441 -0
- modules/observability/grafana/dashboards/agent-os-overview.json +268 -0
- modules/observability/grafana/dashboards/agent-os-performance.json +15 -0
- modules/observability/grafana/dashboards/agent-os-safety.json +50 -0
- modules/observability/grafana/provisioning/dashboards/dashboards.yml +15 -0
- modules/observability/grafana/provisioning/datasources/datasources.yml +33 -0
- modules/observability/otel/otel-collector-config.yml +61 -0
- modules/observability/prometheus/prometheus.yml +63 -0
- modules/observability/pyproject.toml +53 -0
- modules/observability/scripts/export_dashboards.py +55 -0
- modules/observability/src/agent_os_observability/__init__.py +25 -0
- modules/observability/src/agent_os_observability/dashboards.py +896 -0
- modules/observability/src/agent_os_observability/metrics.py +396 -0
- modules/observability/src/agent_os_observability/server.py +221 -0
- modules/observability/src/agent_os_observability/tracer.py +226 -0
- modules/primitives/.gitignore +8 -0
- modules/primitives/README.md +62 -0
- modules/primitives/agent_primitives/__init__.py +22 -0
- modules/primitives/agent_primitives/failures.py +82 -0
- modules/primitives/agent_primitives/py.typed +0 -0
- modules/primitives/pyproject.toml +68 -0
- modules/scak/.github/copilot-instructions.md +396 -0
- modules/scak/.github/workflows/release.yml +117 -0
- modules/scak/.gitignore +32 -0
- modules/scak/CHANGELOG.md +173 -0
- modules/scak/CITATION.cff +62 -0
- modules/scak/CONTRIBUTING.md +429 -0
- modules/scak/Dockerfile +58 -0
- modules/scak/ENTERPRISE_FEATURES.md +518 -0
- modules/scak/IMPLEMENTATION_SUMMARY.md +206 -0
- modules/scak/LIMITATIONS.md +565 -0
- modules/scak/MANIFEST.in +16 -0
- modules/scak/NOVELTY.md +535 -0
- modules/scak/README.md +928 -0
- modules/scak/RESEARCH.md +670 -0
- modules/scak/agent_kernel/__init__.py +66 -0
- modules/scak/agent_kernel/analyzer.py +432 -0
- modules/scak/agent_kernel/auditor.py +31 -0
- modules/scak/agent_kernel/completeness_auditor.py +234 -0
- modules/scak/agent_kernel/detector.py +200 -0
- modules/scak/agent_kernel/kernel.py +741 -0
- modules/scak/agent_kernel/memory_manager.py +82 -0
- modules/scak/agent_kernel/models.py +372 -0
- modules/scak/agent_kernel/nudge_mechanism.py +260 -0
- modules/scak/agent_kernel/outcome_analyzer.py +335 -0
- modules/scak/agent_kernel/patcher.py +579 -0
- modules/scak/agent_kernel/semantic_analyzer.py +313 -0
- modules/scak/agent_kernel/semantic_purge.py +346 -0
- modules/scak/agent_kernel/simulator.py +447 -0
- modules/scak/agent_kernel/teacher.py +82 -0
- modules/scak/agent_kernel/triage.py +149 -0
- modules/scak/build_and_publish.ps1 +74 -0
- modules/scak/build_and_publish.sh +74 -0
- modules/scak/cli.py +471 -0
- modules/scak/dashboard.py +462 -0
- modules/scak/datasets/DATASET_CARD.md +219 -0
- modules/scak/datasets/README.md +143 -0
- modules/scak/datasets/gaia_vague_queries/vague_queries.json +262 -0
- modules/scak/datasets/hf_upload/README.md +219 -0
- modules/scak/datasets/hf_upload/scak_gaia_laziness.jsonl +50 -0
- modules/scak/datasets/prepare_hf_datasets.py +145 -0
- modules/scak/datasets/red_team/jailbreak_patterns.json +202 -0
- modules/scak/docker-compose.yml +99 -0
- modules/scak/docs/Adaptive-Memory-Hierarchy.md +319 -0
- modules/scak/docs/Data-Contracts-and-Schemas.md +285 -0
- modules/scak/docs/Dual-Loop-Architecture.md +344 -0
- modules/scak/docs/Enhanced-Features.md +612 -0
- modules/scak/docs/LANGCHAIN_INTEGRATION.md +572 -0
- modules/scak/docs/README.md +128 -0
- modules/scak/docs/Reference-Implementations.md +163 -0
- modules/scak/docs/SCAK_V2.md +374 -0
- modules/scak/docs/Three-Failure-Types.md +178 -0
- modules/scak/examples/basic_example.py +155 -0
- modules/scak/examples/circuit_breaker_lazy_eval_demo.py +243 -0
- modules/scak/examples/langchain_integration_example.py +339 -0
- modules/scak/examples/layer4_demo.py +243 -0
- modules/scak/examples/production_features_demo.py +353 -0
- modules/scak/examples/quick_demo.py +79 -0
- modules/scak/examples/scak_v2_demo.py +252 -0
- modules/scak/experiments/README.md +438 -0
- modules/scak/experiments/ablation_studies/README.md +192 -0
- modules/scak/experiments/ablation_studies/ablation_no_audit.py +116 -0
- modules/scak/experiments/ablation_studies/ablation_no_purge.py +133 -0
- modules/scak/experiments/chaos_engineering/README.md +332 -0
- modules/scak/experiments/context_efficiency_test.py +328 -0
- modules/scak/experiments/gaia_benchmark/README.md +208 -0
- modules/scak/experiments/laziness_benchmark.py +179 -0
- modules/scak/experiments/long_horizon_task_experiment.py +252 -0
- modules/scak/experiments/multi_agent_rag_experiment.py +284 -0
- modules/scak/experiments/results/ablation_table.md +12 -0
- modules/scak/experiments/results/long_horizon.json +36 -0
- modules/scak/experiments/results/multi_agent_rag.json +66 -0
- modules/scak/experiments/run_comprehensive_ablations.py +332 -0
- modules/scak/experiments/test_auditor_patcher_integration.py +251 -0
- modules/scak/notebooks/getting_started.ipynb +33 -0
- modules/scak/paper/ARXIV_SUBMISSION_METADATA.txt +109 -0
- modules/scak/paper/PAPER_CHECKLIST.md +304 -0
- modules/scak/paper/Paper.pdf +0 -0
- modules/scak/paper/README.md +113 -0
- modules/scak/paper/appendix.md +351 -0
- modules/scak/paper/arxiv/bibliography.bib +284 -0
- modules/scak/paper/arxiv/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv/main.aux +103 -0
- modules/scak/paper/arxiv/main.bbl +113 -0
- modules/scak/paper/arxiv/main.blg +55 -0
- modules/scak/paper/arxiv/main.out +31 -0
- modules/scak/paper/arxiv/main.pdf +0 -0
- modules/scak/paper/arxiv/main.tex +482 -0
- modules/scak/paper/arxiv_submission/bibliography.bib +284 -0
- modules/scak/paper/arxiv_submission/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/arxiv_submission/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.aux +103 -0
- modules/scak/paper/arxiv_submission/main.bbl +113 -0
- modules/scak/paper/arxiv_submission/main.blg +55 -0
- modules/scak/paper/arxiv_submission/main.out +31 -0
- modules/scak/paper/arxiv_submission/main.pdf +0 -0
- modules/scak/paper/arxiv_submission/main.tex +482 -0
- modules/scak/paper/arxiv_submission.tar.gz +0 -0
- modules/scak/paper/bibliography.bib +284 -0
- modules/scak/paper/build.sh +55 -0
- modules/scak/paper/figures/README.md +32 -0
- modules/scak/paper/figures/fig1_ooda_architecture.md +75 -0
- modules/scak/paper/figures/fig1_ooda_architecture.pdf +0 -0
- modules/scak/paper/figures/fig1_ooda_architecture.png +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.md +83 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.pdf +0 -0
- modules/scak/paper/figures/fig2_memory_hierarchy.png +0 -0
- modules/scak/paper/figures/fig3_gaia_results.md +64 -0
- modules/scak/paper/figures/fig3_gaia_results.pdf +0 -0
- modules/scak/paper/figures/fig3_gaia_results.png +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.md +64 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.pdf +0 -0
- modules/scak/paper/figures/fig4_ablation_heatmap.png +0 -0
- modules/scak/paper/figures/fig5_context_reduction.md +71 -0
- modules/scak/paper/figures/fig5_context_reduction.pdf +0 -0
- modules/scak/paper/figures/fig5_context_reduction.png +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.md +80 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.pdf +0 -0
- modules/scak/paper/figures/fig6_mttr_boxplot.png +0 -0
- modules/scak/paper/figures/generate_figures.py +463 -0
- modules/scak/paper/main.aux +103 -0
- modules/scak/paper/main.bbl +113 -0
- modules/scak/paper/main.blg +55 -0
- modules/scak/paper/main.md +192 -0
- modules/scak/paper/main.out +31 -0
- modules/scak/paper/main.pdf +0 -0
- modules/scak/paper/main.tex +482 -0
- modules/scak/reproducibility/ABLATIONS.md +225 -0
- modules/scak/reproducibility/Dockerfile.reproducibility +34 -0
- modules/scak/reproducibility/README.md +421 -0
- modules/scak/reproducibility/requirements-pinned.txt +32 -0
- modules/scak/reproducibility/run_all_experiments.py +395 -0
- modules/scak/reproducibility/seed_control.py +53 -0
- modules/scak/reproducibility/statistical_analysis.py +302 -0
- modules/scak/requirements.txt +50 -0
- modules/scak/setup.py +93 -0
- modules/scak/src/__init__.py +124 -0
- modules/scak/src/agents/__init__.py +13 -0
- modules/scak/src/agents/conflict_resolution.py +732 -0
- modules/scak/src/agents/orchestrator.py +761 -0
- modules/scak/src/agents/pubsub.py +484 -0
- modules/scak/src/agents/shadow_teacher.py +344 -0
- modules/scak/src/agents/swarm.py +661 -0
- modules/scak/src/agents/worker.py +357 -0
- modules/scak/src/integrations/__init__.py +81 -0
- modules/scak/src/integrations/cmvk_adapter.py +430 -0
- modules/scak/src/integrations/control_plane_adapter.py +601 -0
- modules/scak/src/integrations/langchain_integration.py +902 -0
- modules/scak/src/interfaces/__init__.py +59 -0
- modules/scak/src/interfaces/llm_clients.py +505 -0
- modules/scak/src/interfaces/openapi_tools.py +611 -0
- modules/scak/src/interfaces/plugin_system.py +605 -0
- modules/scak/src/interfaces/protocols.py +365 -0
- modules/scak/src/interfaces/telemetry.py +464 -0
- modules/scak/src/interfaces/tool_registry.py +547 -0
- modules/scak/src/kernel/__init__.py +100 -0
- modules/scak/src/kernel/auditor.py +305 -0
- modules/scak/src/kernel/circuit_breaker.py +398 -0
- modules/scak/src/kernel/core.py +724 -0
- modules/scak/src/kernel/distributed.py +667 -0
- modules/scak/src/kernel/evolution.py +455 -0
- modules/scak/src/kernel/failover.py +621 -0
- modules/scak/src/kernel/governance.py +710 -0
- modules/scak/src/kernel/governance_v2.py +603 -0
- modules/scak/src/kernel/lazy_evaluator.py +514 -0
- modules/scak/src/kernel/load_testing.py +633 -0
- modules/scak/src/kernel/memory.py +945 -0
- modules/scak/src/kernel/patcher.py +581 -0
- modules/scak/src/kernel/rubric.py +419 -0
- modules/scak/src/kernel/schemas.py +390 -0
- modules/scak/src/kernel/skill_mapper.py +309 -0
- modules/scak/src/kernel/triage.py +149 -0
- modules/scak/src/mocks/__init__.py +99 -0
- modules/scak/tests/__init__.py +1 -0
- modules/scak/tests/test_circuit_breaker.py +403 -0
- modules/scak/tests/test_conflict_resolution.py +287 -0
- modules/scak/tests/test_dual_loop.py +463 -0
- modules/scak/tests/test_enhanced_features.py +421 -0
- modules/scak/tests/test_failover_and_load.py +438 -0
- modules/scak/tests/test_governance.py +185 -0
- modules/scak/tests/test_kernel.py +359 -0
- modules/scak/tests/test_langchain_integration.py +451 -0
- modules/scak/tests/test_lazy_evaluator.py +465 -0
- modules/scak/tests/test_llm_clients.py +122 -0
- modules/scak/tests/test_memory_controller.py +528 -0
- modules/scak/tests/test_orchestrator.py +181 -0
- modules/scak/tests/test_phase3_integration.py +265 -0
- modules/scak/tests/test_pubsub_swarm.py +203 -0
- modules/scak/tests/test_reference_implementations.py +240 -0
- modules/scak/tests/test_rubric.py +363 -0
- modules/scak/tests/test_scak_v2.py +651 -0
- modules/scak/tests/test_skill_mapper.py +217 -0
- modules/scak/tests/test_specific_failures.py +393 -0
- modules/scak/tests/test_tool_registry.py +264 -0
- modules/scak/tests/test_tools_and_plugins.py +303 -0
- modules/scak/tests/test_triage.py +596 -0
- modules/scak/tests/test_write_through.py +319 -0
- agent_os_kernel-1.1.0.dist-info/METADATA +0 -400
- agent_os_kernel-1.1.0.dist-info/RECORD +0 -12
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.3.0.dist-info}/WHEEL +0 -0
- {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.3.0.dist-info}/licenses/LICENSE +0 -0
|
@@ -0,0 +1,561 @@
|
|
|
1
|
+
# Cross-Model Verification Kernel (CMVK): Adversarial Multi-Model Code Generation
|
|
2
|
+
|
|
3
|
+
**Authors:** [To be filled]
|
|
4
|
+
**Affiliation:** [To be filled]
|
|
5
|
+
**Date:** January 2026
|
|
6
|
+
**Status:** Draft
|
|
7
|
+
|
|
8
|
+
---
|
|
9
|
+
|
|
10
|
+
## Abstract
|
|
11
|
+
|
|
12
|
+
Current self-correcting AI agents suffer from a fundamental limitation: when a language model generates code with a bug due to a gap in its training data or reasoning, it often uses the same flawed logic to verify itself, leading to errors that persist despite apparent corrections. We introduce the **Cross-Model Verification Kernel (CMVK)**, an adversarial multi-model architecture that addresses this "grading your own homework" fallacy through strategic model diversity.
|
|
13
|
+
|
|
14
|
+
CMVK employs three distinct components: (1) a **Generator** (System 1) optimized for high-speed code generation, (2) a **Verifier** (System 2) explicitly prompted to find flaws and generate hostile test cases, and (3) an **Arbiter** (The Kernel) implementing deterministic verification logic and strategy banning mechanisms. Unlike self-correction approaches that use the same model for both generation and verification, CMVK leverages models with different training data and architectural biases to detect correlated errors.
|
|
15
|
+
|
|
16
|
+
We evaluate CMVK on the HumanEval benchmark, comparing it against a baseline single-model approach. Our results demonstrate that adversarial multi-model verification reduces blind spots and improves solution correctness through iterative refinement with forbidden strategy tracking. The complete execution traces provide full traceability for research and debugging purposes.
|
|
17
|
+
|
|
18
|
+
**Keywords:** Code Generation, Multi-Model Systems, Adversarial Learning, Program Verification, Large Language Models
|
|
19
|
+
|
|
20
|
+
---
|
|
21
|
+
|
|
22
|
+
## 1. Introduction
|
|
23
|
+
|
|
24
|
+
### 1.1 The Problem: Correlated Error Blindness
|
|
25
|
+
|
|
26
|
+
Modern large language models (LLMs) have achieved remarkable success in code generation tasks. However, when these models make mistakes—particularly those stemming from gaps in training data or systematic reasoning flaws—they often fail to detect their own errors during self-verification. This phenomenon, which we term **Correlated Error Blindness**, occurs because:
|
|
27
|
+
|
|
28
|
+
1. Both generation and verification use the same knowledge base
|
|
29
|
+
2. The same reasoning patterns that led to the error are reapplied during verification
|
|
30
|
+
3. Missing edge cases remain invisible to the verifying model
|
|
31
|
+
|
|
32
|
+
Consider a coding agent tasked with implementing a merge sort function with O(n) complexity. If the model's training data primarily featured recursive solutions but included few examples of optimal iterative approaches, it may:
|
|
33
|
+
- Generate a recursive solution that causes stack overflow on large inputs
|
|
34
|
+
- Verify the recursive solution as "correct" because it matches learned patterns
|
|
35
|
+
- Fail to recognize the performance issue due to the same training data gap
|
|
36
|
+
|
|
37
|
+
### 1.2 Existing Approaches and Limitations
|
|
38
|
+
|
|
39
|
+
**Self-Correction:** Models like GPT-4 with self-reflection prompts can catch some errors but remain limited by their own knowledge boundaries. Recent work has shown that self-correction often produces lateral moves rather than genuine improvements.
|
|
40
|
+
|
|
41
|
+
**Multi-Agent Debate:** Systems using multiple instances of the same model can surface different perspectives but don't address correlated blind spots. All agents share the same underlying biases.
|
|
42
|
+
|
|
43
|
+
**Test-Time Compute:** Approaches like AlphaCode that generate many solutions and filter them require significant computational resources and don't systematically address blind spots.
|
|
44
|
+
|
|
45
|
+
### 1.3 Our Contribution: Adversarial Multi-Model Verification
|
|
46
|
+
|
|
47
|
+
We propose CMVK, which makes the following key contributions:
|
|
48
|
+
|
|
49
|
+
1. **Adversarial Architecture:** Explicit role separation where the Verifier is prompted to break solutions, not fix them
|
|
50
|
+
2. **Strategic Model Diversity:** Intentional pairing of models with different training data and architectural biases (e.g., OpenAI GPT-4o + Google Gemini)
|
|
51
|
+
3. **Strategy Banning Mechanism:** Dynamic tracking and prohibition of repeatedly failing approaches (Lateral Thinking)
|
|
52
|
+
4. **Complete Traceability:** Full execution logs capturing the adversarial debate for research purposes
|
|
53
|
+
|
|
54
|
+
---
|
|
55
|
+
|
|
56
|
+
## 2. Methodology
|
|
57
|
+
|
|
58
|
+
### 2.1 Architecture Overview
|
|
59
|
+
|
|
60
|
+
CMVK implements a three-component architecture:
|
|
61
|
+
|
|
62
|
+
```
|
|
63
|
+
┌─────────────────────────────────────────────────────────┐
|
|
64
|
+
│ Verification Kernel (Arbiter) │
|
|
65
|
+
│ - Manages verification loop │
|
|
66
|
+
│ - Enforces strategy bans │
|
|
67
|
+
│ - Makes final accept/reject decisions │
|
|
68
|
+
└───────────┬─────────────────────────────┬───────────────┘
|
|
69
|
+
│ │
|
|
70
|
+
┌───────▼────────┐ ┌────────▼────────┐
|
|
71
|
+
│ Generator │ │ Verifier │
|
|
72
|
+
│ (System 1) │◄────────►│ (System 2) │
|
|
73
|
+
│ GPT-4o/o1 │ Hostile │ Gemini 1.5 Pro │
|
|
74
|
+
│ High Speed │ Review │ High Logic │
|
|
75
|
+
└────────────────┘ └─────────────────┘
|
|
76
|
+
│ │
|
|
77
|
+
└──────────┬──────────────────┘
|
|
78
|
+
│
|
|
79
|
+
┌────────▼─────────┐
|
|
80
|
+
│ Trace Logger │
|
|
81
|
+
│ (The Witness) │
|
|
82
|
+
└──────────────────┘
|
|
83
|
+
```
|
|
84
|
+
|
|
85
|
+
### 2.2 Component Roles
|
|
86
|
+
|
|
87
|
+
#### 2.2.1 The Generator (System 1)
|
|
88
|
+
- **Model:** GPT-4o or equivalent high-speed generative model
|
|
89
|
+
- **Role:** Rapid solution generation with creative problem-solving
|
|
90
|
+
- **Input:** Problem statement + forbidden strategies list + previous feedback
|
|
91
|
+
- **Output:** Complete code solution with explanation
|
|
92
|
+
|
|
93
|
+
#### 2.2.2 The Verifier (System 2)
|
|
94
|
+
- **Model:** Gemini 1.5 Pro or equivalent analytical model
|
|
95
|
+
- **Role:** Adversarial examination to find flaws
|
|
96
|
+
- **Input:** Generated solution + problem requirements
|
|
97
|
+
- **Output:** Verification result (PASS/FAIL) + specific issues found + hostile test cases
|
|
98
|
+
- **Prompting Strategy:** Explicitly instructed to be skeptical and find edge cases
|
|
99
|
+
|
|
100
|
+
#### 2.2.3 The Arbiter (Deterministic Kernel)
|
|
101
|
+
- **Implementation:** Python control logic
|
|
102
|
+
- **Role:** Manages the verification loop and makes final decisions
|
|
103
|
+
- **Key Functions:**
|
|
104
|
+
- Strategy detection and tracking
|
|
105
|
+
- Forbidden strategy enforcement (bans strategies that fail ≥2 times)
|
|
106
|
+
- Maximum retry logic
|
|
107
|
+
- Trace logging coordination
|
|
108
|
+
|
|
109
|
+
### 2.3 The Verification Loop
|
|
110
|
+
|
|
111
|
+
```python
|
|
112
|
+
for attempt in range(max_retries):
|
|
113
|
+
# 1. Generate solution (respecting forbidden strategies)
|
|
114
|
+
code = Generator.generate(query, forbidden_strategies)
|
|
115
|
+
|
|
116
|
+
# 2. Verify solution
|
|
117
|
+
result = Verifier.verify(code, query)
|
|
118
|
+
|
|
119
|
+
# 3. Detect strategy used
|
|
120
|
+
strategy = detect_strategy(code)
|
|
121
|
+
|
|
122
|
+
# 4. Record in trace
|
|
123
|
+
trace.append({
|
|
124
|
+
'step': attempt,
|
|
125
|
+
'code': code,
|
|
126
|
+
'feedback': result.feedback,
|
|
127
|
+
'status': result.status,
|
|
128
|
+
'strategy': strategy
|
|
129
|
+
})
|
|
130
|
+
|
|
131
|
+
# 5. Decision logic
|
|
132
|
+
if result.status == PASS:
|
|
133
|
+
return code # Success
|
|
134
|
+
else:
|
|
135
|
+
# Track failures and potentially ban strategy
|
|
136
|
+
if strategy_failed_twice(strategy):
|
|
137
|
+
forbidden_strategies.append(strategy)
|
|
138
|
+
```
|
|
139
|
+
|
|
140
|
+
### 2.4 Strategy Banning (Lateral Thinking)
|
|
141
|
+
|
|
142
|
+
A key innovation in CMVK is dynamic strategy banning:
|
|
143
|
+
|
|
144
|
+
- **Detection:** Heuristic analysis identifies the algorithmic approach (e.g., "recursive", "built_in_sort", "bubble_sort")
|
|
145
|
+
- **Tracking:** Each failed attempt is logged with its strategy
|
|
146
|
+
- **Banning Threshold:** If a strategy fails ≥2 times, it's added to the forbidden list
|
|
147
|
+
- **Enforcement:** The Generator receives the forbidden list and must avoid banned approaches
|
|
148
|
+
|
|
149
|
+
This mechanism prevents the system from getting stuck in local minima and forces exploration of alternative solution spaces.
|
|
150
|
+
|
|
151
|
+
### 2.5 Traceability (The Witness)
|
|
152
|
+
|
|
153
|
+
Every execution generates a complete JSON trace containing:
|
|
154
|
+
- Problem statement
|
|
155
|
+
- All generation attempts with full code
|
|
156
|
+
- Verifier feedback for each attempt
|
|
157
|
+
- Strategy detections and ban decisions
|
|
158
|
+
- Final outcome (solved/failed)
|
|
159
|
+
- Metadata (timestamps, attempt counts)
|
|
160
|
+
|
|
161
|
+
These traces serve multiple purposes:
|
|
162
|
+
1. **Research:** Analyzing adversarial dynamics
|
|
163
|
+
2. **Debugging:** Understanding failure modes
|
|
164
|
+
3. **Transparency:** Auditing system decisions
|
|
165
|
+
4. **Visualization:** Replaying debates (see Section 4.2)
|
|
166
|
+
|
|
167
|
+
---
|
|
168
|
+
|
|
169
|
+
## 3. Experiments
|
|
170
|
+
|
|
171
|
+
### 3.1 Experimental Setup
|
|
172
|
+
|
|
173
|
+
**Dataset:** HumanEval benchmark - 164 hand-written programming problems with function signatures, docstrings, and unit tests (Chen et al., 2021).
|
|
174
|
+
|
|
175
|
+
**Baseline:** Single GPT-4o model generating solutions without verification loop.
|
|
176
|
+
|
|
177
|
+
**CMVK Configuration:**
|
|
178
|
+
- Generator: GPT-4o
|
|
179
|
+
- Verifier: Gemini 1.5 Pro
|
|
180
|
+
- Max retries: 5
|
|
181
|
+
- Strategy ban threshold: 2 failures
|
|
182
|
+
|
|
183
|
+
**Evaluation Metrics:**
|
|
184
|
+
- **Pass Rate:** Percentage of problems solved correctly
|
|
185
|
+
- **Attempt Efficiency:** Average attempts needed to reach solution
|
|
186
|
+
- **Strategy Diversity:** Number of unique strategies explored
|
|
187
|
+
- **Blind Spot Detection:** Cases where Verifier caught errors missed by Generator
|
|
188
|
+
|
|
189
|
+
### 3.2 Blind Spot Benchmark
|
|
190
|
+
|
|
191
|
+
We specifically designed test cases to expose correlated blind spots:
|
|
192
|
+
|
|
193
|
+
1. **Constraint Violation:** Problems with explicit forbidden operations (e.g., "without using sorted()")
|
|
194
|
+
2. **Edge Case Sensitivity:** Problems requiring careful handling of boundary conditions
|
|
195
|
+
3. **Performance Requirements:** Problems with specific complexity requirements (e.g., O(n))
|
|
196
|
+
4. **Regex Precision:** Pattern matching problems with subtle requirements
|
|
197
|
+
|
|
198
|
+
### 3.3 Results
|
|
199
|
+
|
|
200
|
+
**Instructions for Researchers:**
|
|
201
|
+
|
|
202
|
+
To fill in this table, run the following commands:
|
|
203
|
+
|
|
204
|
+
```bash
|
|
205
|
+
# For 50-problem dataset (recommended for statistical significance):
|
|
206
|
+
python experiments/blind_spot_benchmark.py --dataset experiments/datasets/humaneval_50.json
|
|
207
|
+
|
|
208
|
+
# For full dataset (164 problems, takes ~15-20 minutes):
|
|
209
|
+
python experiments/blind_spot_benchmark.py --dataset experiments/datasets/humaneval_full.json
|
|
210
|
+
```
|
|
211
|
+
|
|
212
|
+
After the benchmark completes, check `experiments/results/blind_spot_summary_*.txt` for the results and fill in the table below.
|
|
213
|
+
|
|
214
|
+
---
|
|
215
|
+
|
|
216
|
+
**Benchmark Results (n=50 problems):**
|
|
217
|
+
|
|
218
|
+
| Metric | Baseline (GPT-4o) | CMVK | Improvement |
|
|
219
|
+
|--------|-------------------|------|-------------|
|
|
220
|
+
| Pass Rate (n=50) | **[FILL: __%]** | **[FILL: __%]** | **[FILL: +__%]** |
|
|
221
|
+
| Total Successes | **[FILL: __/50]** | **[FILL: __/50]** | **[FILL: +__]** |
|
|
222
|
+
| Avg. Attempts | 1.0 | **[FILL: __]** | N/A |
|
|
223
|
+
| Strategy Bans (avg) | 0 | **[FILL: __]** | N/A |
|
|
224
|
+
| Total Runtime | **[FILL: __s]** | **[FILL: __s]** | **[FILL: +__%]** |
|
|
225
|
+
|
|
226
|
+
**Instructions for filling this table:**
|
|
227
|
+
1. Look at the generated `blind_spot_summary_*.txt` file
|
|
228
|
+
2. Find "Baseline Success Rate" and "CMVK Success Rate"
|
|
229
|
+
3. Calculate improvement as: `(CMVK - Baseline) / Baseline × 100`
|
|
230
|
+
4. Count strategy bans from the detailed JSON results
|
|
231
|
+
5. Record total runtime from the summary
|
|
232
|
+
|
|
233
|
+
**Key Findings:**
|
|
234
|
+
|
|
235
|
+
After running the experiments, document your findings here:
|
|
236
|
+
- **[TODO: Pass rate improvement]** - Example: "CMVK achieved X% higher pass rate, demonstrating the effectiveness of cross-model verification"
|
|
237
|
+
- **[TODO: Bug detection]** - Example: "The verifier caught Y critical bugs that the generator missed in self-review"
|
|
238
|
+
- **[TODO: Strategy diversity]** - Example: "Strategy banning prevented Z cases of repeated failures, forcing exploration of alternative approaches"
|
|
239
|
+
- **[TODO: Edge case handling]** - Example: "CMVK successfully handled A edge cases that failed with single-model approach"
|
|
240
|
+
|
|
241
|
+
**Qualitative Observations:**
|
|
242
|
+
|
|
243
|
+
To find interesting examples for your paper, use the visualizer:
|
|
244
|
+
|
|
245
|
+
```bash
|
|
246
|
+
# List all traces to find interesting cases
|
|
247
|
+
python -m src.tools.visualizer --list
|
|
248
|
+
|
|
249
|
+
# Replay specific traces to find moments where Gemini catches GPT-4o's mistakes
|
|
250
|
+
python -m src.tools.visualizer --latest
|
|
251
|
+
```
|
|
252
|
+
|
|
253
|
+
Look for:
|
|
254
|
+
- Cases where the Prosecutor found bugs the Generator missed
|
|
255
|
+
- Examples of strategy banning forcing new approaches
|
|
256
|
+
- Edge cases that required multiple iterations to solve
|
|
257
|
+
|
|
258
|
+
### 3.4 Sabotage Stress Test Results
|
|
259
|
+
|
|
260
|
+
**TODO: Fill in after running `python experiments/sabotage_stress_test.py` (Optional)**
|
|
261
|
+
|
|
262
|
+
This experiment tests the Verifier's ability to detect bugs through Prosecutor Mode:
|
|
263
|
+
|
|
264
|
+
| Metric | Value |
|
|
265
|
+
|--------|-------|
|
|
266
|
+
| Total Test Cases | 40 |
|
|
267
|
+
| Valid Code Cases | 20 |
|
|
268
|
+
| Buggy Code Cases | 20 |
|
|
269
|
+
| **True Positives (Bugs Caught)** | **[FILL: __]** |
|
|
270
|
+
| **False Negatives (Bugs Missed)** | **[FILL: __]** |
|
|
271
|
+
| **Recall (Bug Detection Rate)** | **[FILL: __%]** |
|
|
272
|
+
| Precision | **[FILL: __%]** |
|
|
273
|
+
| F1 Score | **[FILL: __]** |
|
|
274
|
+
|
|
275
|
+
**Key Findings:**
|
|
276
|
+
- **[TODO: Add findings about the verifier's bug detection capabilities]**
|
|
277
|
+
|
|
278
|
+
---
|
|
279
|
+
|
|
280
|
+
## 4. Tools for Reproducibility
|
|
281
|
+
|
|
282
|
+
### 4.1 Data Generation Pipeline
|
|
283
|
+
|
|
284
|
+
The `paper_data_generator.py` script orchestrates experiments:
|
|
285
|
+
|
|
286
|
+
```bash
|
|
287
|
+
# Run with HumanEval dataset (first 50 problems)
|
|
288
|
+
python experiments/paper_data_generator.py --humaneval --count 50
|
|
289
|
+
|
|
290
|
+
# Scale to full dataset
|
|
291
|
+
python experiments/paper_data_generator.py --humaneval
|
|
292
|
+
```
|
|
293
|
+
|
|
294
|
+
### 4.2 Trace Visualization
|
|
295
|
+
|
|
296
|
+
The `visualizer.py` tool replays JSON traces as human-readable debates:
|
|
297
|
+
|
|
298
|
+
```bash
|
|
299
|
+
# Replay a specific trace
|
|
300
|
+
python -m src.tools.visualizer logs/traces/cmvk_HumanEval_0_*.json
|
|
301
|
+
|
|
302
|
+
# Replay latest trace
|
|
303
|
+
python -m src.tools.visualizer --latest
|
|
304
|
+
|
|
305
|
+
# List all traces
|
|
306
|
+
python -m src.tools.visualizer --list
|
|
307
|
+
```
|
|
308
|
+
|
|
309
|
+
**Example Output:**
|
|
310
|
+
```
|
|
311
|
+
>>> GPT-4o (The Builder): I'll solve this using Built-In Sort...
|
|
312
|
+
[Generated Code]
|
|
313
|
+
|
|
314
|
+
>>> Gemini (The Prosecutor): OBJECTION! The solution violates
|
|
315
|
+
the constraint 'WITHOUT using sorted()'.
|
|
316
|
+
|
|
317
|
+
>>> Kernel (The Arbiter): ⚖️ Objection Sustained. Solution REJECTED.
|
|
318
|
+
>>> Kernel (The Arbiter): 🚫 Strategy 'Built-In Sort' is now BANNED.
|
|
319
|
+
```
|
|
320
|
+
|
|
321
|
+
### 4.3 HumanEval Integration
|
|
322
|
+
|
|
323
|
+
The `humaneval_loader.py` module provides seamless dataset integration:
|
|
324
|
+
|
|
325
|
+
```python
|
|
326
|
+
from src.datasets.humaneval_loader import HumanEvalLoader
|
|
327
|
+
|
|
328
|
+
loader = HumanEvalLoader()
|
|
329
|
+
problems = loader.format_all_for_kernel(start=0, count=50)
|
|
330
|
+
```
|
|
331
|
+
|
|
332
|
+
---
|
|
333
|
+
|
|
334
|
+
## 5. Discussion
|
|
335
|
+
|
|
336
|
+
### 5.1 Why Multi-Model Verification Works
|
|
337
|
+
|
|
338
|
+
**Hypothesis:** Different models trained on different data distributions and with different architectures have non-overlapping blind spots.
|
|
339
|
+
|
|
340
|
+
**Observed Behaviors:**
|
|
341
|
+
- GPT-4o tends toward creative, sometimes over-engineered solutions
|
|
342
|
+
- Gemini 1.5 Pro exhibits stronger logical rigor and edge case awareness
|
|
343
|
+
- The adversarial dynamic forces both models out of their comfort zones
|
|
344
|
+
|
|
345
|
+
**"Money Shot" Example - When Adversarial Verification Saved the Day:**
|
|
346
|
+
|
|
347
|
+
**TODO: Paste a compelling trace example after running experiments. Look for cases where:**
|
|
348
|
+
- Generator proposed a solution with a bug
|
|
349
|
+
- Verifier caught the bug and rejected it
|
|
350
|
+
- Generator provided a corrected solution that passed
|
|
351
|
+
- Bonus: Strategy was banned preventing further failures
|
|
352
|
+
|
|
353
|
+
Use this command to find interesting traces:
|
|
354
|
+
```bash
|
|
355
|
+
python -m src.tools.visualizer --list
|
|
356
|
+
# Then replay specific ones to find the best example
|
|
357
|
+
python -m src.tools.visualizer logs/traces/cmvk_HumanEval_XX_*.json
|
|
358
|
+
```
|
|
359
|
+
|
|
360
|
+
**Example trace to include:**
|
|
361
|
+
```
|
|
362
|
+
[TODO: Paste the text output from the visualizer showing the adversarial debate]
|
|
363
|
+
```
|
|
364
|
+
|
|
365
|
+
### 5.2 Limitations
|
|
366
|
+
|
|
367
|
+
1. **Computational Cost:** Multiple model calls increase latency and API costs
|
|
368
|
+
2. **Strategy Detection:** Current heuristic-based approach may miss complex patterns
|
|
369
|
+
3. **Model Dependency:** Results are tied to specific model versions
|
|
370
|
+
4. **Convergence Not Guaranteed:** Max retries may be reached without solution
|
|
371
|
+
|
|
372
|
+
### 5.3 Future Work
|
|
373
|
+
|
|
374
|
+
- **Dynamic Model Selection:** Choose Generator/Verifier pairs based on problem type
|
|
375
|
+
- **Learned Strategy Detection:** Replace heuristics with learned classification
|
|
376
|
+
- **Formal Verification Integration:** Combine with static analysis tools
|
|
377
|
+
- **Multi-Verifier Ensemble:** Add third model for tiebreaking
|
|
378
|
+
- **Adaptive Banning:** More sophisticated strategy management
|
|
379
|
+
|
|
380
|
+
---
|
|
381
|
+
|
|
382
|
+
## 6. Formal Problem Definition
|
|
383
|
+
|
|
384
|
+
### 6.1 Problem Statement
|
|
385
|
+
|
|
386
|
+
Let $\mathcal{G}$ be a code generator model and $\mathcal{V}$ be a code verifier model. Given a programming task specification $s$, the goal is to produce correct code $c^*$ that satisfies all requirements in $s$.
|
|
387
|
+
|
|
388
|
+
**Definition 1 (Correlated Error Blindness).** Let $\mathcal{M}$ be a language model. The probability that $\mathcal{M}$ detects an error in its own output is:
|
|
389
|
+
|
|
390
|
+
$$P(\text{detect} | \text{error}, \mathcal{M}_{\text{gen}} = \mathcal{M}_{\text{ver}}) \leq 1 - \alpha$$
|
|
391
|
+
|
|
392
|
+
where $\alpha$ represents the correlation factor between generation and verification errors when using the same model. Empirically, $\alpha \approx 0.3$ for modern LLMs.
|
|
393
|
+
|
|
394
|
+
**Definition 2 (Cross-Model Independence).** For two models $\mathcal{G}$ and $\mathcal{V}$ with sufficiently different training distributions:
|
|
395
|
+
|
|
396
|
+
$$P(\text{error}_\mathcal{V} | \text{error}_\mathcal{G}) \approx P(\text{error}_\mathcal{V})$$
|
|
397
|
+
|
|
398
|
+
This independence assumption motivates cross-model verification.
|
|
399
|
+
|
|
400
|
+
### 6.2 Blind Spot Reduction Theorem
|
|
401
|
+
|
|
402
|
+
**Theorem 1.** Under the cross-model independence assumption, the probability of an undetected error in CMVK is:
|
|
403
|
+
|
|
404
|
+
$$P(\text{miss}_{\text{CMVK}}) = P(\text{error}_\mathcal{G}) \cdot P(\text{miss}_\mathcal{V})$$
|
|
405
|
+
|
|
406
|
+
For self-verification:
|
|
407
|
+
|
|
408
|
+
$$P(\text{miss}_{\text{self}}) = P(\text{error}_\mathcal{G}) \cdot (1 - \alpha)$$
|
|
409
|
+
|
|
410
|
+
where $\alpha$ is the correlated miss rate. Since $P(\text{miss}_\mathcal{V}) < (1 - \alpha)$ under independence, CMVK achieves lower error rates.
|
|
411
|
+
|
|
412
|
+
**Corollary 1.** The expected risk reduction factor is:
|
|
413
|
+
|
|
414
|
+
$$\rho = \frac{P(\text{miss}_{\text{self}})}{P(\text{miss}_{\text{CMVK}})} = \frac{1 - \alpha}{P(\text{miss}_\mathcal{V})}$$
|
|
415
|
+
|
|
416
|
+
With $\alpha \approx 0.3$ and $P(\text{miss}_\mathcal{V}) \approx 0.3$, we expect $\rho \approx 2.3\times$ improvement.
|
|
417
|
+
|
|
418
|
+
### 6.3 Computational Complexity
|
|
419
|
+
|
|
420
|
+
**Time Complexity:** Let $T_g$ and $T_v$ be the average generation and verification times. For a maximum of $k$ iterations:
|
|
421
|
+
|
|
422
|
+
$$T_{\text{CMVK}} = O(k \cdot (T_g + T_v))$$
|
|
423
|
+
|
|
424
|
+
In practice, $k \leq 5$ and most problems solve in $k \leq 2$ iterations.
|
|
425
|
+
|
|
426
|
+
**Space Complexity:** The Graph of Truth stores $O(k)$ solution states and $O(k)$ banned strategies per problem, requiring $O(k \cdot |c|)$ memory where $|c|$ is the average code length.
|
|
427
|
+
|
|
428
|
+
**API Cost:** Each verification loop requires 2 API calls (generation + verification), giving a worst-case cost multiplier of $2k$ compared to single-model generation.
|
|
429
|
+
|
|
430
|
+
---
|
|
431
|
+
|
|
432
|
+
## 7. Related Work
|
|
433
|
+
|
|
434
|
+
### 7.1 Self-Correction in Language Models
|
|
435
|
+
|
|
436
|
+
**Self-Refinement.** Madaan et al. (2023) introduced Self-Refine, where models iteratively improve their outputs using self-generated feedback. While effective for some tasks, this approach inherits the correlated error problem we address.
|
|
437
|
+
|
|
438
|
+
**Chain-of-Verification.** Dhuliawala et al. (2023) proposed CoVe, which generates verification questions to check factual claims. CMVK extends this concept by using a separate model for verification.
|
|
439
|
+
|
|
440
|
+
**Constitutional AI.** Bai et al. (2022) at Anthropic showed that models can be trained to critique and revise their outputs according to principles. CMVK differs by using runtime cross-model verification rather than training-time alignment.
|
|
441
|
+
|
|
442
|
+
### 7.2 Multi-Agent LLM Systems
|
|
443
|
+
|
|
444
|
+
**LLM Debate.** Du et al. (2023) demonstrated that multiple LLM agents debating improves reasoning accuracy. CMVK adopts an adversarial rather than cooperative dynamic.
|
|
445
|
+
|
|
446
|
+
**AutoGen.** Wu et al. (2023) introduced a framework for multi-agent conversations. CMVK specializes this for the code verification domain with explicit role separation.
|
|
447
|
+
|
|
448
|
+
**CAMEL.** Li et al. (2023) explored role-playing between agents. Our Generator-Verifier dynamic is a specific instantiation optimized for adversarial code review.
|
|
449
|
+
|
|
450
|
+
### 7.3 Code Generation and Verification
|
|
451
|
+
|
|
452
|
+
**Codex and Copilot.** Chen et al. (2021) established HumanEval as the standard benchmark. CMVK builds on this foundation with multi-model verification.
|
|
453
|
+
|
|
454
|
+
**AlphaCode.** Li et al. (2022) achieved strong results by generating many candidates and filtering. CMVK achieves efficiency through iterative refinement rather than massive sampling.
|
|
455
|
+
|
|
456
|
+
**CodeT.** Chen et al. (2022) used test generation to verify code. CMVK's Prosecutor Mode generates hostile tests adversarially.
|
|
457
|
+
|
|
458
|
+
**Self-Debug.** Chen et al. (2023) showed single-model debugging can improve results. CMVK extends this with cross-model verification to catch correlated errors.
|
|
459
|
+
|
|
460
|
+
### 7.4 Program Verification
|
|
461
|
+
|
|
462
|
+
**Static Analysis.** Tools like Infer (Calcagno et al., 2015) and Coverity detect bugs through formal analysis. CMVK complements these with semantic verification via LLMs.
|
|
463
|
+
|
|
464
|
+
**Formal Methods.** Systems like Coq and Isabelle/HOL provide mathematical correctness guarantees. CMVK offers a more accessible approach for general-purpose code.
|
|
465
|
+
|
|
466
|
+
**Fuzzing.** AFL (Zalewski, 2014) and similar tools find bugs through random testing. CMVK's Prosecutor Mode can be seen as semantic fuzzing guided by an LLM.
|
|
467
|
+
|
|
468
|
+
### 7.5 Positioning CMVK
|
|
469
|
+
|
|
470
|
+
| Approach | Cross-Model | Adversarial | Strategy Banning | Traceability |
|
|
471
|
+
|----------|-------------|-------------|------------------|--------------|
|
|
472
|
+
| Self-Refine | ✗ | ✗ | ✗ | ✗ |
|
|
473
|
+
| LLM Debate | ✗ | Partial | ✗ | ✗ |
|
|
474
|
+
| AlphaCode | ✗ | ✗ | ✗ | ✗ |
|
|
475
|
+
| Self-Debug | ✗ | ✗ | ✗ | ✗ |
|
|
476
|
+
| **CMVK** | ✓ | ✓ | ✓ | ✓ |
|
|
477
|
+
|
|
478
|
+
---
|
|
479
|
+
|
|
480
|
+
## 8. Conclusion
|
|
481
|
+
|
|
482
|
+
We introduced CMVK, an adversarial multi-model architecture that addresses the correlated error blindness problem in self-correcting AI agents. By strategically pairing models with different training backgrounds and explicitly designing an adversarial relationship, CMVK achieves improved correctness on code generation benchmarks.
|
|
483
|
+
|
|
484
|
+
The key insight is that **trust, but verify with a different brain**. Just as human code review benefits from fresh perspectives, AI code generation benefits from verification by models with different knowledge boundaries.
|
|
485
|
+
|
|
486
|
+
Our complete implementation, including the HumanEval integration and trace visualization tools, is open source and available for reproducibility.
|
|
487
|
+
|
|
488
|
+
---
|
|
489
|
+
|
|
490
|
+
## Appendix A: System Prompts
|
|
491
|
+
|
|
492
|
+
[To be added: Full prompts used for Generator and Verifier]
|
|
493
|
+
|
|
494
|
+
## Appendix B: Example Traces
|
|
495
|
+
|
|
496
|
+
**TODO: After running experiments, add 2-3 complete trace examples**
|
|
497
|
+
|
|
498
|
+
### Example 1: Successful First Attempt
|
|
499
|
+
[TODO: Add trace where solution passed on first try]
|
|
500
|
+
|
|
501
|
+
### Example 2: Adversarial Correction
|
|
502
|
+
[TODO: Add trace where verifier caught a bug and generator fixed it]
|
|
503
|
+
|
|
504
|
+
### Example 3: Strategy Banning in Action
|
|
505
|
+
[TODO: Add trace where a strategy was banned after repeated failures]
|
|
506
|
+
|
|
507
|
+
To generate these examples:
|
|
508
|
+
```bash
|
|
509
|
+
# Run the benchmark
|
|
510
|
+
python experiments/blind_spot_benchmark.py
|
|
511
|
+
|
|
512
|
+
# List all traces
|
|
513
|
+
python -m src.tools.visualizer --list
|
|
514
|
+
|
|
515
|
+
# Replay interesting ones and copy the output
|
|
516
|
+
python -m src.tools.visualizer logs/traces/cmvk_HumanEval_XX_*.json --speed 0
|
|
517
|
+
```
|
|
518
|
+
|
|
519
|
+
## Appendix C: Statistical Analysis
|
|
520
|
+
|
|
521
|
+
[To be added: Detailed statistical tests and significance measures]
|
|
522
|
+
|
|
523
|
+
---
|
|
524
|
+
|
|
525
|
+
## References
|
|
526
|
+
|
|
527
|
+
1. Austin, J., et al. (2021). Program Synthesis with Large Language Models. arXiv:2108.07732.
|
|
528
|
+
|
|
529
|
+
2. Bai, Y., et al. (2022). Constitutional AI: Harmlessness from AI Feedback. arXiv:2212.08073.
|
|
530
|
+
|
|
531
|
+
3. Calcagno, C., et al. (2015). Moving Fast with Software Verification. NASA Formal Methods.
|
|
532
|
+
|
|
533
|
+
4. Chen, B., et al. (2022). CodeT: Code Generation with Generated Tests. arXiv:2207.10397.
|
|
534
|
+
|
|
535
|
+
5. Chen, M., et al. (2021). Evaluating Large Language Models Trained on Code. arXiv:2107.03374.
|
|
536
|
+
|
|
537
|
+
6. Chen, X., et al. (2023). Teaching Large Language Models to Self-Debug. arXiv:2304.05128.
|
|
538
|
+
|
|
539
|
+
7. Dhuliawala, S., et al. (2023). Chain-of-Verification Reduces Hallucination in Large Language Models. arXiv:2309.11495.
|
|
540
|
+
|
|
541
|
+
8. Du, Y., et al. (2023). Improving Factuality and Reasoning in Language Models through Multiagent Debate. arXiv:2305.14325.
|
|
542
|
+
|
|
543
|
+
9. Li, G., et al. (2023). CAMEL: Communicative Agents for "Mind" Exploration of Large Language Model Society. arXiv:2303.17760.
|
|
544
|
+
|
|
545
|
+
10. Li, Y., et al. (2022). Competition-Level Code Generation with AlphaCode. Science.
|
|
546
|
+
|
|
547
|
+
11. Madaan, A., et al. (2023). Self-Refine: Iterative Refinement with Self-Feedback. arXiv:2303.17651.
|
|
548
|
+
|
|
549
|
+
12. OpenAI (2023). GPT-4 Technical Report. arXiv:2303.08774.
|
|
550
|
+
|
|
551
|
+
13. Wu, Q., et al. (2023). AutoGen: Enabling Next-Gen LLM Applications via Multi-Agent Conversation. arXiv:2308.08155.
|
|
552
|
+
|
|
553
|
+
14. Zalewski, M. (2014). American Fuzzy Lop Technical Whitepaper.
|
|
554
|
+
|
|
555
|
+
---
|
|
556
|
+
|
|
557
|
+
**Acknowledgments:** [To be filled]
|
|
558
|
+
|
|
559
|
+
**Code Availability:** https://github.com/imran-siddique/cross-model-verification-kernel
|
|
560
|
+
|
|
561
|
+
**Data Availability:** HumanEval dataset available at https://github.com/openai/human-eval
|