agent-os-kernel 1.1.0__py3-none-any.whl → 1.2.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (1051) hide show
  1. agent_os/__init__.py +66 -4
  2. agent_os/agents_compat.py +286 -0
  3. agent_os/base_agent.py +308 -0
  4. agent_os/cli.py +1079 -19
  5. agent_os/integrations/__init__.py +37 -2
  6. agent_os/integrations/openai_adapter.py +502 -0
  7. agent_os/integrations/semantic_kernel_adapter.py +569 -0
  8. agent_os/stateless.py +349 -0
  9. agent_os_kernel-1.2.0.dist-info/METADATA +676 -0
  10. agent_os_kernel-1.2.0.dist-info/RECORD +1053 -0
  11. {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/entry_points.txt +0 -1
  12. modules/amb/.github/workflows/ci.yml +102 -0
  13. modules/amb/.github/workflows/publish.yml +146 -0
  14. modules/amb/.gitignore +134 -0
  15. modules/amb/CHANGELOG.md +118 -0
  16. modules/amb/CONTRIBUTING.md +141 -0
  17. modules/amb/LICENSE +21 -0
  18. modules/amb/README.md +188 -0
  19. modules/amb/amb_core/__init__.py +175 -0
  20. modules/amb/amb_core/adapters/__init__.py +55 -0
  21. modules/amb/amb_core/adapters/aws_sqs_broker.py +374 -0
  22. modules/amb/amb_core/adapters/azure_servicebus_broker.py +338 -0
  23. modules/amb/amb_core/adapters/kafka_broker.py +258 -0
  24. modules/amb/amb_core/adapters/nats_broker.py +283 -0
  25. modules/amb/amb_core/adapters/rabbitmq_broker.py +233 -0
  26. modules/amb/amb_core/adapters/redis_broker.py +260 -0
  27. modules/amb/amb_core/broker.py +143 -0
  28. modules/amb/amb_core/bus.py +479 -0
  29. modules/amb/amb_core/cloudevents.py +507 -0
  30. modules/amb/amb_core/dlq.py +343 -0
  31. modules/amb/amb_core/hf_utils.py +534 -0
  32. modules/amb/amb_core/memory_broker.py +408 -0
  33. modules/amb/amb_core/models.py +139 -0
  34. modules/amb/amb_core/persistence.py +527 -0
  35. modules/amb/amb_core/schema.py +292 -0
  36. modules/amb/amb_core/tracing.py +356 -0
  37. modules/amb/examples/advanced_features.py +223 -0
  38. modules/amb/examples/backpressure_demo.py +225 -0
  39. modules/amb/examples/basic_usage.py +117 -0
  40. modules/amb/examples/tracing_demo.py +104 -0
  41. modules/amb/experiments/README.md +52 -0
  42. modules/amb/experiments/reproduce_results.py +467 -0
  43. modules/amb/experiments/results.json +324 -0
  44. modules/amb/paper/README.md +40 -0
  45. modules/amb/paper/paper.tex +365 -0
  46. modules/amb/paper/whitepaper.md +377 -0
  47. modules/amb/pyproject.toml +117 -0
  48. modules/amb/tests/__init__.py +1 -0
  49. modules/amb/tests/test_backpressure_priority.py +280 -0
  50. modules/amb/tests/test_bus.py +198 -0
  51. modules/amb/tests/test_cloudevents.py +443 -0
  52. modules/amb/tests/test_features.py +531 -0
  53. modules/amb/tests/test_models.py +74 -0
  54. modules/amb/tests/test_tracing.py +254 -0
  55. modules/atr/.github/workflows/ci.yml +101 -0
  56. modules/atr/.github/workflows/publish.yml +140 -0
  57. modules/atr/.gitignore +134 -0
  58. modules/atr/.pre-commit-config.yaml +37 -0
  59. modules/atr/CHANGELOG.md +39 -0
  60. modules/atr/CONTRIBUTING.md +96 -0
  61. modules/atr/IMPLEMENTATION_SUMMARY.md +143 -0
  62. modules/atr/README.md +180 -0
  63. modules/atr/atr/__init__.py +638 -0
  64. modules/atr/atr/access.py +346 -0
  65. modules/atr/atr/composition.py +643 -0
  66. modules/atr/atr/decorator.py +355 -0
  67. modules/atr/atr/executor.py +382 -0
  68. modules/atr/atr/health.py +555 -0
  69. modules/atr/atr/hf_utils.py +447 -0
  70. modules/atr/atr/injection.py +420 -0
  71. modules/atr/atr/metrics.py +438 -0
  72. modules/atr/atr/policies.py +401 -0
  73. modules/atr/atr/py.typed +2 -0
  74. modules/atr/atr/registry.py +450 -0
  75. modules/atr/atr/schema.py +478 -0
  76. modules/atr/atr/tools/safe/__init__.py +73 -0
  77. modules/atr/atr/tools/safe/calculator.py +380 -0
  78. modules/atr/atr/tools/safe/datetime_tool.py +441 -0
  79. modules/atr/atr/tools/safe/file_reader.py +400 -0
  80. modules/atr/atr/tools/safe/http_client.py +314 -0
  81. modules/atr/atr/tools/safe/json_parser.py +372 -0
  82. modules/atr/atr/tools/safe/text_tool.py +526 -0
  83. modules/atr/atr/tools/safe/toolkit.py +173 -0
  84. modules/atr/docs/PYPI_SETUP.md +113 -0
  85. modules/atr/examples/README.md +27 -0
  86. modules/atr/examples/demo.py +144 -0
  87. modules/atr/examples/sandbox_demo.py +218 -0
  88. modules/atr/experiments/README.md +69 -0
  89. modules/atr/experiments/reproduce_results.py +509 -0
  90. modules/atr/experiments/results/.gitkeep +0 -0
  91. modules/atr/experiments/results/results_20260123_140334.json +71 -0
  92. modules/atr/paper/README.md +36 -0
  93. modules/atr/paper/figures/.gitkeep +0 -0
  94. modules/atr/paper/references.bib +84 -0
  95. modules/atr/paper/structure.tex +293 -0
  96. modules/atr/paper/whitepaper.md +234 -0
  97. modules/atr/pyproject.toml +148 -0
  98. modules/atr/requirements.txt +1 -0
  99. modules/atr/setup.py +30 -0
  100. modules/atr/tests/__init__.py +1 -0
  101. modules/atr/tests/test_decorator.py +317 -0
  102. modules/atr/tests/test_executor.py +245 -0
  103. modules/atr/tests/test_integration_executor.py +184 -0
  104. modules/atr/tests/test_registry.py +312 -0
  105. modules/atr/tests/test_schema.py +182 -0
  106. modules/atr/tests/test_v2_features.py +708 -0
  107. modules/caas/.dockerignore +63 -0
  108. modules/caas/.github/ISSUE_TEMPLATE/bug_report.md +38 -0
  109. modules/caas/.github/ISSUE_TEMPLATE/custom.md +10 -0
  110. modules/caas/.github/ISSUE_TEMPLATE/feature_request.md +20 -0
  111. modules/caas/.github/workflows/ci.yml +100 -0
  112. modules/caas/.github/workflows/lint.yml +39 -0
  113. modules/caas/.github/workflows/publish-pypi.yml +124 -0
  114. modules/caas/.gitignore +73 -0
  115. modules/caas/.pre-commit-config.yaml +33 -0
  116. modules/caas/CHANGELOG.md +58 -0
  117. modules/caas/CONTRIBUTING.md +346 -0
  118. modules/caas/Dockerfile +41 -0
  119. modules/caas/LICENSE +21 -0
  120. modules/caas/MANIFEST.in +11 -0
  121. modules/caas/README.md +158 -0
  122. modules/caas/benchmarks/README.md +255 -0
  123. modules/caas/benchmarks/create_hf_dataset.py +502 -0
  124. modules/caas/benchmarks/data/sample_corpus/README.md +86 -0
  125. modules/caas/benchmarks/data/sample_corpus/auth_module.py +211 -0
  126. modules/caas/benchmarks/data/sample_corpus/contribution_guide.md +185 -0
  127. modules/caas/benchmarks/data/sample_corpus/remote_work_policy.html +57 -0
  128. modules/caas/benchmarks/hf_dataset/README.md +214 -0
  129. modules/caas/benchmarks/hf_dataset/caas_benchmark_corpus.py +73 -0
  130. modules/caas/benchmarks/hf_dataset/corpus_preview.json +193 -0
  131. modules/caas/benchmarks/results/README.md +66 -0
  132. modules/caas/benchmarks/results/evaluation_2026-01-20.json +121 -0
  133. modules/caas/benchmarks/run_evaluation.py +561 -0
  134. modules/caas/benchmarks/statistical_tests.py +289 -0
  135. modules/caas/benchmarks/verify_sample_corpus.py +83 -0
  136. modules/caas/docker-compose.yml +38 -0
  137. modules/caas/docs/CONTEXT_TRIAD.md +462 -0
  138. modules/caas/docs/CONTRIBUTING.md +346 -0
  139. modules/caas/docs/ETHICS_AND_LIMITATIONS.md +336 -0
  140. modules/caas/docs/HEURISTIC_ROUTER.md +442 -0
  141. modules/caas/docs/IMPLEMENTATION_SUMMARY.md +363 -0
  142. modules/caas/docs/IMPLEMENTATION_SUMMARY_CONTEXT_TRIAD.md +277 -0
  143. modules/caas/docs/IMPLEMENTATION_SUMMARY_HEURISTIC_ROUTER.md +231 -0
  144. modules/caas/docs/IMPLEMENTATION_SUMMARY_METADATA_INJECTION.md +258 -0
  145. modules/caas/docs/IMPLEMENTATION_SUMMARY_PRAGMATIC_TRUTH.md +212 -0
  146. modules/caas/docs/IMPLEMENTATION_SUMMARY_TRUST_GATEWAY.md +319 -0
  147. modules/caas/docs/LAYER_1_PRIMITIVE.md +202 -0
  148. modules/caas/docs/METADATA_INJECTION.md +404 -0
  149. modules/caas/docs/PRAGMATIC_TRUTH.md +431 -0
  150. modules/caas/docs/RELATED_WORK.md +312 -0
  151. modules/caas/docs/RELEASE_CHECKLIST.md +219 -0
  152. modules/caas/docs/RELEASE_GUIDE.md +285 -0
  153. modules/caas/docs/REPRODUCIBILITY.md +386 -0
  154. modules/caas/docs/SLIDING_WINDOW.md +387 -0
  155. modules/caas/docs/STRUCTURE_AWARE_INDEXING.md +158 -0
  156. modules/caas/docs/TESTING.md +259 -0
  157. modules/caas/docs/THREAT_MODEL.md +247 -0
  158. modules/caas/docs/TRUST_GATEWAY.md +575 -0
  159. modules/caas/docs/VFS.md +298 -0
  160. modules/caas/examples/agents/enterprise_security_agent.py +414 -0
  161. modules/caas/examples/agents/intelligent_document_analyzer.py +380 -0
  162. modules/caas/examples/demos/demo.py +309 -0
  163. modules/caas/examples/demos/demo_context_triad.py +225 -0
  164. modules/caas/examples/demos/demo_conversation_manager.py +285 -0
  165. modules/caas/examples/demos/demo_heuristic_router.py +133 -0
  166. modules/caas/examples/demos/demo_metadata_injection.py +198 -0
  167. modules/caas/examples/demos/demo_pragmatic_truth.py +303 -0
  168. modules/caas/examples/demos/demo_structure_aware.py +140 -0
  169. modules/caas/examples/demos/demo_time_decay.py +247 -0
  170. modules/caas/examples/demos/demo_trust_gateway.py +383 -0
  171. modules/caas/examples/multi_agent/README.md +159 -0
  172. modules/caas/examples/multi_agent/research_team.py +369 -0
  173. modules/caas/examples/multi_agent/vfs_collaboration.py +393 -0
  174. modules/caas/examples/usage/auth_module.py +142 -0
  175. modules/caas/examples/usage/usage_example.py +173 -0
  176. modules/caas/experiments/README.md +42 -0
  177. modules/caas/experiments/reproduce_results.py +462 -0
  178. modules/caas/paper/ARXIV_METADATA.md +145 -0
  179. modules/caas/paper/ARXIV_README.md +47 -0
  180. modules/caas/paper/CHECKLIST.md +103 -0
  181. modules/caas/paper/GITHUB_RELEASE_NOTES.md +105 -0
  182. modules/caas/paper/README.md +71 -0
  183. modules/caas/paper/abstract.md +24 -0
  184. modules/caas/paper/arxiv_submission.tar +0 -0
  185. modules/caas/paper/arxiv_submission.zip +0 -0
  186. modules/caas/paper/build_pdf.py +355 -0
  187. modules/caas/paper/experiments.md +149 -0
  188. modules/caas/paper/figures/.gitkeep +0 -0
  189. modules/caas/paper/figures/README.md +237 -0
  190. modules/caas/paper/figures/fig1_system_architecture.png +0 -0
  191. modules/caas/paper/figures/fig1_system_architecture.svg +198 -0
  192. modules/caas/paper/figures/fig2_context_triad.png +0 -0
  193. modules/caas/paper/figures/fig2_context_triad.svg +105 -0
  194. modules/caas/paper/figures/fig3_ablation_results.png +0 -0
  195. modules/caas/paper/figures/fig3_ablation_results.svg +113 -0
  196. modules/caas/paper/figures/fig4_routing_latency.png +0 -0
  197. modules/caas/paper/figures/fig4_routing_latency.svg +97 -0
  198. modules/caas/paper/intro.md +103 -0
  199. modules/caas/paper/latex/figures/fig1_system_architecture.png +0 -0
  200. modules/caas/paper/latex/figures/fig2_context_triad.png +0 -0
  201. modules/caas/paper/latex/figures/fig3_ablation_results.png +0 -0
  202. modules/caas/paper/latex/figures/fig4_routing_latency.png +0 -0
  203. modules/caas/paper/latex/main.tex +468 -0
  204. modules/caas/paper/latex/references.bib +140 -0
  205. modules/caas/paper/method.md +350 -0
  206. modules/caas/paper/outline.md +123 -0
  207. modules/caas/paper/related_work.md +101 -0
  208. modules/caas/paper/tables/.gitkeep +0 -0
  209. modules/caas/paper/tables/results_tables.md +50 -0
  210. modules/caas/pyproject.toml +172 -0
  211. modules/caas/requirements.txt +11 -0
  212. modules/caas/src/caas/__init__.py +232 -0
  213. modules/caas/src/caas/api/__init__.py +7 -0
  214. modules/caas/src/caas/api/server.py +1326 -0
  215. modules/caas/src/caas/caching.py +832 -0
  216. modules/caas/src/caas/cli.py +208 -0
  217. modules/caas/src/caas/conversation.py +221 -0
  218. modules/caas/src/caas/decay.py +118 -0
  219. modules/caas/src/caas/detection/__init__.py +7 -0
  220. modules/caas/src/caas/detection/detector.py +236 -0
  221. modules/caas/src/caas/enrichment.py +127 -0
  222. modules/caas/src/caas/gateway/__init__.py +24 -0
  223. modules/caas/src/caas/gateway/trust_gateway.py +471 -0
  224. modules/caas/src/caas/hf_utils.py +477 -0
  225. modules/caas/src/caas/ingestion/__init__.py +21 -0
  226. modules/caas/src/caas/ingestion/processors.py +251 -0
  227. modules/caas/src/caas/ingestion/structure_parser.py +185 -0
  228. modules/caas/src/caas/models.py +354 -0
  229. modules/caas/src/caas/pragmatic_truth.py +441 -0
  230. modules/caas/src/caas/routing/__init__.py +8 -0
  231. modules/caas/src/caas/routing/heuristic_router.py +242 -0
  232. modules/caas/src/caas/storage/__init__.py +7 -0
  233. modules/caas/src/caas/storage/store.py +450 -0
  234. modules/caas/src/caas/triad.py +472 -0
  235. modules/caas/src/caas/tuning/__init__.py +7 -0
  236. modules/caas/src/caas/tuning/tuner.py +322 -0
  237. modules/caas/src/caas/vfs/__init__.py +12 -0
  238. modules/caas/src/caas/vfs/filesystem.py +450 -0
  239. modules/caas/tests/__init__.py +3 -0
  240. modules/caas/tests/conftest.py +8 -0
  241. modules/caas/tests/test_caching.py +628 -0
  242. modules/caas/tests/test_context_triad.py +385 -0
  243. modules/caas/tests/test_conversation_manager.py +289 -0
  244. modules/caas/tests/test_functionality.py +215 -0
  245. modules/caas/tests/test_heuristic_router.py +370 -0
  246. modules/caas/tests/test_metadata_injection.py +328 -0
  247. modules/caas/tests/test_pragmatic_truth.py +322 -0
  248. modules/caas/tests/test_structure_aware_indexing.py +283 -0
  249. modules/caas/tests/test_time_decay.py +268 -0
  250. modules/caas/tests/test_trust_gateway.py +445 -0
  251. modules/caas/tests/test_vfs.py +298 -0
  252. modules/cmvk/.github/FUNDING.yml +9 -0
  253. modules/cmvk/.github/dependabot.yml +54 -0
  254. modules/cmvk/.github/workflows/ci.yml +205 -0
  255. modules/cmvk/.github/workflows/publish.yml +143 -0
  256. modules/cmvk/.gitignore +147 -0
  257. modules/cmvk/.pre-commit-config.yaml +58 -0
  258. modules/cmvk/CHANGELOG.md +146 -0
  259. modules/cmvk/CITATION.cff +48 -0
  260. modules/cmvk/CONTRIBUTING.md +229 -0
  261. modules/cmvk/Dockerfile +87 -0
  262. modules/cmvk/HF_MODEL_CARD.md +185 -0
  263. modules/cmvk/LICENSE +21 -0
  264. modules/cmvk/README.md +149 -0
  265. modules/cmvk/SECURITY.md +114 -0
  266. modules/cmvk/config/prompts/generator_v1.txt +23 -0
  267. modules/cmvk/config/prompts/verifier_hostile.txt +32 -0
  268. modules/cmvk/config/settings.yaml +40 -0
  269. modules/cmvk/coverage_html/.gitignore +2 -0
  270. modules/cmvk/coverage_html/class_index.html +658 -0
  271. modules/cmvk/coverage_html/coverage_html_cb_188fc9a4.js +735 -0
  272. modules/cmvk/coverage_html/favicon_32_cb_c827f16f.png +0 -0
  273. modules/cmvk/coverage_html/function_index.html +1978 -0
  274. modules/cmvk/coverage_html/index.html +255 -0
  275. modules/cmvk/coverage_html/keybd_closed_cb_900cfef5.png +0 -0
  276. modules/cmvk/coverage_html/status.json +1 -0
  277. modules/cmvk/coverage_html/style_cb_5c747636.css +389 -0
  278. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38___init___py.html +315 -0
  279. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_audit_py.html +499 -0
  280. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_benchmarks_py.html +575 -0
  281. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_constitutional_py.html +1001 -0
  282. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_hf_utils_py.html +398 -0
  283. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_metrics_py.html +570 -0
  284. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_profiles_py.html +397 -0
  285. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_types_py.html +109 -0
  286. modules/cmvk/coverage_html/z_2c49bd2ed3e01e38_verification_py.html +1053 -0
  287. modules/cmvk/docs/DIAGRAMS.md +325 -0
  288. modules/cmvk/docs/architecture.md +345 -0
  289. modules/cmvk/docs/features.md +308 -0
  290. modules/cmvk/docs/getting_started.md +279 -0
  291. modules/cmvk/docs/innovation_layer.md +377 -0
  292. modules/cmvk/docs/safety.md +281 -0
  293. modules/cmvk/docs/traceability.md +150 -0
  294. modules/cmvk/examples/basic_example.py +62 -0
  295. modules/cmvk/examples/demo_complete_pipeline.py +209 -0
  296. modules/cmvk/examples/demo_innovation_layer.py +197 -0
  297. modules/cmvk/examples/example.py +112 -0
  298. modules/cmvk/examples/model_diversity_comparison.py +110 -0
  299. modules/cmvk/examples/real_api_integration.py +121 -0
  300. modules/cmvk/examples/test_full_pipeline.py +303 -0
  301. modules/cmvk/experiments/FEATURE_2_LATERAL_THINKING.md +187 -0
  302. modules/cmvk/experiments/README.md +216 -0
  303. modules/cmvk/experiments/ablation_runner.py +666 -0
  304. modules/cmvk/experiments/baseline_runner.py +158 -0
  305. modules/cmvk/experiments/blind_spot_benchmark.py +364 -0
  306. modules/cmvk/experiments/datasets/README.md +85 -0
  307. modules/cmvk/experiments/datasets/humaneval_50.json +352 -0
  308. modules/cmvk/experiments/datasets/humaneval_full.json +1150 -0
  309. modules/cmvk/experiments/datasets/humaneval_sample.json +32 -0
  310. modules/cmvk/experiments/datasets/sabotage.json +262 -0
  311. modules/cmvk/experiments/datasets/sample.json +40 -0
  312. modules/cmvk/experiments/demo_with_traces.py +110 -0
  313. modules/cmvk/experiments/efficiency_curve.py +259 -0
  314. modules/cmvk/experiments/experiment_runner.py +243 -0
  315. modules/cmvk/experiments/paper_data_generator.py +183 -0
  316. modules/cmvk/experiments/reproduce_results.py +407 -0
  317. modules/cmvk/experiments/reproducible_runner.py +352 -0
  318. modules/cmvk/experiments/sabotage_stress_test.py +311 -0
  319. modules/cmvk/experiments/test_lateral_thinking.py +116 -0
  320. modules/cmvk/experiments/test_prosecutor.py +41 -0
  321. modules/cmvk/experiments/visualize_results.py +735 -0
  322. modules/cmvk/logs/traces/demo_HumanEval_0_20260121-204900.json +36 -0
  323. modules/cmvk/notebooks/analysis.ipynb +124 -0
  324. modules/cmvk/paper/PAPER.md +561 -0
  325. modules/cmvk/paper/arxiv_checklist.md +230 -0
  326. modules/cmvk/paper/cmvk_neurips.aux +77 -0
  327. modules/cmvk/paper/cmvk_neurips.bbl +81 -0
  328. modules/cmvk/paper/cmvk_neurips.blg +48 -0
  329. modules/cmvk/paper/cmvk_neurips.out +16 -0
  330. modules/cmvk/paper/cmvk_neurips.pdf +0 -0
  331. modules/cmvk/paper/cmvk_neurips.tex +309 -0
  332. modules/cmvk/paper/figures/ablation.png +0 -0
  333. modules/cmvk/paper/figures/ablation.svg +39 -0
  334. modules/cmvk/paper/figures/architecture.png +0 -0
  335. modules/cmvk/paper/figures/architecture.svg +115 -0
  336. modules/cmvk/paper/figures/results_bar.png +0 -0
  337. modules/cmvk/paper/figures/results_bar.svg +70 -0
  338. modules/cmvk/paper/generate_figures.py +383 -0
  339. modules/cmvk/paper/neurips_2024.sty +101 -0
  340. modules/cmvk/paper/references.bib +98 -0
  341. modules/cmvk/paper/structure.tex +200 -0
  342. modules/cmvk/pyproject.toml +189 -0
  343. modules/cmvk/requirements-dev.txt +19 -0
  344. modules/cmvk/requirements.txt +14 -0
  345. modules/cmvk/src/cmvk/__init__.py +216 -0
  346. modules/cmvk/src/cmvk/audit.py +400 -0
  347. modules/cmvk/src/cmvk/benchmarks.py +476 -0
  348. modules/cmvk/src/cmvk/constitutional.py +902 -0
  349. modules/cmvk/src/cmvk/hf_utils.py +299 -0
  350. modules/cmvk/src/cmvk/metrics.py +471 -0
  351. modules/cmvk/src/cmvk/profiles.py +298 -0
  352. modules/cmvk/src/cmvk/py.typed +0 -0
  353. modules/cmvk/src/cmvk/types.py +10 -0
  354. modules/cmvk/src/cmvk/verification.py +954 -0
  355. modules/cmvk/src/cross_model_verification_kernel/__init__.py +91 -0
  356. modules/cmvk/src/cross_model_verification_kernel/__main__.py +10 -0
  357. modules/cmvk/src/cross_model_verification_kernel/agents/__init__.py +16 -0
  358. modules/cmvk/src/cross_model_verification_kernel/agents/base_agent.py +142 -0
  359. modules/cmvk/src/cross_model_verification_kernel/agents/generator_openai.py +223 -0
  360. modules/cmvk/src/cross_model_verification_kernel/agents/verifier_anthropic.py +448 -0
  361. modules/cmvk/src/cross_model_verification_kernel/agents/verifier_gemini.py +481 -0
  362. modules/cmvk/src/cross_model_verification_kernel/cli.py +570 -0
  363. modules/cmvk/src/cross_model_verification_kernel/core/__init__.py +26 -0
  364. modules/cmvk/src/cross_model_verification_kernel/core/graph_memory.py +308 -0
  365. modules/cmvk/src/cross_model_verification_kernel/core/kernel.py +413 -0
  366. modules/cmvk/src/cross_model_verification_kernel/core/trace_logger.py +75 -0
  367. modules/cmvk/src/cross_model_verification_kernel/core/types.py +121 -0
  368. modules/cmvk/src/cross_model_verification_kernel/datasets/__init__.py +20 -0
  369. modules/cmvk/src/cross_model_verification_kernel/datasets/humaneval_loader.py +271 -0
  370. modules/cmvk/src/cross_model_verification_kernel/generator.py +118 -0
  371. modules/cmvk/src/cross_model_verification_kernel/kernel.py +292 -0
  372. modules/cmvk/src/cross_model_verification_kernel/models.py +111 -0
  373. modules/cmvk/src/cross_model_verification_kernel/py.typed +1 -0
  374. modules/cmvk/src/cross_model_verification_kernel/simple_kernel.py +185 -0
  375. modules/cmvk/src/cross_model_verification_kernel/tools/__init__.py +94 -0
  376. modules/cmvk/src/cross_model_verification_kernel/tools/huggingface_upload.py +394 -0
  377. modules/cmvk/src/cross_model_verification_kernel/tools/sandbox.py +159 -0
  378. modules/cmvk/src/cross_model_verification_kernel/tools/statistics.py +468 -0
  379. modules/cmvk/src/cross_model_verification_kernel/tools/visualizer.py +312 -0
  380. modules/cmvk/src/cross_model_verification_kernel/tools/web_search.py +86 -0
  381. modules/cmvk/src/cross_model_verification_kernel/verifier.py +257 -0
  382. modules/cmvk/tests/__init__.py +3 -0
  383. modules/cmvk/tests/conftest.py +61 -0
  384. modules/cmvk/tests/integration/__init__.py +1 -0
  385. modules/cmvk/tests/integration/test_anthropic_verifier.py +269 -0
  386. modules/cmvk/tests/integration/test_integration.py +53 -0
  387. modules/cmvk/tests/integration/test_lateral_thinking_integration.py +199 -0
  388. modules/cmvk/tests/integration/test_lateral_thinking_witness.py +208 -0
  389. modules/cmvk/tests/integration/test_prosecutor_mode.py +131 -0
  390. modules/cmvk/tests/test_constitutional.py +611 -0
  391. modules/cmvk/tests/test_enhanced_features.py +603 -0
  392. modules/cmvk/tests/test_verification.py +255 -0
  393. modules/cmvk/tests/unit/__init__.py +1 -0
  394. modules/cmvk/tests/unit/test_agents.py +64 -0
  395. modules/cmvk/tests/unit/test_cli.py +224 -0
  396. modules/cmvk/tests/unit/test_core.py +126 -0
  397. modules/cmvk/tests/unit/test_humaneval_loader.py +197 -0
  398. modules/cmvk/tests/unit/test_kernel.py +255 -0
  399. modules/cmvk/tests/unit/test_reproducibility.py +160 -0
  400. modules/cmvk/tests/unit/test_trace_logger.py +115 -0
  401. modules/cmvk/tests/unit/test_visualizer.py +218 -0
  402. modules/control-plane/.github/ISSUE_TEMPLATE/bug_report.yml +82 -0
  403. modules/control-plane/.github/ISSUE_TEMPLATE/config.yml +11 -0
  404. modules/control-plane/.github/ISSUE_TEMPLATE/feature_request.yml +104 -0
  405. modules/control-plane/.github/ISSUE_TEMPLATE/question.yml +70 -0
  406. modules/control-plane/.github/ISSUE_TEMPLATE/security_vulnerability.yml +84 -0
  407. modules/control-plane/.github/discussions.yml +73 -0
  408. modules/control-plane/.github/pull_request_template.md +82 -0
  409. modules/control-plane/.github/workflows/publish.yml +146 -0
  410. modules/control-plane/.github/workflows/release.yml +39 -0
  411. modules/control-plane/.github/workflows/tests.yml +58 -0
  412. modules/control-plane/.gitignore +55 -0
  413. modules/control-plane/CHANGELOG.md +203 -0
  414. modules/control-plane/CONTRIBUTING.md +311 -0
  415. modules/control-plane/CONTRIBUTORS.md +88 -0
  416. modules/control-plane/Dockerfile +82 -0
  417. modules/control-plane/LICENSE +21 -0
  418. modules/control-plane/MANIFEST.in +17 -0
  419. modules/control-plane/README.md +1264 -0
  420. modules/control-plane/ROADMAP.md +228 -0
  421. modules/control-plane/SECURITY.md +210 -0
  422. modules/control-plane/SUPPORT.md +106 -0
  423. modules/control-plane/acp-cli.py +212 -0
  424. modules/control-plane/benchmark/README.md +257 -0
  425. modules/control-plane/benchmark/__init__.py +19 -0
  426. modules/control-plane/benchmark/red_team_dataset.py +517 -0
  427. modules/control-plane/benchmark.py +563 -0
  428. modules/control-plane/build_and_publish.sh +130 -0
  429. modules/control-plane/docker-compose.yml +74 -0
  430. modules/control-plane/docs/ABLATION_STUDIES.md +528 -0
  431. modules/control-plane/docs/ADAPTER_GUIDE.md +544 -0
  432. modules/control-plane/docs/ADVANCED_FEATURES.md +543 -0
  433. modules/control-plane/docs/AIOS_COMPARISON.md +296 -0
  434. modules/control-plane/docs/BIBLIOGRAPHY.md +367 -0
  435. modules/control-plane/docs/CASE_STUDIES.md +645 -0
  436. modules/control-plane/docs/DOCKER_DEPLOYMENT.md +184 -0
  437. modules/control-plane/docs/ECOSYSTEM_STATUS.md +98 -0
  438. modules/control-plane/docs/HF_MODEL_CARD.md +168 -0
  439. modules/control-plane/docs/KERNEL_V1_RELEASE.md +454 -0
  440. modules/control-plane/docs/LAYER3_FRAMEWORK.md +227 -0
  441. modules/control-plane/docs/LIMITATIONS.md +523 -0
  442. modules/control-plane/docs/PYPI_PUBLISHING.md +195 -0
  443. modules/control-plane/docs/README.md +58 -0
  444. modules/control-plane/docs/RELATED_WORK.md +319 -0
  445. modules/control-plane/docs/RELEASE_v1.1.0.md +252 -0
  446. modules/control-plane/docs/REPRODUCIBILITY.md +540 -0
  447. modules/control-plane/docs/RESEARCH_FOUNDATION.md +197 -0
  448. modules/control-plane/docs/api/CORE.md +270 -0
  449. modules/control-plane/docs/architecture/architecture.md +120 -0
  450. modules/control-plane/docs/community/ANNOUNCEMENT_TEMPLATES.md +52 -0
  451. modules/control-plane/docs/guides/IMPLEMENTATION.md +225 -0
  452. modules/control-plane/docs/guides/PHILOSOPHY.md +354 -0
  453. modules/control-plane/docs/guides/QUICKSTART.md +217 -0
  454. modules/control-plane/examples/README.md +138 -0
  455. modules/control-plane/examples/a2a_demo.py +410 -0
  456. modules/control-plane/examples/adapter_demo.py +347 -0
  457. modules/control-plane/examples/advanced_features.py +403 -0
  458. modules/control-plane/examples/basic_usage.py +261 -0
  459. modules/control-plane/examples/benchmark_demo.py +186 -0
  460. modules/control-plane/examples/compliance_demo.py +333 -0
  461. modules/control-plane/examples/configuration.py +265 -0
  462. modules/control-plane/examples/getting_started.py +178 -0
  463. modules/control-plane/examples/hibernation_and_time_travel_demo.py +406 -0
  464. modules/control-plane/examples/interactive_tutorial.ipynb +497 -0
  465. modules/control-plane/examples/kernel_interceptor_demo.py +202 -0
  466. modules/control-plane/examples/kernel_v1_demo.py +273 -0
  467. modules/control-plane/examples/langchain_demo.py +281 -0
  468. modules/control-plane/examples/lifecycle_demo.py +724 -0
  469. modules/control-plane/examples/mcp_demo.py +378 -0
  470. modules/control-plane/examples/ml_safety_demo.py +157 -0
  471. modules/control-plane/examples/multimodal_demo.py +347 -0
  472. modules/control-plane/examples/observability_demo.py +370 -0
  473. modules/control-plane/examples/use_cases.py +336 -0
  474. modules/control-plane/experiments/long_horizon_purge.py +235 -0
  475. modules/control-plane/experiments/multi_agent_rag.py +165 -0
  476. modules/control-plane/experiments/reproduce_results.py +667 -0
  477. modules/control-plane/paper/ARXIV_SUBMISSION_INFO.txt +122 -0
  478. modules/control-plane/paper/ETHICS_STATEMENT.md +248 -0
  479. modules/control-plane/paper/PAPER_CHECKLIST.md +72 -0
  480. modules/control-plane/paper/Paper.pdf +0 -0
  481. modules/control-plane/paper/README.md +71 -0
  482. modules/control-plane/paper/appendix.md +152 -0
  483. modules/control-plane/paper/architecture.md +15 -0
  484. modules/control-plane/paper/arxiv/figures/ablation_chart.png +0 -0
  485. modules/control-plane/paper/arxiv/figures/architecture.png +0 -0
  486. modules/control-plane/paper/arxiv/figures/constraint_graphs.png +0 -0
  487. modules/control-plane/paper/arxiv/figures/results_chart.png +0 -0
  488. modules/control-plane/paper/arxiv/main.aux +97 -0
  489. modules/control-plane/paper/arxiv/main.bbl +112 -0
  490. modules/control-plane/paper/arxiv/main.blg +48 -0
  491. modules/control-plane/paper/arxiv/main.out +33 -0
  492. modules/control-plane/paper/arxiv/main.pdf +0 -0
  493. modules/control-plane/paper/arxiv/main.tex +479 -0
  494. modules/control-plane/paper/arxiv/references.bib +234 -0
  495. modules/control-plane/paper/arxiv_submission.tar +0 -0
  496. modules/control-plane/paper/arxiv_submission.zip +0 -0
  497. modules/control-plane/paper/build.sh +68 -0
  498. modules/control-plane/paper/figures/README.md +47 -0
  499. modules/control-plane/paper/figures/ablation_chart.pdf +0 -0
  500. modules/control-plane/paper/figures/ablation_chart.png +0 -0
  501. modules/control-plane/paper/figures/architecture.pdf +0 -0
  502. modules/control-plane/paper/figures/architecture.png +0 -0
  503. modules/control-plane/paper/figures/constraint_graphs.pdf +0 -0
  504. modules/control-plane/paper/figures/constraint_graphs.png +0 -0
  505. modules/control-plane/paper/figures/generate_figures.py +252 -0
  506. modules/control-plane/paper/figures/results_chart.pdf +0 -0
  507. modules/control-plane/paper/figures/results_chart.png +0 -0
  508. modules/control-plane/paper/main.md +273 -0
  509. modules/control-plane/paper/main.tex +214 -0
  510. modules/control-plane/paper/main_arxiv.aux +53 -0
  511. modules/control-plane/paper/main_arxiv.out +17 -0
  512. modules/control-plane/paper/main_arxiv.pdf +0 -0
  513. modules/control-plane/paper/main_arxiv.tex +264 -0
  514. modules/control-plane/paper/references.bib +234 -0
  515. modules/control-plane/pyproject.toml +124 -0
  516. modules/control-plane/reproducibility/ABLATIONS.md +136 -0
  517. modules/control-plane/reproducibility/README.md +288 -0
  518. modules/control-plane/reproducibility/commands.md +467 -0
  519. modules/control-plane/reproducibility/docker_config/Dockerfile +39 -0
  520. modules/control-plane/reproducibility/experiment_configs/purge_config.json +46 -0
  521. modules/control-plane/reproducibility/experiment_configs/rag_config.json +36 -0
  522. modules/control-plane/reproducibility/hardware_specs.md +317 -0
  523. modules/control-plane/reproducibility/requirements_frozen.txt +0 -0
  524. modules/control-plane/reproducibility/run_all_experiments.sh +45 -0
  525. modules/control-plane/reproducibility/seeds.json +106 -0
  526. modules/control-plane/scripts/prepare_pypi.py +46 -0
  527. modules/control-plane/scripts/prepare_release.py +176 -0
  528. modules/control-plane/scripts/upload_dataset_to_hf.py +316 -0
  529. modules/control-plane/setup.py +69 -0
  530. modules/control-plane/src/agent_control_plane/__init__.py +639 -0
  531. modules/control-plane/src/agent_control_plane/a2a_adapter.py +541 -0
  532. modules/control-plane/src/agent_control_plane/adapter.py +415 -0
  533. modules/control-plane/src/agent_control_plane/agent_hibernation.py +364 -0
  534. modules/control-plane/src/agent_control_plane/agent_kernel.py +464 -0
  535. modules/control-plane/src/agent_control_plane/compliance.py +718 -0
  536. modules/control-plane/src/agent_control_plane/constraint_graphs.py +475 -0
  537. modules/control-plane/src/agent_control_plane/control_plane.py +848 -0
  538. modules/control-plane/src/agent_control_plane/example_executors.py +193 -0
  539. modules/control-plane/src/agent_control_plane/execution_engine.py +229 -0
  540. modules/control-plane/src/agent_control_plane/flight_recorder.py +600 -0
  541. modules/control-plane/src/agent_control_plane/governance_layer.py +432 -0
  542. modules/control-plane/src/agent_control_plane/hf_utils.py +561 -0
  543. modules/control-plane/src/agent_control_plane/interfaces/__init__.py +53 -0
  544. modules/control-plane/src/agent_control_plane/interfaces/kernel_interface.py +359 -0
  545. modules/control-plane/src/agent_control_plane/interfaces/plugin_interface.py +495 -0
  546. modules/control-plane/src/agent_control_plane/interfaces/protocol_interfaces.py +385 -0
  547. modules/control-plane/src/agent_control_plane/kernel_space.py +707 -0
  548. modules/control-plane/src/agent_control_plane/langchain_adapter.py +422 -0
  549. modules/control-plane/src/agent_control_plane/lifecycle.py +3111 -0
  550. modules/control-plane/src/agent_control_plane/mcp_adapter.py +517 -0
  551. modules/control-plane/src/agent_control_plane/ml_safety.py +560 -0
  552. modules/control-plane/src/agent_control_plane/multimodal.py +724 -0
  553. modules/control-plane/src/agent_control_plane/mute_agent.py +419 -0
  554. modules/control-plane/src/agent_control_plane/observability.py +785 -0
  555. modules/control-plane/src/agent_control_plane/orchestrator.py +480 -0
  556. modules/control-plane/src/agent_control_plane/plugin_registry.py +748 -0
  557. modules/control-plane/src/agent_control_plane/policy_engine.py +525 -0
  558. modules/control-plane/src/agent_control_plane/shadow_mode.py +307 -0
  559. modules/control-plane/src/agent_control_plane/signals.py +491 -0
  560. modules/control-plane/src/agent_control_plane/supervisor_agents.py +427 -0
  561. modules/control-plane/src/agent_control_plane/time_travel_debugger.py +554 -0
  562. modules/control-plane/src/agent_control_plane/tool_registry.py +350 -0
  563. modules/control-plane/src/agent_control_plane/vfs.py +695 -0
  564. modules/control-plane/tests/README.md +33 -0
  565. modules/control-plane/tests/test_a2a_adapter.py +336 -0
  566. modules/control-plane/tests/test_adapter.py +422 -0
  567. modules/control-plane/tests/test_advanced_features.py +389 -0
  568. modules/control-plane/tests/test_benchmark.py +223 -0
  569. modules/control-plane/tests/test_compliance.py +214 -0
  570. modules/control-plane/tests/test_control_plane.py +295 -0
  571. modules/control-plane/tests/test_hibernation.py +274 -0
  572. modules/control-plane/tests/test_kernel_interception.py +284 -0
  573. modules/control-plane/tests/test_langchain_adapter.py +258 -0
  574. modules/control-plane/tests/test_lifecycle.py +1174 -0
  575. modules/control-plane/tests/test_mcp_adapter.py +293 -0
  576. modules/control-plane/tests/test_ml_safety.py +142 -0
  577. modules/control-plane/tests/test_multimodal.py +317 -0
  578. modules/control-plane/tests/test_new_features.py +435 -0
  579. modules/control-plane/tests/test_observability.py +338 -0
  580. modules/control-plane/tests/test_time_travel.py +387 -0
  581. modules/emk/.github/workflows/ci.yml +105 -0
  582. modules/emk/.github/workflows/publish.yml +144 -0
  583. modules/emk/.gitignore +74 -0
  584. modules/emk/CHANGELOG.md +41 -0
  585. modules/emk/CONTRIBUTING.md +295 -0
  586. modules/emk/IMPLEMENTATION.md +174 -0
  587. modules/emk/LICENSE +21 -0
  588. modules/emk/MANIFEST.in +8 -0
  589. modules/emk/README.md +135 -0
  590. modules/emk/RELEASE_NOTES.md +82 -0
  591. modules/emk/SECURITY.md +52 -0
  592. modules/emk/codecov.yml +39 -0
  593. modules/emk/docs/MEMORY_MANAGEMENT.md +285 -0
  594. modules/emk/emk/__init__.py +106 -0
  595. modules/emk/emk/hf_utils.py +419 -0
  596. modules/emk/emk/indexer.py +144 -0
  597. modules/emk/emk/py.typed +0 -0
  598. modules/emk/emk/schema.py +204 -0
  599. modules/emk/emk/sleep_cycle.py +345 -0
  600. modules/emk/emk/store.py +479 -0
  601. modules/emk/examples/basic_usage.py +123 -0
  602. modules/emk/examples/memory_features_demo.py +154 -0
  603. modules/emk/experiments/README.md +59 -0
  604. modules/emk/experiments/reproduce_results.py +461 -0
  605. modules/emk/experiments/results.json +61 -0
  606. modules/emk/paper/structure.tex +192 -0
  607. modules/emk/paper/whitepaper.md +273 -0
  608. modules/emk/pyproject.toml +91 -0
  609. modules/emk/setup.py +5 -0
  610. modules/emk/tests/test_file_adapter.py +195 -0
  611. modules/emk/tests/test_indexer.py +174 -0
  612. modules/emk/tests/test_init.py +55 -0
  613. modules/emk/tests/test_negative_memory.py +83 -0
  614. modules/emk/tests/test_schema.py +150 -0
  615. modules/emk/tests/test_semantic_rules.py +175 -0
  616. modules/emk/tests/test_sleep_cycle.py +335 -0
  617. modules/emk/tests/test_store_anti_patterns.py +239 -0
  618. modules/iatp/.github/workflows/docker-build.yml +124 -0
  619. modules/iatp/.github/workflows/publish.yml +174 -0
  620. modules/iatp/.github/workflows/python-package.yml +121 -0
  621. modules/iatp/.gitignore +67 -0
  622. modules/iatp/.pre-commit-config.yaml +64 -0
  623. modules/iatp/CHANGELOG.md +120 -0
  624. modules/iatp/Dockerfile +91 -0
  625. modules/iatp/IMPLEMENTATION_SUMMARY.md +218 -0
  626. modules/iatp/MANIFEST.in +9 -0
  627. modules/iatp/README.md +180 -0
  628. modules/iatp/docker/Dockerfile.agent +27 -0
  629. modules/iatp/docker/Dockerfile.sidecar-python +86 -0
  630. modules/iatp/docker/README.md +258 -0
  631. modules/iatp/docker-compose.yml +194 -0
  632. modules/iatp/docs/ARCHITECTURE.md +243 -0
  633. modules/iatp/docs/CLI_GUIDE.md +220 -0
  634. modules/iatp/docs/DEPLOYMENT.md +304 -0
  635. modules/iatp/examples/README.md +132 -0
  636. modules/iatp/examples/backend_agent.py +39 -0
  637. modules/iatp/examples/client.py +168 -0
  638. modules/iatp/examples/demo_attestation_reputation.py +274 -0
  639. modules/iatp/examples/demo_client.py +240 -0
  640. modules/iatp/examples/demo_rbac.py +143 -0
  641. modules/iatp/examples/integration_demo.py +245 -0
  642. modules/iatp/examples/manifests/coder_agent.json +20 -0
  643. modules/iatp/examples/manifests/reviewer_agent.json +19 -0
  644. modules/iatp/examples/manifests/secure_bank.json +14 -0
  645. modules/iatp/examples/manifests/standard_agent.json +14 -0
  646. modules/iatp/examples/manifests/untrusted_honeypot.json +14 -0
  647. modules/iatp/examples/run_secure_bank_sidecar.py +85 -0
  648. modules/iatp/examples/run_sidecar.py +105 -0
  649. modules/iatp/examples/run_untrusted_sidecar.py +77 -0
  650. modules/iatp/examples/secure_bank_agent.py +138 -0
  651. modules/iatp/examples/test_untrusted.py +82 -0
  652. modules/iatp/examples/untrusted_agent.py +119 -0
  653. modules/iatp/experiments/README.md +58 -0
  654. modules/iatp/experiments/cascading_hallucination/README.md +149 -0
  655. modules/iatp/experiments/cascading_hallucination/agent_a_user.py +41 -0
  656. modules/iatp/experiments/cascading_hallucination/agent_b_summarizer.py +54 -0
  657. modules/iatp/experiments/cascading_hallucination/agent_c_database.py +47 -0
  658. modules/iatp/experiments/cascading_hallucination/proof_of_concept.py +290 -0
  659. modules/iatp/experiments/cascading_hallucination/run_experiment.py +226 -0
  660. modules/iatp/experiments/cascading_hallucination/sidecar_c.py +61 -0
  661. modules/iatp/experiments/reproduce_results.py +574 -0
  662. modules/iatp/experiments/results.json +2336 -0
  663. modules/iatp/iatp/__init__.py +164 -0
  664. modules/iatp/iatp/attestation.py +401 -0
  665. modules/iatp/iatp/cli.py +253 -0
  666. modules/iatp/iatp/hf_utils.py +469 -0
  667. modules/iatp/iatp/ipc_pipes.py +578 -0
  668. modules/iatp/iatp/main.py +410 -0
  669. modules/iatp/iatp/models/__init__.py +445 -0
  670. modules/iatp/iatp/policy_engine.py +335 -0
  671. modules/iatp/iatp/py.typed +2 -0
  672. modules/iatp/iatp/recovery.py +319 -0
  673. modules/iatp/iatp/security/__init__.py +268 -0
  674. modules/iatp/iatp/sidecar/__init__.py +517 -0
  675. modules/iatp/iatp/telemetry/__init__.py +162 -0
  676. modules/iatp/iatp/tests/__init__.py +1 -0
  677. modules/iatp/iatp/tests/test_attestation.py +368 -0
  678. modules/iatp/iatp/tests/test_cli.py +129 -0
  679. modules/iatp/iatp/tests/test_models.py +128 -0
  680. modules/iatp/iatp/tests/test_policy_engine.py +345 -0
  681. modules/iatp/iatp/tests/test_recovery.py +279 -0
  682. modules/iatp/iatp/tests/test_security.py +220 -0
  683. modules/iatp/iatp/tests/test_sidecar.py +165 -0
  684. modules/iatp/iatp/tests/test_telemetry.py +173 -0
  685. modules/iatp/paper/BLOG.md +307 -0
  686. modules/iatp/paper/PAPER.md +236 -0
  687. modules/iatp/paper/RFC_SUBMISSION.md +299 -0
  688. modules/iatp/paper/whitepaper.md +369 -0
  689. modules/iatp/proto/README.md +200 -0
  690. modules/iatp/proto/generate_stubs.py +81 -0
  691. modules/iatp/proto/iatp.proto +552 -0
  692. modules/iatp/pyproject.toml +180 -0
  693. modules/iatp/requirements-dev.txt +2 -0
  694. modules/iatp/requirements.txt +6 -0
  695. modules/iatp/setup.py +60 -0
  696. modules/iatp/sidecar/README.md +487 -0
  697. modules/iatp/sidecar/go/Dockerfile +32 -0
  698. modules/iatp/sidecar/go/README.md +237 -0
  699. modules/iatp/sidecar/go/go.mod +8 -0
  700. modules/iatp/sidecar/go/main.go +488 -0
  701. modules/iatp/spec/001-handshake.md +436 -0
  702. modules/iatp/spec/002-reversibility.md +394 -0
  703. modules/iatp/spec/schema/capability_manifest.json +266 -0
  704. modules/iatp/test_integration.py +310 -0
  705. modules/mcp-kernel-server/README.md +261 -0
  706. modules/mcp-kernel-server/pyproject.toml +60 -0
  707. modules/mcp-kernel-server/src/mcp_kernel_server/__init__.py +26 -0
  708. modules/mcp-kernel-server/src/mcp_kernel_server/cli.py +229 -0
  709. modules/mcp-kernel-server/src/mcp_kernel_server/resources.py +215 -0
  710. modules/mcp-kernel-server/src/mcp_kernel_server/server.py +562 -0
  711. modules/mcp-kernel-server/src/mcp_kernel_server/tools.py +1172 -0
  712. modules/mute-agent/.github/workflows/safety_check.yml +45 -0
  713. modules/mute-agent/.gitignore +53 -0
  714. modules/mute-agent/ARCHITECTURE.md +531 -0
  715. modules/mute-agent/BENCHMARK_GUIDE.md +384 -0
  716. modules/mute-agent/COMPLETION_SUMMARY.md +293 -0
  717. modules/mute-agent/EXPERIMENT_SUMMARY.md +318 -0
  718. modules/mute-agent/IMPLEMENTATION_SUMMARY.md +212 -0
  719. modules/mute-agent/LICENSE +21 -0
  720. modules/mute-agent/PHASE3_SUMMARY.md +297 -0
  721. modules/mute-agent/README.md +360 -0
  722. modules/mute-agent/STEEL_MAN_RESULTS.md +353 -0
  723. modules/mute-agent/USAGE.md +505 -0
  724. modules/mute-agent/V2_IMPLEMENTATION_SUMMARY.md +253 -0
  725. modules/mute-agent/V2_STEEL_MAN_IMPLEMENTATION.md +274 -0
  726. modules/mute-agent/VERIFICATION_REPORT.md +435 -0
  727. modules/mute-agent/charts/cost_comparison.png +0 -0
  728. modules/mute-agent/charts/cost_vs_ambiguity.png +0 -0
  729. modules/mute-agent/charts/metrics_comparison.png +0 -0
  730. modules/mute-agent/charts/scenario_breakdown.png +0 -0
  731. modules/mute-agent/charts/trace_attack_blocked.html +140 -0
  732. modules/mute-agent/charts/trace_attack_blocked.png +0 -0
  733. modules/mute-agent/charts/trace_failure.html +140 -0
  734. modules/mute-agent/charts/trace_failure.png +0 -0
  735. modules/mute-agent/charts/trace_success.html +140 -0
  736. modules/mute-agent/charts/trace_success.png +0 -0
  737. modules/mute-agent/examples/__init__.py +1 -0
  738. modules/mute-agent/examples/advanced_example.py +384 -0
  739. modules/mute-agent/examples/graph_debugger_demo.py +241 -0
  740. modules/mute-agent/examples/listener_example.py +297 -0
  741. modules/mute-agent/examples/simple_example.py +242 -0
  742. modules/mute-agent/examples/steel_man_demo.py +297 -0
  743. modules/mute-agent/experiments/README.md +135 -0
  744. modules/mute-agent/experiments/__init__.py +3 -0
  745. modules/mute-agent/experiments/agent_comparison.csv +6 -0
  746. modules/mute-agent/experiments/agent_comparison_50runs.csv +6 -0
  747. modules/mute-agent/experiments/ambiguity_test.py +335 -0
  748. modules/mute-agent/experiments/ambiguity_test_results.csv +31 -0
  749. modules/mute-agent/experiments/ambiguity_test_results_50runs.csv +51 -0
  750. modules/mute-agent/experiments/baseline_agent.py +189 -0
  751. modules/mute-agent/experiments/benchmark.py +402 -0
  752. modules/mute-agent/experiments/demo.py +172 -0
  753. modules/mute-agent/experiments/generate_cost_curve.py +474 -0
  754. modules/mute-agent/experiments/jailbreak_test.py +137 -0
  755. modules/mute-agent/experiments/latent_state_scenario.py +361 -0
  756. modules/mute-agent/experiments/mute_agent_experiment.py +349 -0
  757. modules/mute-agent/experiments/run_extended_experiment.py +40 -0
  758. modules/mute-agent/experiments/run_v2_experiments.py +266 -0
  759. modules/mute-agent/experiments/run_v2_experiments_auto.py +247 -0
  760. modules/mute-agent/experiments/v2_scenarios/README.md +214 -0
  761. modules/mute-agent/experiments/v2_scenarios/__init__.py +4 -0
  762. modules/mute-agent/experiments/v2_scenarios/scenario_1_deep_dependency.py +325 -0
  763. modules/mute-agent/experiments/v2_scenarios/scenario_2_adversarial.py +328 -0
  764. modules/mute-agent/experiments/v2_scenarios/scenario_3_false_positive.py +303 -0
  765. modules/mute-agent/experiments/v2_scenarios/scenario_4_performance.py +319 -0
  766. modules/mute-agent/experiments/visualize.py +400 -0
  767. modules/mute-agent/mute_agent/__init__.py +66 -0
  768. modules/mute-agent/mute_agent/core/__init__.py +1 -0
  769. modules/mute-agent/mute_agent/core/execution_agent.py +164 -0
  770. modules/mute-agent/mute_agent/core/handshake_protocol.py +199 -0
  771. modules/mute-agent/mute_agent/core/reasoning_agent.py +236 -0
  772. modules/mute-agent/mute_agent/knowledge_graph/__init__.py +1 -0
  773. modules/mute-agent/mute_agent/knowledge_graph/graph_elements.py +63 -0
  774. modules/mute-agent/mute_agent/knowledge_graph/multidimensional_graph.py +168 -0
  775. modules/mute-agent/mute_agent/knowledge_graph/subgraph.py +222 -0
  776. modules/mute-agent/mute_agent/listener/__init__.py +41 -0
  777. modules/mute-agent/mute_agent/listener/adapters/__init__.py +29 -0
  778. modules/mute-agent/mute_agent/listener/adapters/base_adapter.py +187 -0
  779. modules/mute-agent/mute_agent/listener/adapters/caas_adapter.py +342 -0
  780. modules/mute-agent/mute_agent/listener/adapters/control_plane_adapter.py +434 -0
  781. modules/mute-agent/mute_agent/listener/adapters/iatp_adapter.py +330 -0
  782. modules/mute-agent/mute_agent/listener/adapters/scak_adapter.py +249 -0
  783. modules/mute-agent/mute_agent/listener/listener.py +608 -0
  784. modules/mute-agent/mute_agent/listener/state_observer.py +434 -0
  785. modules/mute-agent/mute_agent/listener/threshold_config.py +311 -0
  786. modules/mute-agent/mute_agent/super_system/__init__.py +1 -0
  787. modules/mute-agent/mute_agent/super_system/router.py +202 -0
  788. modules/mute-agent/mute_agent/visualization/__init__.py +8 -0
  789. modules/mute-agent/mute_agent/visualization/graph_debugger.py +495 -0
  790. modules/mute-agent/requirements-dev.txt +6 -0
  791. modules/mute-agent/requirements.txt +9 -0
  792. modules/mute-agent/setup.py +64 -0
  793. modules/mute-agent/src/__init__.py +0 -0
  794. modules/mute-agent/src/agents/__init__.py +0 -0
  795. modules/mute-agent/src/agents/baseline_agent.py +524 -0
  796. modules/mute-agent/src/agents/interactive_agent.py +113 -0
  797. modules/mute-agent/src/agents/mute_agent.py +622 -0
  798. modules/mute-agent/src/benchmarks/__init__.py +0 -0
  799. modules/mute-agent/src/benchmarks/evaluator.py +481 -0
  800. modules/mute-agent/src/benchmarks/scenarios.json +985 -0
  801. modules/mute-agent/src/core/__init__.py +0 -0
  802. modules/mute-agent/src/core/mock_state.py +320 -0
  803. modules/mute-agent/src/core/tools.py +441 -0
  804. modules/nexus/__init__.py +49 -0
  805. modules/nexus/arbiter.py +357 -0
  806. modules/nexus/client.py +464 -0
  807. modules/nexus/dmz.py +417 -0
  808. modules/nexus/escrow.py +428 -0
  809. modules/nexus/exceptions.py +284 -0
  810. modules/nexus/registry.py +391 -0
  811. modules/nexus/reputation.py +423 -0
  812. modules/nexus/schemas/__init__.py +49 -0
  813. modules/nexus/schemas/compliance.py +274 -0
  814. modules/nexus/schemas/escrow.py +249 -0
  815. modules/nexus/schemas/manifest.py +223 -0
  816. modules/nexus/schemas/receipt.py +206 -0
  817. modules/observability/README.md +192 -0
  818. modules/observability/alertmanager/alertmanager.yml +116 -0
  819. modules/observability/alerts/agent-os-alerts.yaml +197 -0
  820. modules/observability/docker-compose.yml +128 -0
  821. modules/observability/grafana/dashboards/agent-os-amb.json +448 -0
  822. modules/observability/grafana/dashboards/agent-os-cmvk.json +441 -0
  823. modules/observability/grafana/dashboards/agent-os-overview.json +268 -0
  824. modules/observability/grafana/dashboards/agent-os-performance.json +15 -0
  825. modules/observability/grafana/dashboards/agent-os-safety.json +50 -0
  826. modules/observability/grafana/provisioning/dashboards/dashboards.yml +15 -0
  827. modules/observability/grafana/provisioning/datasources/datasources.yml +33 -0
  828. modules/observability/otel/otel-collector-config.yml +61 -0
  829. modules/observability/prometheus/prometheus.yml +63 -0
  830. modules/observability/pyproject.toml +53 -0
  831. modules/observability/scripts/export_dashboards.py +55 -0
  832. modules/observability/src/agent_os_observability/__init__.py +25 -0
  833. modules/observability/src/agent_os_observability/dashboards.py +896 -0
  834. modules/observability/src/agent_os_observability/metrics.py +396 -0
  835. modules/observability/src/agent_os_observability/server.py +221 -0
  836. modules/observability/src/agent_os_observability/tracer.py +226 -0
  837. modules/primitives/.gitignore +8 -0
  838. modules/primitives/README.md +62 -0
  839. modules/primitives/agent_primitives/__init__.py +22 -0
  840. modules/primitives/agent_primitives/failures.py +82 -0
  841. modules/primitives/agent_primitives/py.typed +0 -0
  842. modules/primitives/pyproject.toml +68 -0
  843. modules/scak/.github/copilot-instructions.md +396 -0
  844. modules/scak/.github/workflows/release.yml +117 -0
  845. modules/scak/.gitignore +32 -0
  846. modules/scak/CHANGELOG.md +173 -0
  847. modules/scak/CITATION.cff +62 -0
  848. modules/scak/CONTRIBUTING.md +429 -0
  849. modules/scak/Dockerfile +58 -0
  850. modules/scak/ENTERPRISE_FEATURES.md +518 -0
  851. modules/scak/IMPLEMENTATION_SUMMARY.md +206 -0
  852. modules/scak/LIMITATIONS.md +565 -0
  853. modules/scak/MANIFEST.in +16 -0
  854. modules/scak/NOVELTY.md +535 -0
  855. modules/scak/README.md +928 -0
  856. modules/scak/RESEARCH.md +670 -0
  857. modules/scak/agent_kernel/__init__.py +66 -0
  858. modules/scak/agent_kernel/analyzer.py +432 -0
  859. modules/scak/agent_kernel/auditor.py +31 -0
  860. modules/scak/agent_kernel/completeness_auditor.py +234 -0
  861. modules/scak/agent_kernel/detector.py +200 -0
  862. modules/scak/agent_kernel/kernel.py +741 -0
  863. modules/scak/agent_kernel/memory_manager.py +82 -0
  864. modules/scak/agent_kernel/models.py +372 -0
  865. modules/scak/agent_kernel/nudge_mechanism.py +260 -0
  866. modules/scak/agent_kernel/outcome_analyzer.py +335 -0
  867. modules/scak/agent_kernel/patcher.py +579 -0
  868. modules/scak/agent_kernel/semantic_analyzer.py +313 -0
  869. modules/scak/agent_kernel/semantic_purge.py +346 -0
  870. modules/scak/agent_kernel/simulator.py +447 -0
  871. modules/scak/agent_kernel/teacher.py +82 -0
  872. modules/scak/agent_kernel/triage.py +149 -0
  873. modules/scak/build_and_publish.ps1 +74 -0
  874. modules/scak/build_and_publish.sh +74 -0
  875. modules/scak/cli.py +471 -0
  876. modules/scak/dashboard.py +462 -0
  877. modules/scak/datasets/DATASET_CARD.md +219 -0
  878. modules/scak/datasets/README.md +143 -0
  879. modules/scak/datasets/gaia_vague_queries/vague_queries.json +262 -0
  880. modules/scak/datasets/hf_upload/README.md +219 -0
  881. modules/scak/datasets/hf_upload/scak_gaia_laziness.jsonl +50 -0
  882. modules/scak/datasets/prepare_hf_datasets.py +145 -0
  883. modules/scak/datasets/red_team/jailbreak_patterns.json +202 -0
  884. modules/scak/docker-compose.yml +99 -0
  885. modules/scak/docs/Adaptive-Memory-Hierarchy.md +319 -0
  886. modules/scak/docs/Data-Contracts-and-Schemas.md +285 -0
  887. modules/scak/docs/Dual-Loop-Architecture.md +344 -0
  888. modules/scak/docs/Enhanced-Features.md +612 -0
  889. modules/scak/docs/LANGCHAIN_INTEGRATION.md +572 -0
  890. modules/scak/docs/README.md +128 -0
  891. modules/scak/docs/Reference-Implementations.md +163 -0
  892. modules/scak/docs/SCAK_V2.md +374 -0
  893. modules/scak/docs/Three-Failure-Types.md +178 -0
  894. modules/scak/examples/basic_example.py +155 -0
  895. modules/scak/examples/circuit_breaker_lazy_eval_demo.py +243 -0
  896. modules/scak/examples/langchain_integration_example.py +339 -0
  897. modules/scak/examples/layer4_demo.py +243 -0
  898. modules/scak/examples/production_features_demo.py +353 -0
  899. modules/scak/examples/quick_demo.py +79 -0
  900. modules/scak/examples/scak_v2_demo.py +252 -0
  901. modules/scak/experiments/README.md +438 -0
  902. modules/scak/experiments/ablation_studies/README.md +192 -0
  903. modules/scak/experiments/ablation_studies/ablation_no_audit.py +116 -0
  904. modules/scak/experiments/ablation_studies/ablation_no_purge.py +133 -0
  905. modules/scak/experiments/chaos_engineering/README.md +332 -0
  906. modules/scak/experiments/context_efficiency_test.py +328 -0
  907. modules/scak/experiments/gaia_benchmark/README.md +208 -0
  908. modules/scak/experiments/laziness_benchmark.py +179 -0
  909. modules/scak/experiments/long_horizon_task_experiment.py +252 -0
  910. modules/scak/experiments/multi_agent_rag_experiment.py +284 -0
  911. modules/scak/experiments/results/ablation_table.md +12 -0
  912. modules/scak/experiments/results/long_horizon.json +36 -0
  913. modules/scak/experiments/results/multi_agent_rag.json +66 -0
  914. modules/scak/experiments/run_comprehensive_ablations.py +332 -0
  915. modules/scak/experiments/test_auditor_patcher_integration.py +251 -0
  916. modules/scak/notebooks/getting_started.ipynb +33 -0
  917. modules/scak/paper/ARXIV_SUBMISSION_METADATA.txt +109 -0
  918. modules/scak/paper/PAPER_CHECKLIST.md +304 -0
  919. modules/scak/paper/Paper.pdf +0 -0
  920. modules/scak/paper/README.md +113 -0
  921. modules/scak/paper/appendix.md +351 -0
  922. modules/scak/paper/arxiv/bibliography.bib +284 -0
  923. modules/scak/paper/arxiv/fig1_ooda_architecture.pdf +0 -0
  924. modules/scak/paper/arxiv/fig2_memory_hierarchy.pdf +0 -0
  925. modules/scak/paper/arxiv/fig3_gaia_results.pdf +0 -0
  926. modules/scak/paper/arxiv/fig4_ablation_heatmap.pdf +0 -0
  927. modules/scak/paper/arxiv/fig5_context_reduction.pdf +0 -0
  928. modules/scak/paper/arxiv/fig6_mttr_boxplot.pdf +0 -0
  929. modules/scak/paper/arxiv/main.aux +103 -0
  930. modules/scak/paper/arxiv/main.bbl +113 -0
  931. modules/scak/paper/arxiv/main.blg +55 -0
  932. modules/scak/paper/arxiv/main.out +31 -0
  933. modules/scak/paper/arxiv/main.pdf +0 -0
  934. modules/scak/paper/arxiv/main.tex +482 -0
  935. modules/scak/paper/arxiv_submission/bibliography.bib +284 -0
  936. modules/scak/paper/arxiv_submission/fig1_ooda_architecture.pdf +0 -0
  937. modules/scak/paper/arxiv_submission/fig2_memory_hierarchy.pdf +0 -0
  938. modules/scak/paper/arxiv_submission/fig3_gaia_results.pdf +0 -0
  939. modules/scak/paper/arxiv_submission/fig4_ablation_heatmap.pdf +0 -0
  940. modules/scak/paper/arxiv_submission/fig5_context_reduction.pdf +0 -0
  941. modules/scak/paper/arxiv_submission/fig6_mttr_boxplot.pdf +0 -0
  942. modules/scak/paper/arxiv_submission/main.aux +103 -0
  943. modules/scak/paper/arxiv_submission/main.bbl +113 -0
  944. modules/scak/paper/arxiv_submission/main.blg +55 -0
  945. modules/scak/paper/arxiv_submission/main.out +31 -0
  946. modules/scak/paper/arxiv_submission/main.pdf +0 -0
  947. modules/scak/paper/arxiv_submission/main.tex +482 -0
  948. modules/scak/paper/arxiv_submission.tar.gz +0 -0
  949. modules/scak/paper/bibliography.bib +284 -0
  950. modules/scak/paper/build.sh +55 -0
  951. modules/scak/paper/figures/README.md +32 -0
  952. modules/scak/paper/figures/fig1_ooda_architecture.md +75 -0
  953. modules/scak/paper/figures/fig1_ooda_architecture.pdf +0 -0
  954. modules/scak/paper/figures/fig1_ooda_architecture.png +0 -0
  955. modules/scak/paper/figures/fig2_memory_hierarchy.md +83 -0
  956. modules/scak/paper/figures/fig2_memory_hierarchy.pdf +0 -0
  957. modules/scak/paper/figures/fig2_memory_hierarchy.png +0 -0
  958. modules/scak/paper/figures/fig3_gaia_results.md +64 -0
  959. modules/scak/paper/figures/fig3_gaia_results.pdf +0 -0
  960. modules/scak/paper/figures/fig3_gaia_results.png +0 -0
  961. modules/scak/paper/figures/fig4_ablation_heatmap.md +64 -0
  962. modules/scak/paper/figures/fig4_ablation_heatmap.pdf +0 -0
  963. modules/scak/paper/figures/fig4_ablation_heatmap.png +0 -0
  964. modules/scak/paper/figures/fig5_context_reduction.md +71 -0
  965. modules/scak/paper/figures/fig5_context_reduction.pdf +0 -0
  966. modules/scak/paper/figures/fig5_context_reduction.png +0 -0
  967. modules/scak/paper/figures/fig6_mttr_boxplot.md +80 -0
  968. modules/scak/paper/figures/fig6_mttr_boxplot.pdf +0 -0
  969. modules/scak/paper/figures/fig6_mttr_boxplot.png +0 -0
  970. modules/scak/paper/figures/generate_figures.py +463 -0
  971. modules/scak/paper/main.aux +103 -0
  972. modules/scak/paper/main.bbl +113 -0
  973. modules/scak/paper/main.blg +55 -0
  974. modules/scak/paper/main.md +192 -0
  975. modules/scak/paper/main.out +31 -0
  976. modules/scak/paper/main.pdf +0 -0
  977. modules/scak/paper/main.tex +482 -0
  978. modules/scak/reproducibility/ABLATIONS.md +225 -0
  979. modules/scak/reproducibility/Dockerfile.reproducibility +34 -0
  980. modules/scak/reproducibility/README.md +421 -0
  981. modules/scak/reproducibility/requirements-pinned.txt +32 -0
  982. modules/scak/reproducibility/run_all_experiments.py +395 -0
  983. modules/scak/reproducibility/seed_control.py +53 -0
  984. modules/scak/reproducibility/statistical_analysis.py +302 -0
  985. modules/scak/requirements.txt +50 -0
  986. modules/scak/setup.py +93 -0
  987. modules/scak/src/__init__.py +124 -0
  988. modules/scak/src/agents/__init__.py +13 -0
  989. modules/scak/src/agents/conflict_resolution.py +732 -0
  990. modules/scak/src/agents/orchestrator.py +761 -0
  991. modules/scak/src/agents/pubsub.py +484 -0
  992. modules/scak/src/agents/shadow_teacher.py +344 -0
  993. modules/scak/src/agents/swarm.py +661 -0
  994. modules/scak/src/agents/worker.py +357 -0
  995. modules/scak/src/integrations/__init__.py +81 -0
  996. modules/scak/src/integrations/cmvk_adapter.py +430 -0
  997. modules/scak/src/integrations/control_plane_adapter.py +601 -0
  998. modules/scak/src/integrations/langchain_integration.py +902 -0
  999. modules/scak/src/interfaces/__init__.py +59 -0
  1000. modules/scak/src/interfaces/llm_clients.py +505 -0
  1001. modules/scak/src/interfaces/openapi_tools.py +611 -0
  1002. modules/scak/src/interfaces/plugin_system.py +605 -0
  1003. modules/scak/src/interfaces/protocols.py +365 -0
  1004. modules/scak/src/interfaces/telemetry.py +464 -0
  1005. modules/scak/src/interfaces/tool_registry.py +547 -0
  1006. modules/scak/src/kernel/__init__.py +100 -0
  1007. modules/scak/src/kernel/auditor.py +305 -0
  1008. modules/scak/src/kernel/circuit_breaker.py +398 -0
  1009. modules/scak/src/kernel/core.py +724 -0
  1010. modules/scak/src/kernel/distributed.py +667 -0
  1011. modules/scak/src/kernel/evolution.py +455 -0
  1012. modules/scak/src/kernel/failover.py +621 -0
  1013. modules/scak/src/kernel/governance.py +710 -0
  1014. modules/scak/src/kernel/governance_v2.py +603 -0
  1015. modules/scak/src/kernel/lazy_evaluator.py +514 -0
  1016. modules/scak/src/kernel/load_testing.py +633 -0
  1017. modules/scak/src/kernel/memory.py +945 -0
  1018. modules/scak/src/kernel/patcher.py +581 -0
  1019. modules/scak/src/kernel/rubric.py +419 -0
  1020. modules/scak/src/kernel/schemas.py +390 -0
  1021. modules/scak/src/kernel/skill_mapper.py +309 -0
  1022. modules/scak/src/kernel/triage.py +149 -0
  1023. modules/scak/src/mocks/__init__.py +99 -0
  1024. modules/scak/tests/__init__.py +1 -0
  1025. modules/scak/tests/test_circuit_breaker.py +403 -0
  1026. modules/scak/tests/test_conflict_resolution.py +287 -0
  1027. modules/scak/tests/test_dual_loop.py +463 -0
  1028. modules/scak/tests/test_enhanced_features.py +421 -0
  1029. modules/scak/tests/test_failover_and_load.py +438 -0
  1030. modules/scak/tests/test_governance.py +185 -0
  1031. modules/scak/tests/test_kernel.py +359 -0
  1032. modules/scak/tests/test_langchain_integration.py +451 -0
  1033. modules/scak/tests/test_lazy_evaluator.py +465 -0
  1034. modules/scak/tests/test_llm_clients.py +122 -0
  1035. modules/scak/tests/test_memory_controller.py +528 -0
  1036. modules/scak/tests/test_orchestrator.py +181 -0
  1037. modules/scak/tests/test_phase3_integration.py +265 -0
  1038. modules/scak/tests/test_pubsub_swarm.py +203 -0
  1039. modules/scak/tests/test_reference_implementations.py +240 -0
  1040. modules/scak/tests/test_rubric.py +363 -0
  1041. modules/scak/tests/test_scak_v2.py +651 -0
  1042. modules/scak/tests/test_skill_mapper.py +217 -0
  1043. modules/scak/tests/test_specific_failures.py +393 -0
  1044. modules/scak/tests/test_tool_registry.py +264 -0
  1045. modules/scak/tests/test_tools_and_plugins.py +303 -0
  1046. modules/scak/tests/test_triage.py +596 -0
  1047. modules/scak/tests/test_write_through.py +319 -0
  1048. agent_os_kernel-1.1.0.dist-info/METADATA +0 -400
  1049. agent_os_kernel-1.1.0.dist-info/RECORD +0 -12
  1050. {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/WHEEL +0 -0
  1051. {agent_os_kernel-1.1.0.dist-info → agent_os_kernel-1.2.0.dist-info}/licenses/LICENSE +0 -0
@@ -0,0 +1,284 @@
1
+ % Self-Correcting Agent Kernel - Bibliography
2
+ % Generated: 2026-01-18
3
+ % For use in academic paper submission
4
+
5
+ % ===== Core Inspirations =====
6
+
7
+ @inproceedings{shinn2023reflexion,
8
+ title={Reflexion: Language Agents with Verbal Reinforcement Learning},
9
+ author={Shinn, Noah and Cassano, Federico and Berman, Edward and Gopinath, Ashwin and Narasimhan, Karthik and Yao, Shunyu},
10
+ booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
11
+ year={2023},
12
+ url={https://arxiv.org/abs/2303.11366}
13
+ }
14
+
15
+ @article{madaan2023self,
16
+ title={Self-Refine: Iterative Refinement with Self-Feedback},
17
+ author={Madaan, Aman and Tandon, Niket and Gupta, Prakhar and others},
18
+ journal={Advances in Neural Information Processing Systems (NeurIPS)},
19
+ year={2023},
20
+ url={https://arxiv.org/abs/2303.17651}
21
+ }
22
+
23
+ @article{wang2023voyager,
24
+ title={Voyager: An Open-Ended Embodied Agent with Large Language Models},
25
+ author={Wang, Guanzhi and Xie, Yuqi and Jiang, Yunfan and others},
26
+ year={2023},
27
+ url={https://arxiv.org/abs/2305.16291}
28
+ }
29
+
30
+ @article{bai2022constitutional,
31
+ title={Constitutional AI: Harmlessness from AI Feedback},
32
+ author={Bai, Yuntao and Kadavath, Saurav and Kundu, Sandipan and others},
33
+ journal={arXiv preprint arXiv:2212.08073},
34
+ year={2022},
35
+ publisher={Anthropic}
36
+ }
37
+
38
+ % ===== Reinforcement Learning from Human Feedback =====
39
+
40
+ @inproceedings{christiano2017deep,
41
+ title={Deep Reinforcement Learning from Human Feedback},
42
+ author={Christiano, Paul F and Leike, Jan and Brown, Tom and others},
43
+ booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
44
+ year={2017},
45
+ url={https://arxiv.org/abs/1706.03741}
46
+ }
47
+
48
+ @article{ouyang2022training,
49
+ title={Training language models to follow instructions with human feedback},
50
+ author={Ouyang, Long and Wu, Jeffrey and Jiang, Xu and others},
51
+ journal={arXiv preprint arXiv:2203.02155},
52
+ year={2022},
53
+ publisher={OpenAI}
54
+ }
55
+
56
+ @article{stiennon2020learning,
57
+ title={Learning to summarize with human feedback},
58
+ author={Stiennon, Nisan and Ouyang, Long and Wu, Jeffrey and others},
59
+ booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
60
+ year={2020},
61
+ url={https://arxiv.org/abs/2009.01325}
62
+ }
63
+
64
+ % ===== Multi-Agent Systems =====
65
+
66
+ @article{wu2023autogen,
67
+ title={AutoGen: Enabling Next-Gen LLM Applications via Multi-Agent Conversation},
68
+ author={Wu, Qingyun and Bansal, Gagan and Zhang, Jieyu and others},
69
+ journal={arXiv preprint arXiv:2308.08155},
70
+ year={2023},
71
+ publisher={Microsoft Research}
72
+ }
73
+
74
+ @article{park2023generative,
75
+ title={Generative Agents: Interactive Simulacra of Human Behavior},
76
+ author={Park, Joon Sung and O'Brien, Joseph C and Cai, Carrie J and others},
77
+ year={2023},
78
+ url={https://arxiv.org/abs/2304.03442}
79
+ }
80
+
81
+ @article{hong2023metagpt,
82
+ title={MetaGPT: Meta Programming for A Multi-Agent Collaborative Framework},
83
+ author={Hong, Sirui and Zhuge, Mingchen and Chen, Jiaqi and Zheng, Xiawu and Cheng, Yuheng and Zhang, Ceyao and others},
84
+ year={2023},
85
+ url={https://arxiv.org/abs/2308.00352}
86
+ }
87
+
88
+ % ===== Tool Use and Grounding =====
89
+
90
+ @article{schick2023toolformer,
91
+ title={Toolformer: Language Models Can Teach Themselves to Use Tools},
92
+ author={Schick, Timo and Dwivedi-Yu, Jane and Dessi, Roberto and others},
93
+ year={2023},
94
+ url={https://arxiv.org/abs/2302.04761}
95
+ }
96
+
97
+ @inproceedings{yao2023react,
98
+ title={ReAct: Synergizing Reasoning and Acting in Language Models},
99
+ author={Yao, Shunyu and Zhao, Jeffrey and Yu, Dian and others},
100
+ booktitle={International Conference on Learning Representations (ICLR)},
101
+ year={2023},
102
+ url={https://arxiv.org/abs/2210.03629}
103
+ }
104
+
105
+ @article{qin2023toolllm,
106
+ title={ToolLLM: Facilitating Large Language Models to Master 16000+ Real-world APIs},
107
+ author={Qin, Yujia and Liang, Shihao and Ye, Yining and others},
108
+ year={2023},
109
+ url={https://arxiv.org/abs/2307.16789}
110
+ }
111
+
112
+ % ===== Context Management =====
113
+
114
+ @article{liu2023lost,
115
+ title={Lost in the Middle: How Language Models Use Long Contexts},
116
+ author={Liu, Nelson F and Lin, Kevin and Hewitt, John and others},
117
+ year={2023},
118
+ url={https://arxiv.org/abs/2307.03172}
119
+ }
120
+
121
+ @article{mohtashami2023landmark,
122
+ title={Landmark Attention: Random-Access Infinite Context Length for Transformers},
123
+ author={Mohtashami, Amirkeivan and Jaggi, Martin},
124
+ year={2023},
125
+ url={https://arxiv.org/abs/2305.16300}
126
+ }
127
+
128
+ @inproceedings{lewis2020retrieval,
129
+ title={Retrieval-Augmented Generation for Knowledge-Intensive NLP Tasks},
130
+ author={Lewis, Patrick and Perez, Ethan and Piktus, Aleksandra and others},
131
+ booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
132
+ year={2020},
133
+ url={https://arxiv.org/abs/2005.11401}
134
+ }
135
+
136
+ % ===== Safety and Alignment (2024-2025) =====
137
+
138
+ @misc{meta2024llamaguard2,
139
+ title={LlamaGuard 2: Safety Classification for LLM Interactions},
140
+ author={{Meta AI}},
141
+ year={2024},
142
+ howpublished={Meta Research Blog},
143
+ note={Technical report on improved safety classification}
144
+ }
145
+
146
+ @article{han2024wildguard,
147
+ title={WildGuard: Open One-Stop Moderation Tools for Safety Risks, Jailbreaks, and Refusals of LLMs},
148
+ author={Han, Seungju and Rao, Kavel and Ettinger, Allyson and Jiang, Liwei and Lin, Bill Yuchen and Lambert, Nathan and Choi, Yejin and Dziri, Nouha},
149
+ journal={Advances in Neural Information Processing Systems (NeurIPS)},
150
+ year={2024},
151
+ url={https://arxiv.org/abs/2406.18495}
152
+ }
153
+
154
+ @article{zou2023universal,
155
+ title={Universal and Transferable Adversarial Attacks on Aligned Language Models},
156
+ author={Zou, Andy and Wang, Zifan and Carlini, Nicholas and Nasr, Milad and Kolter, J. Zico and Fredrikson, Matt},
157
+ year={2023},
158
+ url={https://arxiv.org/abs/2307.15043}
159
+ }
160
+
161
+ % ===== Benchmarks =====
162
+
163
+ @article{mialon2023gaia,
164
+ title={GAIA: a benchmark for General AI Assistants},
165
+ author={Mialon, Gr{\'e}goire and Fourrier, Cl{\'e}mentine and Swift, Craig and Wolf, Thomas and LeCun, Yann and Scialom, Thomas},
166
+ year={2023},
167
+ url={https://arxiv.org/abs/2311.12983}
168
+ }
169
+
170
+ @article{liu2023agentbench,
171
+ title={AgentBench: Evaluating LLMs as Agents},
172
+ author={Liu, Xiao and Yu, Hao and Zhang, Hanchen and others},
173
+ year={2023},
174
+ url={https://arxiv.org/abs/2308.03688}
175
+ }
176
+
177
+ % ===== Production ML =====
178
+
179
+ @inproceedings{sculley2015hidden,
180
+ title={Hidden Technical Debt in Machine Learning Systems},
181
+ author={Sculley, David and Holt, Gary and Golovin, Daniel and others},
182
+ booktitle={Advances in Neural Information Processing Systems (NeurIPS)},
183
+ year={2015}
184
+ }
185
+
186
+ @inproceedings{breck2019data,
187
+ title={Data Validation for Machine Learning},
188
+ author={Breck, Eric and Polyzotis, Neoklis and Roy, Sudip and others},
189
+ booktitle={MLSys},
190
+ year={2019}
191
+ }
192
+
193
+ % ===== Cognitive Science Foundations =====
194
+
195
+ @book{kahneman2011thinking,
196
+ title={Thinking, Fast and Slow},
197
+ author={Kahneman, Daniel},
198
+ year={2011},
199
+ publisher={Farrar, Straus and Giroux}
200
+ }
201
+
202
+ @book{boyd1987discourse,
203
+ title={A Discourse on Winning and Losing},
204
+ author={Boyd, John R},
205
+ year={1987},
206
+ publisher={Air University Press}
207
+ }
208
+
209
+ % ===== Governance and Policy (2025) =====
210
+
211
+ @misc{wef2025governance,
212
+ title={AI Agents in the Workplace: Governance Framework and Risk Mitigation},
213
+ author={{World Economic Forum}},
214
+ year={2025},
215
+ howpublished={WEF Whitepaper},
216
+ month={January}
217
+ }
218
+
219
+ @misc{euai2024,
220
+ title={Regulation (EU) 2024/1689 - Artificial Intelligence Act},
221
+ author={{European Parliament}},
222
+ year={2024},
223
+ howpublished={Official Journal of the European Union}
224
+ }
225
+
226
+ % ===== LLM Models Referenced =====
227
+
228
+ @misc{openai2023gpt4,
229
+ title={GPT-4 Technical Report},
230
+ author={{OpenAI}},
231
+ year={2023},
232
+ url={https://arxiv.org/abs/2303.08774}
233
+ }
234
+
235
+ @misc{openai2024o1,
236
+ title={Learning to Reason with LLMs},
237
+ author={{OpenAI}},
238
+ year={2024},
239
+ howpublished={OpenAI Blog},
240
+ month={September}
241
+ }
242
+
243
+ @misc{anthropic2024claude,
244
+ title={Claude 3.5 Sonnet: Extended Context and Reasoning},
245
+ author={{Anthropic}},
246
+ year={2024},
247
+ howpublished={Anthropic Release Notes},
248
+ month={June}
249
+ }
250
+
251
+ % ===== Additional References =====
252
+
253
+ @article{chen2023teaching,
254
+ title={Teaching Large Language Models to Self-Debug},
255
+ author={Chen, Xinyun and Lin, Maxwell and Sch{\"a}rli, Nathanael and Zhou, Denny},
256
+ year={2023},
257
+ url={https://arxiv.org/abs/2304.05128}
258
+ }
259
+
260
+ @article{zhang2023multimodal,
261
+ title={Multimodal Chain-of-Thought Reasoning in Language Models},
262
+ author={Zhang, Zhuosheng and Zhang, Aston and Li, Mu and others},
263
+ year={2023},
264
+ url={https://arxiv.org/abs/2302.00923}
265
+ }
266
+
267
+ @misc{basiri2016chaos,
268
+ title={Chaos Engineering},
269
+ author={Basiri, Ali and Behnam, Niosha and de Rooij, Ruud and others},
270
+ journal={IEEE Software},
271
+ year={2016},
272
+ publisher={IEEE}
273
+ }
274
+
275
+ % ===== Our Work =====
276
+
277
+ @software{scak2026,
278
+ title={Self-Correcting Agent Kernel: Automated Alignment via Differential Auditing and Semantic Memory Hygiene},
279
+ author={{Self-Correcting Agent Team}},
280
+ year={2026},
281
+ version={1.1.0},
282
+ url={https://github.com/imran-siddique/self-correcting-agent-kernel},
283
+ note={Research foundations: Reflexion (NeurIPS 2023), Constitutional AI (Anthropic 2022), Voyager (arXiv:2305.16291)}
284
+ }
@@ -0,0 +1,103 @@
1
+ \relax
2
+ \providecommand\hyper@newdestlabel[2]{}
3
+ \providecommand\HyField@AuxAddToFields[1]{}
4
+ \providecommand\HyField@AuxAddToCoFields[2]{}
5
+ \citation{liu2023lost}
6
+ \providecommand \oddpage@label [2]{}
7
+ \@writefile{toc}{\contentsline {section}{\numberline {1}Introduction}{1}{section.1}\protected@file@percent }
8
+ \@writefile{toc}{\contentsline {subsection}{\numberline {1.1}The Accumulation Paradox}{1}{subsection.1.1}\protected@file@percent }
9
+ \citation{bai2022constitutional}
10
+ \citation{scak2026}
11
+ \citation{basiri2016chaos}
12
+ \citation{shinn2023reflexion}
13
+ \citation{madaan2023self}
14
+ \citation{bai2022constitutional}
15
+ \citation{wu2023autogen}
16
+ \citation{hong2023metagpt}
17
+ \citation{wang2023voyager}
18
+ \citation{liu2023lost}
19
+ \citation{mohtashami2023landmark}
20
+ \citation{lewis2020retrieval}
21
+ \@writefile{toc}{\contentsline {subsection}{\numberline {1.2}The ``Scale by Subtraction'' Philosophy}{2}{subsection.1.2}\protected@file@percent }
22
+ \@writefile{toc}{\contentsline {section}{\numberline {2}Related Work}{2}{section.2}\protected@file@percent }
23
+ \@writefile{toc}{\contentsline {subsection}{\numberline {2.1}The OODA Loop: Attack Surface or Defense?}{2}{subsection.2.1}\protected@file@percent }
24
+ \@writefile{toc}{\contentsline {subsection}{\numberline {2.2}Self-Correction and Feedback}{2}{subsection.2.2}\protected@file@percent }
25
+ \@writefile{toc}{\contentsline {subsection}{\numberline {2.3}Multi-Agent Systems}{2}{subsection.2.3}\protected@file@percent }
26
+ \citation{euai2024}
27
+ \citation{wef2025governance}
28
+ \citation{meta2024llamaguard2}
29
+ \citation{han2024wildguard}
30
+ \citation{boyd1987discourse}
31
+ \@writefile{toc}{\contentsline {subsection}{\numberline {2.4}Context Management}{3}{subsection.2.4}\protected@file@percent }
32
+ \@writefile{toc}{\contentsline {subsection}{\numberline {2.5}Recent Advances in Agent Alignment (2024--2026)}{3}{subsection.2.5}\protected@file@percent }
33
+ \@writefile{toc}{\contentsline {section}{\numberline {3}System Design}{3}{section.3}\protected@file@percent }
34
+ \@writefile{toc}{\contentsline {subsection}{\numberline {3.1}Problem Formulation}{3}{subsection.3.1}\protected@file@percent }
35
+ \@writefile{toc}{\contentsline {subsection}{\numberline {3.2}Dual-Loop Architecture}{3}{subsection.3.2}\protected@file@percent }
36
+ \@writefile{toc}{\contentsline {subsection}{\numberline {3.3}Differential Auditing Algorithm}{3}{subsection.3.3}\protected@file@percent }
37
+ \@writefile{lof}{\contentsline {figure}{\numberline {1}{\ignorespaces \textbf {\textsc {SCAK}{} Dual-Loop Architecture.} Loop 1 (Runtime) handles user queries with minimal latency. Loop 2 (Alignment) triggers asynchronously on give-up signals, using differential auditing to detect laziness and generate competence patches.}}{4}{figure.caption.1}\protected@file@percent }
38
+ \providecommand*\caption@xref[2]{\@setref\relax\@undefined{#1}}
39
+ \newlabel{fig:architecture}{{1}{4}{\textbf {\scak {} Dual-Loop Architecture.} Loop 1 (Runtime) handles user queries with minimal latency. Loop 2 (Alignment) triggers asynchronously on give-up signals, using differential auditing to detect laziness and generate competence patches}{figure.caption.1}{}}
40
+ \@writefile{toc}{\contentsline {subsection}{\numberline {3.4}Semantic Purge (Formalizing Decay)}{4}{subsection.3.4}\protected@file@percent }
41
+ \@writefile{toc}{\contentsline {subsection}{\numberline {3.5}Three-Tier Memory Hierarchy}{4}{subsection.3.5}\protected@file@percent }
42
+ \citation{wu2023autogen}
43
+ \@writefile{loa}{\contentsline {algorithm}{\numberline {1}{\ignorespaces Differential Auditing}}{5}{algorithm.1}\protected@file@percent }
44
+ \newlabel{alg:audit}{{1}{5}{Differential Auditing}{algorithm.1}{}}
45
+ \@writefile{loa}{\contentsline {algorithm}{\numberline {2}{\ignorespaces Semantic Purge (Model Upgrade)}}{5}{algorithm.2}\protected@file@percent }
46
+ \newlabel{alg:purge}{{2}{5}{Semantic Purge (Model Upgrade)}{algorithm.2}{}}
47
+ \@writefile{toc}{\contentsline {section}{\numberline {4}Experiments}{5}{section.4}\protected@file@percent }
48
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.1}Experimental Setup}{5}{subsection.4.1}\protected@file@percent }
49
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.2}GAIA Laziness Benchmark}{5}{subsection.4.2}\protected@file@percent }
50
+ \@writefile{lof}{\contentsline {figure}{\numberline {2}{\ignorespaces \textbf {Three-Tier Memory Hierarchy.} Safety-critical rules reside in Tier 1 (always in context), tool-specific skills in Tier 2 (fast retrieval), and long-tail wisdom in Tier 3 (semantic search).}}{6}{figure.caption.2}\protected@file@percent }
51
+ \newlabel{fig:memory}{{2}{6}{\textbf {Three-Tier Memory Hierarchy.} Safety-critical rules reside in Tier 1 (always in context), tool-specific skills in Tier 2 (fast retrieval), and long-tail wisdom in Tier 3 (semantic search)}{figure.caption.2}{}}
52
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.3}Amnesia Test (Context Efficiency)}{6}{subsection.4.3}\protected@file@percent }
53
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.4}Chaos Engineering (Robustness)}{6}{subsection.4.4}\protected@file@percent }
54
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.5}Ablation Studies}{6}{subsection.4.5}\protected@file@percent }
55
+ \@writefile{toc}{\contentsline {subsection}{\numberline {4.6}Cost Analysis}{6}{subsection.4.6}\protected@file@percent }
56
+ \@writefile{lot}{\contentsline {table}{\numberline {1}{\ignorespaces \textbf {GAIA Laziness Benchmark Results.} Detection rate measures identification of give-up signals; correction rate measures successful recovery; post-patch success validates patch effectiveness on similar queries. Results show mean $\pm $ std over 5 runs. Statistical significance: $^{***}p<0.001$ vs. baseline.}}{7}{table.caption.3}\protected@file@percent }
57
+ \newlabel{tab:gaia}{{1}{7}{\textbf {GAIA Laziness Benchmark Results.} Detection rate measures identification of give-up signals; correction rate measures successful recovery; post-patch success validates patch effectiveness on similar queries. Results show mean $\pm $ std over 5 runs. Statistical significance: $^{***}p<0.001$ vs. baseline}{table.caption.3}{}}
58
+ \@writefile{lot}{\contentsline {table}{\numberline {2}{\ignorespaces \textbf {Context Reduction via Semantic Purge.} \textsc {SCAK}{} achieves 45\% context reduction on model upgrade while retaining 100\% of business rules (10/10 Type~B{} patches preserved).}}{7}{table.caption.5}\protected@file@percent }
59
+ \newlabel{tab:amnesia}{{2}{7}{\textbf {Context Reduction via Semantic Purge.} \scak {} achieves 45\% context reduction on model upgrade while retaining 100\% of business rules (10/10 \typeb {} patches preserved)}{table.caption.5}{}}
60
+ \@writefile{toc}{\contentsline {section}{\numberline {5}Discussion}{7}{section.5}\protected@file@percent }
61
+ \@writefile{toc}{\contentsline {subsection}{\numberline {5.1}The Virtue of Forgetting}{7}{subsection.5.1}\protected@file@percent }
62
+ \@writefile{toc}{\contentsline {subsection}{\numberline {5.2}Why External Teachers Outperform Self-Critique}{7}{subsection.5.2}\protected@file@percent }
63
+ \@writefile{toc}{\contentsline {subsection}{\numberline {5.3}Limitations}{7}{subsection.5.3}\protected@file@percent }
64
+ \citation{wef2025governance,euai2024}
65
+ \@writefile{lof}{\contentsline {figure}{\numberline {3}{\ignorespaces \textbf {GAIA Laziness Benchmark: Correction Rates.} \textsc {SCAK}{} achieves 72\% correction rate, outperforming both self-critique (40\%) and the stronger o1-preview model used alone (40\%).}}{8}{figure.caption.4}\protected@file@percent }
66
+ \newlabel{fig:gaia}{{3}{8}{\textbf {GAIA Laziness Benchmark: Correction Rates.} \scak {} achieves 72\% correction rate, outperforming both self-critique (40\%) and the stronger o1-preview model used alone (40\%)}{figure.caption.4}{}}
67
+ \@writefile{lot}{\contentsline {table}{\numberline {3}{\ignorespaces \textbf {Chaos Engineering Results.} MTTR measures seconds to recover from injected failures. \textsc {SCAK}{} recovers from all scenarios; baselines require manual intervention.}}{8}{table.caption.7}\protected@file@percent }
68
+ \newlabel{tab:chaos}{{3}{8}{\textbf {Chaos Engineering Results.} MTTR measures seconds to recover from injected failures. \scak {} recovers from all scenarios; baselines require manual intervention}{table.caption.7}{}}
69
+ \@writefile{toc}{\contentsline {subsection}{\numberline {5.4}Broader Impact}{8}{subsection.5.4}\protected@file@percent }
70
+ \@writefile{lof}{\contentsline {figure}{\numberline {4}{\ignorespaces \textbf {Context Efficiency: Semantic Purge Effect.} Without purge, context grows monotonically. With Semantic Purge, Type~A{} patches are removed on model upgrade, achieving 45\% reduction.}}{9}{figure.caption.6}\protected@file@percent }
71
+ \newlabel{fig:context}{{4}{9}{\textbf {Context Efficiency: Semantic Purge Effect.} Without purge, context grows monotonically. With Semantic Purge, \typea {} patches are removed on model upgrade, achieving 45\% reduction}{figure.caption.6}{}}
72
+ \@writefile{toc}{\contentsline {section}{\numberline {6}Conclusion}{9}{section.6}\protected@file@percent }
73
+ \bibstyle{plainnat}
74
+ \bibdata{bibliography}
75
+ \bibcite{bai2022constitutional}{{1}{2022}{{Bai et~al.}}{{Bai, Kadavath, Kundu, et~al.}}}
76
+ \bibcite{basiri2016chaos}{{2}{2016}{{Basiri et~al.}}{{Basiri, Behnam, de~Rooij, et~al.}}}
77
+ \@writefile{lof}{\contentsline {figure}{\numberline {5}{\ignorespaces \textbf {Mean Time To Recovery (MTTR).} \textsc {SCAK}{} achieves consistent recovery in under 30 seconds across all failure scenarios.}}{10}{figure.caption.8}\protected@file@percent }
78
+ \newlabel{fig:mttr}{{5}{10}{\textbf {Mean Time To Recovery (MTTR).} \scak {} achieves consistent recovery in under 30 seconds across all failure scenarios}{figure.caption.8}{}}
79
+ \@writefile{toc}{\contentsline {paragraph}{LLM Disclosure.}{10}{section*.12}\protected@file@percent }
80
+ \bibcite{boyd1987discourse}{{3}{1987}{{Boyd}}{{}}}
81
+ \bibcite{euai2024}{{4}{2024}{{European Parliament}}{{}}}
82
+ \bibcite{han2024wildguard}{{5}{2024}{{Han et~al.}}{{Han, Rao, Ettinger, Jiang, Lin, Lambert, Choi, and Dziri}}}
83
+ \bibcite{hong2023metagpt}{{6}{2023}{{Hong et~al.}}{{Hong, Zhuge, Chen, Zheng, Cheng, Zhang, et~al.}}}
84
+ \bibcite{lewis2020retrieval}{{7}{2020}{{Lewis et~al.}}{{Lewis, Perez, Piktus, et~al.}}}
85
+ \@writefile{lot}{\contentsline {table}{\numberline {4}{\ignorespaces \textbf {Ablation Study.} Each row removes one component from the full \textsc {SCAK}{} system. Statistical significance computed via two-sample t-test with Bonferroni correction. $^{***}p<0.001$, $^{**}p<0.01$, $^{*}p<0.05$.}}{11}{table.caption.9}\protected@file@percent }
86
+ \newlabel{tab:ablation}{{4}{11}{\textbf {Ablation Study.} Each row removes one component from the full \scak {} system. Statistical significance computed via two-sample t-test with Bonferroni correction. $^{***}p<0.001$, $^{**}p<0.01$, $^{*}p<0.05$}{table.caption.9}{}}
87
+ \@writefile{lof}{\contentsline {figure}{\numberline {6}{\ignorespaces \textbf {Ablation Study: Component Contributions.} Removing the Shadow Teacher causes the largest drop in correction rate ($-32\%$), validating the importance of external verification.}}{11}{figure.caption.10}\protected@file@percent }
88
+ \newlabel{fig:ablation}{{6}{11}{\textbf {Ablation Study: Component Contributions.} Removing the Shadow Teacher causes the largest drop in correction rate ($-32\%$), validating the importance of external verification}{figure.caption.10}{}}
89
+ \bibcite{liu2023lost}{{8}{2023}{{Liu et~al.}}{{Liu, Lin, Hewitt, et~al.}}}
90
+ \bibcite{madaan2023self}{{9}{2023}{{Madaan et~al.}}{{Madaan, Tandon, Gupta, et~al.}}}
91
+ \bibcite{meta2024llamaguard2}{{10}{2024}{{Meta AI}}{{}}}
92
+ \bibcite{mohtashami2023landmark}{{11}{2023}{{Mohtashami and Jaggi}}{{}}}
93
+ \bibcite{scak2026}{{12}{2026}{{Self-Correcting Agent Team}}{{}}}
94
+ \bibcite{shinn2023reflexion}{{13}{2023}{{Shinn et~al.}}{{Shinn, Cassano, Berman, Gopinath, Narasimhan, and Yao}}}
95
+ \bibcite{wang2023voyager}{{14}{2023}{{Wang et~al.}}{{Wang, Xie, Jiang, et~al.}}}
96
+ \bibcite{wef2025governance}{{15}{2025}{{World Economic Forum}}{{}}}
97
+ \bibcite{wu2023autogen}{{16}{2023}{{Wu et~al.}}{{Wu, Bansal, Zhang, et~al.}}}
98
+ \@writefile{lot}{\contentsline {table}{\numberline {5}{\ignorespaces \textbf {Cost Efficiency.} Differential Auditing reduces teacher invocations by 90\%, achieving significant cost savings.}}{12}{table.caption.11}\protected@file@percent }
99
+ \newlabel{tab:cost}{{5}{12}{\textbf {Cost Efficiency.} Differential Auditing reduces teacher invocations by 90\%, achieving significant cost savings}{table.caption.11}{}}
100
+ \@writefile{toc}{\contentsline {section}{\numberline {A}Reproducibility Details}{12}{appendix.A}\protected@file@percent }
101
+ \@writefile{toc}{\contentsline {section}{\numberline {B}Extended Ablation Results}{13}{appendix.B}\protected@file@percent }
102
+ \@writefile{toc}{\contentsline {section}{\numberline {C}Patch Examples}{13}{appendix.C}\protected@file@percent }
103
+ \gdef \@abspage@last{13}
@@ -0,0 +1,113 @@
1
+ \begin{thebibliography}{16}
2
+ \providecommand{\natexlab}[1]{#1}
3
+ \providecommand{\url}[1]{\texttt{#1}}
4
+ \expandafter\ifx\csname urlstyle\endcsname\relax
5
+ \providecommand{\doi}[1]{doi: #1}\else
6
+ \providecommand{\doi}{doi: \begingroup \urlstyle{rm}\Url}\fi
7
+
8
+ \bibitem[Bai et~al.(2022)Bai, Kadavath, Kundu, et~al.]{bai2022constitutional}
9
+ Yuntao Bai, Saurav Kadavath, Sandipan Kundu, et~al.
10
+ \newblock Constitutional ai: Harmlessness from ai feedback.
11
+ \newblock \emph{arXiv preprint arXiv:2212.08073}, 2022.
12
+
13
+ \bibitem[Basiri et~al.(2016)Basiri, Behnam, de~Rooij, et~al.]{basiri2016chaos}
14
+ Ali Basiri, Niosha Behnam, Ruud de~Rooij, et~al.
15
+ \newblock Chaos engineering, 2016.
16
+
17
+ \bibitem[Boyd(1987)]{boyd1987discourse}
18
+ John~R Boyd.
19
+ \newblock \emph{A Discourse on Winning and Losing}.
20
+ \newblock Air University Press, 1987.
21
+
22
+ \bibitem[{European Parliament}(2024)]{euai2024}
23
+ {European Parliament}.
24
+ \newblock Regulation (eu) 2024/1689 - artificial intelligence act.
25
+ \newblock Official Journal of the European Union, 2024.
26
+
27
+ \bibitem[Han et~al.(2024)Han, Rao, Ettinger, Jiang, Lin, Lambert, Choi, and
28
+ Dziri]{han2024wildguard}
29
+ Seungju Han, Kavel Rao, Allyson Ettinger, Liwei Jiang, Bill~Yuchen Lin, Nathan
30
+ Lambert, Yejin Choi, and Nouha Dziri.
31
+ \newblock Wildguard: Open one-stop moderation tools for safety risks,
32
+ jailbreaks, and refusals of llms.
33
+ \newblock \emph{Advances in Neural Information Processing Systems (NeurIPS)},
34
+ 2024.
35
+ \newblock URL \url{https://arxiv.org/abs/2406.18495}.
36
+
37
+ \bibitem[Hong et~al.(2023)Hong, Zhuge, Chen, Zheng, Cheng, Zhang,
38
+ et~al.]{hong2023metagpt}
39
+ Sirui Hong, Mingchen Zhuge, Jiaqi Chen, Xiawu Zheng, Yuheng Cheng, Ceyao Zhang,
40
+ et~al.
41
+ \newblock Metagpt: Meta programming for a multi-agent collaborative framework.
42
+ \newblock 2023.
43
+ \newblock URL \url{https://arxiv.org/abs/2308.00352}.
44
+
45
+ \bibitem[Lewis et~al.(2020)Lewis, Perez, Piktus, et~al.]{lewis2020retrieval}
46
+ Patrick Lewis, Ethan Perez, Aleksandra Piktus, et~al.
47
+ \newblock Retrieval-augmented generation for knowledge-intensive nlp tasks.
48
+ \newblock In \emph{Advances in Neural Information Processing Systems
49
+ (NeurIPS)}, 2020.
50
+ \newblock URL \url{https://arxiv.org/abs/2005.11401}.
51
+
52
+ \bibitem[Liu et~al.(2023)Liu, Lin, Hewitt, et~al.]{liu2023lost}
53
+ Nelson~F Liu, Kevin Lin, John Hewitt, et~al.
54
+ \newblock Lost in the middle: How language models use long contexts.
55
+ \newblock 2023.
56
+ \newblock URL \url{https://arxiv.org/abs/2307.03172}.
57
+
58
+ \bibitem[Madaan et~al.(2023)Madaan, Tandon, Gupta, et~al.]{madaan2023self}
59
+ Aman Madaan, Niket Tandon, Prakhar Gupta, et~al.
60
+ \newblock Self-refine: Iterative refinement with self-feedback.
61
+ \newblock \emph{Advances in Neural Information Processing Systems (NeurIPS)},
62
+ 2023.
63
+ \newblock URL \url{https://arxiv.org/abs/2303.17651}.
64
+
65
+ \bibitem[{Meta AI}(2024)]{meta2024llamaguard2}
66
+ {Meta AI}.
67
+ \newblock Llamaguard 2: Safety classification for llm interactions.
68
+ \newblock Meta Research Blog, 2024.
69
+ \newblock Technical report on improved safety classification.
70
+
71
+ \bibitem[Mohtashami and Jaggi(2023)]{mohtashami2023landmark}
72
+ Amirkeivan Mohtashami and Martin Jaggi.
73
+ \newblock Landmark attention: Random-access infinite context length for
74
+ transformers.
75
+ \newblock 2023.
76
+ \newblock URL \url{https://arxiv.org/abs/2305.16300}.
77
+
78
+ \bibitem[{Self-Correcting Agent Team}(2026)]{scak2026}
79
+ {Self-Correcting Agent Team}.
80
+ \newblock Self-correcting agent kernel: Automated alignment via differential
81
+ auditing and semantic memory hygiene, 2026.
82
+ \newblock URL
83
+ \url{https://github.com/imran-siddique/self-correcting-agent-kernel}.
84
+ \newblock Research foundations: Reflexion (NeurIPS 2023), Constitutional AI
85
+ (Anthropic 2022), Voyager (arXiv:2305.16291).
86
+
87
+ \bibitem[Shinn et~al.(2023)Shinn, Cassano, Berman, Gopinath, Narasimhan, and
88
+ Yao]{shinn2023reflexion}
89
+ Noah Shinn, Federico Cassano, Edward Berman, Ashwin Gopinath, Karthik
90
+ Narasimhan, and Shunyu Yao.
91
+ \newblock Reflexion: Language agents with verbal reinforcement learning.
92
+ \newblock In \emph{Advances in Neural Information Processing Systems
93
+ (NeurIPS)}, 2023.
94
+ \newblock URL \url{https://arxiv.org/abs/2303.11366}.
95
+
96
+ \bibitem[Wang et~al.(2023)Wang, Xie, Jiang, et~al.]{wang2023voyager}
97
+ Guanzhi Wang, Yuqi Xie, Yunfan Jiang, et~al.
98
+ \newblock Voyager: An open-ended embodied agent with large language models.
99
+ \newblock 2023.
100
+ \newblock URL \url{https://arxiv.org/abs/2305.16291}.
101
+
102
+ \bibitem[{World Economic Forum}(2025)]{wef2025governance}
103
+ {World Economic Forum}.
104
+ \newblock Ai agents in the workplace: Governance framework and risk mitigation.
105
+ \newblock WEF Whitepaper, January 2025.
106
+
107
+ \bibitem[Wu et~al.(2023)Wu, Bansal, Zhang, et~al.]{wu2023autogen}
108
+ Qingyun Wu, Gagan Bansal, Jieyu Zhang, et~al.
109
+ \newblock Autogen: Enabling next-gen llm applications via multi-agent
110
+ conversation.
111
+ \newblock \emph{arXiv preprint arXiv:2308.08155}, 2023.
112
+
113
+ \end{thebibliography}
@@ -0,0 +1,55 @@
1
+ This is BibTeX, Version 0.99e
2
+ Capacity: max_strings=200000, hash_size=200000, hash_prime=170003
3
+ The top-level auxiliary file: main.aux
4
+ Reallocating 'name_of_file' (item size: 1) to 9 items.
5
+ The style file: plainnat.bst
6
+ Reallocating 'name_of_file' (item size: 1) to 13 items.
7
+ Database file #1: bibliography.bib
8
+ Warning--entry type for "scak2026" isn't style-file defined
9
+ --line 553 of file bibliography.bib
10
+ Warning--empty journal in hong2023metagpt
11
+ Warning--empty journal in liu2023lost
12
+ Warning--empty journal in mohtashami2023landmark
13
+ Warning--empty journal in wang2023voyager
14
+ You've used 16 entries,
15
+ 2773 wiz_defined-function locations,
16
+ 670 strings with 7739 characters,
17
+ and the built_in function-call counts, 7040 in all, are:
18
+ = -- 568
19
+ > -- 534
20
+ < -- 6
21
+ + -- 184
22
+ - -- 168
23
+ * -- 550
24
+ := -- 1154
25
+ add.period$ -- 57
26
+ call.type$ -- 16
27
+ change.case$ -- 95
28
+ chr.to.int$ -- 16
29
+ cite$ -- 36
30
+ duplicate$ -- 303
31
+ empty$ -- 523
32
+ format.name$ -- 186
33
+ if$ -- 1432
34
+ int.to.chr$ -- 1
35
+ int.to.str$ -- 1
36
+ missing$ -- 12
37
+ newline$ -- 97
38
+ num.names$ -- 64
39
+ pop$ -- 224
40
+ preamble$ -- 1
41
+ purify$ -- 80
42
+ quote$ -- 0
43
+ skip$ -- 249
44
+ stack$ -- 0
45
+ substring$ -- 32
46
+ swap$ -- 15
47
+ text.length$ -- 0
48
+ text.prefix$ -- 0
49
+ top$ -- 0
50
+ type$ -- 171
51
+ warning$ -- 4
52
+ while$ -- 48
53
+ width$ -- 0
54
+ write$ -- 213
55
+ (There were 5 warnings)
@@ -0,0 +1,31 @@
1
+ \BOOKMARK [1][-]{section.1}{\376\377\0001\000\040\000I\000n\000t\000r\000o\000d\000u\000c\000t\000i\000o\000n}{}% 1
2
+ \BOOKMARK [2][-]{subsection.1.1}{\376\377\0001\000.\0001\000\040\000T\000h\000e\000\040\000A\000c\000c\000u\000m\000u\000l\000a\000t\000i\000o\000n\000\040\000P\000a\000r\000a\000d\000o\000x}{section.1}% 2
3
+ \BOOKMARK [2][-]{subsection.1.2}{\376\377\0001\000.\0002\000\040\000T\000h\000e\000\040\000`\000`\000S\000c\000a\000l\000e\000\040\000b\000y\000\040\000S\000u\000b\000t\000r\000a\000c\000t\000i\000o\000n\000'\000'\000\040\000P\000h\000i\000l\000o\000s\000o\000p\000h\000y}{section.1}% 3
4
+ \BOOKMARK [1][-]{section.2}{\376\377\0002\000\040\000R\000e\000l\000a\000t\000e\000d\000\040\000W\000o\000r\000k}{}% 4
5
+ \BOOKMARK [2][-]{subsection.2.1}{\376\377\0002\000.\0001\000\040\000T\000h\000e\000\040\000O\000O\000D\000A\000\040\000L\000o\000o\000p\000:\000\040\000A\000t\000t\000a\000c\000k\000\040\000S\000u\000r\000f\000a\000c\000e\000\040\000o\000r\000\040\000D\000e\000f\000e\000n\000s\000e\000?}{section.2}% 5
6
+ \BOOKMARK [2][-]{subsection.2.2}{\376\377\0002\000.\0002\000\040\000S\000e\000l\000f\000-\000C\000o\000r\000r\000e\000c\000t\000i\000o\000n\000\040\000a\000n\000d\000\040\000F\000e\000e\000d\000b\000a\000c\000k}{section.2}% 6
7
+ \BOOKMARK [2][-]{subsection.2.3}{\376\377\0002\000.\0003\000\040\000M\000u\000l\000t\000i\000-\000A\000g\000e\000n\000t\000\040\000S\000y\000s\000t\000e\000m\000s}{section.2}% 7
8
+ \BOOKMARK [2][-]{subsection.2.4}{\376\377\0002\000.\0004\000\040\000C\000o\000n\000t\000e\000x\000t\000\040\000M\000a\000n\000a\000g\000e\000m\000e\000n\000t}{section.2}% 8
9
+ \BOOKMARK [2][-]{subsection.2.5}{\376\377\0002\000.\0005\000\040\000R\000e\000c\000e\000n\000t\000\040\000A\000d\000v\000a\000n\000c\000e\000s\000\040\000i\000n\000\040\000A\000g\000e\000n\000t\000\040\000A\000l\000i\000g\000n\000m\000e\000n\000t\000\040\000\050\0002\0000\0002\0004\040\023\0002\0000\0002\0006\000\051}{section.2}% 9
10
+ \BOOKMARK [1][-]{section.3}{\376\377\0003\000\040\000S\000y\000s\000t\000e\000m\000\040\000D\000e\000s\000i\000g\000n}{}% 10
11
+ \BOOKMARK [2][-]{subsection.3.1}{\376\377\0003\000.\0001\000\040\000P\000r\000o\000b\000l\000e\000m\000\040\000F\000o\000r\000m\000u\000l\000a\000t\000i\000o\000n}{section.3}% 11
12
+ \BOOKMARK [2][-]{subsection.3.2}{\376\377\0003\000.\0002\000\040\000D\000u\000a\000l\000-\000L\000o\000o\000p\000\040\000A\000r\000c\000h\000i\000t\000e\000c\000t\000u\000r\000e}{section.3}% 12
13
+ \BOOKMARK [2][-]{subsection.3.3}{\376\377\0003\000.\0003\000\040\000D\000i\000f\000f\000e\000r\000e\000n\000t\000i\000a\000l\000\040\000A\000u\000d\000i\000t\000i\000n\000g\000\040\000A\000l\000g\000o\000r\000i\000t\000h\000m}{section.3}% 13
14
+ \BOOKMARK [2][-]{subsection.3.4}{\376\377\0003\000.\0004\000\040\000S\000e\000m\000a\000n\000t\000i\000c\000\040\000P\000u\000r\000g\000e\000\040\000\050\000F\000o\000r\000m\000a\000l\000i\000z\000i\000n\000g\000\040\000D\000e\000c\000a\000y\000\051}{section.3}% 14
15
+ \BOOKMARK [2][-]{subsection.3.5}{\376\377\0003\000.\0005\000\040\000T\000h\000r\000e\000e\000-\000T\000i\000e\000r\000\040\000M\000e\000m\000o\000r\000y\000\040\000H\000i\000e\000r\000a\000r\000c\000h\000y}{section.3}% 15
16
+ \BOOKMARK [1][-]{section.4}{\376\377\0004\000\040\000E\000x\000p\000e\000r\000i\000m\000e\000n\000t\000s}{}% 16
17
+ \BOOKMARK [2][-]{subsection.4.1}{\376\377\0004\000.\0001\000\040\000E\000x\000p\000e\000r\000i\000m\000e\000n\000t\000a\000l\000\040\000S\000e\000t\000u\000p}{section.4}% 17
18
+ \BOOKMARK [2][-]{subsection.4.2}{\376\377\0004\000.\0002\000\040\000G\000A\000I\000A\000\040\000L\000a\000z\000i\000n\000e\000s\000s\000\040\000B\000e\000n\000c\000h\000m\000a\000r\000k}{section.4}% 18
19
+ \BOOKMARK [2][-]{subsection.4.3}{\376\377\0004\000.\0003\000\040\000A\000m\000n\000e\000s\000i\000a\000\040\000T\000e\000s\000t\000\040\000\050\000C\000o\000n\000t\000e\000x\000t\000\040\000E\000f\000f\000i\000c\000i\000e\000n\000c\000y\000\051}{section.4}% 19
20
+ \BOOKMARK [2][-]{subsection.4.4}{\376\377\0004\000.\0004\000\040\000C\000h\000a\000o\000s\000\040\000E\000n\000g\000i\000n\000e\000e\000r\000i\000n\000g\000\040\000\050\000R\000o\000b\000u\000s\000t\000n\000e\000s\000s\000\051}{section.4}% 20
21
+ \BOOKMARK [2][-]{subsection.4.5}{\376\377\0004\000.\0005\000\040\000A\000b\000l\000a\000t\000i\000o\000n\000\040\000S\000t\000u\000d\000i\000e\000s}{section.4}% 21
22
+ \BOOKMARK [2][-]{subsection.4.6}{\376\377\0004\000.\0006\000\040\000C\000o\000s\000t\000\040\000A\000n\000a\000l\000y\000s\000i\000s}{section.4}% 22
23
+ \BOOKMARK [1][-]{section.5}{\376\377\0005\000\040\000D\000i\000s\000c\000u\000s\000s\000i\000o\000n}{}% 23
24
+ \BOOKMARK [2][-]{subsection.5.1}{\376\377\0005\000.\0001\000\040\000T\000h\000e\000\040\000V\000i\000r\000t\000u\000e\000\040\000o\000f\000\040\000F\000o\000r\000g\000e\000t\000t\000i\000n\000g}{section.5}% 24
25
+ \BOOKMARK [2][-]{subsection.5.2}{\376\377\0005\000.\0002\000\040\000W\000h\000y\000\040\000E\000x\000t\000e\000r\000n\000a\000l\000\040\000T\000e\000a\000c\000h\000e\000r\000s\000\040\000O\000u\000t\000p\000e\000r\000f\000o\000r\000m\000\040\000S\000e\000l\000f\000-\000C\000r\000i\000t\000i\000q\000u\000e}{section.5}% 25
26
+ \BOOKMARK [2][-]{subsection.5.3}{\376\377\0005\000.\0003\000\040\000L\000i\000m\000i\000t\000a\000t\000i\000o\000n\000s}{section.5}% 26
27
+ \BOOKMARK [2][-]{subsection.5.4}{\376\377\0005\000.\0004\000\040\000B\000r\000o\000a\000d\000e\000r\000\040\000I\000m\000p\000a\000c\000t}{section.5}% 27
28
+ \BOOKMARK [1][-]{section.6}{\376\377\0006\000\040\000C\000o\000n\000c\000l\000u\000s\000i\000o\000n}{}% 28
29
+ \BOOKMARK [1][-]{appendix.A}{\376\377\000A\000\040\000R\000e\000p\000r\000o\000d\000u\000c\000i\000b\000i\000l\000i\000t\000y\000\040\000D\000e\000t\000a\000i\000l\000s}{}% 29
30
+ \BOOKMARK [1][-]{appendix.B}{\376\377\000B\000\040\000E\000x\000t\000e\000n\000d\000e\000d\000\040\000A\000b\000l\000a\000t\000i\000o\000n\000\040\000R\000e\000s\000u\000l\000t\000s}{}% 30
31
+ \BOOKMARK [1][-]{appendix.C}{\376\377\000C\000\040\000P\000a\000t\000c\000h\000\040\000E\000x\000a\000m\000p\000l\000e\000s}{}% 31