agent_sre 3.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (270) hide show
  1. agent_sre-3.1.0/.gitignore +456 -0
  2. agent_sre-3.1.0/AGENTS.md +86 -0
  3. agent_sre-3.1.0/ARCHITECTURE.md +562 -0
  4. agent_sre-3.1.0/CHANGELOG.md +64 -0
  5. agent_sre-3.1.0/LICENSE +21 -0
  6. agent_sre-3.1.0/PKG-INFO +754 -0
  7. agent_sre-3.1.0/README.md +678 -0
  8. agent_sre-3.1.0/SECURITY.md +17 -0
  9. agent_sre-3.1.0/benchmarks/__init__.py +1 -0
  10. agent_sre-3.1.0/benchmarks/bench_chaos.py +153 -0
  11. agent_sre-3.1.0/benchmarks/bench_delivery.py +154 -0
  12. agent_sre-3.1.0/benchmarks/bench_slo.py +154 -0
  13. agent_sre-3.1.0/benchmarks/results/BENCHMARKS.md +65 -0
  14. agent_sre-3.1.0/benchmarks/run_all.py +59 -0
  15. agent_sre-3.1.0/charts/agent-sre/Chart.yaml +20 -0
  16. agent_sre-3.1.0/charts/agent-sre/README.md +46 -0
  17. agent_sre-3.1.0/charts/agent-sre/templates/NOTES.txt +21 -0
  18. agent_sre-3.1.0/charts/agent-sre/templates/_helpers.tpl +45 -0
  19. agent_sre-3.1.0/charts/agent-sre/templates/configmap.yaml +17 -0
  20. agent_sre-3.1.0/charts/agent-sre/templates/deployments.yaml +73 -0
  21. agent_sre-3.1.0/charts/agent-sre/templates/hpa.yaml +30 -0
  22. agent_sre-3.1.0/charts/agent-sre/templates/networkpolicy.yaml +29 -0
  23. agent_sre-3.1.0/charts/agent-sre/templates/pdb.yaml +19 -0
  24. agent_sre-3.1.0/charts/agent-sre/templates/services.yaml +27 -0
  25. agent_sre-3.1.0/charts/agent-sre/values.yaml +124 -0
  26. agent_sre-3.1.0/dashboards/agent-sre-overview.json +77 -0
  27. agent_sre-3.1.0/dashboards/grafana/agent-slo-dashboard.json +412 -0
  28. agent_sre-3.1.0/dashboards/grafana/agent-sre-overview.json +415 -0
  29. agent_sre-3.1.0/deployments/helm/README.md +64 -0
  30. agent_sre-3.1.0/deployments/helm/agent-sre/Chart.yaml +18 -0
  31. agent_sre-3.1.0/deployments/helm/agent-sre/templates/_helpers.tpl +32 -0
  32. agent_sre-3.1.0/deployments/helm/agent-sre/templates/crd.yaml +138 -0
  33. agent_sre-3.1.0/deployments/helm/agent-sre/templates/deployment.yaml +59 -0
  34. agent_sre-3.1.0/deployments/helm/agent-sre/templates/service.yaml +17 -0
  35. agent_sre-3.1.0/deployments/helm/agent-sre/values.yaml +52 -0
  36. agent_sre-3.1.0/docs/api-reference.md +1332 -0
  37. agent_sre-3.1.0/docs/comparison.md +43 -0
  38. agent_sre-3.1.0/docs/concepts.md +89 -0
  39. agent_sre-3.1.0/docs/deployment.md +187 -0
  40. agent_sre-3.1.0/docs/getting-started.md +76 -0
  41. agent_sre-3.1.0/docs/integration-guide.md +69 -0
  42. agent_sre-3.1.0/docs/security.md +139 -0
  43. agent_sre-3.1.0/docs/slo-reference.md +621 -0
  44. agent_sre-3.1.0/docs/sre-concepts-for-ai-engineers.md +501 -0
  45. agent_sre-3.1.0/examples/README.md +46 -0
  46. agent_sre-3.1.0/examples/canary-model-upgrade/README.md +161 -0
  47. agent_sre-3.1.0/examples/canary-model-upgrade/demo.py +417 -0
  48. agent_sre-3.1.0/examples/canary_rollout.py +113 -0
  49. agent_sre-3.1.0/examples/chaos/schedules.yaml +59 -0
  50. agent_sre-3.1.0/examples/chaos-chatbot/README.md +149 -0
  51. agent_sre-3.1.0/examples/chaos-chatbot/chaos-scenarios.yaml +109 -0
  52. agent_sre-3.1.0/examples/chaos-chatbot/demo.py +394 -0
  53. agent_sre-3.1.0/examples/chaos_test.py +92 -0
  54. agent_sre-3.1.0/examples/cost_guard.py +74 -0
  55. agent_sre-3.1.0/examples/cost_guardrails.py +100 -0
  56. agent_sre-3.1.0/examples/dashboard/README.md +29 -0
  57. agent_sre-3.1.0/examples/dashboard/app.py +1081 -0
  58. agent_sre-3.1.0/examples/dashboard/requirements.txt +4 -0
  59. agent_sre-3.1.0/examples/docker-compose/Dockerfile +12 -0
  60. agent_sre-3.1.0/examples/docker-compose/README.md +76 -0
  61. agent_sre-3.1.0/examples/docker-compose/config/grafana-dashboards.yml +11 -0
  62. agent_sre-3.1.0/examples/docker-compose/config/grafana-datasources.yml +9 -0
  63. agent_sre-3.1.0/examples/docker-compose/config/prometheus.yml +11 -0
  64. agent_sre-3.1.0/examples/docker-compose/dashboards/agent-sre-overview.json +389 -0
  65. agent_sre-3.1.0/examples/docker-compose/docker-compose.yml +118 -0
  66. agent_sre-3.1.0/examples/langchain-monitoring/README.md +76 -0
  67. agent_sre-3.1.0/examples/langchain-monitoring/demo.py +286 -0
  68. agent_sre-3.1.0/examples/langchain_monitor.py +250 -0
  69. agent_sre-3.1.0/examples/quickstart.py +110 -0
  70. agent_sre-3.1.0/examples/slo_alerting.py +112 -0
  71. agent_sre-3.1.0/notebooks/README.md +22 -0
  72. agent_sre-3.1.0/notebooks/slo-exploration.ipynb +456 -0
  73. agent_sre-3.1.0/operator/README.md +50 -0
  74. agent_sre-3.1.0/operator/crds/agent-slo.yaml +64 -0
  75. agent_sre-3.1.0/operator/crds/cost-budget.yaml +43 -0
  76. agent_sre-3.1.0/pyproject.toml +110 -0
  77. agent_sre-3.1.0/screenshots/ss_architecture.png +0 -0
  78. agent_sre-3.1.0/screenshots/ss_by_the_numbers.png +0 -0
  79. agent_sre-3.1.0/screenshots/ss_ecosystem.png +0 -0
  80. agent_sre-3.1.0/screenshots/ss_quickstart.png +0 -0
  81. agent_sre-3.1.0/screenshots/ss_repo_hero.png +0 -0
  82. agent_sre-3.1.0/specs/coding-agent.yaml +43 -0
  83. agent_sre-3.1.0/specs/customer-support-agent.yaml +42 -0
  84. agent_sre-3.1.0/specs/data-pipeline-agent.yaml +44 -0
  85. agent_sre-3.1.0/specs/research-agent.yaml +48 -0
  86. agent_sre-3.1.0/specs/slos/base.yaml +37 -0
  87. agent_sre-3.1.0/specs/slos/batch_agent.yaml +39 -0
  88. agent_sre-3.1.0/specs/slos/critical_agent.yaml +43 -0
  89. agent_sre-3.1.0/src/agent_sre/__init__.py +49 -0
  90. agent_sre-3.1.0/src/agent_sre/__main__.py +8 -0
  91. agent_sre-3.1.0/src/agent_sre/accuracy_declaration.py +198 -0
  92. agent_sre-3.1.0/src/agent_sre/adapters/__init__.py +489 -0
  93. agent_sre-3.1.0/src/agent_sre/alerts/__init__.py +515 -0
  94. agent_sre-3.1.0/src/agent_sre/alerts/dedup.py +188 -0
  95. agent_sre-3.1.0/src/agent_sre/anomaly/__init__.py +51 -0
  96. agent_sre-3.1.0/src/agent_sre/anomaly/detector.py +368 -0
  97. agent_sre-3.1.0/src/agent_sre/anomaly/rogue_detector.py +459 -0
  98. agent_sre-3.1.0/src/agent_sre/anomaly/strategies.py +162 -0
  99. agent_sre-3.1.0/src/agent_sre/api/__init__.py +359 -0
  100. agent_sre-3.1.0/src/agent_sre/api/models.py +161 -0
  101. agent_sre-3.1.0/src/agent_sre/api/server.py +598 -0
  102. agent_sre-3.1.0/src/agent_sre/benchmarks/__init__.py +458 -0
  103. agent_sre-3.1.0/src/agent_sre/cascade/__init__.py +19 -0
  104. agent_sre-3.1.0/src/agent_sre/cascade/circuit_breaker.py +266 -0
  105. agent_sre-3.1.0/src/agent_sre/certification/__init__.py +335 -0
  106. agent_sre-3.1.0/src/agent_sre/chaos/__init__.py +47 -0
  107. agent_sre-3.1.0/src/agent_sre/chaos/adversarial.py +285 -0
  108. agent_sre-3.1.0/src/agent_sre/chaos/adversarial_policy.py +247 -0
  109. agent_sre-3.1.0/src/agent_sre/chaos/chaos_scheduler.py +125 -0
  110. agent_sre-3.1.0/src/agent_sre/chaos/engine.py +357 -0
  111. agent_sre-3.1.0/src/agent_sre/chaos/library.py +243 -0
  112. agent_sre-3.1.0/src/agent_sre/chaos/loader.py +27 -0
  113. agent_sre-3.1.0/src/agent_sre/chaos/scheduler.py +72 -0
  114. agent_sre-3.1.0/src/agent_sre/cli/__init__.py +6 -0
  115. agent_sre-3.1.0/src/agent_sre/cli/main.py +83 -0
  116. agent_sre-3.1.0/src/agent_sre/cost/__init__.py +23 -0
  117. agent_sre-3.1.0/src/agent_sre/cost/anomaly.py +159 -0
  118. agent_sre-3.1.0/src/agent_sre/cost/guard.py +386 -0
  119. agent_sre-3.1.0/src/agent_sre/cost/optimizer.py +186 -0
  120. agent_sre-3.1.0/src/agent_sre/delivery/__init__.py +31 -0
  121. agent_sre-3.1.0/src/agent_sre/delivery/blue_green.py +299 -0
  122. agent_sre-3.1.0/src/agent_sre/delivery/gitops.py +168 -0
  123. agent_sre-3.1.0/src/agent_sre/delivery/rollout.py +731 -0
  124. agent_sre-3.1.0/src/agent_sre/evals/__init__.py +456 -0
  125. agent_sre-3.1.0/src/agent_sre/experiments/__init__.py +255 -0
  126. agent_sre-3.1.0/src/agent_sre/fleet/__init__.py +420 -0
  127. agent_sre-3.1.0/src/agent_sre/incidents/__init__.py +41 -0
  128. agent_sre-3.1.0/src/agent_sre/incidents/circuit_breaker.py +187 -0
  129. agent_sre-3.1.0/src/agent_sre/incidents/detector.py +333 -0
  130. agent_sre-3.1.0/src/agent_sre/incidents/postmortem.py +339 -0
  131. agent_sre-3.1.0/src/agent_sre/incidents/runbook.py +157 -0
  132. agent_sre-3.1.0/src/agent_sre/incidents/runbook_executor.py +197 -0
  133. agent_sre-3.1.0/src/agent_sre/incidents/runbook_registry.py +107 -0
  134. agent_sre-3.1.0/src/agent_sre/incidents/runbooks/restart_agent.yaml +34 -0
  135. agent_sre-3.1.0/src/agent_sre/incidents/runbooks/revoke_trust.yaml +34 -0
  136. agent_sre-3.1.0/src/agent_sre/incidents/runbooks/rollback_version.yaml +35 -0
  137. agent_sre-3.1.0/src/agent_sre/incidents/runbooks/throttle_traffic.yaml +34 -0
  138. agent_sre-3.1.0/src/agent_sre/integrations/__init__.py +21 -0
  139. agent_sre-3.1.0/src/agent_sre/integrations/agent_mesh/__init__.py +3 -0
  140. agent_sre-3.1.0/src/agent_sre/integrations/agent_mesh/bridge.py +148 -0
  141. agent_sre-3.1.0/src/agent_sre/integrations/agent_os/__init__.py +3 -0
  142. agent_sre-3.1.0/src/agent_sre/integrations/agent_os/bridge.py +128 -0
  143. agent_sre-3.1.0/src/agent_sre/integrations/agentops/__init__.py +6 -0
  144. agent_sre-3.1.0/src/agent_sre/integrations/agentops/exporter.py +198 -0
  145. agent_sre-3.1.0/src/agent_sre/integrations/arize/__init__.py +23 -0
  146. agent_sre-3.1.0/src/agent_sre/integrations/arize/exporter.py +206 -0
  147. agent_sre-3.1.0/src/agent_sre/integrations/arize/importer.py +140 -0
  148. agent_sre-3.1.0/src/agent_sre/integrations/braintrust/__init__.py +12 -0
  149. agent_sre-3.1.0/src/agent_sre/integrations/braintrust/exporter.py +268 -0
  150. agent_sre-3.1.0/src/agent_sre/integrations/datadog/__init__.py +12 -0
  151. agent_sre-3.1.0/src/agent_sre/integrations/datadog/exporter.py +298 -0
  152. agent_sre-3.1.0/src/agent_sre/integrations/helicone/__init__.py +13 -0
  153. agent_sre-3.1.0/src/agent_sre/integrations/helicone/headers.py +249 -0
  154. agent_sre-3.1.0/src/agent_sre/integrations/langchain/__init__.py +20 -0
  155. agent_sre-3.1.0/src/agent_sre/integrations/langchain/callback.py +424 -0
  156. agent_sre-3.1.0/src/agent_sre/integrations/langfuse/__init__.py +29 -0
  157. agent_sre-3.1.0/src/agent_sre/integrations/langfuse/exporter.py +285 -0
  158. agent_sre-3.1.0/src/agent_sre/integrations/langsmith/__init__.py +12 -0
  159. agent_sre-3.1.0/src/agent_sre/integrations/langsmith/exporter.py +360 -0
  160. agent_sre-3.1.0/src/agent_sre/integrations/llamaindex/__init__.py +17 -0
  161. agent_sre-3.1.0/src/agent_sre/integrations/llamaindex/handler.py +376 -0
  162. agent_sre-3.1.0/src/agent_sre/integrations/mcp/__init__.py +342 -0
  163. agent_sre-3.1.0/src/agent_sre/integrations/mlflow/__init__.py +6 -0
  164. agent_sre-3.1.0/src/agent_sre/integrations/mlflow/exporter.py +173 -0
  165. agent_sre-3.1.0/src/agent_sre/integrations/openlit.py +211 -0
  166. agent_sre-3.1.0/src/agent_sre/integrations/otel/__init__.py +29 -0
  167. agent_sre-3.1.0/src/agent_sre/integrations/otel/conventions.py +84 -0
  168. agent_sre-3.1.0/src/agent_sre/integrations/otel/events.py +322 -0
  169. agent_sre-3.1.0/src/agent_sre/integrations/otel/metrics.py +286 -0
  170. agent_sre-3.1.0/src/agent_sre/integrations/otel/saga_sink.py +97 -0
  171. agent_sre-3.1.0/src/agent_sre/integrations/otel/traces.py +242 -0
  172. agent_sre-3.1.0/src/agent_sre/integrations/pagerduty.py +183 -0
  173. agent_sre-3.1.0/src/agent_sre/integrations/prometheus/__init__.py +14 -0
  174. agent_sre-3.1.0/src/agent_sre/integrations/prometheus/exporter.py +115 -0
  175. agent_sre-3.1.0/src/agent_sre/integrations/wandb/__init__.py +6 -0
  176. agent_sre-3.1.0/src/agent_sre/integrations/wandb/exporter.py +154 -0
  177. agent_sre-3.1.0/src/agent_sre/k8s/__init__.py +628 -0
  178. agent_sre-3.1.0/src/agent_sre/mcp/__init__.py +6 -0
  179. agent_sre-3.1.0/src/agent_sre/mcp/server.py +211 -0
  180. agent_sre-3.1.0/src/agent_sre/providers.py +116 -0
  181. agent_sre-3.1.0/src/agent_sre/py.typed +0 -0
  182. agent_sre-3.1.0/src/agent_sre/replay/__init__.py +23 -0
  183. agent_sre-3.1.0/src/agent_sre/replay/capture.py +344 -0
  184. agent_sre-3.1.0/src/agent_sre/replay/distributed.py +308 -0
  185. agent_sre-3.1.0/src/agent_sre/replay/engine.py +249 -0
  186. agent_sre-3.1.0/src/agent_sre/replay/golden.py +104 -0
  187. agent_sre-3.1.0/src/agent_sre/replay/golden_manager.py +201 -0
  188. agent_sre-3.1.0/src/agent_sre/replay/visualization.py +245 -0
  189. agent_sre-3.1.0/src/agent_sre/sbom.py +284 -0
  190. agent_sre-3.1.0/src/agent_sre/signing.py +174 -0
  191. agent_sre-3.1.0/src/agent_sre/slo/__init__.py +27 -0
  192. agent_sre-3.1.0/src/agent_sre/slo/dashboard.py +188 -0
  193. agent_sre-3.1.0/src/agent_sre/slo/indicators.py +516 -0
  194. agent_sre-3.1.0/src/agent_sre/slo/objectives.py +298 -0
  195. agent_sre-3.1.0/src/agent_sre/slo/persistence.py +266 -0
  196. agent_sre-3.1.0/src/agent_sre/slo/spec.py +143 -0
  197. agent_sre-3.1.0/src/agent_sre/slo/validator.py +150 -0
  198. agent_sre-3.1.0/src/agent_sre/specs/__init__.py +182 -0
  199. agent_sre-3.1.0/src/agent_sre/tracing/__init__.py +786 -0
  200. agent_sre-3.1.0/src/agent_sre/tracing/conventions.py +36 -0
  201. agent_sre-3.1.0/src/agent_sre/tracing/exporters.py +110 -0
  202. agent_sre-3.1.0/src/agent_sre/tracing/metrics.py +121 -0
  203. agent_sre-3.1.0/src/agent_sre/tracing/spans.py +161 -0
  204. agent_sre-3.1.0/tests/__init__.py +0 -0
  205. agent_sre-3.1.0/tests/integration/__init__.py +0 -0
  206. agent_sre-3.1.0/tests/integration/test_integration.py +490 -0
  207. agent_sre-3.1.0/tests/integration/test_scenarios.py +622 -0
  208. agent_sre-3.1.0/tests/test_adapters.py +336 -0
  209. agent_sre-3.1.0/tests/test_agentops.py +86 -0
  210. agent_sre-3.1.0/tests/test_alert_dedup.py +360 -0
  211. agent_sre-3.1.0/tests/test_alert_persistence.py +67 -0
  212. agent_sre-3.1.0/tests/test_alerts.py +467 -0
  213. agent_sre-3.1.0/tests/test_api.py +308 -0
  214. agent_sre-3.1.0/tests/test_arize.py +291 -0
  215. agent_sre-3.1.0/tests/test_benchmarks.py +290 -0
  216. agent_sre-3.1.0/tests/test_blue_green.py +214 -0
  217. agent_sre-3.1.0/tests/test_braintrust.py +149 -0
  218. agent_sre-3.1.0/tests/test_cascade.py +242 -0
  219. agent_sre-3.1.0/tests/test_certification.py +290 -0
  220. agent_sre-3.1.0/tests/test_chaos_scheduler.py +306 -0
  221. agent_sre-3.1.0/tests/test_cli.py +35 -0
  222. agent_sre-3.1.0/tests/test_cost_optimizer.py +271 -0
  223. agent_sre-3.1.0/tests/test_datadog.py +149 -0
  224. agent_sre-3.1.0/tests/test_evals.py +583 -0
  225. agent_sre-3.1.0/tests/test_experiments.py +195 -0
  226. agent_sre-3.1.0/tests/test_fleet.py +320 -0
  227. agent_sre-3.1.0/tests/test_golden_traces.py +211 -0
  228. agent_sre-3.1.0/tests/test_helicone.py +140 -0
  229. agent_sre-3.1.0/tests/test_k8s.py +321 -0
  230. agent_sre-3.1.0/tests/test_langchain_callback.py +354 -0
  231. agent_sre-3.1.0/tests/test_langfuse.py +345 -0
  232. agent_sre-3.1.0/tests/test_langsmith.py +182 -0
  233. agent_sre-3.1.0/tests/test_llamaindex.py +287 -0
  234. agent_sre-3.1.0/tests/test_mcp_drift.py +282 -0
  235. agent_sre-3.1.0/tests/test_mcp_server.py +140 -0
  236. agent_sre-3.1.0/tests/test_openlit_integration.py +160 -0
  237. agent_sre-3.1.0/tests/test_otel.py +692 -0
  238. agent_sre-3.1.0/tests/test_otel_saga_sink.py +110 -0
  239. agent_sre-3.1.0/tests/test_pagerduty_slo.py +208 -0
  240. agent_sre-3.1.0/tests/test_prometheus.py +87 -0
  241. agent_sre-3.1.0/tests/test_protocol_tracing.py +571 -0
  242. agent_sre-3.1.0/tests/test_runbooks.py +379 -0
  243. agent_sre-3.1.0/tests/test_sbom.py +323 -0
  244. agent_sre-3.1.0/tests/test_slo_spec.py +257 -0
  245. agent_sre-3.1.0/tests/test_slo_templates.py +147 -0
  246. agent_sre-3.1.0/tests/test_tracing.py +340 -0
  247. agent_sre-3.1.0/tests/test_wandb_mlflow.py +146 -0
  248. agent_sre-3.1.0/tests/unit/__init__.py +0 -0
  249. agent_sre-3.1.0/tests/unit/test_accuracy_declaration.py +124 -0
  250. agent_sre-3.1.0/tests/unit/test_adversarial_chaos.py +334 -0
  251. agent_sre-3.1.0/tests/unit/test_anomaly_detection.py +348 -0
  252. agent_sre-3.1.0/tests/unit/test_capture.py +232 -0
  253. agent_sre-3.1.0/tests/unit/test_chaos.py +308 -0
  254. agent_sre-3.1.0/tests/unit/test_circuit_breaker.py +142 -0
  255. agent_sre-3.1.0/tests/unit/test_cost.py +348 -0
  256. agent_sre-3.1.0/tests/unit/test_dashboard.py +88 -0
  257. agent_sre-3.1.0/tests/unit/test_delivery.py +212 -0
  258. agent_sre-3.1.0/tests/unit/test_engine.py +223 -0
  259. agent_sre-3.1.0/tests/unit/test_hallucination.py +60 -0
  260. agent_sre-3.1.0/tests/unit/test_incidents.py +127 -0
  261. agent_sre-3.1.0/tests/unit/test_indicators.py +210 -0
  262. agent_sre-3.1.0/tests/unit/test_integrations.py +223 -0
  263. agent_sre-3.1.0/tests/unit/test_objectives.py +169 -0
  264. agent_sre-3.1.0/tests/unit/test_p2_features.py +320 -0
  265. agent_sre-3.1.0/tests/unit/test_rogue_detector.py +561 -0
  266. agent_sre-3.1.0/tests/unit/test_sli_persistence.py +313 -0
  267. agent_sre-3.1.0/tests/unit/test_visualization.py +93 -0
  268. agent_sre-3.1.0/tutorials/langchain-slo-setup/README.md +234 -0
  269. agent_sre-3.1.0/tutorials/langchain-slo-setup/demo.py +269 -0
  270. agent_sre-3.1.0/tutorials/langchain-slo-setup/slo-config.yaml +79 -0
@@ -0,0 +1,456 @@
1
+ # Generated artifacts
2
+ sbom/
3
+
4
+ # Python
5
+ __pycache__/
6
+ *.py[cod]
7
+ *$py.class
8
+ *.egg-info/
9
+ dist/
10
+ build/
11
+ *.egg
12
+ .eggs/
13
+ .venv/
14
+ venv/
15
+ .pytest_cache/
16
+ .mypy_cache/
17
+ .ruff_cache/
18
+ .hypothesis/
19
+ .tox/
20
+ htmlcov/
21
+ .coverage
22
+ *.cover
23
+
24
+ # Node
25
+ node_modules/
26
+
27
+ # IDE
28
+ .vscode/
29
+ .idea/
30
+ *.swp
31
+ *.swo
32
+ .claude/
33
+
34
+ ## Ignore Visual Studio temporary files, build results, and
35
+ ## files generated by popular Visual Studio add-ons.
36
+ ##
37
+ ## Get latest from https://github.com/github/gitignore/blob/main/VisualStudio.gitignore
38
+
39
+ # User-specific files
40
+ *.rsuser
41
+ *.suo
42
+ *.user
43
+ *.userosscache
44
+ *.sln.docstates
45
+ *.env
46
+
47
+ # User-specific files (MonoDevelop/Xamarin Studio)
48
+ *.userprefs
49
+
50
+ # Mono auto generated files
51
+ mono_crash.*
52
+
53
+ # Build results
54
+ [Dd]ebug/
55
+ [Dd]ebugPublic/
56
+ [Rr]elease/
57
+ [Rr]eleases/
58
+ x64/
59
+ x86/
60
+ [Ww][Ii][Nn]32/
61
+ [Aa][Rr][Mm]/
62
+ [Aa][Rr][Mm]64/
63
+ [Aa][Rr][Mm]64[Ee][Cc]/
64
+ bld/
65
+ [Oo]bj/
66
+ [Oo]ut/
67
+ [Ll]og/
68
+ [Ll]ogs/
69
+
70
+ # Build results on 'Bin' directories
71
+ **/[Bb]in/*
72
+ # Uncomment if you have tasks that rely on *.refresh files to move binaries
73
+ # (https://github.com/github/gitignore/pull/3736)
74
+ #!**/[Bb]in/*.refresh
75
+
76
+ # Visual Studio 2015/2017 cache/options directory
77
+ .vs/
78
+ # Uncomment if you have tasks that create the project's static files in wwwroot
79
+ #wwwroot/
80
+
81
+ # Visual Studio 2017 auto generated files
82
+ Generated\ Files/
83
+
84
+ # MSTest test Results
85
+ [Tt]est[Rr]esult*/
86
+ [Bb]uild[Ll]og.*
87
+ *.trx
88
+
89
+ # NUnit
90
+ *.VisualState.xml
91
+ TestResult.xml
92
+ nunit-*.xml
93
+
94
+ # Approval Tests result files
95
+ *.received.*
96
+
97
+ # Build Results of an ATL Project
98
+ [Dd]ebugPS/
99
+ [Rr]eleasePS/
100
+ dlldata.c
101
+
102
+ # Benchmark Results
103
+ BenchmarkDotNet.Artifacts/
104
+
105
+ # .NET Core
106
+ project.lock.json
107
+ project.fragment.lock.json
108
+ artifacts/
109
+
110
+ # ASP.NET Scaffolding
111
+ ScaffoldingReadMe.txt
112
+
113
+ # StyleCop
114
+ StyleCopReport.xml
115
+
116
+ # Files built by Visual Studio
117
+ *_i.c
118
+ *_p.c
119
+ *_h.h
120
+ *.ilk
121
+ *.meta
122
+ *.obj
123
+ *.idb
124
+ *.iobj
125
+ *.pch
126
+ *.pdb
127
+ *.ipdb
128
+ *.pgc
129
+ *.pgd
130
+ *.rsp
131
+ # but not Directory.Build.rsp, as it configures directory-level build defaults
132
+ !Directory.Build.rsp
133
+ *.sbr
134
+ *.tlb
135
+ *.tli
136
+ *.tlh
137
+ *.tmp
138
+ *.tmp_proj
139
+ *_wpftmp.csproj
140
+ *.log
141
+ *.tlog
142
+ *.vspscc
143
+ *.vssscc
144
+ .builds
145
+ *.pidb
146
+ *.svclog
147
+ *.scc
148
+
149
+ # Chutzpah Test files
150
+ _Chutzpah*
151
+
152
+ # Visual C++ cache files
153
+ ipch/
154
+ *.aps
155
+ *.ncb
156
+ *.opendb
157
+ *.opensdf
158
+ *.sdf
159
+ *.cachefile
160
+ *.VC.db
161
+ *.VC.VC.opendb
162
+
163
+ # Visual Studio profiler
164
+ *.psess
165
+ *.vsp
166
+ *.vspx
167
+ *.sap
168
+
169
+ # Visual Studio Trace Files
170
+ *.e2e
171
+
172
+ # TFS 2012 Local Workspace
173
+ $tf/
174
+
175
+ # Guidance Automation Toolkit
176
+ *.gpState
177
+
178
+ # ReSharper is a .NET coding add-in
179
+ _ReSharper*/
180
+ *.[Rr]e[Ss]harper
181
+ *.DotSettings.user
182
+
183
+ # TeamCity is a build add-in
184
+ _TeamCity*
185
+
186
+ # DotCover is a Code Coverage Tool
187
+ *.dotCover
188
+
189
+ # AxoCover is a Code Coverage Tool
190
+ .axoCover/*
191
+ !.axoCover/settings.json
192
+
193
+ # Coverlet is a free, cross platform Code Coverage Tool
194
+ coverage*.json
195
+ coverage*.xml
196
+ coverage*.info
197
+
198
+ # Visual Studio code coverage results
199
+ *.coverage
200
+ *.coveragexml
201
+
202
+ # NCrunch
203
+ _NCrunch_*
204
+ .NCrunch_*
205
+ .*crunch*.local.xml
206
+ nCrunchTemp_*
207
+
208
+ # MightyMoose
209
+ *.mm.*
210
+ AutoTest.Net/
211
+
212
+ # Web workbench (sass)
213
+ .sass-cache/
214
+
215
+ # Installshield output folder
216
+ [Ee]xpress/
217
+
218
+ # DocProject is a documentation generator add-in
219
+ DocProject/buildhelp/
220
+ DocProject/Help/*.HxT
221
+ DocProject/Help/*.HxC
222
+ DocProject/Help/*.hhc
223
+ DocProject/Help/*.hhk
224
+ DocProject/Help/*.hhp
225
+ DocProject/Help/Html2
226
+ DocProject/Help/html
227
+
228
+ # Click-Once directory
229
+ publish/
230
+
231
+ # Publish Web Output
232
+ *.[Pp]ublish.xml
233
+ *.azurePubxml
234
+ # Note: Comment the next line if you want to checkin your web deploy settings,
235
+ # but database connection strings (with potential passwords) will be unencrypted
236
+ *.pubxml
237
+ *.publishproj
238
+
239
+ # Microsoft Azure Web App publish settings. Comment the next line if you want to
240
+ # checkin your Azure Web App publish settings, but sensitive information contained
241
+ # in these scripts will be unencrypted
242
+ PublishScripts/
243
+
244
+ # NuGet Packages
245
+ *.nupkg
246
+ # NuGet Symbol Packages
247
+ *.snupkg
248
+ # The packages folder can be ignored because of Package Restore
249
+ # DISABLED: mono-repo uses /packages/ for source code
250
+ # **/[Pp]ackages/*
251
+ # !**/[Pp]ackages/build/
252
+ # #!**/[Pp]ackages/repositories.config
253
+ # NuGet v3's project.json files produces more ignorable files
254
+ *.nuget.props
255
+ *.nuget.targets
256
+
257
+ # Microsoft Azure Build Output
258
+ csx/
259
+ *.build.csdef
260
+
261
+ # Microsoft Azure Emulator
262
+ ecf/
263
+ rcf/
264
+
265
+ # Windows Store app package directories and files
266
+ AppPackages/
267
+ BundleArtifacts/
268
+ Package.StoreAssociation.xml
269
+ _pkginfo.txt
270
+ *.appx
271
+ *.appxbundle
272
+ *.appxupload
273
+
274
+ # Visual Studio cache files
275
+ # files ending in .cache can be ignored
276
+ *.[Cc]ache
277
+ # but keep track of directories ending in .cache
278
+ !?*.[Cc]ache/
279
+
280
+ # Others
281
+ ClientBin/
282
+ ~$*
283
+ *~
284
+ *.dbmdl
285
+ *.dbproj.schemaview
286
+ *.jfm
287
+ *.pfx
288
+ *.publishsettings
289
+ orleans.codegen.cs
290
+
291
+ # Including strong name files can present a security risk
292
+ # (https://github.com/github/gitignore/pull/2483#issue-259490424)
293
+ #*.snk
294
+
295
+ # Since there are multiple workflows, uncomment next line to ignore bower_components
296
+ # (https://github.com/github/gitignore/pull/1529#issuecomment-104372622)
297
+ #bower_components/
298
+
299
+ # RIA/Silverlight projects
300
+ Generated_Code/
301
+
302
+ # Backup & report files from converting an old project file
303
+ # to a newer Visual Studio version. Backup files are not needed,
304
+ # because we have git ;-)
305
+ _UpgradeReport_Files/
306
+ Backup*/
307
+ UpgradeLog*.XML
308
+ UpgradeLog*.htm
309
+ ServiceFabricBackup/
310
+ *.rptproj.bak
311
+
312
+ # SQL Server files
313
+ *.mdf
314
+ *.ldf
315
+ *.ndf
316
+
317
+ # Business Intelligence projects
318
+ *.rdl.data
319
+ *.bim.layout
320
+ *.bim_*.settings
321
+ *.rptproj.rsuser
322
+ *- [Bb]ackup.rdl
323
+ *- [Bb]ackup ([0-9]).rdl
324
+ *- [Bb]ackup ([0-9][0-9]).rdl
325
+
326
+ # Microsoft Fakes
327
+ FakesAssemblies/
328
+
329
+ # GhostDoc plugin setting file
330
+ *.GhostDoc.xml
331
+
332
+ # Node.js Tools for Visual Studio
333
+ .ntvs_analysis.dat
334
+ node_modules/
335
+
336
+ # Visual Studio 6 build log
337
+ *.plg
338
+
339
+ # Visual Studio 6 workspace options file
340
+ *.opt
341
+
342
+ # Visual Studio 6 auto-generated workspace file (contains which files were open etc.)
343
+ *.vbw
344
+
345
+ # Visual Studio 6 auto-generated project file (contains which files were open etc.)
346
+ *.vbp
347
+
348
+ # Visual Studio 6 workspace and project file (working project files containing files to include in project)
349
+ *.dsw
350
+ *.dsp
351
+
352
+ # Visual Studio 6 technical files
353
+ *.ncb
354
+ *.aps
355
+
356
+ # Visual Studio LightSwitch build output
357
+ **/*.HTMLClient/GeneratedArtifacts
358
+ **/*.DesktopClient/GeneratedArtifacts
359
+ **/*.DesktopClient/ModelManifest.xml
360
+ **/*.Server/GeneratedArtifacts
361
+ **/*.Server/ModelManifest.xml
362
+ _Pvt_Extensions
363
+
364
+ # Paket dependency manager
365
+ **/.paket/paket.exe
366
+ paket-files/
367
+
368
+ # FAKE - F# Make
369
+ **/.fake/
370
+
371
+ # CodeRush personal settings
372
+ **/.cr/personal
373
+
374
+ # Python Tools for Visual Studio (PTVS)
375
+ **/__pycache__/
376
+ *.pyc
377
+
378
+ # Cake - Uncomment if you are using it
379
+ #tools/**
380
+ #!tools/packages.config
381
+
382
+ # Tabs Studio
383
+ *.tss
384
+
385
+ # Telerik's JustMock configuration file
386
+ *.jmconfig
387
+
388
+ # BizTalk build output
389
+ *.btp.cs
390
+ *.btm.cs
391
+ *.odx.cs
392
+ *.xsd.cs
393
+
394
+ # OpenCover UI analysis results
395
+ OpenCover/
396
+
397
+ # Azure Stream Analytics local run output
398
+ ASALocalRun/
399
+
400
+ # MSBuild Binary and Structured Log
401
+ *.binlog
402
+ MSBuild_Logs/
403
+
404
+ # AWS SAM Build and Temporary Artifacts folder
405
+ .aws-sam
406
+
407
+ # NVidia Nsight GPU debugger configuration file
408
+ *.nvuser
409
+
410
+ # MFractors (Xamarin productivity tool) working folder
411
+ **/.mfractor/
412
+
413
+ # Local History for Visual Studio
414
+ **/.localhistory/
415
+
416
+ # Visual Studio History (VSHistory) files
417
+ .vshistory/
418
+
419
+ # BeatPulse healthcheck temp database
420
+ healthchecksdb
421
+
422
+ # Backup folder for Package Reference Convert tool in Visual Studio 2017
423
+ MigrationBackup/
424
+
425
+ # Ionide (cross platform F# VS Code tools) working folder
426
+ **/.ionide/
427
+
428
+ # Fody - auto-generated XML schema
429
+ FodyWeavers.xsd
430
+
431
+ # VS Code files for those working on multiple tools
432
+ .vscode/*
433
+ !.vscode/settings.json
434
+ !.vscode/tasks.json
435
+ !.vscode/launch.json
436
+ !.vscode/extensions.json
437
+ !.vscode/*.code-snippets
438
+
439
+ # Local History for Visual Studio Code
440
+ .history/
441
+
442
+ # Built Visual Studio Code Extensions
443
+ *.vsix
444
+
445
+ # Windows Installer files from build outputs
446
+ *.cab
447
+ *.msi
448
+ *.msix
449
+ *.msm
450
+ *.msp
451
+
452
+ # Token/secret files
453
+ .mcpregistry_*
454
+ *.token
455
+ .env
456
+ .env.*
@@ -0,0 +1,86 @@
1
+ # Agent-SRE — Coding Agent Instructions
2
+
3
+ ## Project Overview
4
+
5
+ Agent-SRE is an **SRE toolkit for AI agent reliability** — providing SLO management, error budgets, chaos engineering, progressive delivery, cost guardrails, incident management, and observability for autonomous AI agents.
6
+
7
+ **Key engines:**
8
+
9
+ - **SLO Engine:** Define and track Service Level Objectives for agent operations
10
+ - **Error Budget Engine:** SRE-style reliability tracking with burn rate alerts
11
+ - **Chaos Engine:** Fault injection and resilience testing for agents
12
+ - **Cost Guard:** Token/API cost tracking and budget enforcement
13
+ - **Progressive Delivery:** Canary deployments, A/B testing for agent versions
14
+ - **Incident Manager:** Automated incident detection, classification, and response
15
+ - **Replay Engine:** Capture and replay agent execution traces
16
+ - **Tracing:** OpenTelemetry semantic conventions for AI agents
17
+
18
+ ## Build & Test Commands
19
+
20
+ ```bash
21
+ # Install dependencies (development mode)
22
+ pip install -e ".[dev]"
23
+
24
+ # Run all tests
25
+ pytest tests/
26
+
27
+ # Run tests with coverage
28
+ pytest tests/ --cov=src/agent_sre --cov-report=html
29
+
30
+ # Type checking
31
+ mypy src/
32
+
33
+ # Lint and format
34
+ ruff check .
35
+ ruff format .
36
+ ```
37
+
38
+ ## Code Style
39
+
40
+ - **Linter:** Ruff (line-length: 100, rules: E, F, W, I, N, UP, B, SIM, TCH)
41
+ - **Type checker:** MyPy strict mode (Python 3.10)
42
+ - **Python:** >=3.10
43
+ - **Docstrings:** Google-style
44
+
45
+ ## Key Files
46
+
47
+ | File | Purpose |
48
+ |------|---------|
49
+ | `src/agent_sre/slo/` | SLO definitions, tracking, burn rate calculation |
50
+ | `src/agent_sre/cost/` | Cost guardrails, token budget tracking |
51
+ | `src/agent_sre/chaos/` | Chaos experiments, fault injection |
52
+ | `src/agent_sre/delivery/` | Canary/progressive delivery |
53
+ | `src/agent_sre/incidents/` | Incident detection and response |
54
+ | `src/agent_sre/replay/` | Trace capture and replay |
55
+ | `src/agent_sre/tracing/` | OpenTelemetry agent conventions |
56
+ | `src/agent_sre/alerts/` | Alert rules and notifications |
57
+ | `src/agent_sre/fleet/` | Fleet-wide agent management |
58
+ | `src/agent_sre/certification/` | Agent certification framework |
59
+ | `deployments/` | Helm charts, Kubernetes manifests |
60
+ | `operator/` | Kubernetes operator for agent-sre |
61
+
62
+ ## Coding Conventions
63
+
64
+ - Error budgets: pure SRE math — availability windows, burn rates, exhaustion forecasting
65
+ - SLOs: YAML/TOML definitions, version-controlled
66
+ - OTEL conventions: custom attributes like `agent.did`, `agent.trust_score`, `agent.task.success`
67
+ - Span kinds: `AGENT_TASK`, `TOOL_CALL`, `LLM_INFERENCE`, `DELEGATION`, `POLICY_CHECK`
68
+ - All metrics follow Prometheus naming conventions
69
+ - Use `dataclass` or Pydantic `BaseModel` for structured data
70
+
71
+ ## Boundaries
72
+
73
+ - **Never commit** secrets, API keys, or cloud credentials
74
+ - **Never modify** deployment configs without testing locally first
75
+ - **Never lower** SLO targets — only raise them
76
+ - Keep backward compatibility with existing metric names and OTEL attributes
77
+
78
+ ## Testing Requirements
79
+
80
+ - All new features must include tests
81
+ - Run `pytest tests/` before committing
82
+ - Use `pytest-asyncio` for async tests (asyncio_mode = "auto")
83
+
84
+ ## Commit Style
85
+
86
+ Use conventional commits: `feat:`, `fix:`, `docs:`, `test:`, `refactor:`, `chore:`