synth-ai 0.2.8.dev2__py3-none-any.whl → 0.4.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (740) hide show
  1. synth_ai/__init__.py +44 -24
  2. synth_ai/__main__.py +30 -3
  3. synth_ai/cli/__init__.py +103 -48
  4. synth_ai/cli/__main__.py +42 -0
  5. synth_ai/cli/_internal/__init__.py +5 -0
  6. synth_ai/cli/_internal/modal_wrapper.py +31 -0
  7. synth_ai/cli/_internal/storage.py +20 -0
  8. synth_ai/cli/_internal/typer_patch.py +47 -0
  9. synth_ai/cli/_internal/validate_task_app.py +29 -0
  10. synth_ai/cli/agents/__init__.py +17 -0
  11. synth_ai/cli/agents/claude.py +77 -0
  12. synth_ai/cli/agents/codex.py +265 -0
  13. synth_ai/cli/agents/opencode.py +253 -0
  14. synth_ai/cli/commands/__init__.py +18 -0
  15. synth_ai/cli/commands/artifacts/__init__.py +13 -0
  16. synth_ai/cli/commands/artifacts/client.py +119 -0
  17. synth_ai/cli/commands/artifacts/config.py +57 -0
  18. synth_ai/cli/commands/artifacts/core.py +24 -0
  19. synth_ai/cli/commands/artifacts/download.py +188 -0
  20. synth_ai/cli/commands/artifacts/export.py +186 -0
  21. synth_ai/cli/commands/artifacts/list.py +156 -0
  22. synth_ai/cli/commands/artifacts/parsing.py +250 -0
  23. synth_ai/cli/commands/artifacts/show.py +336 -0
  24. synth_ai/cli/commands/demo/__init__.py +3 -0
  25. synth_ai/cli/commands/demo/core.py +153 -0
  26. synth_ai/cli/commands/eval/__init__.py +10 -0
  27. synth_ai/cli/commands/eval/config.py +338 -0
  28. synth_ai/cli/commands/eval/core.py +256 -0
  29. synth_ai/cli/commands/eval/runner.py +704 -0
  30. synth_ai/cli/commands/eval/validation.py +60 -0
  31. synth_ai/cli/commands/filter/__init__.py +12 -0
  32. synth_ai/cli/commands/filter/core.py +424 -0
  33. synth_ai/cli/commands/filter/errors.py +55 -0
  34. synth_ai/cli/commands/filter/validation.py +77 -0
  35. synth_ai/cli/commands/help/__init__.py +185 -0
  36. synth_ai/cli/commands/help/core.py +72 -0
  37. synth_ai/cli/commands/scan/__init__.py +19 -0
  38. synth_ai/cli/commands/scan/cloudflare_scanner.py +403 -0
  39. synth_ai/cli/commands/scan/core.py +344 -0
  40. synth_ai/cli/commands/scan/health_checker.py +242 -0
  41. synth_ai/cli/commands/scan/local_scanner.py +278 -0
  42. synth_ai/cli/commands/scan/models.py +83 -0
  43. synth_ai/cli/commands/smoke/__init__.py +7 -0
  44. synth_ai/cli/commands/smoke/core.py +1428 -0
  45. synth_ai/cli/commands/status/__init__.py +3 -0
  46. synth_ai/cli/commands/status/client.py +91 -0
  47. synth_ai/cli/commands/status/config.py +12 -0
  48. synth_ai/cli/commands/status/errors.py +11 -0
  49. synth_ai/cli/commands/status/subcommands/__init__.py +3 -0
  50. synth_ai/cli/commands/status/subcommands/config.py +13 -0
  51. synth_ai/cli/commands/status/subcommands/files.py +34 -0
  52. synth_ai/cli/commands/status/subcommands/jobs.py +51 -0
  53. synth_ai/cli/commands/status/subcommands/models.py +35 -0
  54. synth_ai/cli/commands/status/subcommands/runs.py +34 -0
  55. synth_ai/cli/commands/status/subcommands/session.py +77 -0
  56. synth_ai/cli/commands/status/subcommands/summary.py +39 -0
  57. synth_ai/cli/commands/status/subcommands/utils.py +41 -0
  58. synth_ai/cli/commands/status/utils.py +23 -0
  59. synth_ai/cli/commands/train/__init__.py +53 -0
  60. synth_ai/cli/commands/train/core.py +22 -0
  61. synth_ai/cli/commands/train/errors.py +117 -0
  62. synth_ai/cli/commands/train/judge_schemas.py +201 -0
  63. synth_ai/cli/commands/train/judge_validation.py +305 -0
  64. synth_ai/cli/commands/train/prompt_learning_validation.py +633 -0
  65. synth_ai/cli/commands/train/validation.py +392 -0
  66. synth_ai/cli/demo_apps/__init__.py +10 -0
  67. synth_ai/cli/demo_apps/core/__init__.py +28 -0
  68. synth_ai/{demos → cli/demo_apps}/core/cli.py +783 -441
  69. synth_ai/cli/demo_apps/crafter/__init__.py +1 -0
  70. synth_ai/cli/demo_apps/crafter/crafter_fft_4b.toml +55 -0
  71. synth_ai/cli/demo_apps/crafter/grpo_crafter_task_app.py +186 -0
  72. synth_ai/cli/demo_apps/crafter/rl_from_base_qwen4b.toml +74 -0
  73. synth_ai/cli/demo_apps/demo_registry.py +176 -0
  74. synth_ai/cli/demo_apps/demo_task_apps/__init__.py +7 -0
  75. synth_ai/{demos → cli/demo_apps}/demo_task_apps/core.py +75 -37
  76. synth_ai/cli/demo_apps/demo_task_apps/crafter/__init__.py +1 -0
  77. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/crafter_fft_4b.toml +53 -0
  78. synth_ai/cli/demo_apps/demo_task_apps/crafter/configs/rl_from_base_qwen4b.toml +73 -0
  79. synth_ai/cli/demo_apps/demo_task_apps/crafter/grpo_crafter_task_app.py +185 -0
  80. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/_common.py +1 -2
  81. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/app.py +2 -1
  82. synth_ai/cli/demo_apps/demo_task_apps/math/config.toml +73 -0
  83. synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/deploy_modal.py +3 -6
  84. synth_ai/cli/demo_apps/demo_task_apps/math/modal_task_app.py +738 -0
  85. synth_ai/cli/demo_apps/demo_task_apps/math/task_app_entry.py +39 -0
  86. synth_ai/cli/demo_apps/math/__init__.py +1 -0
  87. synth_ai/cli/demo_apps/math/_common.py +16 -0
  88. synth_ai/cli/demo_apps/math/app.py +38 -0
  89. synth_ai/cli/demo_apps/math/config.toml +75 -0
  90. synth_ai/cli/demo_apps/math/deploy_modal.py +54 -0
  91. synth_ai/cli/demo_apps/math/modal_task_app.py +698 -0
  92. synth_ai/cli/demo_apps/math/task_app_entry.py +53 -0
  93. synth_ai/cli/demo_apps/mipro/main.py +271 -0
  94. synth_ai/cli/demo_apps/mipro/task_app.py +922 -0
  95. synth_ai/cli/demo_apps/mipro/train_cfg.toml +92 -0
  96. synth_ai/cli/demos/__init__.py +12 -0
  97. synth_ai/cli/demos/demo.py +32 -0
  98. synth_ai/cli/demos/rl_demo.py +254 -0
  99. synth_ai/cli/deploy.py +216 -0
  100. synth_ai/cli/infra/__init__.py +14 -0
  101. synth_ai/cli/{balance.py → infra/balance.py} +16 -4
  102. synth_ai/cli/infra/mcp.py +35 -0
  103. synth_ai/cli/infra/modal_app.py +36 -0
  104. synth_ai/cli/infra/setup.py +69 -0
  105. synth_ai/cli/infra/status.py +16 -0
  106. synth_ai/cli/infra/turso.py +77 -0
  107. synth_ai/cli/lib/__init__.py +10 -0
  108. synth_ai/cli/lib/agents.py +76 -0
  109. synth_ai/cli/lib/apps/modal_app.py +101 -0
  110. synth_ai/cli/lib/apps/task_app.py +642 -0
  111. synth_ai/cli/lib/bin.py +39 -0
  112. synth_ai/cli/lib/env.py +375 -0
  113. synth_ai/cli/lib/errors.py +85 -0
  114. synth_ai/cli/lib/modal.py +315 -0
  115. synth_ai/cli/lib/plotting.py +126 -0
  116. synth_ai/cli/lib/prompt_args.py +39 -0
  117. synth_ai/cli/lib/prompts.py +284 -0
  118. synth_ai/cli/lib/sqld.py +122 -0
  119. synth_ai/cli/lib/task_app_discovery.py +884 -0
  120. synth_ai/cli/lib/task_app_env.py +295 -0
  121. synth_ai/cli/lib/train_cfgs.py +300 -0
  122. synth_ai/cli/lib/tunnel_records.py +207 -0
  123. synth_ai/cli/local/__init__.py +14 -0
  124. synth_ai/cli/local/experiment_queue/__init__.py +72 -0
  125. synth_ai/cli/local/experiment_queue/api_schemas.py +221 -0
  126. synth_ai/cli/local/experiment_queue/celery_app.py +208 -0
  127. synth_ai/cli/local/experiment_queue/config.py +128 -0
  128. synth_ai/cli/local/experiment_queue/config_utils.py +272 -0
  129. synth_ai/cli/local/experiment_queue/database.py +175 -0
  130. synth_ai/cli/local/experiment_queue/dispatcher.py +119 -0
  131. synth_ai/cli/local/experiment_queue/models.py +231 -0
  132. synth_ai/cli/local/experiment_queue/progress_info.py +160 -0
  133. synth_ai/cli/local/experiment_queue/results.py +373 -0
  134. synth_ai/cli/local/experiment_queue/schemas.py +131 -0
  135. synth_ai/cli/local/experiment_queue/service.py +344 -0
  136. synth_ai/cli/local/experiment_queue/status.py +372 -0
  137. synth_ai/cli/local/experiment_queue/status_tracker.py +360 -0
  138. synth_ai/cli/local/experiment_queue/tasks.py +1984 -0
  139. synth_ai/cli/local/experiment_queue/trace_storage.py +65 -0
  140. synth_ai/cli/local/experiment_queue/validation.py +157 -0
  141. synth_ai/cli/local/session/__init__.py +92 -0
  142. synth_ai/cli/local/session/client.py +383 -0
  143. synth_ai/cli/local/session/constants.py +63 -0
  144. synth_ai/cli/local/session/exceptions.py +105 -0
  145. synth_ai/cli/local/session/manager.py +139 -0
  146. synth_ai/cli/local/session/models.py +89 -0
  147. synth_ai/cli/local/session/query.py +110 -0
  148. synth_ai/cli/root.py +150 -108
  149. synth_ai/cli/task_apps/__init__.py +37 -0
  150. synth_ai/cli/task_apps/commands.py +3145 -0
  151. synth_ai/cli/task_apps/deploy.py +7 -0
  152. synth_ai/cli/task_apps/list.py +26 -0
  153. synth_ai/cli/task_apps/main.py +36 -0
  154. synth_ai/cli/task_apps/modal_serve.py +11 -0
  155. synth_ai/cli/task_apps/serve.py +11 -0
  156. synth_ai/cli/training/__init__.py +8 -0
  157. synth_ai/cli/training/train.py +5 -0
  158. synth_ai/cli/training/train_cfg.py +34 -0
  159. synth_ai/cli/{watch.py → training/watch.py} +13 -18
  160. synth_ai/cli/turso.py +52 -0
  161. synth_ai/cli/utils/__init__.py +8 -0
  162. synth_ai/cli/utils/experiments.py +235 -0
  163. synth_ai/cli/utils/queue.py +504 -0
  164. synth_ai/cli/{recent.py → utils/recent.py} +13 -7
  165. synth_ai/cli/{traces.py → utils/traces.py} +9 -5
  166. synth_ai/contracts/__init__.py +67 -0
  167. synth_ai/core/__init__.py +100 -0
  168. synth_ai/core/_utils/__init__.py +54 -0
  169. synth_ai/core/_utils/base_url.py +10 -0
  170. synth_ai/core/_utils/http.py +10 -0
  171. synth_ai/core/_utils/prompts.py +14 -0
  172. synth_ai/core/_utils/task_app_state.py +12 -0
  173. synth_ai/core/_utils/user_config.py +10 -0
  174. synth_ai/core/apps/common.py +116 -0
  175. synth_ai/core/auth.py +95 -0
  176. synth_ai/core/cfgs.py +240 -0
  177. synth_ai/core/config/__init__.py +16 -0
  178. synth_ai/core/config/base.py +168 -0
  179. synth_ai/core/config/resolver.py +89 -0
  180. synth_ai/core/env.py +231 -0
  181. synth_ai/core/errors.py +126 -0
  182. synth_ai/core/http.py +230 -0
  183. synth_ai/core/integrations/__init__.py +11 -0
  184. synth_ai/core/integrations/cloudflare.py +1710 -0
  185. synth_ai/core/integrations/mcp/__init__.py +6 -0
  186. synth_ai/core/integrations/mcp/__main__.py +8 -0
  187. synth_ai/core/integrations/mcp/claude.py +36 -0
  188. synth_ai/core/integrations/mcp/main.py +254 -0
  189. synth_ai/core/integrations/mcp/setup.py +100 -0
  190. synth_ai/core/integrations/modal.py +277 -0
  191. synth_ai/core/json.py +72 -0
  192. synth_ai/core/log_filter.py +99 -0
  193. synth_ai/core/logging.py +82 -0
  194. synth_ai/core/paths.py +107 -0
  195. synth_ai/core/pricing.py +109 -0
  196. synth_ai/core/process.py +233 -0
  197. synth_ai/core/ssl.py +25 -0
  198. synth_ai/core/storage/__init__.py +71 -0
  199. synth_ai/core/task_app_state.py +318 -0
  200. synth_ai/core/telemetry.py +282 -0
  201. synth_ai/{tracing_v3 → core/tracing_v3}/__init__.py +5 -1
  202. synth_ai/{tracing_v3 → core/tracing_v3}/abstractions.py +21 -4
  203. synth_ai/core/tracing_v3/config.py +229 -0
  204. synth_ai/core/tracing_v3/constants.py +21 -0
  205. synth_ai/{tracing_v3 → core/tracing_v3}/db_config.py +42 -29
  206. synth_ai/{tracing_v3 → core/tracing_v3}/decorators.py +80 -45
  207. synth_ai/{tracing_v3 → core/tracing_v3}/examples/basic_usage.py +15 -9
  208. synth_ai/{tracing_v3 → core/tracing_v3}/hooks.py +6 -4
  209. synth_ai/{tracing_v3 → core/tracing_v3}/llm_call_record_helpers.py +161 -61
  210. synth_ai/{tracing_v3 → core/tracing_v3}/migration_helper.py +1 -2
  211. synth_ai/{tracing_v3 → core/tracing_v3}/replica_sync.py +12 -7
  212. synth_ai/core/tracing_v3/serialization.py +130 -0
  213. synth_ai/{tracing_v3 → core/tracing_v3}/session_tracer.py +88 -21
  214. synth_ai/{tracing_v3 → core/tracing_v3}/storage/base.py +99 -12
  215. synth_ai/core/tracing_v3/storage/config.py +109 -0
  216. synth_ai/{tracing_v3 → core/tracing_v3}/storage/factory.py +11 -9
  217. synth_ai/{tracing_v3 → core/tracing_v3}/storage/utils.py +15 -11
  218. synth_ai/core/tracing_v3/trace_utils.py +326 -0
  219. synth_ai/core/tracing_v3/turso/__init__.py +12 -0
  220. synth_ai/core/tracing_v3/turso/daemon.py +278 -0
  221. synth_ai/{tracing_v3 → core/tracing_v3}/turso/models.py +7 -3
  222. synth_ai/core/tracing_v3/turso/native_manager.py +1385 -0
  223. synth_ai/{tracing_v3 → core/tracing_v3}/utils.py +5 -4
  224. synth_ai/core/urls.py +18 -0
  225. synth_ai/core/user_config.py +137 -0
  226. synth_ai/core/uvicorn.py +222 -0
  227. synth_ai/data/__init__.py +83 -0
  228. synth_ai/data/enums.py +123 -0
  229. synth_ai/data/rewards.py +152 -0
  230. synth_ai/data/traces.py +35 -0
  231. synth_ai/products/__init__.py +6 -0
  232. synth_ai/products/graph_evolve/__init__.py +46 -0
  233. synth_ai/products/graph_evolve/client.py +226 -0
  234. synth_ai/products/graph_evolve/config.py +591 -0
  235. synth_ai/products/graph_evolve/converters/__init__.py +42 -0
  236. synth_ai/products/graph_evolve/converters/openai_sft.py +484 -0
  237. synth_ai/products/graph_evolve/examples/hotpotqa/config.toml +109 -0
  238. synth_ai/products/graph_evolve/run.py +222 -0
  239. synth_ai/products/graph_gepa/__init__.py +23 -0
  240. synth_ai/products/graph_gepa/converters/__init__.py +19 -0
  241. synth_ai/products/graph_gepa/converters/openai_sft.py +29 -0
  242. synth_ai/sdk/__init__.py +123 -0
  243. synth_ai/sdk/api/__init__.py +1 -0
  244. synth_ai/sdk/api/models/supported.py +514 -0
  245. synth_ai/sdk/api/research_agent/__init__.py +296 -0
  246. synth_ai/sdk/api/train/__init__.py +85 -0
  247. synth_ai/sdk/api/train/builders.py +895 -0
  248. synth_ai/sdk/api/train/cli.py +2199 -0
  249. synth_ai/sdk/api/train/config_finder.py +267 -0
  250. synth_ai/sdk/api/train/configs/__init__.py +65 -0
  251. synth_ai/sdk/api/train/configs/prompt_learning.py +1706 -0
  252. synth_ai/sdk/api/train/configs/rl.py +187 -0
  253. synth_ai/sdk/api/train/configs/sft.py +99 -0
  254. synth_ai/sdk/api/train/configs/shared.py +81 -0
  255. synth_ai/sdk/api/train/context_learning.py +312 -0
  256. synth_ai/sdk/api/train/env_resolver.py +418 -0
  257. synth_ai/sdk/api/train/graph_validators.py +216 -0
  258. synth_ai/sdk/api/train/graphgen.py +984 -0
  259. synth_ai/sdk/api/train/graphgen_models.py +823 -0
  260. synth_ai/sdk/api/train/graphgen_validators.py +109 -0
  261. synth_ai/sdk/api/train/local_api.py +10 -0
  262. synth_ai/sdk/api/train/pollers.py +124 -0
  263. synth_ai/sdk/api/train/progress/__init__.py +97 -0
  264. synth_ai/sdk/api/train/progress/dataclasses.py +569 -0
  265. synth_ai/sdk/api/train/progress/events.py +326 -0
  266. synth_ai/sdk/api/train/progress/results.py +428 -0
  267. synth_ai/sdk/api/train/progress/tracker.py +641 -0
  268. synth_ai/sdk/api/train/prompt_learning.py +469 -0
  269. synth_ai/sdk/api/train/rl.py +441 -0
  270. synth_ai/sdk/api/train/sft.py +396 -0
  271. synth_ai/sdk/api/train/summary.py +522 -0
  272. synth_ai/sdk/api/train/supported_algos.py +147 -0
  273. synth_ai/sdk/api/train/task_app.py +351 -0
  274. synth_ai/sdk/api/train/utils.py +279 -0
  275. synth_ai/sdk/api/train/validators.py +2424 -0
  276. synth_ai/sdk/graphs/__init__.py +15 -0
  277. synth_ai/sdk/graphs/completions.py +570 -0
  278. synth_ai/{inference → sdk/inference}/__init__.py +0 -1
  279. synth_ai/sdk/inference/client.py +128 -0
  280. synth_ai/sdk/jobs/__init__.py +16 -0
  281. synth_ai/sdk/jobs/client.py +371 -0
  282. synth_ai/sdk/judging/__init__.py +14 -0
  283. synth_ai/sdk/judging/base.py +24 -0
  284. synth_ai/sdk/judging/client.py +40 -0
  285. synth_ai/sdk/judging/schemas.py +222 -0
  286. synth_ai/sdk/judging/types.py +42 -0
  287. synth_ai/sdk/learning/__init__.py +99 -0
  288. synth_ai/sdk/learning/algorithms.py +14 -0
  289. synth_ai/{learning → sdk/learning}/client.py +121 -30
  290. synth_ai/sdk/learning/config.py +5 -0
  291. synth_ai/{learning → sdk/learning}/constants.py +0 -2
  292. synth_ai/sdk/learning/context_learning_client.py +531 -0
  293. synth_ai/sdk/learning/context_learning_types.py +292 -0
  294. synth_ai/sdk/learning/ft_client.py +7 -0
  295. synth_ai/{learning → sdk/learning}/health.py +15 -9
  296. synth_ai/{learning → sdk/learning}/jobs.py +44 -47
  297. synth_ai/sdk/learning/prompt_extraction.py +334 -0
  298. synth_ai/sdk/learning/prompt_learning_client.py +455 -0
  299. synth_ai/sdk/learning/prompt_learning_types.py +186 -0
  300. synth_ai/{rl → sdk/learning/rl}/__init__.py +13 -8
  301. synth_ai/{learning/rl_client.py → sdk/learning/rl/client.py} +89 -77
  302. synth_ai/sdk/learning/rl/config.py +31 -0
  303. synth_ai/{rl → sdk/learning/rl}/contracts.py +5 -14
  304. synth_ai/{rl → sdk/learning/rl}/env_keys.py +45 -16
  305. synth_ai/sdk/learning/rl/secrets.py +13 -0
  306. synth_ai/sdk/learning/rl_client.py +5 -0
  307. synth_ai/sdk/learning/sft/__init__.py +29 -0
  308. synth_ai/sdk/learning/sft/client.py +95 -0
  309. synth_ai/sdk/learning/sft/config.py +270 -0
  310. synth_ai/sdk/learning/sft/data.py +698 -0
  311. synth_ai/sdk/learning/sse.py +57 -0
  312. synth_ai/sdk/learning/validators.py +52 -0
  313. synth_ai/sdk/localapi/__init__.py +40 -0
  314. synth_ai/sdk/localapi/apps/__init__.py +28 -0
  315. synth_ai/sdk/localapi/client.py +10 -0
  316. synth_ai/sdk/localapi/contracts.py +10 -0
  317. synth_ai/sdk/localapi/helpers.py +519 -0
  318. synth_ai/sdk/localapi/rollouts.py +87 -0
  319. synth_ai/sdk/localapi/server.py +29 -0
  320. synth_ai/sdk/localapi/template.py +70 -0
  321. synth_ai/sdk/streaming/__init__.py +35 -0
  322. synth_ai/sdk/streaming/config.py +94 -0
  323. synth_ai/sdk/streaming/handlers.py +1997 -0
  324. synth_ai/sdk/streaming/streamer.py +713 -0
  325. synth_ai/sdk/streaming/types.py +112 -0
  326. synth_ai/sdk/task/__init__.py +164 -0
  327. synth_ai/sdk/task/apps/__init__.py +169 -0
  328. synth_ai/sdk/task/auth.py +165 -0
  329. synth_ai/sdk/task/client.py +175 -0
  330. synth_ai/sdk/task/config.py +257 -0
  331. synth_ai/sdk/task/contracts.py +219 -0
  332. synth_ai/sdk/task/datasets.py +108 -0
  333. synth_ai/sdk/task/errors.py +50 -0
  334. synth_ai/sdk/task/health.py +34 -0
  335. synth_ai/sdk/task/in_process.py +1190 -0
  336. synth_ai/sdk/task/in_process_runner.py +314 -0
  337. synth_ai/sdk/task/inference_api.py +299 -0
  338. synth_ai/sdk/task/json.py +111 -0
  339. synth_ai/sdk/task/proxy.py +287 -0
  340. synth_ai/sdk/task/rubrics/__init__.py +55 -0
  341. synth_ai/sdk/task/rubrics/loaders.py +156 -0
  342. synth_ai/sdk/task/rubrics/models.py +57 -0
  343. synth_ai/sdk/task/rubrics/scoring.py +116 -0
  344. synth_ai/sdk/task/rubrics/strict.py +149 -0
  345. synth_ai/sdk/task/rubrics.py +219 -0
  346. synth_ai/sdk/task/server.py +631 -0
  347. synth_ai/sdk/task/trace_correlation_helpers.py +539 -0
  348. synth_ai/sdk/task/tracing_utils.py +95 -0
  349. synth_ai/sdk/task/validators.py +441 -0
  350. synth_ai/sdk/task/vendors.py +59 -0
  351. synth_ai/sdk/training/__init__.py +102 -0
  352. synth_ai/sdk/tunnels/__init__.py +83 -0
  353. synth_ai/sdk/tunnels/cleanup.py +83 -0
  354. synth_ai/sdk/tunnels/ports.py +120 -0
  355. synth_ai/utils/__init__.py +213 -0
  356. synth_ai-0.4.3.dist-info/METADATA +262 -0
  357. synth_ai-0.4.3.dist-info/RECORD +370 -0
  358. {synth_ai-0.2.8.dev2.dist-info → synth_ai-0.4.3.dist-info}/entry_points.txt +0 -1
  359. synth_ai/cli/calc.py +0 -69
  360. synth_ai/cli/demo.py +0 -144
  361. synth_ai/cli/legacy_root_backup.py +0 -470
  362. synth_ai/cli/man.py +0 -106
  363. synth_ai/cli/rl_demo.py +0 -202
  364. synth_ai/cli/status.py +0 -133
  365. synth_ai/config/base_url.py +0 -107
  366. synth_ai/core/experiment.py +0 -15
  367. synth_ai/core/system.py +0 -15
  368. synth_ai/demos/core/__init__.py +0 -1
  369. synth_ai/demos/demo_task_apps/__init__.py +0 -1
  370. synth_ai/demos/demo_task_apps/math/config.toml +0 -129
  371. synth_ai/demos/demo_task_apps/math/deploy_task_app.sh +0 -22
  372. synth_ai/demos/demo_task_apps/math/modal_task_app.py +0 -415
  373. synth_ai/environments/__init__.py +0 -31
  374. synth_ai/environments/environment/__init__.py +0 -1
  375. synth_ai/environments/environment/artifacts/__init__.py +0 -1
  376. synth_ai/environments/environment/artifacts/base.py +0 -52
  377. synth_ai/environments/environment/core.py +0 -67
  378. synth_ai/environments/environment/db/__init__.py +0 -1
  379. synth_ai/environments/environment/db/sqlite.py +0 -45
  380. synth_ai/environments/environment/registry.py +0 -233
  381. synth_ai/environments/environment/resources/sqlite.py +0 -45
  382. synth_ai/environments/environment/results.py +0 -1
  383. synth_ai/environments/environment/rewards/__init__.py +0 -1
  384. synth_ai/environments/environment/rewards/core.py +0 -29
  385. synth_ai/environments/environment/shared_engine.py +0 -26
  386. synth_ai/environments/environment/tools/__init__.py +0 -200
  387. synth_ai/environments/examples/__init__.py +0 -1
  388. synth_ai/environments/examples/bandit/__init__.py +0 -33
  389. synth_ai/environments/examples/bandit/engine.py +0 -294
  390. synth_ai/environments/examples/bandit/environment.py +0 -194
  391. synth_ai/environments/examples/bandit/taskset.py +0 -200
  392. synth_ai/environments/examples/crafter_classic/__init__.py +0 -8
  393. synth_ai/environments/examples/crafter_classic/agent_demos/analyze_semantic_words_markdown.py +0 -250
  394. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_comprehensive_evaluation.py +0 -59
  395. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_browser.py +0 -152
  396. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_config.toml +0 -24
  397. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_evaluation_framework.py +0 -1194
  398. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/crafter_synth_config.toml +0 -56
  399. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_config_modal.toml +0 -32
  400. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/filter_traces_sft_turso.py +0 -738
  401. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/kick_off_ft_modal.py +0 -384
  402. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_action_results.py +0 -53
  403. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_agent_actions.py +0 -178
  404. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_latest_run.py +0 -222
  405. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_lm_traces.py +0 -183
  406. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_no_rewards.py +0 -210
  407. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/analyze_trace_issue.py +0 -206
  408. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_db_schema.py +0 -49
  409. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/check_latest_results.py +0 -64
  410. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/debug_agent_responses.py +0 -88
  411. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_modal_ft/old/quick_trace_check.py +0 -77
  412. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/compare_experiments.py +0 -324
  413. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/filter_traces_sft_turso.py +0 -580
  414. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/kick_off_ft_oai.py +0 -362
  415. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/multi_model_config.toml +0 -49
  416. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_enhanced_hooks.py +0 -332
  417. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_events.py +0 -97
  418. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/analyze_hook_results.py +0 -217
  419. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_hook_storage.py +0 -87
  420. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/check_seeds.py +0 -88
  421. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/compare_seed_performance.py +0 -195
  422. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/custom_eval_pipelines.py +0 -400
  423. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/plot_hook_frequency.py +0 -195
  424. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/old/seed_analysis_summary.py +0 -56
  425. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_openai_ft/run_rollouts_for_models_and_compare_v3.py +0 -858
  426. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_quick_evaluation.py +0 -52
  427. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_react_agent.py +0 -874
  428. synth_ai/environments/examples/crafter_classic/agent_demos/crafter_trace_evaluation.py +0 -1412
  429. synth_ai/environments/examples/crafter_classic/agent_demos/example_v3_usage.py +0 -216
  430. synth_ai/environments/examples/crafter_classic/agent_demos/old/compare_traces.py +0 -296
  431. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_comprehensive_evaluation.py +0 -58
  432. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_env_serialization.py +0 -464
  433. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_evaluation_browser.py +0 -152
  434. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_quick_evaluation.py +0 -51
  435. synth_ai/environments/examples/crafter_classic/agent_demos/old/crafter_trace_evaluation.py +0 -1412
  436. synth_ai/environments/examples/crafter_classic/agent_demos/old/debug_player_loss.py +0 -112
  437. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_service.py +0 -203
  438. synth_ai/environments/examples/crafter_classic/agent_demos/old/diagnose_slowness.py +0 -305
  439. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_by_difficulty.py +0 -126
  440. synth_ai/environments/examples/crafter_classic/agent_demos/old/eval_example.py +0 -94
  441. synth_ai/environments/examples/crafter_classic/agent_demos/old/explore_saved_states.py +0 -142
  442. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft.py +0 -26
  443. synth_ai/environments/examples/crafter_classic/agent_demos/old/filter_traces_sft_OLD.py +0 -984
  444. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_gemini.py +0 -724
  445. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_data_modal.py +0 -386
  446. synth_ai/environments/examples/crafter_classic/agent_demos/old/generate_ft_metadata.py +0 -205
  447. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_gemini.py +0 -150
  448. synth_ai/environments/examples/crafter_classic/agent_demos/old/kick_off_ft_modal.py +0 -283
  449. synth_ai/environments/examples/crafter_classic/agent_demos/old/prepare_vertex_ft.py +0 -280
  450. synth_ai/environments/examples/crafter_classic/agent_demos/old/profile_env_slowness.py +0 -456
  451. synth_ai/environments/examples/crafter_classic/agent_demos/old/replicate_issue.py +0 -166
  452. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_and_eval.py +0 -102
  453. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_comparison.py +0 -128
  454. synth_ai/environments/examples/crafter_classic/agent_demos/old/run_qwen_rollouts.py +0 -655
  455. synth_ai/environments/examples/crafter_classic/agent_demos/old/trace_eval_OLD.py +0 -202
  456. synth_ai/environments/examples/crafter_classic/agent_demos/old/validate_openai_format.py +0 -166
  457. synth_ai/environments/examples/crafter_classic/config_logging.py +0 -111
  458. synth_ai/environments/examples/crafter_classic/debug_translation.py +0 -0
  459. synth_ai/environments/examples/crafter_classic/engine.py +0 -579
  460. synth_ai/environments/examples/crafter_classic/engine_deterministic_patch.py +0 -64
  461. synth_ai/environments/examples/crafter_classic/engine_helpers/action_map.py +0 -6
  462. synth_ai/environments/examples/crafter_classic/engine_helpers/serialization.py +0 -75
  463. synth_ai/environments/examples/crafter_classic/engine_serialization_patch_v3.py +0 -267
  464. synth_ai/environments/examples/crafter_classic/environment.py +0 -404
  465. synth_ai/environments/examples/crafter_classic/taskset.py +0 -233
  466. synth_ai/environments/examples/crafter_classic/trace_hooks_v3.py +0 -228
  467. synth_ai/environments/examples/crafter_classic/world_config_patch_simple.py +0 -299
  468. synth_ai/environments/examples/crafter_custom/__init__.py +0 -4
  469. synth_ai/environments/examples/crafter_custom/agent_demos/__init__.py +0 -1
  470. synth_ai/environments/examples/crafter_custom/agent_demos/trace_eval.py +0 -202
  471. synth_ai/environments/examples/crafter_custom/crafter/__init__.py +0 -7
  472. synth_ai/environments/examples/crafter_custom/crafter/config.py +0 -182
  473. synth_ai/environments/examples/crafter_custom/crafter/constants.py +0 -8
  474. synth_ai/environments/examples/crafter_custom/crafter/engine.py +0 -269
  475. synth_ai/environments/examples/crafter_custom/crafter/env.py +0 -262
  476. synth_ai/environments/examples/crafter_custom/crafter/objects.py +0 -417
  477. synth_ai/environments/examples/crafter_custom/crafter/recorder.py +0 -187
  478. synth_ai/environments/examples/crafter_custom/crafter/worldgen.py +0 -118
  479. synth_ai/environments/examples/crafter_custom/dataset_builder.py +0 -373
  480. synth_ai/environments/examples/crafter_custom/environment.py +0 -312
  481. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_issue.py +0 -159
  482. synth_ai/environments/examples/crafter_custom/old/analyze_diamond_spawning.py +0 -158
  483. synth_ai/environments/examples/crafter_custom/old/compare_worlds.py +0 -71
  484. synth_ai/environments/examples/crafter_custom/old/dataset_stats.py +0 -105
  485. synth_ai/environments/examples/crafter_custom/old/diamond_spawning_summary.py +0 -119
  486. synth_ai/environments/examples/crafter_custom/old/example_dataset_usage.py +0 -52
  487. synth_ai/environments/examples/crafter_custom/run_dataset.py +0 -305
  488. synth_ai/environments/examples/enron/art_helpers/email_search_tools.py +0 -156
  489. synth_ai/environments/examples/enron/art_helpers/local_email_db.py +0 -281
  490. synth_ai/environments/examples/enron/art_helpers/types_enron.py +0 -25
  491. synth_ai/environments/examples/enron/engine.py +0 -295
  492. synth_ai/environments/examples/enron/environment.py +0 -166
  493. synth_ai/environments/examples/enron/taskset.py +0 -112
  494. synth_ai/environments/examples/enron/units/keyword_stats.py +0 -112
  495. synth_ai/environments/examples/minigrid/__init__.py +0 -48
  496. synth_ai/environments/examples/minigrid/agent_demos/minigrid_evaluation_framework.py +0 -1188
  497. synth_ai/environments/examples/minigrid/agent_demos/minigrid_quick_evaluation.py +0 -48
  498. synth_ai/environments/examples/minigrid/agent_demos/minigrid_react_agent.py +0 -562
  499. synth_ai/environments/examples/minigrid/agent_demos/minigrid_trace_evaluation.py +0 -221
  500. synth_ai/environments/examples/minigrid/engine.py +0 -589
  501. synth_ai/environments/examples/minigrid/environment.py +0 -274
  502. synth_ai/environments/examples/minigrid/environment_mapping.py +0 -242
  503. synth_ai/environments/examples/minigrid/puzzle_loader.py +0 -417
  504. synth_ai/environments/examples/minigrid/taskset.py +0 -583
  505. synth_ai/environments/examples/nethack/__init__.py +0 -7
  506. synth_ai/environments/examples/nethack/achievements.py +0 -337
  507. synth_ai/environments/examples/nethack/agent_demos/nethack_evaluation_framework.py +0 -981
  508. synth_ai/environments/examples/nethack/agent_demos/nethack_quick_evaluation.py +0 -74
  509. synth_ai/environments/examples/nethack/agent_demos/nethack_react_agent.py +0 -831
  510. synth_ai/environments/examples/nethack/engine.py +0 -739
  511. synth_ai/environments/examples/nethack/environment.py +0 -256
  512. synth_ai/environments/examples/nethack/helpers/__init__.py +0 -41
  513. synth_ai/environments/examples/nethack/helpers/action_mapping.py +0 -301
  514. synth_ai/environments/examples/nethack/helpers/nle_wrapper.py +0 -402
  515. synth_ai/environments/examples/nethack/helpers/observation_utils.py +0 -433
  516. synth_ai/environments/examples/nethack/helpers/recording_wrapper.py +0 -200
  517. synth_ai/environments/examples/nethack/helpers/trajectory_recorder.py +0 -269
  518. synth_ai/environments/examples/nethack/helpers/visualization/replay_viewer.py +0 -308
  519. synth_ai/environments/examples/nethack/helpers/visualization/visualizer.py +0 -431
  520. synth_ai/environments/examples/nethack/taskset.py +0 -323
  521. synth_ai/environments/examples/red/__init__.py +0 -7
  522. synth_ai/environments/examples/red/agent_demos/__init__.py +0 -1
  523. synth_ai/environments/examples/red/config_logging.py +0 -110
  524. synth_ai/environments/examples/red/engine.py +0 -694
  525. synth_ai/environments/examples/red/engine_helpers/__init__.py +0 -1
  526. synth_ai/environments/examples/red/engine_helpers/memory_map.py +0 -28
  527. synth_ai/environments/examples/red/engine_helpers/reward_components.py +0 -276
  528. synth_ai/environments/examples/red/engine_helpers/reward_library/__init__.py +0 -142
  529. synth_ai/environments/examples/red/engine_helpers/reward_library/adaptive_rewards.py +0 -57
  530. synth_ai/environments/examples/red/engine_helpers/reward_library/battle_rewards.py +0 -284
  531. synth_ai/environments/examples/red/engine_helpers/reward_library/composite_rewards.py +0 -150
  532. synth_ai/environments/examples/red/engine_helpers/reward_library/economy_rewards.py +0 -138
  533. synth_ai/environments/examples/red/engine_helpers/reward_library/efficiency_rewards.py +0 -57
  534. synth_ai/environments/examples/red/engine_helpers/reward_library/exploration_rewards.py +0 -331
  535. synth_ai/environments/examples/red/engine_helpers/reward_library/novelty_rewards.py +0 -121
  536. synth_ai/environments/examples/red/engine_helpers/reward_library/pallet_town_rewards.py +0 -559
  537. synth_ai/environments/examples/red/engine_helpers/reward_library/pokemon_rewards.py +0 -313
  538. synth_ai/environments/examples/red/engine_helpers/reward_library/social_rewards.py +0 -148
  539. synth_ai/environments/examples/red/engine_helpers/reward_library/story_rewards.py +0 -247
  540. synth_ai/environments/examples/red/engine_helpers/screen_analysis.py +0 -368
  541. synth_ai/environments/examples/red/engine_helpers/state_extraction.py +0 -140
  542. synth_ai/environments/examples/red/environment.py +0 -238
  543. synth_ai/environments/examples/red/taskset.py +0 -79
  544. synth_ai/environments/examples/red/units/__init__.py +0 -1
  545. synth_ai/environments/examples/sokoban/__init__.py +0 -1
  546. synth_ai/environments/examples/sokoban/agent_demos/sokoban_full_eval.py +0 -899
  547. synth_ai/environments/examples/sokoban/engine.py +0 -678
  548. synth_ai/environments/examples/sokoban/engine_helpers/__init__.py +0 -1
  549. synth_ai/environments/examples/sokoban/engine_helpers/room_utils.py +0 -657
  550. synth_ai/environments/examples/sokoban/engine_helpers/vendored/__init__.py +0 -18
  551. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/__init__.py +0 -3
  552. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/boxoban_env.py +0 -131
  553. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/render_utils.py +0 -370
  554. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/room_utils.py +0 -332
  555. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env.py +0 -306
  556. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_fixed_targets.py +0 -67
  557. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_pull.py +0 -115
  558. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_two_player.py +0 -123
  559. synth_ai/environments/examples/sokoban/engine_helpers/vendored/envs/sokoban_env_variations.py +0 -394
  560. synth_ai/environments/examples/sokoban/environment.py +0 -229
  561. synth_ai/environments/examples/sokoban/generate_verified_puzzles.py +0 -440
  562. synth_ai/environments/examples/sokoban/puzzle_loader.py +0 -312
  563. synth_ai/environments/examples/sokoban/taskset.py +0 -428
  564. synth_ai/environments/examples/sokoban/units/astar_common.py +0 -95
  565. synth_ai/environments/examples/tictactoe/__init__.py +0 -1
  566. synth_ai/environments/examples/tictactoe/engine.py +0 -368
  567. synth_ai/environments/examples/tictactoe/environment.py +0 -240
  568. synth_ai/environments/examples/tictactoe/taskset.py +0 -215
  569. synth_ai/environments/examples/verilog/__init__.py +0 -10
  570. synth_ai/environments/examples/verilog/engine.py +0 -329
  571. synth_ai/environments/examples/verilog/environment.py +0 -350
  572. synth_ai/environments/examples/verilog/taskset.py +0 -420
  573. synth_ai/environments/examples/wordle/__init__.py +0 -29
  574. synth_ai/environments/examples/wordle/engine.py +0 -398
  575. synth_ai/environments/examples/wordle/environment.py +0 -159
  576. synth_ai/environments/examples/wordle/helpers/generate_instances_wordfreq.py +0 -75
  577. synth_ai/environments/examples/wordle/taskset.py +0 -230
  578. synth_ai/environments/reproducibility/core.py +0 -42
  579. synth_ai/environments/reproducibility/helpers.py +0 -0
  580. synth_ai/environments/reproducibility/tree.py +0 -364
  581. synth_ai/environments/service/app.py +0 -98
  582. synth_ai/environments/service/core_routes.py +0 -1020
  583. synth_ai/environments/service/external_registry.py +0 -56
  584. synth_ai/environments/service/registry.py +0 -9
  585. synth_ai/environments/stateful/__init__.py +0 -1
  586. synth_ai/environments/stateful/core.py +0 -163
  587. synth_ai/environments/stateful/engine.py +0 -21
  588. synth_ai/environments/stateful/state.py +0 -7
  589. synth_ai/environments/tasks/api.py +0 -19
  590. synth_ai/environments/tasks/core.py +0 -80
  591. synth_ai/environments/tasks/filters.py +0 -41
  592. synth_ai/environments/tasks/utils.py +0 -91
  593. synth_ai/environments/v0_observability/history.py +0 -3
  594. synth_ai/environments/v0_observability/log.py +0 -2
  595. synth_ai/evals/base.py +0 -15
  596. synth_ai/experimental/synth_oss.py +0 -446
  597. synth_ai/handshake.py +0 -63
  598. synth_ai/http.py +0 -26
  599. synth_ai/http_client.py +0 -104
  600. synth_ai/inference/client.py +0 -20
  601. synth_ai/install_sqld.sh +0 -40
  602. synth_ai/jobs/client.py +0 -246
  603. synth_ai/learning/__init__.py +0 -24
  604. synth_ai/learning/config.py +0 -43
  605. synth_ai/learning/filtering.py +0 -0
  606. synth_ai/learning/ft_client.py +0 -59
  607. synth_ai/learning/offline/dpo.py +0 -0
  608. synth_ai/learning/offline/providers.py +0 -7
  609. synth_ai/learning/offline/sft.py +0 -0
  610. synth_ai/learning/offline/shared.py +0 -0
  611. synth_ai/learning/online/grpo.py +0 -0
  612. synth_ai/learning/online/irft.py +0 -0
  613. synth_ai/learning/prompts/banking77_injection_eval.py +0 -168
  614. synth_ai/learning/prompts/gepa.py +0 -0
  615. synth_ai/learning/prompts/hello_world_in_context_injection_ex.py +0 -213
  616. synth_ai/learning/prompts/mipro.py +0 -289
  617. synth_ai/learning/prompts/random_search.py +0 -246
  618. synth_ai/learning/prompts/run_mipro_banking77.py +0 -172
  619. synth_ai/learning/prompts/run_random_search_banking77.py +0 -324
  620. synth_ai/learning/sse.py +0 -58
  621. synth_ai/learning/validators.py +0 -48
  622. synth_ai/lm/__init__.py +0 -51
  623. synth_ai/lm/caching/constants.py +0 -6
  624. synth_ai/lm/caching/dbs.py +0 -0
  625. synth_ai/lm/caching/ephemeral.py +0 -102
  626. synth_ai/lm/caching/handler.py +0 -137
  627. synth_ai/lm/caching/initialize.py +0 -11
  628. synth_ai/lm/caching/persistent.py +0 -114
  629. synth_ai/lm/config.py +0 -110
  630. synth_ai/lm/constants.py +0 -32
  631. synth_ai/lm/core/__init__.py +0 -8
  632. synth_ai/lm/core/all.py +0 -73
  633. synth_ai/lm/core/exceptions.py +0 -7
  634. synth_ai/lm/core/main.py +0 -319
  635. synth_ai/lm/core/main_v3.py +0 -594
  636. synth_ai/lm/core/synth_models.py +0 -48
  637. synth_ai/lm/core/vendor_clients.py +0 -188
  638. synth_ai/lm/cost/__init__.py +0 -0
  639. synth_ai/lm/cost/monitor.py +0 -1
  640. synth_ai/lm/cost/statefulness.py +0 -1
  641. synth_ai/lm/injection.py +0 -80
  642. synth_ai/lm/overrides.py +0 -206
  643. synth_ai/lm/provider_support/__init__.py +0 -8
  644. synth_ai/lm/provider_support/anthropic.py +0 -972
  645. synth_ai/lm/provider_support/openai.py +0 -1139
  646. synth_ai/lm/provider_support/suppress_logging.py +0 -31
  647. synth_ai/lm/structured_outputs/__init__.py +0 -0
  648. synth_ai/lm/structured_outputs/handler.py +0 -440
  649. synth_ai/lm/structured_outputs/inject.py +0 -297
  650. synth_ai/lm/structured_outputs/rehabilitate.py +0 -185
  651. synth_ai/lm/tools/__init__.py +0 -3
  652. synth_ai/lm/tools/base.py +0 -172
  653. synth_ai/lm/unified_interface.py +0 -202
  654. synth_ai/lm/vendors/__init__.py +0 -0
  655. synth_ai/lm/vendors/base.py +0 -81
  656. synth_ai/lm/vendors/core/__init__.py +0 -0
  657. synth_ai/lm/vendors/core/anthropic_api.py +0 -387
  658. synth_ai/lm/vendors/core/gemini_api.py +0 -292
  659. synth_ai/lm/vendors/core/mistral_api.py +0 -322
  660. synth_ai/lm/vendors/core/openai_api.py +0 -225
  661. synth_ai/lm/vendors/core/synth_dev_api.py +0 -0
  662. synth_ai/lm/vendors/local/__init__.py +0 -0
  663. synth_ai/lm/vendors/local/ollama.py +0 -0
  664. synth_ai/lm/vendors/openai_standard.py +0 -780
  665. synth_ai/lm/vendors/openai_standard_responses.py +0 -256
  666. synth_ai/lm/vendors/retries.py +0 -22
  667. synth_ai/lm/vendors/supported/__init__.py +0 -0
  668. synth_ai/lm/vendors/supported/custom_endpoint.py +0 -417
  669. synth_ai/lm/vendors/supported/deepseek.py +0 -69
  670. synth_ai/lm/vendors/supported/grok.py +0 -75
  671. synth_ai/lm/vendors/supported/groq.py +0 -16
  672. synth_ai/lm/vendors/supported/ollama.py +0 -15
  673. synth_ai/lm/vendors/supported/openrouter.py +0 -74
  674. synth_ai/lm/vendors/supported/together.py +0 -11
  675. synth_ai/lm/vendors/synth_client.py +0 -808
  676. synth_ai/lm/warmup.py +0 -186
  677. synth_ai/rl/secrets.py +0 -19
  678. synth_ai/scripts/verify_rewards.py +0 -100
  679. synth_ai/task/__init__.py +0 -10
  680. synth_ai/task/contracts.py +0 -120
  681. synth_ai/task/health.py +0 -28
  682. synth_ai/task/validators.py +0 -12
  683. synth_ai/tracing/__init__.py +0 -30
  684. synth_ai/tracing_v1/__init__.py +0 -33
  685. synth_ai/tracing_v3/config.py +0 -84
  686. synth_ai/tracing_v3/storage/config.py +0 -62
  687. synth_ai/tracing_v3/turso/__init__.py +0 -25
  688. synth_ai/tracing_v3/turso/daemon.py +0 -144
  689. synth_ai/tracing_v3/turso/manager.py +0 -760
  690. synth_ai/v0/tracing/__init__.py +0 -0
  691. synth_ai/v0/tracing/abstractions.py +0 -224
  692. synth_ai/v0/tracing/base_client.py +0 -91
  693. synth_ai/v0/tracing/client_manager.py +0 -131
  694. synth_ai/v0/tracing/config.py +0 -142
  695. synth_ai/v0/tracing/context.py +0 -146
  696. synth_ai/v0/tracing/decorators.py +0 -682
  697. synth_ai/v0/tracing/events/__init__.py +0 -0
  698. synth_ai/v0/tracing/events/manage.py +0 -147
  699. synth_ai/v0/tracing/events/scope.py +0 -86
  700. synth_ai/v0/tracing/events/store.py +0 -228
  701. synth_ai/v0/tracing/immediate_client.py +0 -151
  702. synth_ai/v0/tracing/local.py +0 -18
  703. synth_ai/v0/tracing/log_client_base.py +0 -73
  704. synth_ai/v0/tracing/retry_queue.py +0 -186
  705. synth_ai/v0/tracing/trackers.py +0 -515
  706. synth_ai/v0/tracing/upload.py +0 -512
  707. synth_ai/v0/tracing/utils.py +0 -9
  708. synth_ai/v0/tracing_v1/__init__.py +0 -16
  709. synth_ai/v0/tracing_v1/abstractions.py +0 -224
  710. synth_ai/v0/tracing_v1/base_client.py +0 -91
  711. synth_ai/v0/tracing_v1/client_manager.py +0 -131
  712. synth_ai/v0/tracing_v1/config.py +0 -142
  713. synth_ai/v0/tracing_v1/context.py +0 -146
  714. synth_ai/v0/tracing_v1/decorators.py +0 -703
  715. synth_ai/v0/tracing_v1/events/__init__.py +0 -0
  716. synth_ai/v0/tracing_v1/events/manage.py +0 -147
  717. synth_ai/v0/tracing_v1/events/scope.py +0 -86
  718. synth_ai/v0/tracing_v1/events/store.py +0 -228
  719. synth_ai/v0/tracing_v1/immediate_client.py +0 -151
  720. synth_ai/v0/tracing_v1/local.py +0 -18
  721. synth_ai/v0/tracing_v1/log_client_base.py +0 -73
  722. synth_ai/v0/tracing_v1/retry_queue.py +0 -186
  723. synth_ai/v0/tracing_v1/trackers.py +0 -515
  724. synth_ai/v0/tracing_v1/upload.py +0 -527
  725. synth_ai/v0/tracing_v1/utils.py +0 -9
  726. synth_ai/zyk/__init__.py +0 -30
  727. synth_ai-0.2.8.dev2.dist-info/METADATA +0 -129
  728. synth_ai-0.2.8.dev2.dist-info/RECORD +0 -420
  729. /synth_ai/{demos → cli/demo_apps}/demo_task_apps/math/__init__.py +0 -0
  730. /synth_ai/{lm/caching → core/apps}/__init__.py +0 -0
  731. /synth_ai/{tracing_v3 → core/tracing_v3}/lm_call_record_abstractions.py +0 -0
  732. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/__init__.py +0 -0
  733. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/exceptions.py +0 -0
  734. /synth_ai/{tracing_v3 → core/tracing_v3}/storage/types.py +0 -0
  735. /synth_ai/{compound/cais.py → py.typed} +0 -0
  736. /synth_ai/{learning → sdk/learning}/core.py +0 -0
  737. /synth_ai/{learning → sdk/learning}/gateway.py +0 -0
  738. {synth_ai-0.2.8.dev2.dist-info → synth_ai-0.4.3.dist-info}/WHEEL +0 -0
  739. {synth_ai-0.2.8.dev2.dist-info → synth_ai-0.4.3.dist-info}/licenses/LICENSE +0 -0
  740. {synth_ai-0.2.8.dev2.dist-info → synth_ai-0.4.3.dist-info}/top_level.txt +0 -0
@@ -1,1139 +0,0 @@
1
- import copy
2
- import logging
3
- import types
4
- from collections import defaultdict
5
- from dataclasses import dataclass
6
- from inspect import isclass
7
-
8
- import openai.resources
9
- from langfuse import Langfuse
10
- from langfuse.client import StatefulGenerationClient
11
- from langfuse.decorators import langfuse_context
12
- from langfuse.utils import _get_timestamp
13
- from langfuse.utils.langfuse_singleton import LangfuseSingleton
14
- from packaging.version import Version
15
- from pydantic import BaseModel
16
- from wrapt import wrap_function_wrapper
17
-
18
- from synth_ai.lm.overrides import (
19
- apply_injection as apply_injection_overrides,
20
- )
21
- from synth_ai.lm.overrides import (
22
- apply_param_overrides,
23
- apply_tool_overrides,
24
- use_overrides_for_messages,
25
- )
26
- from synth_ai.lm.provider_support.suppress_logging import *
27
- from synth_ai.tracing_v1.abstractions import MessageInputs
28
- from synth_ai.tracing_v1.trackers import synth_tracker_async, synth_tracker_sync
29
-
30
- try:
31
- import openai
32
- except ImportError as err:
33
- raise ModuleNotFoundError(
34
- "Please install OpenAI to use this feature: 'pip install openai'"
35
- ) from err
36
-
37
- # CREDIT TO LANGFUSE FOR OPEN-SOURCING THE CODE THAT THIS IS BASED ON
38
- # USING WITH MIT LICENSE PERMISSION
39
- # https://langfuse.com
40
-
41
- try:
42
- from openai import AsyncAzureOpenAI, AsyncOpenAI, AzureOpenAI, OpenAI # noqa: F401
43
- except ImportError:
44
- AsyncAzureOpenAI = None
45
- AsyncOpenAI = None
46
- AzureOpenAI = None
47
- OpenAI = None
48
-
49
-
50
- # log = logging.getLogger("langfuse")
51
-
52
- # Add logger configuration
53
- logger = logging.getLogger(__name__)
54
- logger.setLevel(logging.DEBUG) # Set to DEBUG to see all messages
55
-
56
-
57
- @dataclass
58
- class OpenAiDefinition:
59
- module: str
60
- object: str
61
- method: str
62
- type: str
63
- sync: bool
64
- min_version: str | None = None
65
-
66
-
67
- OPENAI_METHODS_V0 = [
68
- OpenAiDefinition(
69
- module="openai",
70
- object="ChatCompletion",
71
- method="create",
72
- type="chat",
73
- sync=True,
74
- ),
75
- OpenAiDefinition(
76
- module="openai",
77
- object="Completion",
78
- method="create",
79
- type="completion",
80
- sync=True,
81
- ),
82
- ]
83
-
84
-
85
- OPENAI_METHODS_V1 = [
86
- OpenAiDefinition(
87
- module="openai.resources.chat.completions",
88
- object="Completions",
89
- method="create",
90
- type="chat",
91
- sync=True,
92
- ),
93
- OpenAiDefinition(
94
- module="openai.resources.completions",
95
- object="Completions",
96
- method="create",
97
- type="completion",
98
- sync=True,
99
- ),
100
- OpenAiDefinition(
101
- module="openai.resources.chat.completions",
102
- object="AsyncCompletions",
103
- method="create",
104
- type="chat",
105
- sync=False,
106
- ),
107
- OpenAiDefinition(
108
- module="openai.resources.completions",
109
- object="AsyncCompletions",
110
- method="create",
111
- type="completion",
112
- sync=False,
113
- ),
114
- OpenAiDefinition(
115
- module="openai.resources.chat.completions",
116
- object="Completions",
117
- method="parse",
118
- type="chat",
119
- sync=True,
120
- min_version="1.50.0",
121
- ),
122
- OpenAiDefinition(
123
- module="openai.resources.chat.completions",
124
- object="AsyncCompletions",
125
- method="parse",
126
- type="chat",
127
- sync=False,
128
- min_version="1.50.0",
129
- ),
130
- ]
131
-
132
-
133
- class OpenAiArgsExtractor:
134
- def __init__(
135
- self,
136
- name=None,
137
- metadata=None,
138
- trace_id=None,
139
- session_id=None,
140
- user_id=None,
141
- tags=None,
142
- parent_observation_id=None,
143
- langfuse_prompt=None, # we cannot use prompt because it's an argument of the old OpenAI completions API
144
- **kwargs,
145
- ):
146
- # logger.debug(f"OpenAiArgsExtractor initialized with kwargs: {kwargs}")
147
- # raise NotImplementedError("This method is not implemented yet")
148
- self.args = {}
149
- self.args["name"] = name
150
- self.args["metadata"] = (
151
- metadata
152
- if "response_format" not in kwargs
153
- else {
154
- **(metadata or {}),
155
- "response_format": kwargs["response_format"].model_json_schema()
156
- if isclass(kwargs["response_format"])
157
- and issubclass(kwargs["response_format"], BaseModel)
158
- else kwargs["response_format"],
159
- }
160
- )
161
- self.args["trace_id"] = trace_id
162
- self.args["session_id"] = session_id
163
- self.args["user_id"] = user_id
164
- self.args["tags"] = tags
165
- self.args["parent_observation_id"] = parent_observation_id
166
- self.args["langfuse_prompt"] = langfuse_prompt
167
- self.kwargs = kwargs
168
-
169
- def get_langfuse_args(self):
170
- return {**self.args, **self.kwargs}
171
-
172
- def get_openai_args(self):
173
- return self.kwargs
174
-
175
-
176
- def _langfuse_wrapper(func):
177
- def _with_langfuse(open_ai_definitions, initialize):
178
- def wrapper(wrapped, instance, args, kwargs):
179
- return func(open_ai_definitions, initialize, wrapped, args, kwargs)
180
-
181
- return wrapper
182
-
183
- return _with_langfuse
184
-
185
-
186
- def _extract_chat_prompt(kwargs: dict):
187
- """
188
- Extracts the user input from prompts. Returns an array of messages or a dict with messages and functions.
189
- """
190
- prompt = {}
191
-
192
- if kwargs.get("functions") is not None:
193
- prompt.update({"functions": kwargs["functions"]})
194
-
195
- if kwargs.get("function_call") is not None:
196
- prompt.update({"function_call": kwargs["function_call"]})
197
-
198
- if kwargs.get("tools") is not None:
199
- prompt.update({"tools": kwargs["tools"]})
200
-
201
- # existing logic to handle the case when prompt is not empty
202
- if prompt:
203
- messages = _filter_image_data(kwargs.get("messages", []))
204
- prompt.update({"messages": messages})
205
- return prompt
206
- else:
207
- # fallback: just return filtered messages
208
- messages = _filter_image_data(kwargs.get("messages", []))
209
- return messages
210
-
211
-
212
- def _extract_chat_response(kwargs: dict):
213
- """
214
- Extracts the LLM output from the response.
215
- """
216
- response = {
217
- "role": kwargs.get("role"),
218
- }
219
-
220
- if kwargs.get("function_call") is not None:
221
- response.update({"function_call": kwargs["function_call"]})
222
-
223
- if kwargs.get("tool_calls") is not None:
224
- response.update({"tool_calls": kwargs["tool_calls"]})
225
-
226
- response["content"] = kwargs.get("content")
227
- return response
228
-
229
-
230
- def _get_langfuse_data_from_kwargs(
231
- resource: OpenAiDefinition, langfuse: Langfuse, start_time, kwargs
232
- ):
233
- # print("DEBUG: Entering _get_langfuse_data_from_kwargs")
234
- # print("DEBUG: kwargs received:", kwargs)
235
-
236
- name = kwargs.get("name", "OpenAI-generation")
237
- # print("DEBUG: name =", name)
238
- if name is None:
239
- name = "OpenAI-generation"
240
-
241
- if name is not None and not isinstance(name, str):
242
- raise TypeError("name must be a string")
243
-
244
- decorator_context_observation_id = langfuse_context.get_current_observation_id()
245
- decorator_context_trace_id = langfuse_context.get_current_trace_id()
246
- # print("DEBUG: decorator_context_observation_id =", decorator_context_observation_id)
247
- # print("DEBUG: decorator_context_trace_id =", decorator_context_trace_id)
248
-
249
- trace_id = kwargs.get("trace_id", None) or decorator_context_trace_id
250
- # print("DEBUG: trace_id =", trace_id)
251
- if trace_id is not None and not isinstance(trace_id, str):
252
- raise TypeError("trace_id must be a string")
253
-
254
- session_id = kwargs.get("session_id", None)
255
- # print("DEBUG: session_id =", session_id)
256
- if session_id is not None and not isinstance(session_id, str):
257
- raise TypeError("session_id must be a string")
258
-
259
- user_id = kwargs.get("user_id", None)
260
- # print("DEBUG: user_id =", user_id)
261
- if user_id is not None and not isinstance(user_id, str):
262
- raise TypeError("user_id must be a string")
263
-
264
- tags = kwargs.get("tags", None)
265
- # print("DEBUG: tags =", tags)
266
- if tags is not None and (
267
- not isinstance(tags, list) or not all(isinstance(tag, str) for tag in tags)
268
- ):
269
- raise TypeError("tags must be a list of strings")
270
-
271
- if decorator_context_trace_id:
272
- langfuse_context.update_current_trace(session_id=session_id, user_id=user_id, tags=tags)
273
-
274
- parent_observation_id = kwargs.get("parent_observation_id", None) or (
275
- decorator_context_observation_id
276
- if decorator_context_observation_id != decorator_context_trace_id
277
- else None
278
- )
279
- # print("DEBUG: parent_observation_id =", parent_observation_id)
280
- if parent_observation_id is not None and not isinstance(parent_observation_id, str):
281
- raise TypeError("parent_observation_id must be a string")
282
- if parent_observation_id is not None and trace_id is None:
283
- raise ValueError("parent_observation_id requires trace_id to be set")
284
-
285
- metadata = kwargs.get("metadata", {})
286
- # print("DEBUG: metadata =", metadata)
287
- if metadata is not None and not isinstance(metadata, dict):
288
- raise TypeError("metadata must be a dictionary")
289
-
290
- prompt = None
291
- if resource.type == "completion":
292
- prompt = kwargs.get("prompt", None)
293
- elif resource.type == "chat":
294
- prompt = _extract_chat_prompt(kwargs)
295
- # Extract model: first check top-level, then check inside 'inputs'
296
- model = kwargs.get("model", None)
297
- inputs = kwargs.get("inputs", {}) if kwargs.get("inputs", {}) else {}
298
- if isinstance(inputs, dict):
299
- # print("DEBUG: inputs =", inputs)
300
- if "model_name" in inputs:
301
- detailed_model = inputs["model_name"]
302
- print("DEBUG: detailed_model =", detailed_model)
303
- # If a detailed_model exists and is different from the top-level model, use it.
304
- if detailed_model and (not model or model != detailed_model):
305
- print("DEBUG: Upgrading model value from", model, "to", detailed_model)
306
- model = detailed_model
307
- # print("DEBUG: final model =", model)
308
-
309
- # Extract model hyperparameters and add them to the new field 'model_params'
310
- model_params = {
311
- "temperature": kwargs.get("temperature", 1),
312
- "max_tokens": kwargs.get("max_tokens", float("inf")),
313
- "top_p": kwargs.get("top_p", 1),
314
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
315
- "presence_penalty": kwargs.get("presence_penalty", 0),
316
- }
317
- if kwargs.get("seed", None) is not None:
318
- model_params["seed"] = kwargs.get("seed", None)
319
-
320
- is_nested_trace = False
321
- if trace_id:
322
- is_nested_trace = True
323
- langfuse.trace(id=trace_id, session_id=session_id, user_id=user_id, tags=tags)
324
- else:
325
- trace_instance = langfuse.trace(
326
- session_id=session_id,
327
- user_id=user_id,
328
- tags=tags,
329
- name=name,
330
- input=prompt,
331
- metadata=metadata,
332
- )
333
- trace_id = trace_instance.id
334
- # print("DEBUG: Generated new trace_id =", trace_id)
335
-
336
- langfuse_prompt = kwargs.get("langfuse_prompt", None)
337
-
338
- extracted_data = {
339
- "name": name,
340
- "metadata": metadata,
341
- "trace_id": trace_id,
342
- "parent_observation_id": parent_observation_id,
343
- "user_id": user_id,
344
- "start_time": start_time,
345
- "input": prompt,
346
- "model_params": {
347
- "model_name": model or None,
348
- "temperature": kwargs.get("temperature", 1),
349
- "max_tokens": kwargs.get("max_tokens", float("inf")),
350
- "top_p": kwargs.get("top_p", 1),
351
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
352
- "presence_penalty": kwargs.get("presence_penalty", 0),
353
- },
354
- "prompt": langfuse_prompt,
355
- }
356
-
357
- # Add seed to model_params if present
358
- if kwargs.get("seed", None) is not None:
359
- extracted_data["model_params"]["seed"] = kwargs.get("seed", None)
360
-
361
- # print("DEBUG: Exiting _get_langfuse_data_from_kwargs with extracted_data:")
362
- # print(extracted_data)
363
- # print("DEBUG: is_nested_trace =", is_nested_trace)
364
-
365
- return extracted_data, is_nested_trace
366
-
367
-
368
- def _create_langfuse_update(
369
- completion,
370
- generation: StatefulGenerationClient,
371
- completion_start_time,
372
- model=None,
373
- usage=None,
374
- model_params=None,
375
- ):
376
- update = {
377
- "end_time": _get_timestamp(),
378
- "output": completion,
379
- "completion_start_time": completion_start_time,
380
- }
381
-
382
- # Create model_params dictionary
383
- model_params = {
384
- "model_name": model or None,
385
- }
386
-
387
- # Add hyperparameters if provided
388
- if model_params:
389
- model_params.update(model_params)
390
-
391
- # Add model_params to update
392
- update["model_params"] = model_params
393
-
394
- if usage is not None:
395
- update["usage"] = usage
396
-
397
- generation.update(**update)
398
-
399
-
400
- def _extract_streamed_openai_response(resource, chunks):
401
- # logger.debug(f"Extracting streamed response for resource type: {resource.type}")
402
- # logger.debug(f"Number of chunks: {len(chunks)}")
403
- completion = defaultdict(str) if resource.type == "chat" else ""
404
- model = None
405
- usage = None
406
-
407
- for chunk in chunks:
408
- if _is_openai_v1():
409
- chunk = chunk.__dict__
410
- # logger.debug(f"Processing chunk: {chunk}")
411
-
412
- # Extract model name from chunk
413
- model = model or chunk.get("model", None) or None
414
-
415
- # Extract usage information
416
- chunk_usage = chunk.get("usage", None)
417
- if chunk_usage is not None:
418
- if _is_openai_v1():
419
- chunk_usage = chunk_usage.__dict__
420
- usage = chunk_usage
421
-
422
- # Process choices
423
- choices = chunk.get("choices", []) # noqa: F841
424
- # logger.debug(f"Extracted - model: {model}, choices: {choices}")
425
-
426
- # logger.debug(f"Final completion: {completion}")
427
- return model, completion, usage
428
-
429
-
430
- def _get_langfuse_data_from_default_response(resource: OpenAiDefinition, response):
431
- if response is None:
432
- return None, "<NoneType response returned from OpenAI>", None
433
-
434
- # Extract model name from response
435
- model = response.get("model", None) or None
436
-
437
- # Extract completion based on resource type
438
- completion = None
439
- if resource.type == "completion":
440
- choices = response.get("choices", [])
441
- if len(choices) > 0:
442
- choice = choices[-1]
443
- completion = choice.text if _is_openai_v1() else choice.get("text", None)
444
- elif resource.type == "chat":
445
- choices = response.get("choices", [])
446
- if len(choices) > 0:
447
- choice = choices[-1]
448
- completion = (
449
- _extract_chat_response(choice.message.__dict__)
450
- if _is_openai_v1()
451
- else choice.get("message", None)
452
- )
453
-
454
- # Extract usage information
455
- usage = response.get("usage", None)
456
- if _is_openai_v1() and usage is not None:
457
- usage = usage.__dict__
458
-
459
- return model, completion, usage
460
-
461
-
462
- def _is_openai_v1():
463
- return Version(openai.__version__) >= Version("1.0.0")
464
-
465
-
466
- def _is_streaming_response(response):
467
- return (
468
- isinstance(response, types.GeneratorType)
469
- or isinstance(response, types.AsyncGeneratorType)
470
- or (_is_openai_v1() and isinstance(response, openai.Stream))
471
- or (_is_openai_v1() and isinstance(response, openai.AsyncStream))
472
- )
473
-
474
-
475
- @_langfuse_wrapper
476
- def _wrap(open_ai_resource: OpenAiDefinition, initialize, wrapped, args, kwargs):
477
- new_langfuse: Langfuse = initialize()
478
-
479
- start_time = _get_timestamp()
480
- arg_extractor = OpenAiArgsExtractor(*args, **kwargs)
481
-
482
- generation, is_nested_trace = _get_langfuse_data_from_kwargs(
483
- open_ai_resource, new_langfuse, start_time, arg_extractor.get_langfuse_args()
484
- )
485
- generation = new_langfuse.generation(**generation)
486
- try:
487
- openai_args = arg_extractor.get_openai_args()
488
- # Apply context-scoped injection to chat messages if present
489
- if isinstance(openai_args, dict) and "messages" in openai_args:
490
- try:
491
- with use_overrides_for_messages(openai_args["messages"]): # type: ignore[arg-type]
492
- openai_args["messages"] = apply_injection_overrides(openai_args["messages"]) # type: ignore[arg-type]
493
- openai_args = apply_tool_overrides(openai_args)
494
- openai_args = apply_param_overrides(openai_args)
495
- except Exception:
496
- pass
497
- openai_response = wrapped(**openai_args)
498
-
499
- if _is_streaming_response(openai_response):
500
- return LangfuseResponseGeneratorSync(
501
- resource=open_ai_resource,
502
- response=openai_response,
503
- generation=generation,
504
- langfuse=new_langfuse,
505
- is_nested_trace=is_nested_trace,
506
- kwargs=arg_extractor.get_openai_args(),
507
- )
508
-
509
- else:
510
- model, completion, usage = _get_langfuse_data_from_default_response(
511
- open_ai_resource,
512
- (openai_response and openai_response.__dict__)
513
- if _is_openai_v1()
514
- else openai_response,
515
- )
516
- model_params = {
517
- "model_name": model or None,
518
- "temperature": kwargs.get("temperature", 1),
519
- "max_tokens": kwargs.get("max_tokens", float("inf")),
520
- "top_p": kwargs.get("top_p", 1),
521
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
522
- "presence_penalty": kwargs.get("presence_penalty", 0),
523
- }
524
-
525
- # Collect messages
526
- if open_ai_resource.type == "completion":
527
- user_prompt = arg_extractor.get_openai_args().get("prompt", "")
528
- messages = [{"role": "user", "content": user_prompt}]
529
- message_input = MessageInputs(messages=messages)
530
-
531
- # Track user input
532
- synth_tracker_sync.track_lm(
533
- messages=message_input.messages,
534
- model_name=model,
535
- model_params=model_params,
536
- finetune=False,
537
- )
538
-
539
- # Track assistant output separately
540
- assistant_message = [{"role": "assistant", "content": completion}]
541
- synth_tracker_sync.track_lm_output(
542
- messages=assistant_message,
543
- model_name=model,
544
- model_params=model_params,
545
- finetune=False,
546
- )
547
-
548
- elif open_ai_resource.type == "chat":
549
- messages = openai_args.get("messages", [])
550
- message_input = MessageInputs(messages=messages)
551
-
552
- # Track user input
553
- synth_tracker_sync.track_lm(
554
- messages=message_input.messages,
555
- model_name=model,
556
- model_params=model_params,
557
- finetune=False,
558
- )
559
-
560
- # Track assistant output separately
561
- assistant_message = [{"role": "assistant", "content": completion["content"]}]
562
- synth_tracker_sync.track_lm_output(
563
- messages=assistant_message, model_name=model, finetune=False
564
- )
565
-
566
- else:
567
- message_input = MessageInputs(messages=[])
568
-
569
- # Use track_lm
570
- # synth_tracker_sync.track_lm(
571
- # messages=message_input.messages,
572
- # model_name=model,
573
- # model_params=model_params,finetune=False,
574
- # )
575
-
576
- if kwargs.get("seed", None) is not None:
577
- model_params["seed"] = kwargs.get("seed", None)
578
-
579
- generation.update(
580
- model_params=model_params,
581
- output=completion,
582
- end_time=_get_timestamp(),
583
- usage=usage,
584
- )
585
-
586
- # Avoiding the trace-update if trace-id is provided by user.
587
- if not is_nested_trace:
588
- new_langfuse.trace(id=generation.trace_id, output=completion)
589
-
590
- return openai_response
591
- except Exception as ex:
592
- # log.warning(ex)
593
- model = kwargs.get("model", None) or None
594
- model_params = {
595
- "model_name": model or None,
596
- "temperature": kwargs.get("temperature", 1),
597
- "max_tokens": kwargs.get("max_tokens", float("inf")),
598
- "top_p": kwargs.get("top_p", 1),
599
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
600
- "presence_penalty": kwargs.get("presence_penalty", 0),
601
- }
602
- if kwargs.get("seed", None) is not None:
603
- model_params["seed"] = kwargs.get("seed", None)
604
-
605
- generation.update(
606
- end_time=_get_timestamp(),
607
- status_message=str(ex),
608
- level="ERROR",
609
- model_params=model_params,
610
- usage={"input_cost": 0, "output_cost": 0, "total_cost": 0},
611
- )
612
- raise ex
613
-
614
-
615
- @_langfuse_wrapper
616
- async def _wrap_async(open_ai_resource: OpenAiDefinition, initialize, wrapped, args, kwargs):
617
- new_langfuse = initialize()
618
- start_time = _get_timestamp()
619
- arg_extractor = OpenAiArgsExtractor(*args, **kwargs)
620
-
621
- generation, is_nested_trace = _get_langfuse_data_from_kwargs(
622
- open_ai_resource, new_langfuse, start_time, arg_extractor.get_langfuse_args()
623
- )
624
- generation = new_langfuse.generation(**generation)
625
-
626
- try:
627
- openai_args = arg_extractor.get_openai_args()
628
- # Apply context-scoped injection to chat messages if present
629
- if isinstance(openai_args, dict) and "messages" in openai_args:
630
- try:
631
- with use_overrides_for_messages(openai_args["messages"]): # type: ignore[arg-type]
632
- openai_args["messages"] = apply_injection_overrides(openai_args["messages"]) # type: ignore[arg-type]
633
- openai_args = apply_tool_overrides(openai_args)
634
- openai_args = apply_param_overrides(openai_args)
635
- except Exception:
636
- pass
637
- openai_response = await wrapped(**openai_args)
638
-
639
- if _is_streaming_response(openai_response):
640
- return LangfuseResponseGeneratorAsync(
641
- resource=open_ai_resource,
642
- response=openai_response,
643
- generation=generation,
644
- langfuse=new_langfuse,
645
- is_nested_trace=is_nested_trace,
646
- kwargs=arg_extractor.get_openai_args(),
647
- )
648
-
649
- else:
650
- model, completion, usage = _get_langfuse_data_from_default_response(
651
- open_ai_resource,
652
- (openai_response and openai_response.__dict__)
653
- if _is_openai_v1()
654
- else openai_response,
655
- )
656
- model_params = {
657
- "model_name": model or None,
658
- "temperature": kwargs.get("temperature", 1),
659
- "max_tokens": kwargs.get("max_tokens", float("inf")),
660
- "top_p": kwargs.get("top_p", 1),
661
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
662
- "presence_penalty": kwargs.get("presence_penalty", 0),
663
- }
664
-
665
- # Collect messages
666
- if open_ai_resource.type == "completion":
667
- user_prompt = arg_extractor.get_openai_args().get("prompt", "")
668
- messages = [{"role": "user", "content": user_prompt}]
669
- message_input = MessageInputs(messages=messages)
670
-
671
- # Track user input
672
- synth_tracker_async.track_lm(
673
- messages=message_input.messages,
674
- model_name=model,
675
- model_params=model_params,
676
- finetune=False,
677
- )
678
-
679
- # Track assistant output separately
680
- assistant_message = [{"role": "assistant", "content": completion}]
681
- synth_tracker_async.track_lm_output(
682
- messages=assistant_message, model_name=model, finetune=False
683
- )
684
-
685
- elif open_ai_resource.type == "chat":
686
- messages = openai_args.get("messages", [])
687
- message_input = MessageInputs(messages=messages)
688
-
689
- # Track user input
690
- synth_tracker_async.track_lm(
691
- messages=message_input.messages,
692
- model_name=model,
693
- model_params=model_params,
694
- finetune=False,
695
- )
696
-
697
- # Track assistant output separately
698
- assistant_message = [{"role": "assistant", "content": completion["content"]}]
699
- synth_tracker_async.track_lm_output(
700
- messages=assistant_message, model_name=model, finetune=False
701
- )
702
-
703
- else:
704
- message_input = MessageInputs(messages=[])
705
-
706
- # Use track_lm
707
- # synth_tracker_async.track_lm(
708
- # messages=message_input.messages,
709
- # model_name=model,
710
- # model_params=model_params,finetune=False,
711
- # )
712
-
713
- # Create model_params dictionary
714
- model_params = {
715
- "model_name": model or None,
716
- "temperature": kwargs.get("temperature", 1),
717
- "max_tokens": kwargs.get("max_tokens", float("inf")),
718
- "top_p": kwargs.get("top_p", 1),
719
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
720
- "presence_penalty": kwargs.get("presence_penalty", 0),
721
- }
722
- if kwargs.get("seed", None) is not None:
723
- model_params["seed"] = kwargs.get("seed", None)
724
-
725
- generation.update(
726
- model_params=model_params,
727
- output=completion,
728
- end_time=_get_timestamp(),
729
- usage=usage,
730
- )
731
- # Avoiding the trace-update if trace-id is provided by user.
732
- if not is_nested_trace:
733
- new_langfuse.trace(id=generation.trace_id, output=completion)
734
-
735
- return openai_response
736
- except Exception as ex:
737
- model = kwargs.get("model", None) or None
738
- model_params = {
739
- "model_name": model or None,
740
- "temperature": kwargs.get("temperature", 1),
741
- "max_tokens": kwargs.get("max_tokens", float("inf")),
742
- "top_p": kwargs.get("top_p", 1),
743
- "frequency_penalty": kwargs.get("frequency_penalty", 0),
744
- "presence_penalty": kwargs.get("presence_penalty", 0),
745
- }
746
- if kwargs.get("seed", None) is not None:
747
- model_params["seed"] = kwargs.get("seed", None)
748
-
749
- generation.update(
750
- end_time=_get_timestamp(),
751
- status_message=str(ex),
752
- level="ERROR",
753
- model_params=model_params,
754
- usage={"input_cost": 0, "output_cost": 0, "total_cost": 0},
755
- )
756
- raise ex
757
-
758
- async def close(self) -> None:
759
- """Close the response and release the connection.
760
-
761
- Automatically called if the response body is read to completion.
762
- """
763
- await self.response.close()
764
-
765
-
766
- class OpenAILangfuse:
767
- _langfuse: Langfuse | None = None
768
-
769
- def initialize(self):
770
- self._langfuse = LangfuseSingleton().get(
771
- public_key=openai.langfuse_public_key,
772
- secret_key=openai.langfuse_secret_key,
773
- host=openai.langfuse_host,
774
- debug=openai.langfuse_debug,
775
- enabled=openai.langfuse_enabled,
776
- sdk_integration="openai",
777
- sample_rate=openai.langfuse_sample_rate,
778
- )
779
-
780
- return self._langfuse
781
-
782
- def flush(cls):
783
- cls._langfuse.flush()
784
-
785
- def langfuse_auth_check(self):
786
- """Check if the provided Langfuse credentials (public and secret key) are valid.
787
-
788
- Raises:
789
- Exception: If no projects were found for the provided credentials.
790
-
791
- Note:
792
- This method is blocking. It is discouraged to use it in prod code.
793
- """
794
- if self._langfuse is None:
795
- self.initialize()
796
-
797
- return self._langfuse.auth_check()
798
-
799
- def register_tracing(self):
800
- resources = OPENAI_METHODS_V1 if _is_openai_v1() else OPENAI_METHODS_V0
801
-
802
- for resource in resources:
803
- if resource.min_version is not None and Version(openai.__version__) < Version(
804
- resource.min_version
805
- ):
806
- continue
807
-
808
- # Check if the method actually exists before trying to wrap it
809
- try:
810
- module = __import__(resource.module, fromlist=[resource.object])
811
- obj = getattr(module, resource.object, None)
812
- if obj and not hasattr(obj, resource.method):
813
- continue # Skip if method doesn't exist
814
- except (ImportError, AttributeError):
815
- continue # Skip if module or object doesn't exist
816
-
817
- wrap_function_wrapper(
818
- resource.module,
819
- f"{resource.object}.{resource.method}",
820
- _wrap(resource, self.initialize)
821
- if resource.sync
822
- else _wrap_async(resource, self.initialize),
823
- )
824
-
825
- openai.langfuse_public_key = None
826
- openai.langfuse_secret_key = None
827
- openai.langfuse_host = None
828
- openai.langfuse_debug = None
829
- openai.langfuse_enabled = True
830
- openai.langfuse_sample_rate = None
831
- openai.langfuse_mask = None
832
- openai.langfuse_auth_check = self.langfuse_auth_check
833
- openai.flush_langfuse = self.flush
834
-
835
-
836
- modifier = OpenAILangfuse()
837
- modifier.register_tracing()
838
-
839
-
840
- # DEPRECATED: Use `openai.langfuse_auth_check()` instead
841
- def auth_check():
842
- if modifier._langfuse is None:
843
- modifier.initialize()
844
-
845
- return modifier._langfuse.auth_check()
846
-
847
-
848
- def _filter_image_data(messages: list[dict]):
849
- """https://platform.openai.com/docs/guides/vision?lang=python
850
-
851
- The messages array remains the same, but the 'image_url' is removed from the 'content' array.
852
- It should only be removed if the value starts with 'data:image/jpeg;base64,'
853
-
854
- """
855
- output_messages = copy.deepcopy(messages)
856
-
857
- for message in output_messages:
858
- content = (
859
- message.get("content", None)
860
- if isinstance(message, dict)
861
- else getattr(message, "content", None)
862
- )
863
-
864
- if content is not None:
865
- for index, item in enumerate(content):
866
- if isinstance(item, dict) and item.get("image_url", None) is not None:
867
- url = item["image_url"]["url"]
868
- if url.startswith("data:image/"):
869
- del content[index]["image_url"]
870
-
871
- return output_messages
872
-
873
-
874
- class LangfuseResponseGeneratorSync:
875
- def __init__(
876
- self,
877
- *,
878
- resource,
879
- response,
880
- generation,
881
- langfuse,
882
- is_nested_trace,
883
- kwargs,
884
- ):
885
- self.items = []
886
- self.resource = resource
887
- self.response = response
888
- self.generation = generation
889
- self.langfuse = langfuse
890
- self.is_nested_trace = is_nested_trace
891
- self.kwargs = kwargs
892
- self.completion_start_time = None
893
-
894
- def __iter__(self):
895
- try:
896
- for i in self.response:
897
- self.items.append(i)
898
-
899
- if self.completion_start_time is None:
900
- self.completion_start_time = _get_timestamp()
901
-
902
- yield i
903
- finally:
904
- self._finalize()
905
-
906
- def __next__(self):
907
- try:
908
- item = self.response.__next__()
909
- self.items.append(item)
910
-
911
- if self.completion_start_time is None:
912
- self.completion_start_time = _get_timestamp()
913
-
914
- return item
915
-
916
- except StopIteration:
917
- self._finalize()
918
-
919
- raise
920
-
921
- def __enter__(self):
922
- return self.__iter__()
923
-
924
- def __exit__(self, exc_type, exc_value, traceback):
925
- pass
926
-
927
- def _finalize(self):
928
- logger.debug("Entering _finalize() in LangfuseResponseGeneratorSync...")
929
- # First, extract values from the streamed response items
930
- model, completion, usage = _extract_streamed_openai_response(self.resource, self.items)
931
- logger.debug("Extracted model=%s, completion=%s, usage=%s", model, completion, usage)
932
-
933
- # Look through the streamed items for a detailed model in the additional "inputs"
934
- for item in self.items:
935
- if isinstance(item, dict):
936
- inputs = item.get("inputs")
937
- if isinstance(inputs, dict):
938
- detailed = inputs.get("model_name")
939
- if detailed and detailed != model:
940
- logger.debug(
941
- "Upgrading model value from %s to %s based on streamed inputs",
942
- model,
943
- detailed,
944
- )
945
- model = detailed
946
- break
947
- logger.debug("Final model after _finalize check: %s", model)
948
-
949
- # Create model hyperparameters dictionary
950
- model_params = {
951
- "temperature": self.kwargs.get("temperature", 1),
952
- "max_tokens": self.kwargs.get("max_tokens", float("inf")),
953
- "top_p": self.kwargs.get("top_p", 1),
954
- "frequency_penalty": self.kwargs.get("frequency_penalty", 0),
955
- "presence_penalty": self.kwargs.get("presence_penalty", 0),
956
- }
957
- if self.kwargs.get("seed") is not None:
958
- model_params["seed"] = self.kwargs.get("seed")
959
-
960
- if self.resource.type == "completion":
961
- user_prompt = self.kwargs.get("prompt", "")
962
- messages = [
963
- {"role": "user", "content": user_prompt},
964
- {"role": "assistant", "content": completion},
965
- ]
966
- message_input = MessageInputs(messages=messages)
967
- elif self.resource.type == "chat":
968
- messages = self.kwargs.get("messages", [])
969
- logger.debug("Existing 'messages' from kwargs before appending: %s", messages)
970
- if isinstance(completion, dict) and "content" in completion:
971
- messages.append({"role": "assistant", "content": completion["content"]})
972
- message_input = MessageInputs(messages=messages)
973
- logger.debug("Final 'messages': %s", message_input.messages)
974
- else:
975
- message_input = MessageInputs(messages=[])
976
-
977
- logger.debug(
978
- "Calling track_lm (sync) with messages: %s, model: %s",
979
- message_input.messages,
980
- model,
981
- )
982
- synth_tracker_sync.track_lm(
983
- messages=message_input.messages,
984
- model_name=model,
985
- model_params=model_params,
986
- finetune=False,
987
- )
988
-
989
- # Avoid the trace update if a trace-id was provided by the user.
990
- if not self.is_nested_trace:
991
- self.langfuse.trace(id=self.generation.trace_id, output=completion)
992
-
993
- # Pass the updated model and hyperparameters downstream in the update event.
994
- _create_langfuse_update(
995
- completion,
996
- self.generation,
997
- self.completion_start_time,
998
- model=model,
999
- usage=usage,
1000
- model_params=model_params,
1001
- )
1002
-
1003
-
1004
- class LangfuseResponseGeneratorAsync:
1005
- def __init__(
1006
- self,
1007
- *,
1008
- resource,
1009
- response,
1010
- generation,
1011
- langfuse,
1012
- is_nested_trace,
1013
- kwargs,
1014
- ):
1015
- # logger.debug(f"LangfuseResponseGeneratorAsync initialized with kwargs: {kwargs}")
1016
- # logger.debug(f"Resource type: {resource.type}")
1017
- self.items = []
1018
- self.resource = resource
1019
- self.response = response
1020
- self.generation = generation
1021
- self.langfuse = langfuse
1022
- self.is_nested_trace = is_nested_trace
1023
- self.kwargs = kwargs
1024
- self.completion_start_time = None
1025
-
1026
- async def __aiter__(self):
1027
- try:
1028
- async for i in self.response:
1029
- self.items.append(i)
1030
-
1031
- if self.completion_start_time is None:
1032
- self.completion_start_time = _get_timestamp()
1033
-
1034
- yield i
1035
- finally:
1036
- await self._finalize()
1037
-
1038
- async def __anext__(self):
1039
- try:
1040
- item = await self.response.__anext__()
1041
- self.items.append(item)
1042
-
1043
- if self.completion_start_time is None:
1044
- self.completion_start_time = _get_timestamp()
1045
-
1046
- return item
1047
-
1048
- except StopAsyncIteration:
1049
- await self._finalize()
1050
-
1051
- raise
1052
-
1053
- async def __aenter__(self):
1054
- return self.__aiter__()
1055
-
1056
- async def __aexit__(self, exc_type, exc_value, traceback):
1057
- pass
1058
-
1059
- async def _finalize(self):
1060
- logger.debug("Entering _finalize() in LangfuseResponseGeneratorAsync...")
1061
- model, completion, usage = _extract_streamed_openai_response(self.resource, self.items)
1062
- logger.debug("Extracted model=%s, completion=%s, usage=%s", model, completion, usage)
1063
-
1064
- # Look through the streamed items for a detailed model in the additional "inputs"
1065
- for item in self.items:
1066
- if isinstance(item, dict):
1067
- inputs = item.get("inputs")
1068
- if isinstance(inputs, dict):
1069
- detailed = inputs.get("model_name")
1070
- if detailed and detailed != model:
1071
- logger.debug(
1072
- "Upgrading model value from %s to %s based on streamed inputs",
1073
- model,
1074
- detailed,
1075
- )
1076
- model = detailed
1077
- break
1078
- logger.debug("Final model after _finalize check: %s", model)
1079
-
1080
- # Create model hyperparameters dictionary
1081
- model_params = {
1082
- "temperature": self.kwargs.get("temperature", 1),
1083
- "max_tokens": self.kwargs.get("max_tokens", float("inf")),
1084
- "top_p": self.kwargs.get("top_p", 1),
1085
- "frequency_penalty": self.kwargs.get("frequency_penalty", 0),
1086
- "presence_penalty": self.kwargs.get("presence_penalty", 0),
1087
- }
1088
- if self.kwargs.get("seed") is not None:
1089
- model_params["seed"] = self.kwargs.get("seed")
1090
-
1091
- if self.resource.type == "completion":
1092
- user_prompt = self.kwargs.get("prompt", "")
1093
- messages = [
1094
- {"role": "user", "content": user_prompt},
1095
- {"role": "assistant", "content": completion},
1096
- ]
1097
- message_input = MessageInputs(messages=messages)
1098
- elif self.resource.type == "chat":
1099
- messages = self.kwargs.get("messages", [])
1100
- logger.debug("Existing 'messages' from kwargs before appending: %s", messages)
1101
- # If completion is a dict, ensure we extract 'content' safely
1102
- if isinstance(completion, dict) and "content" in completion:
1103
- messages.append({"role": "assistant", "content": completion["content"]})
1104
- message_input = MessageInputs(messages=messages)
1105
- logger.debug("Final 'messages': %s", message_input.messages)
1106
- else:
1107
- message_input = MessageInputs(messages=[])
1108
-
1109
- logger.debug(
1110
- "Calling track_lm (async) with messages: %s, model: %s",
1111
- message_input.messages,
1112
- model,
1113
- )
1114
- synth_tracker_async.track_lm(
1115
- messages=message_input.messages,
1116
- model_name=model,
1117
- model_params=model_params,
1118
- finetune=False,
1119
- )
1120
-
1121
- # Avoiding the trace-update if trace-id is provided by user.
1122
- if not self.is_nested_trace:
1123
- self.langfuse.trace(id=self.generation.trace_id, output=completion)
1124
-
1125
- _create_langfuse_update(
1126
- completion,
1127
- self.generation,
1128
- self.completion_start_time,
1129
- model=model,
1130
- usage=usage,
1131
- model_params=model_params,
1132
- )
1133
-
1134
- async def close(self) -> None:
1135
- """Close the response and release the connection.
1136
-
1137
- Automatically called if the response body is read to completion.
1138
- """
1139
- await self.response.close()