openadapt-ml 0.2.0__tar.gz → 0.2.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (344) hide show
  1. openadapt_ml-0.2.2/.github/workflows/release.yml +48 -0
  2. openadapt_ml-0.2.2/.github/workflows/test.yml +41 -0
  3. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/.gitignore +33 -1
  4. openadapt_ml-0.2.2/CHANGELOG.md +1060 -0
  5. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/CLAUDE.md +599 -94
  6. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/PKG-INFO +215 -14
  7. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/README.md +207 -12
  8. openadapt_ml-0.2.2/deprecated/Dockerfile.simple +26 -0
  9. openadapt_ml-0.2.2/deprecated/README.md +7 -0
  10. openadapt_ml-0.2.2/deprecated/docs/WAA_ACR_DESIGN.md +87 -0
  11. openadapt_ml-0.2.2/deprecated/docs/WAA_APPROACH_REVIEW.md +440 -0
  12. openadapt_ml-0.2.2/deprecated/docs/WAA_EVAL_ATTEMPTS.md +443 -0
  13. openadapt_ml-0.2.2/deprecated/docs/WAA_RELIABILITY_ANALYSIS.md +514 -0
  14. openadapt_ml-0.2.2/deprecated/docs/WINDOWS_PRODUCT_KEY_RCA.md +345 -0
  15. openadapt_ml-0.2.2/deprecated/docs/waa_setup.md +330 -0
  16. openadapt_ml-0.2.2/deprecated/tmp_dockerfile_winarena.txt +64 -0
  17. openadapt_ml-0.2.2/deprecated/waa_deploy/Dockerfile +138 -0
  18. openadapt_ml-0.2.2/deprecated/waa_deploy/Dockerfile.backup +289 -0
  19. openadapt_ml-0.2.2/deprecated/waa_deploy/Dockerfile.simplified +139 -0
  20. {openadapt_ml-0.2.0/openadapt_ml/benchmarks → openadapt_ml-0.2.2/deprecated}/waa_deploy/api_agent.py +21 -20
  21. openadapt_ml-0.2.2/docs/ARCHITECTURE_DECISIONS.md +325 -0
  22. openadapt_ml-0.2.2/docs/AZURE_DASHBOARD_SPEC.md +403 -0
  23. openadapt_ml-0.2.2/docs/CLEANUP_NOTES.md +277 -0
  24. openadapt_ml-0.2.2/docs/REPOSITORY_HISTORY.md +70 -0
  25. openadapt_ml-0.2.2/docs/REPO_CONSOLIDATION_PLAN.md +1076 -0
  26. openadapt_ml-0.2.2/docs/SEGMENTATION_TEST_PLAN.md +298 -0
  27. openadapt_ml-0.2.2/docs/SEGMENTATION_TEST_RESULTS.md +292 -0
  28. openadapt_ml-0.2.2/docs/VM_MONITOR_SCREENSHOT_IMPLEMENTATION.md +410 -0
  29. openadapt_ml-0.2.2/docs/WAA_PARALLELIZATION_DESIGN.md +331 -0
  30. openadapt_ml-0.2.2/docs/WAA_UNATTENDED_SCALABLE.md +298 -0
  31. openadapt_ml-0.2.2/docs/analysis_jan2026.md +491 -0
  32. openadapt_ml-0.2.2/docs/architecture_diagram.md +496 -0
  33. openadapt_ml-0.2.2/docs/desktop_app_plan.md +389 -0
  34. openadapt_ml-0.2.2/docs/enterprise/COORDS_VS_MARKS_ABLATION.md +99 -0
  35. openadapt_ml-0.2.2/docs/enterprise/README.md +44 -0
  36. openadapt_ml-0.2.2/docs/experiments/representation_shootout_design.md +396 -0
  37. openadapt_ml-0.2.2/docs/experiments/waa_benchmark_results_jan2026.md +148 -0
  38. openadapt_ml-0.2.2/docs/github_org_profile_content.md +266 -0
  39. openadapt_ml-0.2.2/docs/github_org_update_plan.md +492 -0
  40. openadapt_ml-0.2.2/docs/grpo_training_report.md +997 -0
  41. openadapt_ml-0.2.2/docs/live_benchmark_monitoring_fix.md +265 -0
  42. openadapt_ml-0.2.2/docs/new_openadapt_architecture.md +849 -0
  43. openadapt_ml-0.2.2/docs/openadapt_integration_plan.md +594 -0
  44. openadapt_ml-0.2.2/docs/perception_integration.md +175 -0
  45. openadapt_ml-0.2.2/docs/qwen3_vl_embedding_design.md +2420 -0
  46. openadapt_ml-0.2.2/docs/qwen3_vl_embedding_literature_review.md +892 -0
  47. openadapt_ml-0.2.2/docs/qwen3_vl_embedding_research.md +569 -0
  48. openadapt_ml-0.2.2/docs/research/cua_waa_comparison.md +607 -0
  49. openadapt_ml-0.2.2/docs/safety_gate_design.md +376 -0
  50. openadapt_ml-0.2.2/docs/screenshots/vm_monitor_dashboard_full.png +0 -0
  51. openadapt_ml-0.2.2/docs/screenshots/vm_monitor_details.png +0 -0
  52. openadapt_ml-0.2.2/docs/screenshots/vm_monitor_terminal.png +0 -0
  53. openadapt_ml-0.2.2/docs/trl_unsloth_integration_analysis.md +1188 -0
  54. openadapt_ml-0.2.2/docs/viewer_architecture_survey.md +610 -0
  55. openadapt_ml-0.2.2/docs/viewer_consolidation_design.md +501 -0
  56. openadapt_ml-0.2.2/docs/viewer_redesign_proposal.md +780 -0
  57. openadapt_ml-0.2.2/docs/vm_monitor_screenshot_analysis.md +609 -0
  58. openadapt_ml-0.2.2/docs/waa_speedup_options.md +94 -0
  59. openadapt_ml-0.2.2/docs/waa_vanilla_automation.md +73 -0
  60. openadapt_ml-0.2.2/docs/website_redesign_plan.md +592 -0
  61. openadapt_ml-0.2.2/experiment_results/representation_shootout/results_20260116_142335.json +96 -0
  62. openadapt_ml-0.2.2/experiments/qwen_login/2b_dev_fixed/plots/qwen_base_vs_ft.png +0 -0
  63. openadapt_ml-0.2.2/experiments/qwen_login/registration_som_eval.json +20 -0
  64. openadapt_ml-0.2.2/openadapt_ml/baselines/__init__.py +121 -0
  65. openadapt_ml-0.2.2/openadapt_ml/baselines/adapter.py +185 -0
  66. openadapt_ml-0.2.2/openadapt_ml/baselines/cli.py +314 -0
  67. openadapt_ml-0.2.2/openadapt_ml/baselines/config.py +448 -0
  68. openadapt_ml-0.2.2/openadapt_ml/baselines/parser.py +922 -0
  69. openadapt_ml-0.2.2/openadapt_ml/baselines/prompts.py +787 -0
  70. openadapt_ml-0.2.2/openadapt_ml/benchmarks/__init__.py +31 -0
  71. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/benchmarks/agent.py +265 -421
  72. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/benchmarks/azure.py +28 -19
  73. openadapt_ml-0.2.2/openadapt_ml/benchmarks/azure_ops_tracker.py +521 -0
  74. openadapt_ml-0.2.2/openadapt_ml/benchmarks/cli.py +2007 -0
  75. openadapt_ml-0.2.2/openadapt_ml/benchmarks/trace_export.py +631 -0
  76. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/benchmarks/viewer.py +22 -5
  77. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/benchmarks/vm_monitor.py +530 -29
  78. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/benchmarks/waa_deploy/Dockerfile +47 -53
  79. openadapt_ml-0.2.2/openadapt_ml/benchmarks/waa_deploy/__init__.py +10 -0
  80. openadapt_ml-0.2.2/openadapt_ml/benchmarks/waa_deploy/api_agent.py +540 -0
  81. openadapt_ml-0.2.2/openadapt_ml/benchmarks/waa_deploy/start_waa_server.bat +53 -0
  82. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/cloud/azure_inference.py +3 -5
  83. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/cloud/lambda_labs.py +722 -307
  84. openadapt_ml-0.2.2/openadapt_ml/cloud/local.py +3895 -0
  85. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/cloud/ssh_tunnel.py +68 -26
  86. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/datasets/next_action.py +40 -30
  87. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/evals/grounding.py +8 -3
  88. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/evals/plot_eval_metrics.py +15 -13
  89. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/evals/trajectory_matching.py +41 -26
  90. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/format_demo.py +16 -6
  91. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/run_experiment.py +26 -16
  92. openadapt_ml-0.2.2/openadapt_ml/experiments/representation_shootout/__init__.py +70 -0
  93. openadapt_ml-0.2.2/openadapt_ml/experiments/representation_shootout/conditions.py +708 -0
  94. openadapt_ml-0.2.2/openadapt_ml/experiments/representation_shootout/config.py +390 -0
  95. openadapt_ml-0.2.2/openadapt_ml/experiments/representation_shootout/evaluator.py +659 -0
  96. openadapt_ml-0.2.2/openadapt_ml/experiments/representation_shootout/runner.py +687 -0
  97. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/waa_demo/runner.py +29 -14
  98. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/export/parquet.py +36 -24
  99. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/grounding/detector.py +18 -14
  100. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/ingest/__init__.py +8 -6
  101. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/ingest/capture.py +25 -22
  102. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/ingest/loader.py +7 -4
  103. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/ingest/synthetic.py +189 -100
  104. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/models/api_adapter.py +14 -4
  105. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/models/base_adapter.py +10 -2
  106. openadapt_ml-0.2.2/openadapt_ml/models/providers/__init__.py +288 -0
  107. openadapt_ml-0.2.2/openadapt_ml/models/providers/anthropic.py +266 -0
  108. openadapt_ml-0.2.2/openadapt_ml/models/providers/base.py +299 -0
  109. openadapt_ml-0.2.2/openadapt_ml/models/providers/google.py +376 -0
  110. openadapt_ml-0.2.2/openadapt_ml/models/providers/openai.py +342 -0
  111. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/models/qwen_vl.py +46 -19
  112. openadapt_ml-0.2.2/openadapt_ml/perception/__init__.py +35 -0
  113. openadapt_ml-0.2.2/openadapt_ml/perception/integration.py +399 -0
  114. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/demo_retriever.py +50 -24
  115. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/embeddings.py +9 -8
  116. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/retriever.py +3 -1
  117. openadapt_ml-0.2.2/openadapt_ml/runtime/__init__.py +50 -0
  118. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/runtime/policy.py +18 -5
  119. openadapt_ml-0.2.2/openadapt_ml/runtime/safety_gate.py +471 -0
  120. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/schema/__init__.py +9 -0
  121. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/schema/converters.py +74 -27
  122. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/schema/episode.py +31 -18
  123. openadapt_ml-0.2.2/openadapt_ml/scripts/capture_screenshots.py +530 -0
  124. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/compare.py +85 -54
  125. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/demo_policy.py +4 -1
  126. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/eval_policy.py +15 -9
  127. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/make_gif.py +1 -1
  128. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/prepare_synthetic.py +3 -1
  129. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/train.py +21 -9
  130. openadapt_ml-0.2.2/openadapt_ml/segmentation/README.md +920 -0
  131. openadapt_ml-0.2.2/openadapt_ml/segmentation/__init__.py +97 -0
  132. openadapt_ml-0.2.2/openadapt_ml/segmentation/adapters/__init__.py +5 -0
  133. openadapt_ml-0.2.2/openadapt_ml/segmentation/adapters/capture_adapter.py +420 -0
  134. openadapt_ml-0.2.2/openadapt_ml/segmentation/annotator.py +610 -0
  135. openadapt_ml-0.2.2/openadapt_ml/segmentation/cache.py +290 -0
  136. openadapt_ml-0.2.2/openadapt_ml/segmentation/cli.py +674 -0
  137. openadapt_ml-0.2.2/openadapt_ml/segmentation/deduplicator.py +656 -0
  138. openadapt_ml-0.2.2/openadapt_ml/segmentation/frame_describer.py +788 -0
  139. openadapt_ml-0.2.2/openadapt_ml/segmentation/pipeline.py +340 -0
  140. openadapt_ml-0.2.2/openadapt_ml/segmentation/schemas.py +622 -0
  141. openadapt_ml-0.2.2/openadapt_ml/segmentation/segment_extractor.py +634 -0
  142. openadapt_ml-0.2.2/openadapt_ml/training/azure_ops_viewer.py +1097 -0
  143. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/benchmark_viewer.py +52 -41
  144. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/shared_ui.py +7 -7
  145. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/stub_provider.py +57 -35
  146. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/trainer.py +143 -86
  147. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/trl_trainer.py +70 -21
  148. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/training/viewer.py +323 -108
  149. openadapt_ml-0.2.2/openadapt_ml/training/viewer_components.py +180 -0
  150. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/pyproject.toml +21 -3
  151. openadapt_ml-0.2.2/scripts/generate_vm_screenshots.py +193 -0
  152. openadapt_ml-0.2.2/scripts/generate_vm_screenshots_simple.py +190 -0
  153. openadapt_ml-0.2.2/scripts/p1_episode_success_ab_test.py +967 -0
  154. openadapt_ml-0.2.2/scripts/waa_bootstrap_helper.sh +85 -0
  155. openadapt_ml-0.2.2/scripts/waa_bootstrap_local.sh +132 -0
  156. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/benchmarks/test_api_agent.py +2 -2
  157. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/benchmarks/test_waa.py +9 -7
  158. openadapt_ml-0.2.2/tests/integration/test_benchmark_viewer.py +61 -0
  159. openadapt_ml-0.2.2/tests/integration/test_data_collection.py +170 -0
  160. openadapt_ml-0.2.2/tests/integration/test_live_eval.py +79 -0
  161. openadapt_ml-0.2.2/tests/integration/test_sse_endpoint.py +88 -0
  162. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_api_adapter.py +8 -0
  163. openadapt_ml-0.2.2/tests/test_baselines.py +619 -0
  164. openadapt_ml-0.2.2/tests/test_batching.py +54 -0
  165. openadapt_ml-0.2.2/tests/test_capture_adapter.py +48 -0
  166. openadapt_ml-0.2.2/tests/test_demo_persistence.py +400 -0
  167. openadapt_ml-0.2.2/tests/test_gemini_grounding_imports.py +190 -0
  168. openadapt_ml-0.2.2/tests/test_mock_labeling.py +85 -0
  169. openadapt_ml-0.2.2/tests/test_negative_control.py +265 -0
  170. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_parquet_export.py +3 -3
  171. openadapt_ml-0.2.2/tests/test_providers.py +492 -0
  172. openadapt_ml-0.2.2/tests/test_segmentation_pipeline.py +293 -0
  173. openadapt_ml-0.2.2/tests/test_terminal_output.py +28 -0
  174. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_trl_trainer.py +116 -0
  175. openadapt_ml-0.2.2/tests/test_viewer_screenshots.py +40 -0
  176. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/uv.lock +1157 -43
  177. openadapt_ml-0.2.0/.github/workflows/publish.yml +0 -30
  178. openadapt_ml-0.2.0/docs/azure_acr_authentication.md +0 -159
  179. openadapt_ml-0.2.0/docs/waa_setup.md +0 -315
  180. openadapt_ml-0.2.0/openadapt_ml/benchmarks/__init__.py +0 -133
  181. openadapt_ml-0.2.0/openadapt_ml/benchmarks/base.py +0 -366
  182. openadapt_ml-0.2.0/openadapt_ml/benchmarks/cli.py +0 -5132
  183. openadapt_ml-0.2.0/openadapt_ml/benchmarks/data_collection.py +0 -432
  184. openadapt_ml-0.2.0/openadapt_ml/benchmarks/live_tracker.py +0 -180
  185. openadapt_ml-0.2.0/openadapt_ml/benchmarks/runner.py +0 -418
  186. openadapt_ml-0.2.0/openadapt_ml/benchmarks/waa.py +0 -761
  187. openadapt_ml-0.2.0/openadapt_ml/benchmarks/waa_live.py +0 -619
  188. openadapt_ml-0.2.0/openadapt_ml/cloud/local.py +0 -2344
  189. openadapt_ml-0.2.0/scripts/fix_acr_auth.py +0 -212
  190. openadapt_ml-0.2.0/tests/test_waa_live.py +0 -314
  191. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/.env.example +0 -0
  192. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/.gitmodules +0 -0
  193. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/.python-version +0 -0
  194. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/LICENSE +0 -0
  195. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/RETRIEVAL_QUICKSTART.md +0 -0
  196. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen2_5vl_synthetic.yaml +0 -0
  197. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_capture.yaml +0 -0
  198. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_capture_4bit.yaml +0 -0
  199. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_capture_batched.yaml +0 -0
  200. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_synthetic.yaml +0 -0
  201. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_synthetic_coord_v2.yaml +0 -0
  202. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_synthetic_dev.yaml +0 -0
  203. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_synthetic_registration_som.yaml +0 -0
  204. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/configs/qwen3vl_synthetic_som.yaml +0 -0
  205. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2/deprecated}/docs/azure_waa_setup.md +0 -0
  206. {openadapt_ml-0.2.0/openadapt_ml/benchmarks → openadapt_ml-0.2.2/deprecated}/waa_deploy/__init__.py +0 -0
  207. {openadapt_ml-0.2.0/openadapt_ml/benchmarks → openadapt_ml-0.2.2/deprecated}/waa_deploy/start_waa_server.bat +0 -0
  208. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/GEMINI_GROUNDING_QUICKSTART.md +0 -0
  209. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/IMPLEMENTATION_SUMMARY_GEMINI_GROUNDING.md +0 -0
  210. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/NEXT_STEPS_GROUNDING_ARCHITECTURE.md +0 -0
  211. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/PRIORITY_2_COMPLETION_SUMMARY.md +0 -0
  212. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/PRIVACY_IMPLEMENTATION_PLAN.md +0 -0
  213. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/RECORD_IMPLEMENTATION_PLAN.md +0 -0
  214. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/auto_shutoff_design.md +0 -0
  215. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/background_task_visibility.md +0 -0
  216. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/batching_and_schedulers.md +0 -0
  217. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_integration_plan.md +0 -0
  218. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_next_steps.md +0 -0
  219. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_run_ui_design.md +0 -0
  220. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_viewer_integration.md +0 -0
  221. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_viewer_phase2.md +0 -0
  222. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/benchmark_viewer_ux_improvements.md +0 -0
  223. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/capture_format_decision.md +0 -0
  224. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/chrome_extension_design.md +0 -0
  225. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/cloud_gpu_training.md +0 -0
  226. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/current_state_dec2024.md +0 -0
  227. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/dashboard_architecture.md +0 -0
  228. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/demo_prompt_experiment.md +0 -0
  229. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/demo_retrieval_design.md +0 -0
  230. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/design.md +0 -0
  231. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/early_termination.md +0 -0
  232. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/enterprise_integration.md +0 -0
  233. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/eval_json_schema.md +0 -0
  234. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/experiments/demo_conditioned_prompting_results.md +0 -0
  235. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/experiments/multi_step_experiment_design.md +0 -0
  236. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/experiments/waa_demo_experiment_design.md +0 -0
  237. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/gemini_grounding.md +0 -0
  238. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/gui_actor_integration.md +0 -0
  239. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/benchmark_viewer.png +0 -0
  240. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/dashboard/training_bottom.png +0 -0
  241. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/dashboard/training_top.png +0 -0
  242. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/dashboard/viewer_bottom.png +0 -0
  243. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/dashboard/viewer_top.png +0 -0
  244. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/grounding_demo.png +0 -0
  245. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/grounding_demo_full.png +0 -0
  246. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/training-dashboard.png +0 -0
  247. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/images/viewer-comparison.png +0 -0
  248. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/infra_refactor_design.md +0 -0
  249. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/live_inference_design.md +0 -0
  250. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/mock_adapter_evaluation_fix.md +0 -0
  251. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/openadapt_capture_migration_detailed.md +0 -0
  252. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/openadapt_capture_migration_plan.md +0 -0
  253. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/opencua_integration.md +0 -0
  254. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/output_artifacts_and_media.md +0 -0
  255. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/parallelization_implementation.md +0 -0
  256. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/parquet_export_design.md +0 -0
  257. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/prediction_loading_architecture.md +0 -0
  258. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/qwen_login_experiment.md +0 -0
  259. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/research_thesis.md +0 -0
  260. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/roadmap.md +0 -0
  261. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/schema/README.md +0 -0
  262. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/schema/episode.schema.json +0 -0
  263. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/schema_consolidation_plan.md +0 -0
  264. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/semantic_element_capture.md +0 -0
  265. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/set_of_marks_implementation.md +0 -0
  266. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/smart_mock_agent_design.md +0 -0
  267. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/som_implementation_verification.md +0 -0
  268. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/sse_architecture.md +0 -0
  269. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/sse_benchmark_endpoint.md +0 -0
  270. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/sse_frontend_integration.md +0 -0
  271. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/sse_quick_reference.md +0 -0
  272. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/sse_usage_examples.md +0 -0
  273. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/state_and_next_steps_qwen_login.md +0 -0
  274. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/stub_training_adapter.md +0 -0
  275. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/synthetic_login_jitter_and_ablation.md +0 -0
  276. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/training_feedback_ux.md +0 -0
  277. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/unified_compute_architecture.md +0 -0
  278. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/viewer_eval_integration.md +0 -0
  279. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/viewer_layout_redesign.md +0 -0
  280. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/vision.md +0 -0
  281. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/waa_demo_recording_guide.md +0 -0
  282. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/waa_live_adapter_design.md +0 -0
  283. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/waa_network_architecture.md +0 -0
  284. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/waa_parallelization_plan.md +0 -0
  285. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/docs/wandb_integration.md +0 -0
  286. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/README.md +0 -0
  287. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/demo_retrieval_example.py +0 -0
  288. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/retrieval_with_capture.py +0 -0
  289. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/sample_data.json +0 -0
  290. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/test_gemini_grounding.py +0 -0
  291. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/examples/train_from_json.py +0 -0
  292. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/2b_dev/media/qwen3_2b_login_demo.gif +0 -0
  293. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/2b_dev/media/qwen3_2b_login_demo_session_0001.gif +0 -0
  294. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/2b_dev/plots/base_vs_ft.png +0 -0
  295. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/2b_dev/plots/qwen3_2b_base_vs_ft_hardened_v2.png +0 -0
  296. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/2b_dev/plots/qwen_vs_apis.png +0 -0
  297. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/8b_hero/plots/qwen3_8b_base_vs_ft_hardened_v2.png +0 -0
  298. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/SOM_INVESTIGATION_REPORT.md +0 -0
  299. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/comprehensive_comparison.png +0 -0
  300. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/login_demo.gif +0 -0
  301. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/experiments/qwen_login/registration_demo.gif +0 -0
  302. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/negative_control_results/NEGATIVE_CONTROL_REPORT.md +0 -0
  303. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/negative_control_results/RESULTS_SUMMARY.txt +0 -0
  304. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/negative_control_results/negative_control_20251231_005135.json +0 -0
  305. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/__init__.py +0 -0
  306. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/cloud/__init__.py +0 -0
  307. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/config.py +0 -0
  308. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/datasets/__init__.py +0 -0
  309. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/evals/__init__.py +0 -0
  310. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/__init__.py +0 -0
  311. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/results/experiment_20251231_002125.json +0 -0
  312. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/results/experiment_n30_20251231_165958.json +0 -0
  313. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/demo_prompt/results/multistep_20251231_025051.json +0 -0
  314. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/waa_demo/__init__.py +0 -0
  315. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/waa_demo/demos.py +0 -0
  316. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/experiments/waa_demo/tasks.py +0 -0
  317. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/export/__init__.py +0 -0
  318. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/export/__main__.py +0 -0
  319. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/export/cli.py +0 -0
  320. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/grounding/__init__.py +0 -0
  321. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/grounding/base.py +0 -0
  322. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/models/__init__.py +0 -0
  323. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/models/dummy_adapter.py +0 -0
  324. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/README.md +0 -0
  325. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/USAGE.md +0 -0
  326. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/__init__.py +0 -0
  327. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/retrieval/index.py +0 -0
  328. {openadapt_ml-0.2.0/openadapt_ml/runtime → openadapt_ml-0.2.2/openadapt_ml/scripts}/__init__.py +0 -0
  329. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/openadapt_ml/scripts/run_qwen_login_benchmark.py +0 -0
  330. {openadapt_ml-0.2.0/openadapt_ml/scripts → openadapt_ml-0.2.2/openadapt_ml/training}/__init__.py +0 -0
  331. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/scripts/p0_validate_demo_persistence.py +0 -0
  332. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/scripts/run_demo_experiment.py +0 -0
  333. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/scripts/run_demo_experiment_n30.py +0 -0
  334. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/scripts/run_multistep_experiment.py +0 -0
  335. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/scripts/setup_azure.py +0 -0
  336. {openadapt_ml-0.2.0/openadapt_ml/training → openadapt_ml-0.2.2/tests}/__init__.py +0 -0
  337. {openadapt_ml-0.2.0/tests → openadapt_ml-0.2.2/tests/benchmarks}/__init__.py +0 -0
  338. {openadapt_ml-0.2.0/tests/benchmarks → openadapt_ml-0.2.2/tests/integration}/__init__.py +0 -0
  339. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_action_parsing.py +0 -0
  340. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_demo_retrieval.py +0 -0
  341. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_local_cli.py +0 -0
  342. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_retrieval.py +0 -0
  343. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_training_dummy.py +0 -0
  344. {openadapt_ml-0.2.0 → openadapt_ml-0.2.2}/tests/test_waa_demo.py +0 -0
@@ -0,0 +1,48 @@
1
+ name: Release and PyPI Publish
2
+
3
+ on:
4
+ push:
5
+ branches:
6
+ - main
7
+
8
+ jobs:
9
+ release:
10
+ runs-on: ubuntu-latest
11
+ concurrency: release
12
+ permissions:
13
+ id-token: write
14
+ contents: write
15
+
16
+ steps:
17
+ - name: Checkout repository
18
+ uses: actions/checkout@v4
19
+ with:
20
+ fetch-depth: 0
21
+
22
+ - name: Set up Python
23
+ uses: actions/setup-python@v5
24
+ with:
25
+ python-version: '3.12'
26
+
27
+ - name: Install uv
28
+ uses: astral-sh/setup-uv@v4
29
+
30
+ - name: Python Semantic Release
31
+ id: release
32
+ uses: python-semantic-release/python-semantic-release@v9.15.2
33
+ with:
34
+ github_token: ${{ secrets.GITHUB_TOKEN }}
35
+
36
+ - name: Build package
37
+ if: steps.release.outputs.released == 'true'
38
+ run: uv build
39
+
40
+ - name: Publish to PyPI
41
+ if: steps.release.outputs.released == 'true'
42
+ uses: pypa/gh-action-pypi-publish@release/v1
43
+
44
+ - name: Publish to GitHub Releases
45
+ if: steps.release.outputs.released == 'true'
46
+ uses: python-semantic-release/publish-action@v9.15.2
47
+ with:
48
+ github_token: ${{ secrets.GITHUB_TOKEN }}
@@ -0,0 +1,41 @@
1
+ name: Test
2
+
3
+ on:
4
+ pull_request:
5
+ branches:
6
+ - '**'
7
+ push:
8
+ branches:
9
+ - main
10
+
11
+ jobs:
12
+ test:
13
+ runs-on: ${{ matrix.os }}
14
+ strategy:
15
+ matrix:
16
+ os: [ubuntu-latest, macos-latest]
17
+ python-version: ['3.10', '3.11']
18
+
19
+ steps:
20
+ - name: Checkout code
21
+ uses: actions/checkout@v4
22
+
23
+ - name: Install uv
24
+ uses: astral-sh/setup-uv@v4
25
+ with:
26
+ version: "latest"
27
+
28
+ - name: Set up Python ${{ matrix.python-version }}
29
+ run: uv python install ${{ matrix.python-version }}
30
+
31
+ - name: Install dependencies
32
+ run: uv sync --all-extras
33
+
34
+ - name: Run ruff linter (check)
35
+ run: uv run ruff check openadapt_ml/
36
+
37
+ - name: Run ruff formatter (check)
38
+ run: uv run ruff format --check openadapt_ml/
39
+
40
+ - name: Run pytest
41
+ run: uv run pytest tests/ -v
@@ -1,6 +1,7 @@
1
1
  # Python-generated files
2
2
  __pycache__/
3
3
  *.py[oc]
4
+ *.pyc
4
5
  build/
5
6
  dist/
6
7
  wheels/
@@ -17,6 +18,7 @@ local_context_openadapt_ml_internal.md
17
18
  synthetic/
18
19
  synthetic_train/
19
20
  synthetic_train_dev/
21
+ synthetic_*/
20
22
 
21
23
  # Local OS cruft
22
24
  .DS_Store
@@ -36,7 +38,37 @@ checkpoints_*/
36
38
  eval_*.json
37
39
  benchmark_results/
38
40
  debug_*/
41
+ training_output*/
42
+
43
+ # JSONL data files (generated during experiments)
44
+ *.jsonl
45
+
46
+ # Live benchmark tracking
47
+ benchmark_live.json
48
+
49
+ # Experiment results directories
50
+ p0_results/
51
+ p1_results/
52
+
53
+ # External dependencies (cloned repos, vendored code)
54
+ external/
55
+
56
+ # Demo recordings
57
+ demos/
58
+
59
+ # Pytest cache
60
+ .pytest_cache/
61
+
62
+ # Coverage files
63
+ .coverage
64
+ .coverage.*
65
+ htmlcov/
66
+
67
+ # Analysis/debug artifacts
68
+ cli_analysis.json
69
+ dead_code_candidates.json
70
+ segmentation_output/
39
71
 
40
72
  # Internal documentation (not for public repo)
41
73
  docs/internal/
42
- docs/internal/
74
+ docs/private/