verifiers 0.1.15.dev15__tar.gz → 0.1.15.dev16__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (312) hide show
  1. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/PKG-INFO +1 -1
  2. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_init_script.py +10 -7
  3. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/__init__.py +1 -1
  4. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/init.py +42 -32
  5. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/.gitignore +0 -0
  6. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/LICENSE +0 -0
  7. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/README.md +0 -0
  8. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/pyproject.toml +0 -0
  9. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/AGENTS.md +0 -0
  10. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/README.md +0 -0
  11. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/__init__.py +0 -0
  12. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/conftest.py +0 -0
  13. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_browser_env.py +0 -0
  14. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_build_script.py +0 -0
  15. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_cli_agent_env.py +0 -0
  16. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_auth_errors.py +0 -0
  17. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_config.py +0 -0
  18. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_multimodal_types.py +0 -0
  19. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_composable_env.py +0 -0
  20. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_context_token_metrics.py +0 -0
  21. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_decorator_ranks.py +0 -0
  22. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_endpoint_registry.py +0 -0
  23. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_env_group.py +0 -0
  24. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_env_server.py +0 -0
  25. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_environment.py +0 -0
  26. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_environment_extra.py +0 -0
  27. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_envs.py +0 -0
  28. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_error_chain.py +0 -0
  29. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_cli.py +0 -0
  30. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_display.py +0 -0
  31. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_utils.py +0 -0
  32. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gepa_cli.py +0 -0
  33. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gepa_utils.py +0 -0
  34. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gym_env.py +0 -0
  35. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_harbor_env_mcp.py +0 -0
  36. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_imports.py +0 -0
  37. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_install_utils.py +0 -0
  38. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_interception_utils.py +0 -0
  39. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_langchain_deep_agents_wikispeedia.py +0 -0
  40. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_lean_task.py +0 -0
  41. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_logging.py +0 -0
  42. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_math_rubric.py +0 -0
  43. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_maybe_think_parser.py +0 -0
  44. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_mcp_search_env.py +0 -0
  45. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_message_utils.py +0 -0
  46. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_message_utils_multimodal.py +0 -0
  47. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_multiturn_env.py +0 -0
  48. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_nemorl_client.py +0 -0
  49. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openai_chat_completions_token_client.py +0 -0
  50. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openai_responses_client.py +0 -0
  51. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_opencode_harbor.py +0 -0
  52. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_opencode_rlm_env.py +0 -0
  53. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openenv_client.py +0 -0
  54. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_parser.py +0 -0
  55. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_path_utils.py +0 -0
  56. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_per_turn_timing.py +0 -0
  57. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_pricing_utils.py +0 -0
  58. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_prime_plugin.py +0 -0
  59. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_renderer_client.py +0 -0
  60. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_renderer_e2e.py +0 -0
  61. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rlm_composable_env.py +0 -0
  62. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rlm_env.py +0 -0
  63. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rubric.py +0 -0
  64. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rubric_group.py +0 -0
  65. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_sandbox_env.py +0 -0
  66. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_sandbox_mixin.py +0 -0
  67. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_save_utils.py +0 -0
  68. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_setup_script.py +0 -0
  69. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_singleturn_env.py +0 -0
  70. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_stateful_tool_env.py +0 -0
  71. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_think_parser.py +0 -0
  72. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tool_env.py +0 -0
  73. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tool_utils.py +0 -0
  74. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_trajectory_processing.py +0 -0
  75. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tui_info_formatting.py +0 -0
  76. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_types.py +0 -0
  77. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_bfcl.py +0 -0
  78. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_config_extension.py +0 -0
  79. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_empty_completions.py +0 -0
  80. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_endpoint_protocols.py +0 -0
  81. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_example_counts.py +0 -0
  82. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_group_reward_env.py +0 -0
  83. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_harbor_cli.py +0 -0
  84. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_mini_swe_agent.py +0 -0
  85. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_nemo_gym_harness.py +0 -0
  86. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_openenv_taskset.py +0 -0
  87. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_openreward_taskset.py +0 -0
  88. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_rlm_swe.py +0 -0
  89. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_runtime_lifecycle.py +0 -0
  90. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_scoring_functions.py +0 -0
  91. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_taskset_bindings.py +0 -0
  92. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_textarena_taskset.py +0 -0
  93. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wiki_search_v1.py +0 -0
  94. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wordle_env.py +0 -0
  95. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wordle_v1_env.py +0 -0
  96. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_xml_parser.py +0 -0
  97. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/AGENTS.md +0 -0
  98. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/__init__.py +0 -0
  99. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/__init__.py +0 -0
  100. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/build.py +0 -0
  101. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/eval.py +0 -0
  102. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/gepa.py +0 -0
  103. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/init.py +0 -0
  104. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/install.py +0 -0
  105. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/setup.py +0 -0
  106. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/plugins/__init__.py +0 -0
  107. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/plugins/prime.py +0 -0
  108. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/tui.py +0 -0
  109. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/__init__.py +0 -0
  110. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/anthropic_messages_client.py +0 -0
  111. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/client.py +0 -0
  112. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/nemorl_chat_completions_client.py +0 -0
  113. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_chat_completions_client.py +0 -0
  114. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_chat_completions_token_client.py +0 -0
  115. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_completions_client.py +0 -0
  116. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_responses_client.py +0 -0
  117. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/renderer_client.py +0 -0
  118. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/decorators.py +0 -0
  119. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/AGENTS.md +0 -0
  120. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/__init__.py +0 -0
  121. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/env_group.py +0 -0
  122. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/environment.py +0 -0
  123. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/README.md +0 -0
  124. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/__init__.py +0 -0
  125. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/cli_agent_env.py +0 -0
  126. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/README.md +0 -0
  127. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/__init__.py +0 -0
  128. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/_filter.py +0 -0
  129. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/composable_env.py +0 -0
  130. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harness.py +0 -0
  131. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/__init__.py +0 -0
  132. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/mini_swe_agent.py +0 -0
  133. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/opencode.py +0 -0
  134. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/prompt.txt +0 -0
  135. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/rlm.py +0 -0
  136. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/swe_debug_env.py +0 -0
  137. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/task.py +0 -0
  138. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/__init__.py +0 -0
  139. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/__init__.py +0 -0
  140. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/cp_task.py +0 -0
  141. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/test_utils.py +0 -0
  142. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/harbor/__init__.py +0 -0
  143. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/harbor/harbor.py +0 -0
  144. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/lean/__init__.py +0 -0
  145. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/lean/lean_task.py +0 -0
  146. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/math/__init__.py +0 -0
  147. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/math/math_task.py +0 -0
  148. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/__init__.py +0 -0
  149. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/_test_patch.py +0 -0
  150. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/create_fix_patch.sh +0 -0
  151. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/log_parser.py +0 -0
  152. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/multi_swe.py +0 -0
  153. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/openswe.py +0 -0
  154. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/r2e_gym.py +0 -0
  155. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_bench.py +0 -0
  156. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_lego.py +0 -0
  157. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_rebench_v2.py +0 -0
  158. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_rebench_v2_log_parsers.py +0 -0
  159. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_smith.py +0 -0
  160. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_tasksets.py +0 -0
  161. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/gym_env.py +0 -0
  162. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/__init__.py +0 -0
  163. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/env.py +0 -0
  164. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/mcp.py +0 -0
  165. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/mcp_env.py +0 -0
  166. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_env.py +0 -0
  167. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_qa_env.py +0 -0
  168. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_rlm_env.py +0 -0
  169. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/rlm_env.py +0 -0
  170. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/sandbox_mixin.py +0 -0
  171. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/__init__.py +0 -0
  172. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/file_locks.py +0 -0
  173. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/git_checkout_cache.py +0 -0
  174. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/README.md +0 -0
  175. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/__init__.py +0 -0
  176. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/README.md +0 -0
  177. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/__init__.py +0 -0
  178. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/browser_env.py +0 -0
  179. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/__init__.py +0 -0
  180. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/base.py +0 -0
  181. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/cua_mode.py +0 -0
  182. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/dom_mode.py +0 -0
  183. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/openenv_env.py +0 -0
  184. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/reasoninggym_env.py +0 -0
  185. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/textarena_env.py +0 -0
  186. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/multiturn_env.py +0 -0
  187. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/python_env.py +0 -0
  188. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/sandbox_env.py +0 -0
  189. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/singleturn_env.py +0 -0
  190. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/stateful_tool_env.py +0 -0
  191. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/tool_env.py +0 -0
  192. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/errors.py +0 -0
  193. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/__init__.py +0 -0
  194. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/adapter.py +0 -0
  195. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/config.py +0 -0
  196. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/display.py +0 -0
  197. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/gepa_utils.py +0 -0
  198. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/__init__.py +0 -0
  199. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/maybe_think_parser.py +0 -0
  200. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/parser.py +0 -0
  201. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/think_parser.py +0 -0
  202. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/xml_parser.py +0 -0
  203. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/README.md +0 -0
  204. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/__init__.py +0 -0
  205. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/__init__.py +0 -0
  206. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/client.py +0 -0
  207. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/server.py +0 -0
  208. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/__init__.py +0 -0
  209. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/config.py +0 -0
  210. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/orchestrator.py +0 -0
  211. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/trainer.py +0 -0
  212. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/utils.py +0 -0
  213. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/__init__.py +0 -0
  214. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/experimental/hybrid_math_rubric.py +0 -0
  215. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/judge_rubric.py +0 -0
  216. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/math_rubric.py +0 -0
  217. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/rubric.py +0 -0
  218. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/rubric_group.py +0 -0
  219. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/__init__.py +0 -0
  220. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/build.py +0 -0
  221. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/eval.py +0 -0
  222. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/gepa.py +0 -0
  223. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/install.py +0 -0
  224. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/rl.py +0 -0
  225. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/setup.py +0 -0
  226. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/train.py +0 -0
  227. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/tui.py +0 -0
  228. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/vllm.py +0 -0
  229. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/__init__.py +0 -0
  230. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/client/env_client.py +0 -0
  231. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/client/zmq_env_client.py +0 -0
  232. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/__init__.py +0 -0
  233. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_router.py +0 -0
  234. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_server.py +0 -0
  235. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_worker.py +0 -0
  236. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/zmq_env_server.py +0 -0
  237. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/types.py +0 -0
  238. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/types.py +0 -0
  239. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/__init__.py +0 -0
  240. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/async_utils.py +0 -0
  241. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/client_utils.py +0 -0
  242. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/config_utils.py +0 -0
  243. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/data_utils.py +0 -0
  244. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/display_utils.py +0 -0
  245. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/env_config_utils.py +0 -0
  246. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/env_utils.py +0 -0
  247. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/error_utils.py +0 -0
  248. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/eval_display.py +0 -0
  249. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/eval_utils.py +0 -0
  250. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/heartbeat.py +0 -0
  251. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/import_utils.py +0 -0
  252. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/install_utils.py +0 -0
  253. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/interception_utils.py +0 -0
  254. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/logging_utils.py +0 -0
  255. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/message_utils.py +0 -0
  256. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/metric_utils.py +0 -0
  257. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/path_utils.py +0 -0
  258. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/pricing_utils.py +0 -0
  259. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/process_utils.py +0 -0
  260. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/response_utils.py +0 -0
  261. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/save_utils.py +0 -0
  262. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/serve_utils.py +0 -0
  263. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/thread_utils.py +0 -0
  264. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/threaded_sandbox_client.py +0 -0
  265. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/tool_utils.py +0 -0
  266. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/usage_utils.py +0 -0
  267. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/version_utils.py +0 -0
  268. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/ENVIRONMENT_BEST_PRACTICES.md +0 -0
  269. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/README.md +0 -0
  270. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/RE_MIGRATION.md +0 -0
  271. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/__init__.py +0 -0
  272. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/artifact.py +0 -0
  273. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/config.py +0 -0
  274. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/env.py +0 -0
  275. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/harness.py +0 -0
  276. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/model.py +0 -0
  277. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/program.py +0 -0
  278. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/runtime.py +0 -0
  279. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/runtime_handles.py +0 -0
  280. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/sandbox.py +0 -0
  281. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/state.py +0 -0
  282. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/task.py +0 -0
  283. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/taskset.py +0 -0
  284. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/toolset.py +0 -0
  285. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/types.py +0 -0
  286. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/user.py +0 -0
  287. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/__init__.py +0 -0
  288. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/binding_utils.py +0 -0
  289. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/config_callable_utils.py +0 -0
  290. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/config_utils.py +0 -0
  291. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/endpoint_utils.py +0 -0
  292. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/json_utils.py +0 -0
  293. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/judge_utils.py +0 -0
  294. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/lifecycle_utils.py +0 -0
  295. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/mcp_proxy_utils.py +0 -0
  296. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/mcp_utils.py +0 -0
  297. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/object_utils.py +0 -0
  298. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/program_utils.py +0 -0
  299. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/prompt_utils.py +0 -0
  300. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/runtime_owner_utils.py +0 -0
  301. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/runtime_registry.py +0 -0
  302. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_program_utils.py +0 -0
  303. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_python_utils.py +0 -0
  304. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_utils.py +0 -0
  305. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/scoring_utils.py +0 -0
  306. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/serialization_utils.py +0 -0
  307. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/task_freeze_utils.py +0 -0
  308. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/taskset_utils.py +0 -0
  309. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/tool_utils.py +0 -0
  310. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/toolset_utils.py +0 -0
  311. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/trajectory_utils.py +0 -0
  312. {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/usage_utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: verifiers
3
- Version: 0.1.15.dev15
3
+ Version: 0.1.15.dev16
4
4
  Summary: Verifiers: Environments for LLM Reinforcement Learning
5
5
  Project-URL: Homepage, https://github.com/primeintellect-ai/verifiers
6
6
  Project-URL: Documentation, https://github.com/primeintellect-ai/verifiers
@@ -1,6 +1,4 @@
1
1
  from pathlib import Path
2
-
3
- import pytest
4
2
  import verifiers as vf
5
3
  from verifiers.scripts.init import init_environment
6
4
 
@@ -21,20 +19,23 @@ def test_init_default_writes_v0_stub(tmp_path: Path) -> None:
21
19
  assert "EnvTaskset" not in content
22
20
 
23
21
 
24
- def test_init_v1_writes_thin_taskset_template(tmp_path: Path) -> None:
22
+ def test_init_v1_writes_taskset_template(tmp_path: Path) -> None:
25
23
  init_environment("bar", path=str(tmp_path), v1=True)
26
24
  content = read_env_file(tmp_path, "bar")
27
25
 
28
26
  assert "class BarTasksetConfig(vf.TasksetConfig):" in content
29
27
  assert "class BarTaskset(vf.Taskset[BarTasksetConfig]):" in content
28
+ assert 'system_prompt: vf.SystemPrompt = "Answer exactly."' in content
29
+ assert '"""Taskset implementation for bar.' in content
30
+ assert 'def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:' in content
30
31
  assert (
31
- 'system_prompt: vf.SystemPrompt = "Replace this with the system prompt for bar."'
32
+ '"""Return serializable task records as a list, generator, or Dataset."""'
32
33
  in content
33
34
  )
34
- assert 'def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:' in content
35
35
  assert "def load_system_prompt" not in content
36
36
  assert "async def correct_answer(self, task: vf.Task, state: vf.State)" in content
37
37
  assert "def load_taskset(config: BarTasksetConfig) -> BarTaskset:" in content
38
+ assert '"""Typed taskset loader used by vf.load_taskset."""' in content
38
39
  assert "return BarTaskset(config=config)" in content
39
40
  assert "taskset=vf.load_taskset(config=config.taskset)" in content
40
41
  assert '"""Loader pattern for all Taskset/Harness environments."""' in content
@@ -53,8 +54,10 @@ def test_init_v1_template_loads_with_vf_load_environment(
53
54
 
54
55
  env = vf.load_environment("loadable-v1")
55
56
 
56
- with pytest.raises(RuntimeError, match="Load tasks"):
57
- env.get_dataset()
57
+ dataset = env.get_dataset()
58
+
59
+ assert len(dataset) == 1
60
+ assert dataset[0]["answer"] == "cba"
58
61
 
59
62
 
60
63
  def test_init_v1_with_harness_writes_harness_stub(tmp_path: Path) -> None:
@@ -1,4 +1,4 @@
1
- __version__ = "0.1.15.dev15"
1
+ __version__ = "0.1.15.dev16"
2
2
 
3
3
  import importlib
4
4
  import os
@@ -155,67 +155,72 @@ def load_environment(**kwargs) -> vf.Environment:
155
155
  raise NotImplementedError("Implement load_environment here.")
156
156
  """
157
157
 
158
- V1_ENVIRONMENT_TEMPLATE = """\
158
+ V1_TASKSET_TEMPLATE = """\
159
159
  import verifiers as vf
160
160
 
161
161
 
162
162
  class {taskset_config_name}(vf.TasksetConfig):
163
- system_prompt: vf.SystemPrompt = "Replace this with the system prompt for {env_id_dash}."
163
+ \"\"\"User-facing task settings for {env_id_dash}.\"\"\"
164
+
165
+ system_prompt: vf.SystemPrompt = "Answer exactly."
164
166
 
165
167
 
166
168
  class {taskset_name}(vf.Taskset[{taskset_config_name}]):
169
+ \"\"\"Taskset implementation for {env_id_dash}.
170
+
171
+ Add task loading, task-owned toolsets, user behavior, lifecycle hooks,
172
+ metrics, rewards, and advantages on this class.
173
+ \"\"\"
174
+
167
175
  def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:
168
- raise NotImplementedError("Load tasks for {env_id_dash}.")
176
+ \"\"\"Return serializable task records as a list, generator, or Dataset.\"\"\"
177
+ if split == "eval":
178
+ return []
179
+ return [
180
+ {
181
+ "prompt": [{"role": "user", "content": "Reverse abc."}],
182
+ "answer": "cba",
183
+ "max_turns": 1,
184
+ }
185
+ ]
169
186
 
170
187
  @vf.reward(weight=1.0)
171
188
  async def correct_answer(self, task: vf.Task, state: vf.State) -> float:
172
- raise NotImplementedError("Score a completed rollout for {env_id_dash}.")
189
+ \"\"\"Score the final assistant response for one rollout.\"\"\"
190
+ messages = vf.get_messages(state.get("completion") or [], role="assistant")
191
+ if not messages:
192
+ return 0.0
193
+ response = str(messages[-1].content or "").strip()
194
+ return float(response == task["answer"])
173
195
 
174
196
 
175
197
  def load_taskset(config: {taskset_config_name}) -> {taskset_name}:
198
+ \"\"\"Typed taskset loader used by vf.load_taskset.\"\"\"
176
199
  return {taskset_name}(config=config)
177
-
178
-
179
- def load_environment(config: vf.EnvConfig) -> vf.Env:
180
- \"\"\"Loader pattern for all Taskset/Harness environments.\"\"\"
181
- return vf.Env(
182
- taskset=vf.load_taskset(config=config.taskset),
183
- harness=vf.load_harness(config=config.harness),
184
- )
185
200
  """
186
201
 
187
- V1_HARNESS_ENVIRONMENT_TEMPLATE = """\
188
- import verifiers as vf
189
-
190
-
191
- class {taskset_config_name}(vf.TasksetConfig):
192
- system_prompt: vf.SystemPrompt = "Replace this with the system prompt for {env_id_dash}."
193
-
194
-
195
- class {taskset_name}(vf.Taskset[{taskset_config_name}]):
196
- def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:
197
- raise NotImplementedError("Load tasks for {env_id_dash}.")
198
-
199
- @vf.reward(weight=1.0)
200
- async def correct_answer(self, task: vf.Task, state: vf.State) -> float:
201
- raise NotImplementedError("Score a completed rollout for {env_id_dash}.")
202
202
 
203
+ V1_HARNESS_TEMPLATE = """\
203
204
 
204
205
  class {harness_config_name}(vf.HarnessConfig):
205
- pass
206
+ \"\"\"Execution settings for {env_id_dash}.\"\"\"
206
207
 
207
208
 
208
209
  class {harness_name}(vf.Harness[{harness_config_name}]):
209
- pass
210
+ \"\"\"Reusable execution behavior for {env_id_dash}.
210
211
 
211
-
212
- def load_taskset(config: {taskset_config_name}) -> {taskset_name}:
213
- return {taskset_name}(config=config)
212
+ Add harness-owned program, sandbox, endpoint, model, toolset, or lifecycle
213
+ behavior here when this environment owns a custom execution mechanism.
214
+ \"\"\"
214
215
 
215
216
 
216
217
  def load_harness(config: {harness_config_name}) -> {harness_name}:
218
+ \"\"\"Typed harness loader used by vf.load_harness.\"\"\"
217
219
  return {harness_name}(config=config)
220
+ """
221
+
218
222
 
223
+ V1_ENV_LOADER_TEMPLATE = """\
219
224
 
220
225
  def load_environment(config: vf.EnvConfig) -> vf.Env:
221
226
  \"\"\"Loader pattern for all Taskset/Harness environments.\"\"\"
@@ -225,6 +230,11 @@ def load_environment(config: vf.EnvConfig) -> vf.Env:
225
230
  )
226
231
  """
227
232
 
233
+ V1_ENVIRONMENT_TEMPLATE = V1_TASKSET_TEMPLATE + V1_ENV_LOADER_TEMPLATE
234
+ V1_HARNESS_ENVIRONMENT_TEMPLATE = (
235
+ V1_TASKSET_TEMPLATE + V1_HARNESS_TEMPLATE + V1_ENV_LOADER_TEMPLATE
236
+ )
237
+
228
238
  OPENENV_ENVIRONMENT_TEMPLATE = """\
229
239
  import verifiers as vf
230
240
  from tasksets import OpenEnvTaskset, OpenEnvTasksetConfig