verifiers 0.1.15.dev15__tar.gz → 0.1.15.dev16__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/PKG-INFO +1 -1
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_init_script.py +10 -7
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/__init__.py +1 -1
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/init.py +42 -32
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/.gitignore +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/LICENSE +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/pyproject.toml +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/AGENTS.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/conftest.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_browser_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_build_script.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_cli_agent_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_auth_errors.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_config.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_client_multimodal_types.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_composable_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_context_token_metrics.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_decorator_ranks.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_endpoint_registry.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_env_group.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_env_server.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_environment.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_environment_extra.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_envs.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_error_chain.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_cli.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_display.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_eval_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gepa_cli.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gepa_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_gym_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_harbor_env_mcp.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_imports.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_install_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_interception_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_langchain_deep_agents_wikispeedia.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_lean_task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_logging.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_math_rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_maybe_think_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_mcp_search_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_message_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_message_utils_multimodal.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_multiturn_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_nemorl_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openai_chat_completions_token_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openai_responses_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_opencode_harbor.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_opencode_rlm_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openenv_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_path_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_per_turn_timing.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_pricing_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_prime_plugin.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_renderer_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_renderer_e2e.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rlm_composable_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rlm_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_rubric_group.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_sandbox_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_sandbox_mixin.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_save_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_setup_script.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_singleturn_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_stateful_tool_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_think_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tool_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tool_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_trajectory_processing.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_tui_info_formatting.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_types.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_bfcl.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_config_extension.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_empty_completions.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_endpoint_protocols.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_example_counts.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_group_reward_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_harbor_cli.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_mini_swe_agent.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_nemo_gym_harness.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_openenv_taskset.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_openreward_taskset.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_rlm_swe.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_runtime_lifecycle.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_scoring_functions.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_taskset_bindings.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_v1_textarena_taskset.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wiki_search_v1.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wordle_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_wordle_v1_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_xml_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/AGENTS.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/build.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/eval.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/gepa.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/init.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/install.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/commands/setup.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/plugins/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/plugins/prime.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/cli/tui.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/anthropic_messages_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/nemorl_chat_completions_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_chat_completions_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_chat_completions_token_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_completions_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_responses_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/renderer_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/decorators.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/AGENTS.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/env_group.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/environment.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/cli_agent_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/_filter.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/composable_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harness.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/mini_swe_agent.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/opencode.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/prompt.txt +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harnesses/rlm.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/swe_debug_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/cp_task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/cp/test_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/harbor/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/harbor/harbor.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/lean/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/lean/lean_task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/math/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/math/math_task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/_test_patch.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/create_fix_patch.sh +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/log_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/multi_swe.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/openswe.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/r2e_gym.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_bench.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_lego.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_rebench_v2.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_rebench_v2_log_parsers.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_smith.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/tasksets/swe/swe_tasksets.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/gym_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/mcp.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/mcp_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_qa_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/opencode_rlm_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/rlm_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/sandbox_mixin.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/file_locks.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/utils/git_checkout_cache.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/browser_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/base.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/cua_mode.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/browser_env/modes/dom_mode.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/openenv_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/reasoninggym_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/integrations/textarena_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/multiturn_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/python_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/sandbox_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/singleturn_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/stateful_tool_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/tool_env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/errors.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/adapter.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/config.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/display.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/gepa/gepa_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/maybe_think_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/think_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/parsers/xml_parser.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/inference/server.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/config.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/orchestrator.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/trainer.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rl/trainer/utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/experimental/hybrid_math_rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/judge_rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/math_rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/rubric.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/rubrics/rubric_group.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/build.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/eval.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/gepa.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/install.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/rl.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/setup.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/train.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/tui.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/scripts/vllm.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/client/env_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/client/zmq_env_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_router.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_server.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/env_worker.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/server/zmq_env_server.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/serve/types.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/types.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/async_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/client_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/config_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/data_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/display_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/env_config_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/env_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/error_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/eval_display.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/eval_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/heartbeat.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/import_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/install_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/interception_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/logging_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/message_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/metric_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/path_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/pricing_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/process_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/response_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/save_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/serve_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/thread_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/threaded_sandbox_client.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/tool_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/usage_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/utils/version_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/ENVIRONMENT_BEST_PRACTICES.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/README.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/RE_MIGRATION.md +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/artifact.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/config.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/env.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/harness.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/model.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/program.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/runtime.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/runtime_handles.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/sandbox.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/state.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/task.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/taskset.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/toolset.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/types.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/user.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/__init__.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/binding_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/config_callable_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/config_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/endpoint_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/json_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/judge_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/lifecycle_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/mcp_proxy_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/mcp_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/object_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/program_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/prompt_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/runtime_owner_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/runtime_registry.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_program_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_python_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/sandbox_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/scoring_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/serialization_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/task_freeze_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/taskset_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/tool_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/toolset_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/trajectory_utils.py +0 -0
- {verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/v1/utils/usage_utils.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: verifiers
|
|
3
|
-
Version: 0.1.15.
|
|
3
|
+
Version: 0.1.15.dev16
|
|
4
4
|
Summary: Verifiers: Environments for LLM Reinforcement Learning
|
|
5
5
|
Project-URL: Homepage, https://github.com/primeintellect-ai/verifiers
|
|
6
6
|
Project-URL: Documentation, https://github.com/primeintellect-ai/verifiers
|
|
@@ -1,6 +1,4 @@
|
|
|
1
1
|
from pathlib import Path
|
|
2
|
-
|
|
3
|
-
import pytest
|
|
4
2
|
import verifiers as vf
|
|
5
3
|
from verifiers.scripts.init import init_environment
|
|
6
4
|
|
|
@@ -21,20 +19,23 @@ def test_init_default_writes_v0_stub(tmp_path: Path) -> None:
|
|
|
21
19
|
assert "EnvTaskset" not in content
|
|
22
20
|
|
|
23
21
|
|
|
24
|
-
def
|
|
22
|
+
def test_init_v1_writes_taskset_template(tmp_path: Path) -> None:
|
|
25
23
|
init_environment("bar", path=str(tmp_path), v1=True)
|
|
26
24
|
content = read_env_file(tmp_path, "bar")
|
|
27
25
|
|
|
28
26
|
assert "class BarTasksetConfig(vf.TasksetConfig):" in content
|
|
29
27
|
assert "class BarTaskset(vf.Taskset[BarTasksetConfig]):" in content
|
|
28
|
+
assert 'system_prompt: vf.SystemPrompt = "Answer exactly."' in content
|
|
29
|
+
assert '"""Taskset implementation for bar.' in content
|
|
30
|
+
assert 'def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:' in content
|
|
30
31
|
assert (
|
|
31
|
-
'
|
|
32
|
+
'"""Return serializable task records as a list, generator, or Dataset."""'
|
|
32
33
|
in content
|
|
33
34
|
)
|
|
34
|
-
assert 'def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:' in content
|
|
35
35
|
assert "def load_system_prompt" not in content
|
|
36
36
|
assert "async def correct_answer(self, task: vf.Task, state: vf.State)" in content
|
|
37
37
|
assert "def load_taskset(config: BarTasksetConfig) -> BarTaskset:" in content
|
|
38
|
+
assert '"""Typed taskset loader used by vf.load_taskset."""' in content
|
|
38
39
|
assert "return BarTaskset(config=config)" in content
|
|
39
40
|
assert "taskset=vf.load_taskset(config=config.taskset)" in content
|
|
40
41
|
assert '"""Loader pattern for all Taskset/Harness environments."""' in content
|
|
@@ -53,8 +54,10 @@ def test_init_v1_template_loads_with_vf_load_environment(
|
|
|
53
54
|
|
|
54
55
|
env = vf.load_environment("loadable-v1")
|
|
55
56
|
|
|
56
|
-
|
|
57
|
-
|
|
57
|
+
dataset = env.get_dataset()
|
|
58
|
+
|
|
59
|
+
assert len(dataset) == 1
|
|
60
|
+
assert dataset[0]["answer"] == "cba"
|
|
58
61
|
|
|
59
62
|
|
|
60
63
|
def test_init_v1_with_harness_writes_harness_stub(tmp_path: Path) -> None:
|
|
@@ -155,67 +155,72 @@ def load_environment(**kwargs) -> vf.Environment:
|
|
|
155
155
|
raise NotImplementedError("Implement load_environment here.")
|
|
156
156
|
"""
|
|
157
157
|
|
|
158
|
-
|
|
158
|
+
V1_TASKSET_TEMPLATE = """\
|
|
159
159
|
import verifiers as vf
|
|
160
160
|
|
|
161
161
|
|
|
162
162
|
class {taskset_config_name}(vf.TasksetConfig):
|
|
163
|
-
|
|
163
|
+
\"\"\"User-facing task settings for {env_id_dash}.\"\"\"
|
|
164
|
+
|
|
165
|
+
system_prompt: vf.SystemPrompt = "Answer exactly."
|
|
164
166
|
|
|
165
167
|
|
|
166
168
|
class {taskset_name}(vf.Taskset[{taskset_config_name}]):
|
|
169
|
+
\"\"\"Taskset implementation for {env_id_dash}.
|
|
170
|
+
|
|
171
|
+
Add task loading, task-owned toolsets, user behavior, lifecycle hooks,
|
|
172
|
+
metrics, rewards, and advantages on this class.
|
|
173
|
+
\"\"\"
|
|
174
|
+
|
|
167
175
|
def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:
|
|
168
|
-
|
|
176
|
+
\"\"\"Return serializable task records as a list, generator, or Dataset.\"\"\"
|
|
177
|
+
if split == "eval":
|
|
178
|
+
return []
|
|
179
|
+
return [
|
|
180
|
+
{
|
|
181
|
+
"prompt": [{"role": "user", "content": "Reverse abc."}],
|
|
182
|
+
"answer": "cba",
|
|
183
|
+
"max_turns": 1,
|
|
184
|
+
}
|
|
185
|
+
]
|
|
169
186
|
|
|
170
187
|
@vf.reward(weight=1.0)
|
|
171
188
|
async def correct_answer(self, task: vf.Task, state: vf.State) -> float:
|
|
172
|
-
|
|
189
|
+
\"\"\"Score the final assistant response for one rollout.\"\"\"
|
|
190
|
+
messages = vf.get_messages(state.get("completion") or [], role="assistant")
|
|
191
|
+
if not messages:
|
|
192
|
+
return 0.0
|
|
193
|
+
response = str(messages[-1].content or "").strip()
|
|
194
|
+
return float(response == task["answer"])
|
|
173
195
|
|
|
174
196
|
|
|
175
197
|
def load_taskset(config: {taskset_config_name}) -> {taskset_name}:
|
|
198
|
+
\"\"\"Typed taskset loader used by vf.load_taskset.\"\"\"
|
|
176
199
|
return {taskset_name}(config=config)
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
def load_environment(config: vf.EnvConfig) -> vf.Env:
|
|
180
|
-
\"\"\"Loader pattern for all Taskset/Harness environments.\"\"\"
|
|
181
|
-
return vf.Env(
|
|
182
|
-
taskset=vf.load_taskset(config=config.taskset),
|
|
183
|
-
harness=vf.load_harness(config=config.harness),
|
|
184
|
-
)
|
|
185
200
|
"""
|
|
186
201
|
|
|
187
|
-
V1_HARNESS_ENVIRONMENT_TEMPLATE = """\
|
|
188
|
-
import verifiers as vf
|
|
189
|
-
|
|
190
|
-
|
|
191
|
-
class {taskset_config_name}(vf.TasksetConfig):
|
|
192
|
-
system_prompt: vf.SystemPrompt = "Replace this with the system prompt for {env_id_dash}."
|
|
193
|
-
|
|
194
|
-
|
|
195
|
-
class {taskset_name}(vf.Taskset[{taskset_config_name}]):
|
|
196
|
-
def load_tasks(self, split: vf.TaskSplit = "train") -> vf.Tasks:
|
|
197
|
-
raise NotImplementedError("Load tasks for {env_id_dash}.")
|
|
198
|
-
|
|
199
|
-
@vf.reward(weight=1.0)
|
|
200
|
-
async def correct_answer(self, task: vf.Task, state: vf.State) -> float:
|
|
201
|
-
raise NotImplementedError("Score a completed rollout for {env_id_dash}.")
|
|
202
202
|
|
|
203
|
+
V1_HARNESS_TEMPLATE = """\
|
|
203
204
|
|
|
204
205
|
class {harness_config_name}(vf.HarnessConfig):
|
|
205
|
-
|
|
206
|
+
\"\"\"Execution settings for {env_id_dash}.\"\"\"
|
|
206
207
|
|
|
207
208
|
|
|
208
209
|
class {harness_name}(vf.Harness[{harness_config_name}]):
|
|
209
|
-
|
|
210
|
+
\"\"\"Reusable execution behavior for {env_id_dash}.
|
|
210
211
|
|
|
211
|
-
|
|
212
|
-
|
|
213
|
-
|
|
212
|
+
Add harness-owned program, sandbox, endpoint, model, toolset, or lifecycle
|
|
213
|
+
behavior here when this environment owns a custom execution mechanism.
|
|
214
|
+
\"\"\"
|
|
214
215
|
|
|
215
216
|
|
|
216
217
|
def load_harness(config: {harness_config_name}) -> {harness_name}:
|
|
218
|
+
\"\"\"Typed harness loader used by vf.load_harness.\"\"\"
|
|
217
219
|
return {harness_name}(config=config)
|
|
220
|
+
"""
|
|
221
|
+
|
|
218
222
|
|
|
223
|
+
V1_ENV_LOADER_TEMPLATE = """\
|
|
219
224
|
|
|
220
225
|
def load_environment(config: vf.EnvConfig) -> vf.Env:
|
|
221
226
|
\"\"\"Loader pattern for all Taskset/Harness environments.\"\"\"
|
|
@@ -225,6 +230,11 @@ def load_environment(config: vf.EnvConfig) -> vf.Env:
|
|
|
225
230
|
)
|
|
226
231
|
"""
|
|
227
232
|
|
|
233
|
+
V1_ENVIRONMENT_TEMPLATE = V1_TASKSET_TEMPLATE + V1_ENV_LOADER_TEMPLATE
|
|
234
|
+
V1_HARNESS_ENVIRONMENT_TEMPLATE = (
|
|
235
|
+
V1_TASKSET_TEMPLATE + V1_HARNESS_TEMPLATE + V1_ENV_LOADER_TEMPLATE
|
|
236
|
+
)
|
|
237
|
+
|
|
228
238
|
OPENENV_ENVIRONMENT_TEMPLATE = """\
|
|
229
239
|
import verifiers as vf
|
|
230
240
|
from tasksets import OpenEnvTaskset, OpenEnvTasksetConfig
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_langchain_deep_agents_wikispeedia.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/tests/test_openai_chat_completions_token_client.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/anthropic_messages_client.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_completions_client.py
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/clients/openai_responses_client.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/cli_agent_env.py
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/README.md
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/__init__.py
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/_filter.py
RENAMED
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/harness.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/composable/task.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/__init__.py
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/env.py
RENAMED
|
File without changes
|
{verifiers-0.1.15.dev15 → verifiers-0.1.15.dev16}/verifiers/envs/experimental/harbor_env/mcp.py
RENAMED
|
File without changes
|
|
File without changes
|