PyPI - rnow - Versions diffs - 0.3.1__tar.gz → 0.3.12__tar.gz - Mend

rnow 0.3.1tar.gz → 0.3.12tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (67) hide show

{rnow-0.3.1/rnow.egg-info → rnow-0.3.12}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: rnow
-Version: 0.3.1
+Version: 0.3.12
 Summary: ReinforceNow CLI - Reinforcement Learning platform command-line interface
 Requires-Python: <3.15,>=3.10
 Description-Content-Type: text/markdown
@@ -16,6 +16,7 @@ Requires-Dist: tokenizers>=0.15.0
 Requires-Dist: openai-harmony>=0.0.8
 Provides-Extra: test
 Requires-Dist: tinker-cookbook>=0.1.0; extra == "test"
+Requires-Dist: transformers>=4.40.0; extra == "test"
 Provides-Extra: api
 Requires-Dist: fastapi>=0.68.0; extra == "api"
 Requires-Dist: uvicorn>=0.15.0; extra == "api"
@@ -23,6 +24,7 @@ Provides-Extra: mcp
 Requires-Dist: fastmcp>=0.1.0; extra == "mcp"
 Provides-Extra: all
 Requires-Dist: tinker-cookbook>=0.1.0; extra == "all"
+Requires-Dist: transformers>=4.40.0; extra == "all"
 Requires-Dist: fastapi>=0.68.0; extra == "all"
 Requires-Dist: uvicorn>=0.15.0; extra == "all"
 Requires-Dist: fastmcp>=0.1.0; extra == "all"

{rnow-0.3.1 → rnow-0.3.12}/pyproject.toml RENAMED Viewed

@@ -11,7 +11,7 @@ rnow = ["templates/**/*"]
 [project]
 name = "rnow"
-version = "0.3.1"
+version = "0.3.12"
 description = "ReinforceNow CLI - Reinforcement Learning platform command-line interface"
 readme = "README.md"
 requires-python = ">=3.10,<3.15"
@@ -31,13 +31,16 @@ dependencies = [
 [project.optional-dependencies]
 # Local testing with ML inference (requires torch)
-test = ["tinker-cookbook>=0.1.0"]
+test = [
+    "tinker-cookbook>=0.1.0",
+    "transformers>=4.40.0",  # Ensure modern version (2.x is incompatible)
+]
 # API server mode
 api = ["fastapi>=0.68.0", "uvicorn>=0.15.0"]
 # MCP server support (for fetching tool schemas)
 mcp = ["fastmcp>=0.1.0"]
 # All optional features
-all = ["tinker-cookbook>=0.1.0", "fastapi>=0.68.0", "uvicorn>=0.15.0", "fastmcp>=0.1.0"]
+all = ["tinker-cookbook>=0.1.0", "transformers>=4.40.0", "fastapi>=0.68.0", "uvicorn>=0.15.0", "fastmcp>=0.1.0"]
 [project.scripts]
 rnow = "rnow.cli.main:main"

{rnow-0.3.1 → rnow-0.3.12}/rnow/cli/commands.py RENAMED Viewed

@@ -221,18 +221,18 @@ def validate_max_tokens_for_context(
     return None, available
-def get_tools_from_env_py(env_path: Path) -> list[dict]:
+def get_tools_from_tools_py(tools_path: Path) -> list[dict]:
     """
-    Extract tool definitions from env.py as structured data.
+    Extract tool definitions from tools.py as structured data.
     Returns list of tool dicts with name, description, and schema.
     """
     import ast
-    if not env_path.exists():
+    if not tools_path.exists():
         return []
     try:
-        source = env_path.read_text()
+        source = tools_path.read_text()
         tree = ast.parse(source)
     except (SyntaxError, OSError):
         return []
@@ -377,25 +377,124 @@ def fetch_mcp_tool_schemas(
     return all_tools, None
+def get_sandbox_names_from_file(filepath: Path, decorator_name: str) -> set[str]:
+    """
+    Extract function names with sandbox=True from a file.
+    Args:
+        filepath: Path to rewards.py or tools.py
+        decorator_name: "reward" or "tool"
+    Returns:
+        Set of function names that have sandbox=True
+    """
+    import ast
+    names = set()
+    if not filepath.exists():
+        return names
+    try:
+        source = filepath.read_text()
+        tree = ast.parse(source, filename=str(filepath))
+    except SyntaxError:
+        return names
+    for node in ast.walk(tree):
+        if isinstance(node, ast.FunctionDef | ast.AsyncFunctionDef):
+            for decorator in node.decorator_list:
+                # Check for @decorator_name(sandbox=True)
+                if (
+                    isinstance(decorator, ast.Call)
+                    and isinstance(decorator.func, ast.Name)
+                    and decorator.func.id == decorator_name
+                ):
+                    for kw in decorator.keywords:
+                        if kw.arg == "sandbox":
+                            # Check if value is True
+                            if isinstance(kw.value, ast.Constant) and kw.value.value is True:
+                                names.add(node.name)
+                            elif isinstance(kw.value, ast.NameConstant) and kw.value.value is True:
+                                names.add(node.name)  # Python 3.7 compat
+    return names
+def validate_sandbox_docker_requirement(
+    train_jsonl_path: Path, rewards_py_path: Path, tools_py_path: Path
+) -> list[str]:
+    """
+    Validate that entries using sandbox=True tools/rewards have a docker field.
+    Returns:
+        List of error messages (empty if valid)
+    """
+    errors = []
+    # Get sandbox function names
+    sandbox_rewards = get_sandbox_names_from_file(rewards_py_path, "reward")
+    sandbox_tools = get_sandbox_names_from_file(tools_py_path, "tool")
+    if not sandbox_rewards and not sandbox_tools:
+        return []  # No sandbox functions, nothing to validate
+    try:
+        with open(train_jsonl_path, encoding="utf-8") as f:
+            for line_num, line in enumerate(f, start=1):
+                stripped = line.strip()
+                if not stripped:
+                    continue
+                try:
+                    record = json.loads(stripped)
+                except json.JSONDecodeError:
+                    continue
+                # Check if entry references sandbox rewards/tools
+                entry_rewards = set(record.get("rewards", []))
+                entry_tools = set(record.get("tools", []))
+                uses_sandbox_reward = bool(sandbox_rewards & entry_rewards)
+                uses_sandbox_tool = bool(sandbox_tools & entry_tools)
+                if (uses_sandbox_reward or uses_sandbox_tool) and not record.get("docker"):
+                    used = []
+                    if uses_sandbox_reward:
+                        used.extend(f"reward:{r}" for r in sandbox_rewards & entry_rewards)
+                    if uses_sandbox_tool:
+                        used.extend(f"tool:{t}" for t in sandbox_tools & entry_tools)
+                    errors.append(
+                        f"Line {line_num}: Uses sandbox functions ({', '.join(used)}) but missing 'docker' field"
+                    )
+                    if len(errors) >= 5:
+                        errors.append("... (stopping after 5 errors)")
+                        return errors
+    except Exception as e:
+        errors.append(f"Failed to validate sandbox requirements: {e}")
+    return errors
 def validate_train_jsonl(
     path: Path, dataset_type: models.DatasetType, sample_size: int = 50
 ) -> list[str]:
     """
-    Validate train.jsonl format by sampling first N lines.
+    Validate train.jsonl format using Pydantic models.
     Returns a list of error messages (empty if valid).
     """
+    from pydantic import ValidationError
     errors = []
+    EntryModel = models.TrainEntryRL if dataset_type == models.DatasetType.RL else models.TrainEntry
     try:
         with open(path, encoding="utf-8") as f:
             lines_checked = 0
             for line_num, line in enumerate(f, start=1):
-                # Skip empty lines
                 stripped = line.strip()
                 if not stripped:
                     continue
-                # Try to parse as JSON
                 try:
                     record = json.loads(stripped)
                 except json.JSONDecodeError as e:
@@ -405,63 +504,21 @@ def validate_train_jsonl(
                         return errors
                     continue
-                # Check it's a dict
-                if not isinstance(record, dict):
-                    errors.append(
-                        f"Line {line_num}: Expected JSON object, got {type(record).__name__}"
-                    )
-                    continue
-                # Check for required 'messages' field
-                if "messages" not in record:
-                    errors.append(f"Line {line_num}: Missing required 'messages' field")
-                    continue
-                messages = record["messages"]
-                if not isinstance(messages, list):
-                    errors.append(f"Line {line_num}: 'messages' must be a list")
-                    continue
-                if len(messages) == 0:
-                    errors.append(f"Line {line_num}: 'messages' list is empty")
+                try:
+                    EntryModel.model_validate(record)
+                except ValidationError as e:
+                    for err in e.errors():
+                        loc = ".".join(str(x) for x in err["loc"])
+                        errors.append(f"Line {line_num}: {loc} - {err['msg']}")
+                    if len(errors) >= 5:
+                        errors.append("... (stopping after 5 errors)")
+                        return errors
                     continue
-                # Check each message has role and content
-                for msg_idx, msg in enumerate(messages):
-                    if not isinstance(msg, dict):
-                        errors.append(f"Line {line_num}: Message {msg_idx + 1} must be an object")
-                        break
-                    if "role" not in msg:
-                        errors.append(f"Line {line_num}: Message {msg_idx + 1} missing 'role'")
-                        break
-                    if "content" not in msg:
-                        errors.append(f"Line {line_num}: Message {msg_idx + 1} missing 'content'")
-                        break
-                    if msg["role"] not in ("system", "user", "assistant"):
-                        errors.append(
-                            f"Line {line_num}: Message {msg_idx + 1} has invalid role '{msg['role']}' (expected: system, user, assistant)"
-                        )
-                        break
-                # For RL, check for rewards field
-                if dataset_type == models.DatasetType.RL and "rewards" not in record:
-                    errors.append(
-                        f"Line {line_num}: Missing required 'rewards' field for RL dataset"
-                    )
-                # Validate optional 'tools' field if present
-                if "tools" in record:
-                    tools = record["tools"]
-                    if not isinstance(tools, list):
-                        errors.append(f"Line {line_num}: 'tools' must be a list of tool names")
-                    elif not all(isinstance(t, str) for t in tools):
-                        errors.append(f"Line {line_num}: 'tools' must contain only strings")
                 lines_checked += 1
                 if lines_checked >= sample_size:
                     break
-            # Check if file was effectively empty (only whitespace)
             if lines_checked == 0:
                 errors.append("File contains no valid JSON lines")
@@ -1030,8 +1087,10 @@ def orgs(ctx, org_id: str | None):
             "rl-tools",
             "mcp-tavily",
             "deepseek-aha",
+            "dcf-sec",
             "tutorial-reward",
             "tutorial-tool",
+            "web-tasks",
         ]
     ),
     default="start",
@@ -1069,6 +1128,8 @@ def init(template: str, name: str):
         "tutorial-reward": "tutorial-reward",
         "tutorial-tool": "tutorial-tool",
         "deepseek-aha": "deepseek-aha",
+        "dcf-sec": "dcf-sec-filings",
+        "web-tasks": "web-tasks",
         "new": "new-project",
         "blank": "my-project",
     }
@@ -1099,7 +1160,7 @@ def init(template: str, name: str):
                 "train.jsonl",
                 "rewards.py",
                 "requirements.txt",
-                "env.py",
+                "tools.py",
                 "README.md",
             }
@@ -1213,7 +1274,7 @@ def init(template: str, name: str):
     click.echo(click.style("Next steps:", bold=True))
     click.echo(f"  1. Edit {click.style('train.jsonl', underline=True)} with your training data")
     click.echo(
-        f"  2. Edit {click.style('rewards.py', underline=True)} and {click.style('env.py', underline=True)} with your reward and tool functions"
+        f"  2. Edit {click.style('rewards.py', underline=True)} and {click.style('tools.py', underline=True)} with your reward and tool functions"
     )
     click.echo(f"  3. Run {click.style('rnow run', fg=TEAL_RGB, bold=True)} to start training")
@@ -1351,6 +1412,15 @@ def _submit_single_run(
         if jsonl_errors:
             raise click.ClickException(f"Invalid train.jsonl: {jsonl_errors[0]}")
+        # Validate sandbox=True functions require docker field in train.jsonl
+        sandbox_errors = validate_sandbox_docker_requirement(
+            train_jsonl_path,
+            rewards_py_path=dir / "rewards.py",
+            tools_py_path=dir / "tools.py",
+        )
+        if sandbox_errors:
+            raise click.ClickException(f"Sandbox validation: {sandbox_errors[0]}")
     # Validate rewards.py if present
     if config.dataset_type == models.DatasetType.RL:
         rewards_path = dir / "rewards.py"
@@ -1378,10 +1448,10 @@ def _submit_single_run(
             # Collect all tools
             all_tools = []
-            # Get tools from env.py
-            env_path = dir / "env.py"
-            env_tools = get_tools_from_env_py(env_path)
-            all_tools.extend(env_tools)
+            # Get tools from tools.py
+            tools_path = dir / "tools.py"
+            tools_py_tools = get_tools_from_tools_py(tools_path)
+            all_tools.extend(tools_py_tools)
             # Fetch MCP tools
             mcp_urls = config.rollout.mcp_url
@@ -1447,7 +1517,7 @@ def _submit_single_run(
         )
     # Add optional files
-    optional_files = {"env.py": dir / "env.py", "requirements.txt": dir / "requirements.txt"}
+    optional_files = {"tools.py": dir / "tools.py", "requirements.txt": dir / "requirements.txt"}
     for file_name, path in optional_files.items():
         if path.exists():
             files.append(
@@ -1457,6 +1527,17 @@ def _submit_single_run(
                 )
             )
+    # Add Dockerfile.* files for local/ docker images
+    for dockerfile_path in dir.glob("Dockerfile.*"):
+        file_name = dockerfile_path.name
+        click.echo(f"  Found Dockerfile: {file_name}")
+        files.append(
+            (
+                file_name.replace(".", "_"),
+                (file_name, open(dockerfile_path, "rb"), "application/octet-stream"),
+            )
+        )
     headers = auth.get_auth_headers()
     headers.pop("Content-Type", None)
@@ -1732,6 +1813,36 @@ def run(
     if not config.organization_id:
         config.organization_id = get_active_organization()
+    # Load secrets from .env file if it exists
+    secret_values = {}
+    env_file = dir / ".env"
+    if env_file.exists():
+        try:
+            with open(env_file) as f:
+                for line in f:
+                    line = line.strip()
+                    # Skip empty lines and comments
+                    if not line or line.startswith("#"):
+                        continue
+                    # Parse KEY=value format
+                    if "=" in line:
+                        key, _, value = line.partition("=")
+                        key = key.strip()
+                        value = value.strip()
+                        # Remove quotes if present
+                        if (value.startswith('"') and value.endswith('"')) or (
+                            value.startswith("'") and value.endswith("'")
+                        ):
+                            value = value[1:-1]
+                        secret_values[key] = value
+            if secret_values:
+                click.echo(
+                    click.style(f"🔐 Loaded {len(secret_values)} secret(s) from .env", dim=True)
+                )
+        except Exception as e:
+            click.echo(click.style(f"⚠️  Warning: Failed to read .env file: {e}", fg="yellow"))
     # Validate required files (all in the same directory now)
     required_files = {
         "train.jsonl": dir / "train.jsonl",
@@ -1807,10 +1918,10 @@ def run(
             # Collect all tools
             all_tools = []
-            # Get tools from env.py
-            env_path = dir / "env.py"
-            env_tools = get_tools_from_env_py(env_path)
-            all_tools.extend(env_tools)
+            # Get tools from tools.py
+            tools_path = dir / "tools.py"
+            tools_py_tools = get_tools_from_tools_py(tools_path)
+            all_tools.extend(tools_py_tools)
             # Fetch MCP tool schemas (with progress indicator)
             mcp_urls = config.rollout.mcp_url if config.rollout else None
@@ -1925,19 +2036,19 @@ def run(
                     "Please ensure reward names in train.jsonl match functions in rewards.py"
                 )
-    # Validate env.py if present (check for docstrings on @tool functions)
-    env_path = dir / "env.py"
-    has_env_py = env_path.exists() and env_path.stat().st_size > 0
-    if has_env_py:
+    # Validate tools.py if present (check for docstrings on @tool functions)
+    tools_path = dir / "tools.py"
+    has_tools_py = tools_path.exists() and tools_path.stat().st_size > 0
+    if has_tools_py:
         try:
             from rnow.core.tool import validate_tools_file
-            errors = validate_tools_file(env_path)
+            errors = validate_tools_file(tools_path)
             if errors:
-                click.echo(click.style("✗ Invalid env.py:", fg="red", bold=True))
+                click.echo(click.style("✗ Invalid tools.py:", fg="red", bold=True))
                 for err in errors:
                     click.echo(f"  • {err}")
-                raise click.ClickException("Please fix env.py before submitting")
+                raise click.ClickException("Please fix tools.py before submitting")
         except ImportError:
             pass  # Skip validation if module not available
@@ -1949,7 +2060,7 @@ def run(
         mcp_url_count = len(mcp_url) if isinstance(mcp_url, list) else 1
     # Validate tool support for the model
-    has_tools = has_env_py or has_mcp_url
+    has_tools = has_tools_py or has_mcp_url
     if has_tools and not models.supports_tool_calling(model_path):
         click.echo()
         click.echo(click.style("✗ Model does not support tool calling", fg="red", bold=True))
@@ -1961,7 +2072,7 @@ def run(
             click.echo("  Base/non-instruct models use a format that doesn't support tools.")
         click.echo()
         click.echo(click.style("  Options:", bold=True))
-        click.echo("  1. Remove env.py and mcp_url from your project")
+        click.echo("  1. Remove tools.py and mcp_url from your project")
         click.echo(
             "  2. Use a model that supports tools (e.g., Qwen/Qwen3-8B, meta-llama/Llama-3.1-8B-Instruct)"
         )
@@ -1969,16 +2080,16 @@ def run(
         raise click.ClickException("Model does not support tool calling")
     # Show tool sources message
-    if has_env_py and has_mcp_url:
+    if has_tools_py and has_mcp_url:
         server_text = f"{mcp_url_count} server(s)" if mcp_url_count > 1 else "1 server"
         click.echo(
-            click.style("Tools: ", fg=TEAL_RGB) + f"Using MCP ({server_text}) and env.py tools"
+            click.style("Tools: ", fg=TEAL_RGB) + f"Using MCP ({server_text}) and tools.py tools"
         )
     elif has_mcp_url:
         server_text = f"{mcp_url_count} server(s)" if mcp_url_count > 1 else "1 server"
         click.echo(click.style("Tools: ", fg=TEAL_RGB) + f"Using MCP ({server_text})")
-    elif has_env_py:
-        click.echo(click.style("Tools: ", fg=TEAL_RGB) + "Using env.py tools")
+    elif has_tools_py:
+        click.echo(click.style("Tools: ", fg=TEAL_RGB) + "Using tools.py tools")
     # Start cube spinner early
     spinner = CubeSpinner()
@@ -2022,7 +2133,7 @@ def run(
     # Add optional files (all in the same directory now)
     optional_files = {
-        "env.py": dir / "env.py",
+        "tools.py": dir / "tools.py",
         "requirements.txt": dir / "requirements.txt",
     }
@@ -2035,6 +2146,17 @@ def run(
                 )
             )
+    # Add Dockerfile.* files for local/ docker images
+    for dockerfile_path in dir.glob("Dockerfile.*"):
+        file_name = dockerfile_path.name
+        click.echo(f"  Found Dockerfile: {file_name}")
+        files.append(
+            (
+                file_name.replace(".", "_"),
+                (file_name, open(dockerfile_path, "rb"), "application/octet-stream"),
+            )
+        )
     # For multipart, we need to omit Content-Type so requests sets the boundary
     headers = auth.get_auth_headers()
     headers.pop("Content-Type", None)
@@ -2056,6 +2178,10 @@ def run(
     if debug:
         submit_data["debug"] = "true"
+    # Add secrets if provided (sent as JSON string)
+    if secret_values:
+        submit_data["secrets"] = json.dumps(secret_values)
     # Start cube spinner if not already running (for small files)
     if not spinner.running:
         spinner.start()

rnow 0.3.1__tar.gz → 0.3.12__tar.gz

rnow 0.3.1tar.gz → 0.3.12tar.gz