PyPI - rnow - Versions diffs - 0.2.4__py3-none-any.whl - Mend

rnow 0.2.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

rnow/__init__.py +5 -0
rnow/__main__.py +7 -0
rnow/cli/__init__.py +6 -0
rnow/cli/auth.py +67 -0
rnow/cli/blob.py +98 -0
rnow/cli/commands.py +2311 -0
rnow/cli/common.py +28 -0
rnow/cli/cube.py +255 -0
rnow/cli/main.py +49 -0
rnow/cli/test.py +728 -0
rnow/cli/token_count.py +295 -0
rnow/core/__init__.py +33 -0
rnow/core/reward.py +333 -0
rnow/core/tool.py +494 -0
rnow/models.py +295 -0
rnow/templates/deepseek-aha/config.yml +26 -0
rnow/templates/deepseek-aha/rewards.py +36 -0
rnow/templates/deepseek-aha/train.jsonl +1000 -0
rnow/templates/mcp-tavily/config.yml +29 -0
rnow/templates/mcp-tavily/requirements.txt +1 -0
rnow/templates/mcp-tavily/rewards.py +25 -0
rnow/templates/mcp-tavily/train.jsonl +500 -0
rnow/templates/new/config.yml +26 -0
rnow/templates/new/requirements.txt +1 -0
rnow/templates/new/rewards.py +0 -0
rnow/templates/new/train.jsonl +0 -0
rnow/templates/rl-nextjs/config.yml +27 -0
rnow/templates/rl-nextjs/requirements.txt +2 -0
rnow/templates/rl-nextjs/rewards.py +446 -0
rnow/templates/rl-nextjs/train.jsonl +1000 -0
rnow/templates/rl-single/config.yml +27 -0
rnow/templates/rl-single/requirements.txt +1 -0
rnow/templates/rl-single/rewards.py +14 -0
rnow/templates/rl-single/train.jsonl +1000 -0
rnow/templates/rl-tools/config.yml +27 -0
rnow/templates/rl-tools/env.py +38 -0
rnow/templates/rl-tools/requirements.txt +3 -0
rnow/templates/rl-tools/rewards.py +25 -0
rnow/templates/rl-tools/train.jsonl +500 -0
rnow/templates/sft/config.yml +20 -0
rnow/templates/sft/train.jsonl +100 -0
rnow/templates/tutorial-reward/config.yml +27 -0
rnow/templates/tutorial-reward/requirements.txt +1 -0
rnow/templates/tutorial-reward/rewards.py +15 -0
rnow/templates/tutorial-reward/train.jsonl +1000 -0
rnow/templates/tutorial-tool/config.yml +27 -0
rnow/templates/tutorial-tool/env.py +7 -0
rnow/templates/tutorial-tool/requirements.txt +3 -0
rnow/templates/tutorial-tool/rewards.py +7 -0
rnow/templates/tutorial-tool/train.jsonl +1266 -0
rnow-0.2.4.dist-info/METADATA +135 -0
rnow-0.2.4.dist-info/RECORD +56 -0
rnow-0.2.4.dist-info/WHEEL +5 -0
rnow-0.2.4.dist-info/entry_points.txt +2 -0
rnow-0.2.4.dist-info/licenses/LICENSE +21 -0
rnow-0.2.4.dist-info/top_level.txt +1 -0

rnow/templates/new/config.yml ADDED Viewed

@@ -0,0 +1,26 @@
+project_id: ""
+project_name: "rlvr-project"
+dataset_id: ""
+dataset_name: "train"
+dataset_type: rl
+organization_id: ""
+data:
+  train_file: train.jsonl
+  batch_size: 32
+  group_size: 16
+model:
+  path: Qwen/Qwen3-8B
+  qlora_rank: 32
+  name: "My RL Model"
+  description: "Reinforcement learning fine-tuned model"
+algorithm:
+  loss_fn: ppo
+  adv_estimator: grpo
+  kl_penalty_coef: 0.01
+rollout:
+  max_turns: 1
+  max_tokens: 16384
+trainer:
+  num_epochs: 30
+  learning_rate: 0.0001
+  save_step: 20

rnow/templates/new/requirements.txt ADDED Viewed

	@@ -0,0 +1 @@
1	+ # Add your project dependencies here

rnow/templates/new/rewards.py ADDED Viewed

File without changes

rnow/templates/new/train.jsonl ADDED Viewed

File without changes

rnow/templates/rl-nextjs/config.yml ADDED Viewed

@@ -0,0 +1,27 @@
+project_id: ""
+project_name: "Next.js Code Generation"
+dataset_id: ""
+dataset_name: "nextjs-components"
+dataset_type: rl
+organization_id: ""
+data:
+  train_file: train.jsonl
+  batch_size: 32
+  group_size: 16
+model:
+  path: Qwen/Qwen3-8B
+  qlora_rank: 32
+  name: "Next.js Code Generator"
+  description: "RL model for Next.js code generation"
+algorithm:
+  loss_fn: ppo
+  adv_estimator: grpo
+  kl_penalty_coef: 0.01
+rollout:
+  max_turns: 1
+  max_tokens: 16384
+  termination_policy: max_turns
+trainer:
+  num_epochs: 10
+  learning_rate: 0.0001
+  save_step: 833

rnow/templates/rl-nextjs/requirements.txt ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ ast-grep-py>=0.29.3
2	+ pydantic>=2.0.0

rnow/templates/rl-nextjs/rewards.py ADDED Viewed

@@ -0,0 +1,446 @@
+"""
+Reward functions for Next.js ast-grep rules using ReinforceNow framework.
+Each reward function checks if the generated code matches the expected ast-grep pattern.
+"""
+import re
+from ast_grep_py import Config, SgRoot
+from rnow.core import RewardArgs, reward
+@reward(precondition=True)
+def code_block(args: RewardArgs, messages: list) -> float:
+    """Precondition: Response must contain a ```typescript/tsx code block."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    return 1.0 if match else 0.0
+@reward
+def layout_syntax_1(args: RewardArgs, messages: list) -> float:
+    """Reward for correct Next.js layout syntax with children prop."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "all": [
+                        {
+                            "pattern": "function $NAME({ children }: { children: React.ReactNode }) { $$$BODY }"
+                        },
+                        {"kind": "function_declaration"},
+                        {"has": {"pattern": "children", "stopBy": "end"}},
+                    ]
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def server_dynamic_segment_1(args: RewardArgs, messages: list) -> float:
+    """Reward for correct async param extraction in dynamic segment pages."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "all": [
+                        {"pattern": "function $FUNC($$$ARGS) { $$$BODY }"},
+                        {"kind": "function_declaration"},
+                        {"has": {"pattern": "const { $VAR2 } = await params", "stopBy": "end"}},
+                    ]
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def server_dynamic_segment_2(args: RewardArgs, messages: list) -> float:
+    """Reward for generateStaticParams pattern."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "kind": "program",
+                    "all": [
+                        {
+                            "has": {
+                                "pattern": "function generateStaticParams() { $$$BODY }",
+                                "has": {
+                                    "pattern": "return posts.map((post) => ({ slug: post.slug, }))",
+                                    "stopBy": "end",
+                                },
+                                "stopBy": "end",
+                            }
+                        }
+                    ],
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def server_search_params(args: RewardArgs, messages: list) -> float:
+    """Reward for correct server searchParams handling."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "all": [
+                        {
+                            "pattern": "async function $FUNC({ searchParams }: { searchParams: Promise<{ [key: string]: string | string[] | undefined }> }) { $$$BODY }"
+                        },
+                        {"kind": "function_declaration"},
+                        {
+                            "has": {
+                                "pattern": "const $VAR = (await searchParams).$VAR",
+                                "stopBy": "end",
+                            }
+                        },
+                    ]
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def use_client_directive(args: RewardArgs, messages: list) -> float:
+    """Reward for correct 'use client' directive placement."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(Config(rule={"kind": "string", "pattern": '"use client"'}))
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def metadata_export(args: RewardArgs, messages: list) -> float:
+    """Reward for valid metadata export."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(Config(rule={"pattern": "export const metadata = { $$$BODY }"}))
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def error_boundary(args: RewardArgs, messages: list) -> float:
+    """Reward for valid error boundary component."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "all": [
+                        {
+                            "pattern": """export default function Error({
+  error,
+  reset,
+}: {
+  error: Error
+  reset: () => void
+}) {
+  $$$BODY
+}"""
+                        },
+                        {"has": {"pattern": "reset()", "stopBy": "end"}},
+                    ]
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def not_found_boundary(args: RewardArgs, messages: list) -> float:
+    """Reward for not-found boundary component."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export default function NotFound() { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def loading_boundary(args: RewardArgs, messages: list) -> float:
+    """Reward for loading boundary component."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export default function Loading() { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def template_component(args: RewardArgs, messages: list) -> float:
+    """Reward for template component."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(
+                rule={
+                    "all": [
+                        {
+                            "pattern": "export default function Template({ children }: { children: React.ReactNode }) { $$$BODY }"
+                        },
+                        {"has": {"pattern": "children", "stopBy": "end"}},
+                    ]
+                }
+            )
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def redirect_usage(args: RewardArgs, messages: list) -> float:
+    """Reward for usage of Next.js redirect() helper."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"kind": "program", "has": {"pattern": "redirect(", "stopBy": "end"}})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def notfound_function_usage(args: RewardArgs, messages: list) -> float:
+    """Reward for usage of Next.js notFound() function."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"kind": "program", "has": {"pattern": "notFound(", "stopBy": "end"}})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def generate_metadata_function(args: RewardArgs, messages: list) -> float:
+    """Reward for dynamic generateMetadata() function."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export async function generateMetadata() { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def generate_metadata_object(args: RewardArgs, messages: list) -> float:
+    """Reward for static metadata object export."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(Config(rule={"pattern": "export const metadata = { $$$BODY }"}))
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def route_handler_get(args: RewardArgs, messages: list) -> float:
+    """Reward for GET route handler in Next.js Route Handlers."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export async function GET(request: Request) { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def route_handler_post(args: RewardArgs, messages: list) -> float:
+    """Reward for POST route handler in Next.js Route Handlers."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export async function POST(request: Request) { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def default_page_component(args: RewardArgs, messages: list) -> float:
+    """Reward for default page component."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"pattern": "export default function Page() { $$$BODY }"})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def client_component_detection(args: RewardArgs, messages: list) -> float:
+    """Reward for client components using 'use client' directive."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"all": [{"kind": "string"}, {"pattern": '"use client"'}]})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0
+@reward
+def server_component_detection(args: RewardArgs, messages: list) -> float:
+    """Reward for server components (without 'use client')."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        has_function = root.find_all(Config(rule={"kind": "function_declaration"}))
+        has_use_client = root.find_all(Config(rule={"kind": "string", "pattern": '"use client"'}))
+        return 1.0 if has_function and not has_use_client else 0.0
+    except Exception:
+        return 0.0
+@reward
+def parallel_route_segment(args: RewardArgs, messages: list) -> float:
+    """Reward for parallel route segments (e.g., @modal)."""
+    response = messages[-1].get("content", "")
+    match = re.search(r"```(?:typescript|tsx|ts)\n(.*?)```", response, re.DOTALL)
+    if not match:
+        return 0.0
+    try:
+        root = SgRoot(match.group(1).strip(), "tsx").root()
+        matches = root.find_all(
+            Config(rule={"kind": "program", "has": {"pattern": "@", "stopBy": "end"}})
+        )
+        return 1.0 if matches else 0.0
+    except Exception:
+        return 0.0