PyPI - synkro - Versions diffs - 0.4.36__py3-none-any.whl - Mend

synkro 0.4.36__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of synkro might be problematic. Click here for more details.

Files changed (81) hide show

synkro/__init__.py +331 -0
synkro/advanced.py +184 -0
synkro/cli.py +156 -0
synkro/core/__init__.py +7 -0
synkro/core/checkpoint.py +250 -0
synkro/core/dataset.py +432 -0
synkro/core/policy.py +337 -0
synkro/errors.py +178 -0
synkro/examples/__init__.py +148 -0
synkro/factory.py +291 -0
synkro/formatters/__init__.py +18 -0
synkro/formatters/chatml.py +121 -0
synkro/formatters/langfuse.py +98 -0
synkro/formatters/langsmith.py +98 -0
synkro/formatters/qa.py +112 -0
synkro/formatters/sft.py +90 -0
synkro/formatters/tool_call.py +127 -0
synkro/generation/__init__.py +9 -0
synkro/generation/follow_ups.py +134 -0
synkro/generation/generator.py +314 -0
synkro/generation/golden_responses.py +269 -0
synkro/generation/golden_scenarios.py +333 -0
synkro/generation/golden_tool_responses.py +791 -0
synkro/generation/logic_extractor.py +126 -0
synkro/generation/multiturn_responses.py +177 -0
synkro/generation/planner.py +131 -0
synkro/generation/responses.py +189 -0
synkro/generation/scenarios.py +90 -0
synkro/generation/tool_responses.py +625 -0
synkro/generation/tool_simulator.py +114 -0
synkro/interactive/__init__.py +16 -0
synkro/interactive/hitl_session.py +205 -0
synkro/interactive/intent_classifier.py +94 -0
synkro/interactive/logic_map_editor.py +176 -0
synkro/interactive/rich_ui.py +459 -0
synkro/interactive/scenario_editor.py +198 -0
synkro/llm/__init__.py +7 -0
synkro/llm/client.py +309 -0
synkro/llm/rate_limits.py +99 -0
synkro/models/__init__.py +50 -0
synkro/models/anthropic.py +26 -0
synkro/models/google.py +19 -0
synkro/models/local.py +104 -0
synkro/models/openai.py +31 -0
synkro/modes/__init__.py +13 -0
synkro/modes/config.py +66 -0
synkro/modes/conversation.py +35 -0
synkro/modes/tool_call.py +18 -0
synkro/parsers.py +442 -0
synkro/pipeline/__init__.py +20 -0
synkro/pipeline/phases.py +592 -0
synkro/pipeline/runner.py +769 -0
synkro/pipelines.py +136 -0
synkro/prompts/__init__.py +57 -0
synkro/prompts/base.py +167 -0
synkro/prompts/golden_templates.py +533 -0
synkro/prompts/interactive_templates.py +198 -0
synkro/prompts/multiturn_templates.py +156 -0
synkro/prompts/templates.py +281 -0
synkro/prompts/tool_templates.py +318 -0
synkro/quality/__init__.py +14 -0
synkro/quality/golden_refiner.py +163 -0
synkro/quality/grader.py +153 -0
synkro/quality/multiturn_grader.py +150 -0
synkro/quality/refiner.py +137 -0
synkro/quality/tool_grader.py +126 -0
synkro/quality/tool_refiner.py +128 -0
synkro/quality/verifier.py +228 -0
synkro/reporting.py +464 -0
synkro/schemas.py +521 -0
synkro/types/__init__.py +43 -0
synkro/types/core.py +153 -0
synkro/types/dataset_type.py +33 -0
synkro/types/logic_map.py +348 -0
synkro/types/tool.py +94 -0
synkro-0.4.36.data/data/examples/__init__.py +148 -0
synkro-0.4.36.dist-info/METADATA +507 -0
synkro-0.4.36.dist-info/RECORD +81 -0
synkro-0.4.36.dist-info/WHEEL +4 -0
synkro-0.4.36.dist-info/entry_points.txt +2 -0
synkro-0.4.36.dist-info/licenses/LICENSE +21 -0

synkro/modes/config.py ADDED Viewed

@@ -0,0 +1,66 @@
+"""Mode configuration that bundles prompts, schema, and formatter per dataset type."""
+from dataclasses import dataclass
+from typing import TYPE_CHECKING, Type
+if TYPE_CHECKING:
+    from synkro.types.dataset_type import DatasetType
+@dataclass
+class ModeConfig:
+    """
+    Configuration bundle for a dataset type.
+    Defines all the prompts, schemas, and formatters needed
+    for generating a specific type of dataset.
+    """
+    # Prompts
+    scenario_prompt: str
+    """Prompt for generating scenarios/questions"""
+    response_prompt: str
+    """Prompt for generating responses/answers"""
+    grade_prompt: str
+    """Prompt for grading quality"""
+    refine_prompt: str
+    """Prompt for refining failed responses"""
+    # Output configuration
+    output_description: str
+    """Human-readable description of output format"""
+def get_mode_config(dataset_type: "DatasetType") -> ModeConfig:
+    """
+    Get the mode configuration for a dataset type.
+    Args:
+        dataset_type: The type of dataset to generate
+    Returns:
+        ModeConfig with appropriate prompts and settings
+    Example:
+        >>> from synkro import DatasetType
+        >>> config = get_mode_config(DatasetType.CONVERSATION)
+    """
+    from synkro.modes.conversation import CONVERSATION_CONFIG, INSTRUCTION_CONFIG, EVALUATION_CONFIG
+    from synkro.modes.tool_call import TOOL_CALL_CONFIG
+    configs = {
+        "conversation": CONVERSATION_CONFIG,
+        "instruction": INSTRUCTION_CONFIG,
+        "evaluation": EVALUATION_CONFIG,
+        "tool_call": TOOL_CALL_CONFIG,
+    }
+    type_value = dataset_type.value if hasattr(dataset_type, 'value') else str(dataset_type)
+    if type_value not in configs:
+        raise ValueError(f"Unknown dataset type: {dataset_type}")
+    return configs[type_value]

synkro/modes/conversation.py ADDED Viewed

@@ -0,0 +1,35 @@
+"""Conversation mode configuration."""
+from synkro.modes.config import ModeConfig
+from synkro.prompts.templates import (
+    SCENARIO_GENERATOR_PROMPT,
+    SINGLE_RESPONSE_PROMPT,
+    SINGLE_GRADE_PROMPT,
+    BATCHED_REFINER_PROMPT,
+)
+CONVERSATION_CONFIG = ModeConfig(
+    scenario_prompt=SCENARIO_GENERATOR_PROMPT,
+    response_prompt=SINGLE_RESPONSE_PROMPT,
+    grade_prompt=SINGLE_GRADE_PROMPT,
+    refine_prompt=BATCHED_REFINER_PROMPT,
+    output_description="Multi-turn conversation: {messages: [{role, content}, ...]}",
+)
+# Instruction uses the same prompts - turns=1 is enforced in the generator
+INSTRUCTION_CONFIG = ModeConfig(
+    scenario_prompt=SCENARIO_GENERATOR_PROMPT,
+    response_prompt=SINGLE_RESPONSE_PROMPT,
+    grade_prompt=SINGLE_GRADE_PROMPT,
+    refine_prompt=BATCHED_REFINER_PROMPT,
+    output_description="Single-turn instruction: {messages: [{role: 'user'}, {role: 'assistant'}]}",
+)
+# Evaluation uses same prompts but outputs Q&A format with ground truth
+EVALUATION_CONFIG = ModeConfig(
+    scenario_prompt=SCENARIO_GENERATOR_PROMPT,
+    response_prompt=SINGLE_RESPONSE_PROMPT,
+    grade_prompt=SINGLE_GRADE_PROMPT,
+    refine_prompt=BATCHED_REFINER_PROMPT,
+    output_description="Q&A evaluation: {question, answer, expected_outcome, ground_truth_rules, difficulty}",
+)

synkro/modes/tool_call.py ADDED Viewed

@@ -0,0 +1,18 @@
+"""Tool Call mode configuration."""
+from synkro.modes.config import ModeConfig
+from synkro.prompts.tool_templates import (
+    TOOL_SCENARIO_PROMPT,
+    TOOL_RESPONSE_PROMPT,
+    TOOL_GRADE_PROMPT,
+    TOOL_REFINE_PROMPT,
+)
+TOOL_CALL_CONFIG = ModeConfig(
+    scenario_prompt=TOOL_SCENARIO_PROMPT,
+    response_prompt=TOOL_RESPONSE_PROMPT,
+    grade_prompt=TOOL_GRADE_PROMPT,
+    refine_prompt=TOOL_REFINE_PROMPT,
+    output_description="Tool calling: {messages: [system, user, {tool_calls}, {tool}, assistant]}",
+)

synkro/parsers.py ADDED Viewed

@@ -0,0 +1,442 @@
+"""Response parsing functions for LLM outputs with robust JSON extraction."""
+import json
+import re
+from typing import Any
+from synkro.schemas import (
+    ScenarioOutput,
+    GradeOutput,
+    SingleGrade,
+    SingleResponse,
+    PolicyComplexity,
+    PolicyPlan,
+    ChatMessage,
+)
+from synkro.prompts.templates import SYSTEM_PROMPT
+def strip_markdown_fences(content: str) -> str:
+    """Strip markdown code fences from content."""
+    # Remove ```json ... ``` blocks, keeping just the content
+    content = re.sub(r'```json\s*', '', content)
+    content = re.sub(r'```\s*', '', content)
+    return content.strip()
+def extract_json(content: str, start_char: str = "[") -> str | None:
+    """
+    Extract JSON from a string that may contain other text.
+    Args:
+        content: Raw content that may contain JSON
+        start_char: Starting character to look for ('[' for arrays, '{' for objects)
+    Returns:
+        Extracted JSON string or None if not found
+    """
+    end_char = "]" if start_char == "[" else "}"
+    start = content.find(start_char)
+    if start == -1:
+        return None
+    depth = 0
+    in_string = False
+    escape = False
+    for i in range(start, len(content)):
+        char = content[i]
+        if escape:
+            escape = False
+            continue
+        if char == "\\" and in_string:
+            escape = True
+            continue
+        if char == '"':
+            in_string = not in_string
+            continue
+        if in_string:
+            continue
+        if char == start_char:
+            depth += 1
+        if char == end_char:
+            depth -= 1
+        if depth == 0:
+            return content[start : i + 1]
+    return None
+def extract_content(response: Any) -> str:
+    """
+    Extract text content from various LLM response formats.
+    Args:
+        response: Raw response from an LLM
+    Returns:
+        Extracted text content
+    """
+    try:
+        if isinstance(response, str):
+            return response
+        # Gemini format
+        if isinstance(response, dict):
+            if "candidates" in response:
+                return response["candidates"][0]["content"]["parts"][0]["text"]
+            # OpenAI format
+            if "choices" in response:
+                return response["choices"][0]["message"]["content"]
+            # Simple content field
+            if "content" in response:
+                return response["content"]
+            if "text" in response:
+                return response["text"]
+            if "output" in response:
+                return response["output"]
+        return json.dumps(response)
+    except Exception:
+        return str(response)
+def parse_scenarios(response: Any, expected_count: int) -> list[ScenarioOutput]:
+    """
+    Parse scenario output from LLM response.
+    Args:
+        response: Raw LLM response
+        expected_count: Number of scenarios expected
+    Returns:
+        List of parsed scenarios
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "[")
+        if json_str:
+            parsed = json.loads(json_str)
+            if isinstance(parsed, list):
+                scenarios = []
+                for s in parsed[:expected_count]:
+                    scenarios.append(
+                        ScenarioOutput(
+                            scenario=s.get("scenario", s.get("description", "")),
+                            context=s.get("context", s.get("background", "")),
+                        )
+                    )
+                return scenarios
+    except Exception:
+        pass  # Fallback handles this
+    # Fallback: generate placeholder scenarios
+    return [
+        ScenarioOutput(
+            scenario=f"Policy compliance scenario {i + 1}",
+            context="General policy application context",
+        )
+        for i in range(expected_count)
+    ]
+def parse_batched_responses(
+    response: Any, expected_count: int, scenarios: list[ScenarioOutput]
+) -> list[dict]:
+    """
+    Parse batched response output from LLM.
+    Args:
+        response: Raw LLM response
+        expected_count: Number of responses expected
+        scenarios: Original scenarios for fallback
+    Returns:
+        List of response dicts with 'index' and 'messages'
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "[")
+        if json_str:
+            parsed = json.loads(json_str)
+            if isinstance(parsed, list):
+                results = []
+                for r in parsed:
+                    index = r.get("index", 0)
+                    if isinstance(r.get("messages"), list) and len(r["messages"]) > 0:
+                        results.append(
+                            {
+                                "index": index,
+                                "messages": [
+                                    ChatMessage(role=m["role"], content=m.get("content", ""))
+                                    for m in r["messages"]
+                                ],
+                            }
+                        )
+                    else:
+                        # Fallback: construct messages from old format
+                        scenario = scenarios[index] if index < len(scenarios) else scenarios[0]
+                        results.append(
+                            {
+                                "index": index,
+                                "messages": [
+                                    ChatMessage(role="system", content=SYSTEM_PROMPT),
+                                    ChatMessage(
+                                        role="user",
+                                        content=f"Scenario: {scenario.scenario}\n\nContext: {scenario.context}",
+                                    ),
+                                    ChatMessage(
+                                        role="assistant", content=r.get("response", "")
+                                    ),
+                                ],
+                            }
+                        )
+                return results
+    except Exception:
+        pass  # Fallback handles this
+    # Fallback
+    return [
+        {
+            "index": i,
+            "messages": [
+                ChatMessage(role="system", content=SYSTEM_PROMPT),
+                ChatMessage(
+                    role="user",
+                    content=f"Scenario: {scenarios[i].scenario}\n\nContext: {scenarios[i].context}",
+                ),
+                ChatMessage(role="assistant", content="Unable to generate response"),
+            ],
+        }
+        for i in range(min(expected_count, len(scenarios)))
+    ]
+def parse_batched_grades(response: Any) -> list[GradeOutput]:
+    """
+    Parse grading output from LLM response.
+    Args:
+        response: Raw LLM response
+    Returns:
+        List of parsed grades
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "[")
+        if json_str:
+            parsed = json.loads(json_str)
+            if isinstance(parsed, list):
+                grades = []
+                for g in parsed:
+                    grades.append(
+                        GradeOutput(
+                            index=g.get("index", 0),
+                            passed=g.get("pass", False),
+                            policy_violations=g.get("policy_violations", []),
+                            missing_citations=g.get("missing_citations", []),
+                            incomplete_reasoning=g.get("incomplete_reasoning", []),
+                            vague_recommendations=g.get("vague_recommendations", []),
+                            feedback=g.get("feedback", ""),
+                        )
+                    )
+                return grades
+    except Exception:
+        pass  # Return empty list below
+    return []
+def parse_single_response(response: Any) -> SingleResponse | None:
+    """
+    Parse a single response from parallel generation.
+    Args:
+        response: Raw LLM response for a single scenario
+    Returns:
+        Parsed SingleResponse or None if parsing failed
+    """
+    try:
+        content = extract_content(response)
+        # Strip markdown fences first
+        content = strip_markdown_fences(content)
+        # Try to find and parse valid JSON objects with messages
+        remaining = content
+        while remaining:
+            json_str = extract_json(remaining, "{")
+            if not json_str:
+                break
+            try:
+                parsed = json.loads(json_str)
+                # Validate it has the expected structure
+                if isinstance(parsed.get("messages"), list) and len(parsed["messages"]) >= 1:
+                    messages = []
+                    valid = True
+                    for m in parsed["messages"]:
+                        if not isinstance(m, dict) or "role" not in m or "content" not in m:
+                            valid = False
+                            break
+                        msg_content = m.get("content", "")
+                        # Reject if content contains refinement prompt leak markers
+                        if "GRADER FEEDBACK" in msg_content or "Generate an IMPROVED response" in msg_content:
+                            valid = False
+                            break
+                        messages.append(ChatMessage(role=m["role"], content=msg_content))
+                    if valid and len(messages) >= 1:
+                        return SingleResponse(messages=messages)
+            except json.JSONDecodeError:
+                pass
+            # Move past this JSON object and try to find another
+            end_pos = remaining.find(json_str) + len(json_str)
+            remaining = remaining[end_pos:]
+    except Exception:
+        pass  # Caller handles None with fallback
+    return None
+def parse_single_grade(response: Any) -> SingleGrade | None:
+    """
+    Parse a single grade from parallel grading.
+    Args:
+        response: Raw LLM response for a single grade
+    Returns:
+        Parsed SingleGrade or None if parsing failed
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "{")
+        if json_str:
+            parsed = json.loads(json_str)
+            return SingleGrade(
+                passed=parsed.get("pass", False),
+                policy_violations=parsed.get("policy_violations", []),
+                missing_citations=parsed.get("missing_citations", []),
+                incomplete_reasoning=parsed.get("incomplete_reasoning", []),
+                vague_recommendations=parsed.get("vague_recommendations", []),
+                feedback=parsed.get("feedback", ""),
+            )
+    except Exception:
+        pass  # Caller handles None with fallback
+    return None
+def parse_policy_complexity(response: Any) -> PolicyComplexity:
+    """
+    Parse policy complexity analysis from LLM response.
+    Args:
+        response: Raw LLM response
+    Returns:
+        Parsed PolicyComplexity with defaults if parsing fails
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "{")
+        if json_str:
+            parsed = json.loads(json_str)
+            return PolicyComplexity(
+                variable_count=parsed.get("variable_count", 2),
+                complexity_level=parsed.get("complexity_level", "conditional"),
+                recommended_turns=parsed.get("recommended_turns", 3),
+                reasoning=parsed.get("reasoning", "Defaulting to conditional complexity"),
+            )
+    except Exception:
+        pass  # Fallback handles this
+    # Default fallback
+    return PolicyComplexity(
+        variable_count=2,
+        complexity_level="conditional",
+        recommended_turns=3,
+        reasoning="Unable to analyze policy, defaulting to conditional complexity with 3 turns",
+    )
+def parse_policy_plan(response: Any, target_traces: int) -> PolicyPlan:
+    """
+    Parse policy planning output from LLM response.
+    Args:
+        response: Raw LLM response
+        target_traces: Target number of traces for fallback
+    Returns:
+        Parsed PolicyPlan with defaults if parsing fails
+    """
+    try:
+        content = extract_content(response)
+        json_str = extract_json(content, "{")
+        if json_str:
+            parsed = json.loads(json_str)
+            categories = []
+            for cat in parsed.get("categories", []):
+                categories.append(
+                    {
+                        "name": cat.get("name", "General"),
+                        "description": cat.get("description", "General scenarios"),
+                        "traces": cat.get("traces", target_traces // 3),
+                    }
+                )
+            if categories:
+                return PolicyPlan(
+                    categories=categories,
+                    reasoning=parsed.get("reasoning", ""),
+                )
+    except Exception:
+        pass  # Fallback handles this
+    # Default fallback plan
+    third = target_traces // 3
+    remainder = target_traces - (third * 3)
+    return PolicyPlan(
+        categories=[
+            {"name": "Happy Path", "description": "Clear success cases", "traces": third},
+            {"name": "Edge Cases", "description": "Ambiguous situations", "traces": third},
+            {
+                "name": "Violations",
+                "description": "Clear failure cases",
+                "traces": third + remainder,
+            },
+        ],
+        reasoning="Default plan - unable to parse LLM response",
+    )

synkro/pipeline/__init__.py ADDED Viewed

@@ -0,0 +1,20 @@
+"""Pipeline module for decomposed generation phases."""
+from synkro.pipeline.phases import (
+    PlanPhase,
+    ScenarioPhase,
+    ResponsePhase,
+    GradingPhase,
+    ToolCallResponsePhase,
+)
+from synkro.pipeline.runner import GenerationPipeline
+__all__ = [
+    "PlanPhase",
+    "ScenarioPhase",
+    "ResponsePhase",
+    "GradingPhase",
+    "ToolCallResponsePhase",
+    "GenerationPipeline",
+]