PyPI - deepwork - Versions diffs - 0.1.0__py3-none-any.whl - Mend

deepwork 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (41) hide show

deepwork/__init__.py +25 -0
deepwork/cli/__init__.py +1 -0
deepwork/cli/install.py +290 -0
deepwork/cli/main.py +25 -0
deepwork/cli/sync.py +176 -0
deepwork/core/__init__.py +1 -0
deepwork/core/adapters.py +373 -0
deepwork/core/detector.py +93 -0
deepwork/core/generator.py +290 -0
deepwork/core/hooks_syncer.py +206 -0
deepwork/core/parser.py +310 -0
deepwork/core/policy_parser.py +285 -0
deepwork/hooks/__init__.py +1 -0
deepwork/hooks/evaluate_policies.py +159 -0
deepwork/schemas/__init__.py +1 -0
deepwork/schemas/job_schema.py +212 -0
deepwork/schemas/policy_schema.py +68 -0
deepwork/standard_jobs/deepwork_jobs/job.yml +102 -0
deepwork/standard_jobs/deepwork_jobs/steps/define.md +359 -0
deepwork/standard_jobs/deepwork_jobs/steps/implement.md +435 -0
deepwork/standard_jobs/deepwork_jobs/steps/refine.md +447 -0
deepwork/standard_jobs/deepwork_policy/hooks/capture_work_tree.sh +26 -0
deepwork/standard_jobs/deepwork_policy/hooks/get_changed_files.sh +30 -0
deepwork/standard_jobs/deepwork_policy/hooks/global_hooks.yml +8 -0
deepwork/standard_jobs/deepwork_policy/hooks/policy_stop_hook.sh +72 -0
deepwork/standard_jobs/deepwork_policy/hooks/user_prompt_submit.sh +17 -0
deepwork/standard_jobs/deepwork_policy/job.yml +35 -0
deepwork/standard_jobs/deepwork_policy/steps/define.md +174 -0
deepwork/templates/__init__.py +1 -0
deepwork/templates/claude/command-job-step.md.jinja +210 -0
deepwork/templates/gemini/command-job-step.toml.jinja +169 -0
deepwork/utils/__init__.py +1 -0
deepwork/utils/fs.py +128 -0
deepwork/utils/git.py +164 -0
deepwork/utils/validation.py +31 -0
deepwork/utils/yaml_utils.py +89 -0
deepwork-0.1.0.dist-info/METADATA +389 -0
deepwork-0.1.0.dist-info/RECORD +41 -0
deepwork-0.1.0.dist-info/WHEEL +4 -0
deepwork-0.1.0.dist-info/entry_points.txt +2 -0
deepwork-0.1.0.dist-info/licenses/LICENSE.md +60 -0

deepwork/core/parser.py ADDED Viewed

@@ -0,0 +1,310 @@
+"""Job definition parser."""
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Any
+from deepwork.schemas.job_schema import JOB_SCHEMA, LIFECYCLE_HOOK_EVENTS
+from deepwork.utils.validation import ValidationError, validate_against_schema
+from deepwork.utils.yaml_utils import YAMLError, load_yaml
+class ParseError(Exception):
+    """Exception raised for job parsing errors."""
+    pass
+@dataclass
+class StepInput:
+    """Represents a step input (either user parameter or file from previous step)."""
+    # User parameter input
+    name: str | None = None
+    description: str | None = None
+    # File input from previous step
+    file: str | None = None
+    from_step: str | None = None
+    def is_user_input(self) -> bool:
+        """Check if this is a user parameter input."""
+        return self.name is not None and self.description is not None
+    def is_file_input(self) -> bool:
+        """Check if this is a file input from previous step."""
+        return self.file is not None and self.from_step is not None
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "StepInput":
+        """Create StepInput from dictionary."""
+        return cls(
+            name=data.get("name"),
+            description=data.get("description"),
+            file=data.get("file"),
+            from_step=data.get("from_step"),
+        )
+@dataclass
+class HookAction:
+    """Represents a hook action configuration.
+    Hook actions define what happens when a lifecycle hook is triggered.
+    Three types are supported:
+    - prompt: Inline prompt text for validation/action
+    - prompt_file: Path to a file containing the prompt
+    - script: Path to a shell script for custom logic
+    """
+    # Inline prompt
+    prompt: str | None = None
+    # Prompt file reference (relative to job directory)
+    prompt_file: str | None = None
+    # Shell script reference (relative to job directory)
+    script: str | None = None
+    def is_prompt(self) -> bool:
+        """Check if this is an inline prompt hook."""
+        return self.prompt is not None
+    def is_prompt_file(self) -> bool:
+        """Check if this is a prompt file reference hook."""
+        return self.prompt_file is not None
+    def is_script(self) -> bool:
+        """Check if this is a shell script hook."""
+        return self.script is not None
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "HookAction":
+        """Create HookAction from dictionary."""
+        return cls(
+            prompt=data.get("prompt"),
+            prompt_file=data.get("prompt_file"),
+            script=data.get("script"),
+        )
+# Backward compatibility alias
+StopHook = HookAction
+@dataclass
+class Step:
+    """Represents a single step in a job."""
+    id: str
+    name: str
+    description: str
+    instructions_file: str
+    inputs: list[StepInput] = field(default_factory=list)
+    outputs: list[str] = field(default_factory=list)
+    dependencies: list[str] = field(default_factory=list)
+    # New: hooks dict mapping lifecycle event names to HookAction lists
+    # Event names: after_agent, before_tool, before_prompt
+    hooks: dict[str, list[HookAction]] = field(default_factory=dict)
+    @property
+    def stop_hooks(self) -> list[HookAction]:
+        """
+        Backward compatibility property for stop_hooks.
+        Returns hooks for after_agent event.
+        """
+        return self.hooks.get("after_agent", [])
+    @classmethod
+    def from_dict(cls, data: dict[str, Any]) -> "Step":
+        """Create Step from dictionary."""
+        # Parse new hooks structure
+        hooks: dict[str, list[HookAction]] = {}
+        if "hooks" in data:
+            hooks_data = data["hooks"]
+            for event in LIFECYCLE_HOOK_EVENTS:
+                if event in hooks_data:
+                    hooks[event] = [HookAction.from_dict(h) for h in hooks_data[event]]
+        # Handle deprecated stop_hooks -> after_agent
+        if "stop_hooks" in data and data["stop_hooks"]:
+            # Merge with any existing after_agent hooks
+            after_agent_hooks = hooks.get("after_agent", [])
+            after_agent_hooks.extend([HookAction.from_dict(h) for h in data["stop_hooks"]])
+            hooks["after_agent"] = after_agent_hooks
+        return cls(
+            id=data["id"],
+            name=data["name"],
+            description=data["description"],
+            instructions_file=data["instructions_file"],
+            inputs=[StepInput.from_dict(inp) for inp in data.get("inputs", [])],
+            outputs=data["outputs"],
+            dependencies=data.get("dependencies", []),
+            hooks=hooks,
+        )
+@dataclass
+class JobDefinition:
+    """Represents a complete job definition."""
+    name: str
+    version: str
+    summary: str
+    description: str | None
+    steps: list[Step]
+    job_dir: Path
+    def get_step(self, step_id: str) -> Step | None:
+        """
+        Get step by ID.
+        Args:
+            step_id: Step ID to retrieve
+        Returns:
+            Step if found, None otherwise
+        """
+        for step in self.steps:
+            if step.id == step_id:
+                return step
+        return None
+    def validate_dependencies(self) -> None:
+        """
+        Validate step dependencies.
+        Raises:
+            ParseError: If dependencies are invalid (missing steps, circular deps)
+        """
+        step_ids = {step.id for step in self.steps}
+        # Check all dependencies reference existing steps
+        for step in self.steps:
+            for dep_id in step.dependencies:
+                if dep_id not in step_ids:
+                    raise ParseError(f"Step '{step.id}' depends on non-existent step '{dep_id}'")
+        # Check for circular dependencies using topological sort
+        visited = set()
+        rec_stack = set()
+        def has_cycle(step_id: str) -> bool:
+            visited.add(step_id)
+            rec_stack.add(step_id)
+            step = self.get_step(step_id)
+            if step:
+                for dep_id in step.dependencies:
+                    if dep_id not in visited:
+                        if has_cycle(dep_id):
+                            return True
+                    elif dep_id in rec_stack:
+                        return True
+            rec_stack.remove(step_id)
+            return False
+        for step in self.steps:
+            if step.id not in visited:
+                if has_cycle(step.id):
+                    raise ParseError(f"Circular dependency detected involving step '{step.id}'")
+    def validate_file_inputs(self) -> None:
+        """
+        Validate that file inputs reference valid steps and dependencies.
+        Raises:
+            ParseError: If file inputs are invalid
+        """
+        for step in self.steps:
+            for inp in step.inputs:
+                if inp.is_file_input():
+                    # Check that from_step exists
+                    from_step = self.get_step(inp.from_step)  # type: ignore
+                    if from_step is None:
+                        raise ParseError(
+                            f"Step '{step.id}' references non-existent step "
+                            f"'{inp.from_step}' in file input"
+                        )
+                    # Check that from_step is in dependencies
+                    if inp.from_step not in step.dependencies:
+                        raise ParseError(
+                            f"Step '{step.id}' has file input from '{inp.from_step}' "
+                            f"but '{inp.from_step}' is not in dependencies"
+                        )
+    @classmethod
+    def from_dict(cls, data: dict[str, Any], job_dir: Path) -> "JobDefinition":
+        """
+        Create JobDefinition from dictionary.
+        Args:
+            data: Parsed YAML data
+            job_dir: Directory containing job definition
+        Returns:
+            JobDefinition instance
+        """
+        return cls(
+            name=data["name"],
+            version=data["version"],
+            summary=data["summary"],
+            description=data.get("description"),
+            steps=[Step.from_dict(step_data) for step_data in data["steps"]],
+            job_dir=job_dir,
+        )
+def parse_job_definition(job_dir: Path | str) -> JobDefinition:
+    """
+    Parse job definition from directory.
+    Args:
+        job_dir: Directory containing job.yml
+    Returns:
+        Parsed JobDefinition
+    Raises:
+        ParseError: If parsing fails or validation errors occur
+    """
+    job_dir_path = Path(job_dir)
+    if not job_dir_path.exists():
+        raise ParseError(f"Job directory does not exist: {job_dir_path}")
+    if not job_dir_path.is_dir():
+        raise ParseError(f"Job path is not a directory: {job_dir_path}")
+    job_file = job_dir_path / "job.yml"
+    if not job_file.exists():
+        raise ParseError(f"job.yml not found in {job_dir_path}")
+    # Load YAML
+    try:
+        job_data = load_yaml(job_file)
+    except YAMLError as e:
+        raise ParseError(f"Failed to load job.yml: {e}") from e
+    if job_data is None:
+        raise ParseError("job.yml is empty")
+    # Validate against schema
+    try:
+        validate_against_schema(job_data, JOB_SCHEMA)
+    except ValidationError as e:
+        raise ParseError(f"Job definition validation failed: {e}") from e
+    # Parse into dataclass
+    job_def = JobDefinition.from_dict(job_data, job_dir_path)
+    # Validate dependencies and file inputs
+    job_def.validate_dependencies()
+    job_def.validate_file_inputs()
+    return job_def

deepwork/core/policy_parser.py ADDED Viewed

@@ -0,0 +1,285 @@
+"""Policy definition parser."""
+from dataclasses import dataclass, field
+from fnmatch import fnmatch
+from pathlib import Path
+from typing import Any
+import yaml
+from deepwork.schemas.policy_schema import POLICY_SCHEMA
+from deepwork.utils.validation import ValidationError, validate_against_schema
+class PolicyParseError(Exception):
+    """Exception raised for policy parsing errors."""
+    pass
+@dataclass
+class Policy:
+    """Represents a single policy definition."""
+    name: str
+    triggers: list[str]  # Normalized to list
+    safety: list[str] = field(default_factory=list)  # Normalized to list, empty if not specified
+    instructions: str = ""  # Resolved content (either inline or from file)
+    @classmethod
+    def from_dict(cls, data: dict[str, Any], base_dir: Path | None = None) -> "Policy":
+        """
+        Create Policy from dictionary.
+        Args:
+            data: Parsed YAML data for a single policy
+            base_dir: Base directory for resolving instructions_file paths
+        Returns:
+            Policy instance
+        Raises:
+            PolicyParseError: If instructions cannot be resolved
+        """
+        # Normalize trigger to list
+        trigger = data["trigger"]
+        triggers = [trigger] if isinstance(trigger, str) else list(trigger)
+        # Normalize safety to list (empty if not present)
+        safety_data = data.get("safety", [])
+        safety = [safety_data] if isinstance(safety_data, str) else list(safety_data)
+        # Resolve instructions
+        if "instructions" in data:
+            instructions = data["instructions"]
+        elif "instructions_file" in data:
+            if base_dir is None:
+                raise PolicyParseError(
+                    f"Policy '{data['name']}' uses instructions_file but no base_dir provided"
+                )
+            instructions_path = base_dir / data["instructions_file"]
+            if not instructions_path.exists():
+                raise PolicyParseError(
+                    f"Policy '{data['name']}' instructions file not found: {instructions_path}"
+                )
+            try:
+                instructions = instructions_path.read_text()
+            except Exception as e:
+                raise PolicyParseError(
+                    f"Policy '{data['name']}' failed to read instructions file: {e}"
+                ) from e
+        else:
+            # Schema should catch this, but be defensive
+            raise PolicyParseError(
+                f"Policy '{data['name']}' must have either 'instructions' or 'instructions_file'"
+            )
+        return cls(
+            name=data["name"],
+            triggers=triggers,
+            safety=safety,
+            instructions=instructions,
+        )
+def matches_pattern(file_path: str, patterns: list[str]) -> bool:
+    """
+    Check if a file path matches any of the given glob patterns.
+    Args:
+        file_path: File path to check (relative path)
+        patterns: List of glob patterns to match against
+    Returns:
+        True if the file matches any pattern
+    """
+    for pattern in patterns:
+        if _matches_glob(file_path, pattern):
+            return True
+    return False
+def _matches_glob(file_path: str, pattern: str) -> bool:
+    """
+    Match a file path against a glob pattern, supporting ** for recursive matching.
+    Args:
+        file_path: File path to check
+        pattern: Glob pattern (supports *, **, ?)
+    Returns:
+        True if matches
+    """
+    # Normalize path separators
+    file_path = file_path.replace("\\", "/")
+    pattern = pattern.replace("\\", "/")
+    # Handle ** patterns (recursive directory matching)
+    if "**" in pattern:
+        # Split pattern by **
+        parts = pattern.split("**")
+        if len(parts) == 2:
+            prefix, suffix = parts[0], parts[1]
+            # Remove leading/trailing slashes from suffix
+            suffix = suffix.lstrip("/")
+            # Check if prefix matches the start of the path
+            if prefix:
+                prefix = prefix.rstrip("/")
+                if not file_path.startswith(prefix + "/") and file_path != prefix:
+                    return False
+                # Get the remaining path after prefix
+                remaining = file_path[len(prefix) :].lstrip("/")
+            else:
+                remaining = file_path
+            # If no suffix, any remaining path matches
+            if not suffix:
+                return True
+            # Check if suffix matches the end of any remaining path segment
+            # For pattern "src/**/*.py", suffix is "*.py"
+            # We need to match *.py against the filename portion
+            remaining_parts = remaining.split("/")
+            for i in range(len(remaining_parts)):
+                test_path = "/".join(remaining_parts[i:])
+                if fnmatch(test_path, suffix):
+                    return True
+                # Also try just the filename
+                if fnmatch(remaining_parts[-1], suffix):
+                    return True
+            return False
+    # Simple pattern without **
+    return fnmatch(file_path, pattern)
+def evaluate_policy(policy: Policy, changed_files: list[str]) -> bool:
+    """
+    Evaluate whether a policy should fire based on changed files.
+    A policy fires if:
+    - At least one changed file matches a trigger pattern
+    - AND no changed file matches a safety pattern
+    Args:
+        policy: Policy to evaluate
+        changed_files: List of changed file paths (relative)
+    Returns:
+        True if the policy should fire
+    """
+    # Check if any trigger matches
+    trigger_matched = False
+    for file_path in changed_files:
+        if matches_pattern(file_path, policy.triggers):
+            trigger_matched = True
+            break
+    if not trigger_matched:
+        return False
+    # Check if any safety pattern matches
+    if policy.safety:
+        for file_path in changed_files:
+            if matches_pattern(file_path, policy.safety):
+                # Safety file was also changed, don't fire
+                return False
+    return True
+def evaluate_policies(
+    policies: list[Policy],
+    changed_files: list[str],
+    promised_policies: set[str] | None = None,
+) -> list[Policy]:
+    """
+    Evaluate which policies should fire.
+    Args:
+        policies: List of policies to evaluate
+        changed_files: List of changed file paths (relative)
+        promised_policies: Set of policy names that have been marked as addressed
+                          via <promise> tags (these are skipped)
+    Returns:
+        List of policies that should fire (trigger matches, no safety match, not promised)
+    """
+    if promised_policies is None:
+        promised_policies = set()
+    fired_policies = []
+    for policy in policies:
+        # Skip if already promised/addressed
+        if policy.name in promised_policies:
+            continue
+        if evaluate_policy(policy, changed_files):
+            fired_policies.append(policy)
+    return fired_policies
+def parse_policy_file(policy_path: Path | str, base_dir: Path | None = None) -> list[Policy]:
+    """
+    Parse policy definitions from a YAML file.
+    Args:
+        policy_path: Path to .deepwork.policy.yml file
+        base_dir: Base directory for resolving instructions_file paths.
+                  Defaults to the directory containing the policy file.
+    Returns:
+        List of parsed Policy objects
+    Raises:
+        PolicyParseError: If parsing fails or validation errors occur
+    """
+    policy_path = Path(policy_path)
+    if not policy_path.exists():
+        raise PolicyParseError(f"Policy file does not exist: {policy_path}")
+    if not policy_path.is_file():
+        raise PolicyParseError(f"Policy path is not a file: {policy_path}")
+    # Default base_dir to policy file's directory
+    if base_dir is None:
+        base_dir = policy_path.parent
+    # Load YAML (policies are stored as a list, not a dict)
+    try:
+        with open(policy_path, encoding="utf-8") as f:
+            policy_data = yaml.safe_load(f)
+    except yaml.YAMLError as e:
+        raise PolicyParseError(f"Failed to parse policy YAML: {e}") from e
+    except OSError as e:
+        raise PolicyParseError(f"Failed to read policy file: {e}") from e
+    # Handle empty file or null content
+    if policy_data is None:
+        return []
+    # Validate it's a list (schema expects array)
+    if not isinstance(policy_data, list):
+        raise PolicyParseError(
+            f"Policy file must contain a list of policies, got {type(policy_data).__name__}"
+        )
+    # Validate against schema
+    try:
+        validate_against_schema(policy_data, POLICY_SCHEMA)
+    except ValidationError as e:
+        raise PolicyParseError(f"Policy definition validation failed: {e}") from e
+    # Parse into dataclasses
+    policies = []
+    for policy_item in policy_data:
+        policy = Policy.from_dict(policy_item, base_dir)
+        policies.append(policy)
+    return policies

deepwork/hooks/__init__.py ADDED Viewed

	@@ -0,0 +1 @@
1	+ """DeepWork hooks package for policy enforcement and lifecycle events."""