PyPI - tasktree - Versions diffs - 0.0.21__py3-none-any.whl → 0.0.22__py3-none-any.whl - Mend

tasktree 0.0.21py3-none-any.whl → 0.0.22py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (14) hide show

tasktree/cli.py +91 -31
tasktree/docker.py +24 -17
tasktree/executor.py +263 -211
tasktree/graph.py +15 -10
tasktree/hasher.py +13 -6
tasktree/parser.py +220 -121
tasktree/state.py +7 -8
tasktree/substitution.py +27 -15
tasktree/types.py +29 -12
{tasktree-0.0.21.dist-info → tasktree-0.0.22.dist-info}/METADATA +13 -15
tasktree-0.0.22.dist-info/RECORD +14 -0
tasktree-0.0.21.dist-info/RECORD +0 -14
{tasktree-0.0.21.dist-info → tasktree-0.0.22.dist-info}/WHEEL +0 -0
{tasktree-0.0.21.dist-info → tasktree-0.0.22.dist-info}/entry_points.txt +0 -0

tasktree/executor.py CHANGED Viewed

@@ -14,10 +14,16 @@ from pathlib import Path
 from typing import Any
 from tasktree import docker as docker_module
-from tasktree.graph import get_implicit_inputs, resolve_execution_order, resolve_dependency_output_references, resolve_self_references
+from tasktree.graph import (
+    get_implicit_inputs,
+    resolve_execution_order,
+    resolve_dependency_output_references,
+    resolve_self_references,
+)
 from tasktree.hasher import hash_args, hash_task, make_cache_key
 from tasktree.parser import Recipe, Task, Environment
 from tasktree.state import StateManager, TaskState
+from tasktree.hasher import hash_environment_definition
 @dataclass
@@ -47,19 +53,19 @@ class ExecutionError(Exception):
 class Executor:
     """
     Executes tasks with incremental execution logic.
-    @athena: ac1e2fc7b82b
+    @athena: 88e82151721d
     """
     # Protected environment variables that cannot be overridden by exported args
     PROTECTED_ENV_VARS = {
-        'PATH',
-        'LD_LIBRARY_PATH',
-        'LD_PRELOAD',
-        'PYTHONPATH',
-        'HOME',
-        'SHELL',
-        'USER',
-        'LOGNAME',
+        "PATH",
+        "LD_LIBRARY_PATH",
+        "LD_PRELOAD",
+        "PYTHONPATH",
+        "HOME",
+        "SHELL",
+        "USER",
+        "LOGNAME",
     }
     def __init__(self, recipe: Recipe, state_manager: StateManager):
@@ -75,7 +81,8 @@ class Executor:
         self.state = state_manager
         self.docker_manager = docker_module.DockerManager(recipe.project_root)
-    def _has_regular_args(self, task: Task) -> bool:
+    @staticmethod
+    def _has_regular_args(task: Task) -> bool:
         """
         Check if a task has any regular (non-exported) arguments.
@@ -84,7 +91,7 @@ class Executor:
         Returns:
         True if task has at least one regular (non-exported) argument, False otherwise
-        @athena: 0fc46146eed3
+        @athena: a4c7816bfe61
         """
         if not task.args:
             return False
@@ -94,18 +101,19 @@ class Executor:
             # Handle both string and dict arg specs
             if isinstance(arg_spec, str):
                 # Remove default value part if present
-                arg_name = arg_spec.split('=')[0].split(':')[0].strip()
-                if not arg_name.startswith('$'):
+                arg_name = arg_spec.split("=")[0].split(":")[0].strip()
+                if not arg_name.startswith("$"):
                     return True
             elif isinstance(arg_spec, dict):
                 # Dict format: { argname: { ... } } or { $argname: { ... } }
                 for key in arg_spec.keys():
-                    if not key.startswith('$'):
+                    if not key.startswith("$"):
                         return True
         return False
-    def _filter_regular_args(self, task: Task, task_args: dict[str, Any]) -> dict[str, Any]:
+    @staticmethod
+    def _filter_regular_args(task: Task, task_args: dict[str, Any]) -> dict[str, Any]:
         """
         Filter task_args to only include regular (non-exported) arguments.
@@ -115,7 +123,7 @@ class Executor:
         Returns:
         Dictionary containing only regular (non-exported) arguments
-        @athena: 811abd3a56f9
+        @athena: 974e5e32bbd7
         """
         if not task.args or not task_args:
             return {}
@@ -124,18 +132,20 @@ class Executor:
         exported_names = set()
         for arg_spec in task.args:
             if isinstance(arg_spec, str):
-                arg_name = arg_spec.split('=')[0].split(':')[0].strip()
-                if arg_name.startswith('$'):
+                arg_name = arg_spec.split("=")[0].split(":")[0].strip()
+                if arg_name.startswith("$"):
                     exported_names.add(arg_name[1:])  # Remove $ prefix
             elif isinstance(arg_spec, dict):
                 for key in arg_spec.keys():
-                    if key.startswith('$'):
+                    if key.startswith("$"):
                         exported_names.add(key[1:])  # Remove $ prefix
         # Filter out exported args
         return {k: v for k, v in task_args.items() if k not in exported_names}
-    def _collect_early_builtin_variables(self, task: Task, timestamp: datetime) -> dict[str, str]:
+    def _collect_early_builtin_variables(
+        self, task: Task, timestamp: datetime
+    ) -> dict[str, str]:
         """
         Collect built-in variables that don't depend on working_dir.
@@ -150,31 +160,27 @@ class Executor:
         Raises:
         ExecutionError: If any built-in variable fails to resolve
-        @athena: 0b348e67ce4c
+        @athena: 3b4c0ec70ad7
         """
         import os
-        builtin_vars = {}
-        # {{ tt.project_root }} - Absolute path to project root
-        builtin_vars['project_root'] = str(self.recipe.project_root.resolve())
-        # {{ tt.recipe_dir }} - Absolute path to directory containing the recipe file
-        builtin_vars['recipe_dir'] = str(self.recipe.recipe_path.parent.resolve())
-        # {{ tt.task_name }} - Name of currently executing task
-        builtin_vars['task_name'] = task.name
-        # {{ tt.timestamp }} - ISO8601 timestamp when task started execution
-        builtin_vars['timestamp'] = timestamp.strftime('%Y-%m-%dT%H:%M:%SZ')
-        # {{ tt.timestamp_unix }} - Unix epoch timestamp when task started
-        builtin_vars['timestamp_unix'] = str(int(timestamp.timestamp()))
+        builtin_vars = {
+            # {{ tt.project_root }} - Absolute path to project root
+            "project_root": str(self.recipe.project_root.resolve()),
+            # {{ tt.recipe_dir }} - Absolute path to directory containing the recipe file
+            "recipe_dir": str(self.recipe.recipe_path.parent.resolve()),
+            # {{ tt.task_name }} - Name of currently executing task
+            "task_name": task.name,
+            # {{ tt.timestamp }} - ISO8601 timestamp when task started execution
+            "timestamp": timestamp.strftime("%Y-%m-%dT%H:%M:%SZ"),
+            # {{ tt.timestamp_unix }} - Unix epoch timestamp when task started
+            "timestamp_unix": str(int(timestamp.timestamp())),
+        }
         # {{ tt.user_home }} - Current user's home directory (cross-platform)
         try:
             user_home = Path.home()
-            builtin_vars['user_home'] = str(user_home)
+            builtin_vars["user_home"] = str(user_home)
         except Exception as e:
             raise ExecutionError(
                 f"Failed to get user home directory for {{ tt.user_home }}: {e}"
@@ -185,12 +191,16 @@ class Executor:
             user_name = os.getlogin()
         except OSError:
             # Fallback to environment variables if os.getlogin() fails
-            user_name = os.environ.get('USER') or os.environ.get('USERNAME') or 'unknown'
-        builtin_vars['user_name'] = user_name
+            user_name = (
+                os.environ.get("USER") or os.environ.get("USERNAME") or "unknown"
+            )
+        builtin_vars["user_name"] = user_name
         return builtin_vars
-    def _collect_builtin_variables(self, task: Task, working_dir: Path, timestamp: datetime) -> dict[str, str]:
+    def _collect_builtin_variables(
+        self, task: Task, working_dir: Path, timestamp: datetime
+    ) -> dict[str, str]:
         """
         Collect built-in variables for task execution.
@@ -211,11 +221,13 @@ class Executor:
         # {{ tt.working_dir }} - Absolute path to task's effective working directory
         # This is added after working_dir is resolved to avoid circular dependency
-        builtin_vars['working_dir'] = str(working_dir.resolve())
+        builtin_vars["working_dir"] = str(working_dir.resolve())
         return builtin_vars
-    def _prepare_env_with_exports(self, exported_env_vars: dict[str, str] | None = None) -> dict[str, str]:
+    def _prepare_env_with_exports(
+        self, exported_env_vars: dict[str, str] | None = None
+    ) -> dict[str, str]:
         """
         Prepare environment with exported arguments.
@@ -241,19 +253,20 @@ class Executor:
             env.update(exported_env_vars)
         return env
-    def _get_platform_default_environment(self) -> tuple[str, list[str]]:
+    @staticmethod
+    def _get_platform_default_environment() -> tuple[str, list[str]]:
         """
         Get default shell and args for current platform.
         Returns:
         Tuple of (shell, args) for platform default
-        @athena: b67799671787
+        @athena: 8b7fa81073af
         """
         is_windows = platform.system() == "Windows"
         if is_windows:
-            return ("cmd", ["/c"])
+            return "cmd", ["/c"]
         else:
-            return ("bash", ["-c"])
+            return "bash", ["-c"]
     def _get_effective_env_name(self, task: Task) -> str:
         """
@@ -287,7 +300,7 @@ class Executor:
         # Platform default (no env name)
         return ""
-    def _resolve_environment(self, task: Task) -> tuple[str, list[str], str]:
+    def _resolve_environment(self, task: Task) -> tuple[str, str]:
         """
         Resolve which environment to use for a task.
@@ -301,8 +314,8 @@ class Executor:
         task: Task to resolve environment for
         Returns:
-        Tuple of (shell, args, preamble)
-        @athena: b919568f73fc
+        Tuple of (shell, preamble)
+        @athena: 15cad76d7c80
         """
         # Check for global override first
         env_name = self.recipe.global_env_override
@@ -319,12 +332,12 @@ class Executor:
         if env_name:
             env = self.recipe.get_environment(env_name)
             if env:
-                return (env.shell, env.args, env.preamble)
+                return env.shell, env.preamble
             # If env not found, fall through to platform default
         # Use platform default
-        shell, args = self._get_platform_default_environment()
-        return (shell, args, "")
+        shell, _ = self._get_platform_default_environment()
+        return shell, ""
     def check_task_status(
         self,
@@ -364,7 +377,14 @@ class Executor:
         # Compute hashes (include effective environment and dependencies)
         effective_env = self._get_effective_env_name(task)
-        task_hash = hash_task(task.cmd, task.outputs, task.working_dir, task.args, effective_env, task.deps)
+        task_hash = hash_task(
+            task.cmd,
+            task.outputs,
+            task.working_dir,
+            task.args,
+            effective_env,
+            task.deps,
+        )
         args_hash = hash_args(args_dict) if args_dict else None
         cache_key = make_cache_key(task_hash, args_hash)
@@ -487,13 +507,20 @@ class Executor:
             # Only include regular (non-exported) args in status key for parameterized dependencies
             # For the root task (invoked from CLI), status key is always just the task name
             # For dependencies with parameterized invocations, include the regular args
-            is_root_task = (name == task_name)
-            if not is_root_task and args_dict_for_execution and self._has_regular_args(task):
+            is_root_task = name == task_name
+            if (
+                not is_root_task
+                and args_dict_for_execution
+                and self._has_regular_args(task)
+            ):
                 import json
                 # Filter to only include regular (non-exported) args
                 regular_args = self._filter_regular_args(task, args_dict_for_execution)
                 if regular_args:
-                    args_str = json.dumps(regular_args, sort_keys=True, separators=(",", ":"))
+                    args_str = json.dumps(
+                        regular_args, sort_keys=True, separators=(",", ":")
+                    )
                     status_key = f"{name}({args_str})"
                 else:
                     status_key = name
@@ -506,6 +533,7 @@ class Executor:
                 # Warn if re-running due to missing outputs
                 if status.reason == "outputs_missing":
                     import sys
                     print(
                         f"Warning: Re-running task '{name}' because declared outputs are missing",
                         file=sys.stderr,
@@ -525,7 +553,7 @@ class Executor:
         Raises:
         ExecutionError: If task execution fails
-        @athena: 885c66658550
+        @athena: 4b49652a7afd
         """
         # Capture timestamp at task start for consistency (in UTC)
         task_start_time = datetime.now(timezone.utc)
@@ -533,6 +561,7 @@ class Executor:
         # Parse task arguments to identify exported args
         # Note: args_dict already has defaults applied by CLI (cli.py:413-424)
         from tasktree.parser import parse_arg_spec
         exported_args = set()
         regular_args = {}
         exported_env_vars = {}
@@ -551,18 +580,24 @@ class Executor:
         # Collect early built-in variables (those that don't depend on working_dir)
         # These can be used in the working_dir field itself
-        early_builtin_vars = self._collect_early_builtin_variables(task, task_start_time)
+        early_builtin_vars = self._collect_early_builtin_variables(
+            task, task_start_time
+        )
         # Resolve working directory
         # Validate that working_dir doesn't contain {{ tt.working_dir }} (circular dependency)
         self._validate_no_working_dir_circular_ref(task.working_dir)
         working_dir_str = self._substitute_builtin(task.working_dir, early_builtin_vars)
-        working_dir_str = self._substitute_args(working_dir_str, regular_args, exported_args)
+        working_dir_str = self._substitute_args(
+            working_dir_str, regular_args, exported_args
+        )
         working_dir_str = self._substitute_env(working_dir_str)
         working_dir = self.recipe.project_root / working_dir_str
         # Collect all built-in variables (including tt.working_dir now that it's resolved)
-        builtin_vars = self._collect_builtin_variables(task, working_dir, task_start_time)
+        builtin_vars = self._collect_builtin_variables(
+            task, working_dir, task_start_time
+        )
         # Substitute built-in variables, arguments, and environment variables in command
         cmd = self._substitute_builtin(task.cmd, builtin_vars)
@@ -583,64 +618,33 @@ class Executor:
             # Docker execution path
             self._run_task_in_docker(task, env, cmd, working_dir, exported_env_vars)
         else:
-            # Regular execution path
-            shell, shell_args, preamble = self._resolve_environment(task)
-            # Detect multi-line commands (ignore trailing newlines from YAML folded blocks)
-            if "\n" in cmd.rstrip():
-                self._run_multiline_command(cmd, working_dir, task.name, shell, preamble, exported_env_vars)
-            else:
-                self._run_single_line_command(cmd, working_dir, task.name, shell, shell_args, exported_env_vars)
+            # Regular execution path - use unified script-based execution
+            shell, preamble = self._resolve_environment(task)
+            self._run_command_as_script(
+                cmd, working_dir, task.name, shell, preamble, exported_env_vars
+            )
         # Update state
         self._update_state(task, args_dict)
-    def _run_single_line_command(
-        self, cmd: str, working_dir: Path, task_name: str, shell: str, shell_args: list[str],
-        exported_env_vars: dict[str, str] | None = None
+    def _run_command_as_script(
+        self,
+        cmd: str,
+        working_dir: Path,
+        task_name: str,
+        shell: str,
+        preamble: str,
+        exported_env_vars: dict[str, str] | None = None,
     ) -> None:
         """
-        Execute a single-line command via shell.
-        Args:
-        cmd: Command string
-        working_dir: Working directory
-        task_name: Task name (for error messages)
-        shell: Shell executable to use
-        shell_args: Arguments to pass to shell
-        exported_env_vars: Exported arguments to set as environment variables
-        Raises:
-        ExecutionError: If command execution fails
-        @athena: 46849e6a0bbb
-        """
-        # Prepare environment with exported args
-        env = self._prepare_env_with_exports(exported_env_vars)
+        Execute a command via temporary script file (unified execution path).
-        try:
-            # Build command: shell + args + cmd
-            full_cmd = [shell] + shell_args + [cmd]
-            subprocess.run(
-                full_cmd,
-                cwd=working_dir,
-                check=True,
-                capture_output=False,
-                env=env,
-            )
-        except subprocess.CalledProcessError as e:
-            raise ExecutionError(
-                f"Task '{task_name}' failed with exit code {e.returncode}"
-            )
-    def _run_multiline_command(
-        self, cmd: str, working_dir: Path, task_name: str, shell: str, preamble: str,
-        exported_env_vars: dict[str, str] | None = None
-    ) -> None:
-        """
-        Execute a multi-line command via temporary script file.
+        This method handles both single-line and multi-line commands by writing
+        them to a temporary script file and executing the script. This provides
+        consistent behavior and allows preamble to work with all commands.
         Args:
-        cmd: Multi-line command string
+        cmd: Command string (single-line or multi-line)
         working_dir: Working directory
         task_name: Task name (for error messages)
         shell: Shell to use for script execution
@@ -649,7 +653,8 @@ class Executor:
         Raises:
         ExecutionError: If command execution fails
-        @athena: 825892b6db05
+        @athena: TBD
+        @athena: 96e85dc15b5c
         """
         # Prepare environment with exported args
         env = self._prepare_env_with_exports(exported_env_vars)
@@ -707,7 +712,9 @@ class Executor:
             except OSError:
                 pass  # Ignore cleanup errors
-    def _substitute_builtin_in_environment(self, env: Environment, builtin_vars: dict[str, str]) -> Environment:
+    def _substitute_builtin_in_environment(
+        self, env: Environment, builtin_vars: dict[str, str]
+    ) -> Environment:
         """
         Substitute builtin and environment variables in environment fields.
@@ -725,29 +732,51 @@ class Executor:
         from dataclasses import replace
         # Substitute in volumes (builtin vars first, then env vars)
-        substituted_volumes = [
-            self._substitute_env(self._substitute_builtin(vol, builtin_vars)) for vol in env.volumes
-        ] if env.volumes else []
+        substituted_volumes = (
+            [
+                self._substitute_env(self._substitute_builtin(vol, builtin_vars))
+                for vol in env.volumes
+            ]
+            if env.volumes
+            else []
+        )
         # Substitute in env_vars values (builtin vars first, then env vars)
-        substituted_env_vars = {
-            key: self._substitute_env(self._substitute_builtin(value, builtin_vars))
-            for key, value in env.env_vars.items()
-        } if env.env_vars else {}
+        substituted_env_vars = (
+            {
+                key: self._substitute_env(self._substitute_builtin(value, builtin_vars))
+                for key, value in env.env_vars.items()
+            }
+            if env.env_vars
+            else {}
+        )
         # Substitute in ports (builtin vars first, then env vars)
-        substituted_ports = [
-            self._substitute_env(self._substitute_builtin(port, builtin_vars)) for port in env.ports
-        ] if env.ports else []
+        substituted_ports = (
+            [
+                self._substitute_env(self._substitute_builtin(port, builtin_vars))
+                for port in env.ports
+            ]
+            if env.ports
+            else []
+        )
         # Substitute in working_dir (builtin vars first, then env vars)
-        substituted_working_dir = self._substitute_env(self._substitute_builtin(env.working_dir, builtin_vars)) if env.working_dir else ""
+        substituted_working_dir = (
+            self._substitute_env(
+                self._substitute_builtin(env.working_dir, builtin_vars)
+            )
+            if env.working_dir
+            else ""
+        )
         # Substitute in build args (for Docker environments, args is a dict)
         # Apply builtin vars first, then env vars
         if isinstance(env.args, dict):
             substituted_args = {
-                key: self._substitute_env(self._substitute_builtin(str(value), builtin_vars))
+                key: self._substitute_env(
+                    self._substitute_builtin(str(value), builtin_vars)
+                )
                 for key, value in env.args.items()
             }
         else:
@@ -760,12 +789,16 @@ class Executor:
             env_vars=substituted_env_vars,
             ports=substituted_ports,
             working_dir=substituted_working_dir,
-            args=substituted_args
+            args=substituted_args,
         )
     def _run_task_in_docker(
-        self, task: Task, env: Any, cmd: str, working_dir: Path,
-        exported_env_vars: dict[str, str] | None = None
+        self,
+        task: Task,
+        env: Any,
+        cmd: str,
+        working_dir: Path,
+        exported_env_vars: dict[str, str] | None = None,
     ) -> None:
         """
         Execute task inside Docker container.
@@ -783,7 +816,9 @@ class Executor:
         """
         # Get builtin variables for substitution in environment fields
         task_start_time = datetime.now(timezone.utc)
-        builtin_vars = self._collect_builtin_variables(task, working_dir, task_start_time)
+        builtin_vars = self._collect_builtin_variables(
+            task, working_dir, task_start_time
+        )
         # Substitute builtin variables in environment fields (volumes, env_vars, etc.)
         env = self._substitute_builtin_in_environment(env, builtin_vars)
@@ -807,6 +842,7 @@ class Executor:
         # Create modified environment with merged env vars using dataclass replace
         from dataclasses import replace
         modified_env = replace(env, env_vars=docker_env_vars)
         # Execute in container
@@ -820,7 +856,8 @@ class Executor:
         except docker_module.DockerError as e:
             raise ExecutionError(str(e)) from e
-    def _validate_no_working_dir_circular_ref(self, text: str) -> None:
+    @staticmethod
+    def _validate_no_working_dir_circular_ref(text: str) -> None:
         """
         Validate that working_dir field does not contain {{ tt.working_dir }}.
@@ -831,20 +868,22 @@ class Executor:
         Raises:
         ExecutionError: If {{ tt.working_dir }} placeholder is found
-        @athena: 5dc6ee41d403
+        @athena: 617a0c609f4d
         """
         import re
         # Pattern to match {{ tt.working_dir }} specifically
-        pattern = re.compile(r'\{\{\s*tt\s*\.\s*working_dir\s*\}\}')
+        pattern = re.compile(r"\{\{\s*tt\s*\.\s*working_dir\s*}}")
         if pattern.search(text):
             raise ExecutionError(
-                f"Cannot use {{{{ tt.working_dir }}}} in the 'working_dir' field.\n\n"
-                f"This creates a circular dependency (working_dir cannot reference itself).\n"
-                f"Other built-in variables like {{{{ tt.task_name }}}} or {{{{ tt.timestamp }}}} are allowed."
+                "Cannot use {{ tt.working_dir }} in the 'working_dir' field.\n\n"
+                "This creates a circular dependency (working_dir cannot reference itself).\n"
+                "Other built-in variables like {{ tt.task_name }} or {{ tt.timestamp }} are allowed."
             )
-    def _substitute_builtin(self, text: str, builtin_vars: dict[str, str]) -> str:
+    @staticmethod
+    def _substitute_builtin(text: str, builtin_vars: dict[str, str]) -> str:
         """
         Substitute {{ tt.name }} placeholders in text.
@@ -859,12 +898,16 @@ class Executor:
         Raises:
         ValueError: If built-in variable is not defined
-        @athena: 463600a203f4
+        @athena: fe47afe87b52
         """
         from tasktree.substitution import substitute_builtin_variables
         return substitute_builtin_variables(text, builtin_vars)
-    def _substitute_args(self, cmd: str, args_dict: dict[str, Any], exported_args: set[str] | None = None) -> str:
+    @staticmethod
+    def _substitute_args(
+        cmd: str, args_dict: dict[str, Any], exported_args: set[str] | None = None
+    ) -> str:
         """
         Substitute {{ arg.name }} placeholders in command string.
@@ -881,12 +924,14 @@ class Executor:
         Raises:
         ValueError: If an exported argument is used in template substitution
-        @athena: 4261a91c6a98
+        @athena: 9a931179f270
         """
         from tasktree.substitution import substitute_arguments
         return substitute_arguments(cmd, args_dict, exported_args)
-    def _substitute_env(self, text: str) -> str:
+    @staticmethod
+    def _substitute_env(text: str) -> str:
         """
         Substitute {{ env.NAME }} placeholders in text.
@@ -900,9 +945,10 @@ class Executor:
         Raises:
         ValueError: If environment variable is not set
-        @athena: 63becab531cd
+        @athena: 1bbe24759451
         """
         from tasktree.substitution import substitute_environment
         return substitute_environment(text)
     def _get_all_inputs(self, task: Task) -> list[str]:
@@ -929,6 +975,7 @@ class Executor:
         all_inputs.extend(implicit_inputs)
         return all_inputs
+    # TODO: Understand why task isn't used
     def _check_environment_changed(
         self, task: Task, cached_state: TaskState, env_name: str
     ) -> bool:
@@ -997,12 +1044,12 @@ class Executor:
         Returns:
         True if image ID changed, False otherwise
-        @athena: 8af77cb1be44
+        @athena: 0443710cf356
         """
         # Build/ensure image is built and get its ID
         try:
             image_tag, current_image_id = self.docker_manager.ensure_image_built(env)
-        except Exception as e:
+        except Exception:
             # If we can't build, treat as changed (will fail later with better error)
             return True
@@ -1095,7 +1142,9 @@ class Executor:
                         # Check if digests changed
                         if current_digests != cached_digests:
-                            changed_files.append(f"Docker base image digests in {dockerfile_name}")
+                            changed_files.append(
+                                f"Docker base image digests in {dockerfile_name}"
+                            )
                     except (OSError, IOError):
                         # Can't read Dockerfile - consider changed
                         changed_files.append(f"Dockerfile: {dockerfile_name}")
@@ -1115,7 +1164,8 @@ class Executor:
         return changed_files
-    def _expand_output_paths(self, task: Task) -> list[str]:
+    @staticmethod
+    def _expand_output_paths(task: Task) -> list[str]:
         """
         Extract all output paths from task outputs (both named and anonymous).
@@ -1124,7 +1174,7 @@ class Executor:
         Returns:
         List of output path patterns (glob patterns as strings)
-        @athena: 848a28564b14
+        @athena: 21da23ad5dcf
         """
         paths = []
         for output in task.outputs:
@@ -1193,25 +1243,42 @@ class Executor:
     def _update_state(self, task: Task, args_dict: dict[str, Any]) -> None:
         """
         Update state after task execution.
-        Args:
-        task: Task that was executed
-        args_dict: Arguments used for execution
         @athena: 1fcfdfcb9be9
         """
-        # Compute hashes (include effective environment and dependencies)
+        cache_key = self._cache_key(task, args_dict)
+        input_state = self._input_files_to_modified_times(task)
+        env_name = self._get_effective_env_name(task)
+        if env_name:
+            env = self.recipe.get_environment(env_name)
+            if env:
+                input_state[f"_env_hash_{env_name}"] = hash_environment_definition(env)
+                if env.dockerfile:
+                    input_state |= self._docker_inputs_to_modified_times(env_name, env)
+        new_state = TaskState(last_run=time.time(), input_state=input_state)
+        self.state.set(cache_key, new_state)
+        self.state.save()
+    def _cache_key(self, task: Task, args_dict: dict[str, Any]) -> str:
         effective_env = self._get_effective_env_name(task)
-        task_hash = hash_task(task.cmd, task.outputs, task.working_dir, task.args, effective_env, task.deps)
+        task_hash = hash_task(
+            task.cmd,
+            task.outputs,
+            task.working_dir,
+            task.args,
+            effective_env,
+            task.deps,
+        )
         args_hash = hash_args(args_dict) if args_dict else None
-        cache_key = make_cache_key(task_hash, args_hash)
+        return make_cache_key(task_hash, args_hash)
-        # Get all inputs and their current mtimes
-        all_inputs = self._get_all_inputs(task)
-        input_files = self._expand_globs(all_inputs, task.working_dir)
+    def _input_files_to_modified_times(self, task: Task) -> dict[str, float]:
+        input_files = self._expand_globs(self._get_all_inputs(task), task.working_dir)
         input_state = {}
         for file_path in input_files:
-            # Skip Docker special markers (handled separately below)
+            # Skip Docker special markers (handled separately)
             if file_path.startswith("_docker_"):
                 continue
@@ -1219,59 +1286,44 @@ class Executor:
             if file_path_obj.exists():
                 input_state[file_path] = file_path_obj.stat().st_mtime
-        # Record Docker-specific inputs if task uses Docker environment
-        env_name = self._get_effective_env_name(task)
-        if env_name:
-            env = self.recipe.get_environment(env_name)
-            if env and env.dockerfile:
-                # Record Dockerfile mtime
-                dockerfile_path = self.recipe.project_root / env.dockerfile
-                if dockerfile_path.exists():
-                    input_state[env.dockerfile] = dockerfile_path.stat().st_mtime
-                # Record .dockerignore mtime if exists
-                context_path = self.recipe.project_root / env.context
-                dockerignore_path = context_path / ".dockerignore"
-                if dockerignore_path.exists():
-                    relative_dockerignore = str(
-                        dockerignore_path.relative_to(self.recipe.project_root)
-                    )
-                    input_state[relative_dockerignore] = dockerignore_path.stat().st_mtime
-                # Record context check timestamp
-                input_state[f"_context_{env.context}"] = time.time()
-                # Parse and record base image digests from Dockerfile
-                try:
-                    dockerfile_content = dockerfile_path.read_text()
-                    digests = docker_module.parse_base_image_digests(dockerfile_content)
-                    for digest in digests:
-                        # Store digest with Dockerfile's mtime
-                        input_state[f"_digest_{digest}"] = dockerfile_path.stat().st_mtime
-                except (OSError, IOError):
-                    # If we can't read Dockerfile, skip digest tracking
-                    pass
-            # Record environment definition hash for all environments (shell and Docker)
-            if env:
-                from tasktree.hasher import hash_environment_definition
-                env_hash = hash_environment_definition(env)
-                input_state[f"_env_hash_{env_name}"] = env_hash
+        return input_state
+    def _docker_inputs_to_modified_times(
+        self, env_name: str, env: Environment
+    ) -> dict[str, float]:
+        input_state = dict()
+        # Record Dockerfile mtime
+        dockerfile_path = self.recipe.project_root / env.dockerfile
+        if dockerfile_path.exists():
+            input_state[env.dockerfile] = dockerfile_path.stat().st_mtime
+        # Record .dockerignore mtime if exists
+        context_path = self.recipe.project_root / env.context
+        dockerignore_path = context_path / ".dockerignore"
+        if dockerignore_path.exists():
+            relative_dockerignore = str(
+                dockerignore_path.relative_to(self.recipe.project_root)
+            )
+            input_state[relative_dockerignore] = dockerignore_path.stat().st_mtime
-                # For Docker environments, also store the image ID
-                if env.dockerfile:
-                    # Image was already built during check phase or task execution
-                    if env_name in self.docker_manager._built_images:
-                        image_tag, image_id = self.docker_manager._built_images[env_name]
-                        input_state[f"_docker_image_id_{env_name}"] = image_id
-        # Create new state
-        state = TaskState(
-            last_run=time.time(),
-            input_state=input_state,
-        )
+        # Record context check timestamp
+        input_state[f"_context_{env.context}"] = time.time()
-        # Save state
-        self.state.set(cache_key, state)
-        self.state.save()
+        # Parse and record base image digests from Dockerfile
+        try:
+            dockerfile_content = dockerfile_path.read_text()
+            digests = docker_module.parse_base_image_digests(dockerfile_content)
+            for digest in digests:
+                # Store digest with Dockerfile's mtime
+                input_state[f"_digest_{digest}"] = dockerfile_path.stat().st_mtime
+        except (OSError, IOError):
+            # If we can't read Dockerfile, skip digest tracking
+            pass
+        # For Docker environments, also store the image ID
+        # Image was already built during check phase or task execution
+        if env_name in self.docker_manager._built_images:
+            image_tag, image_id = self.docker_manager._built_images[env_name]
+            input_state[f"_docker_image_id_{env_name}"] = image_id
+        return input_state

tasktree 0.0.21__py3-none-any.whl → 0.0.22__py3-none-any.whl

tasktree 0.0.21py3-none-any.whl → 0.0.22py3-none-any.whl