PyPI - flowyml - Versions diffs - 1.7.2__py3-none-any.whl → 1.8.0__py3-none-any.whl - Mend

flowyml 1.7.2py3-none-any.whl → 1.8.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (126) hide show

flowyml/assets/base.py +15 -0
flowyml/assets/metrics.py +5 -0
flowyml/cli/main.py +709 -0
flowyml/cli/stack_cli.py +138 -25
flowyml/core/__init__.py +17 -0
flowyml/core/executor.py +161 -26
flowyml/core/image_builder.py +129 -0
flowyml/core/log_streamer.py +227 -0
flowyml/core/orchestrator.py +22 -2
flowyml/core/pipeline.py +34 -10
flowyml/core/routing.py +558 -0
flowyml/core/step.py +9 -1
flowyml/core/step_grouping.py +49 -35
flowyml/core/types.py +407 -0
flowyml/monitoring/alerts.py +10 -0
flowyml/monitoring/notifications.py +104 -25
flowyml/monitoring/slack_blocks.py +323 -0
flowyml/plugins/__init__.py +251 -0
flowyml/plugins/alerters/__init__.py +1 -0
flowyml/plugins/alerters/slack.py +168 -0
flowyml/plugins/base.py +752 -0
flowyml/plugins/config.py +478 -0
flowyml/plugins/deployers/__init__.py +22 -0
flowyml/plugins/deployers/gcp_cloud_run.py +200 -0
flowyml/plugins/deployers/sagemaker.py +306 -0
flowyml/plugins/deployers/vertex.py +290 -0
flowyml/plugins/integration.py +369 -0
flowyml/plugins/manager.py +510 -0
flowyml/plugins/model_registries/__init__.py +22 -0
flowyml/plugins/model_registries/mlflow.py +159 -0
flowyml/plugins/model_registries/sagemaker.py +489 -0
flowyml/plugins/model_registries/vertex.py +386 -0
flowyml/plugins/orchestrators/__init__.py +13 -0
flowyml/plugins/orchestrators/sagemaker.py +443 -0
flowyml/plugins/orchestrators/vertex_ai.py +461 -0
flowyml/plugins/registries/__init__.py +13 -0
flowyml/plugins/registries/ecr.py +321 -0
flowyml/plugins/registries/gcr.py +313 -0
flowyml/plugins/registry.py +454 -0
flowyml/plugins/stack.py +494 -0
flowyml/plugins/stack_config.py +537 -0
flowyml/plugins/stores/__init__.py +13 -0
flowyml/plugins/stores/gcs.py +460 -0
flowyml/plugins/stores/s3.py +453 -0
flowyml/plugins/trackers/__init__.py +11 -0
flowyml/plugins/trackers/mlflow.py +316 -0
flowyml/plugins/validators/__init__.py +3 -0
flowyml/plugins/validators/deepchecks.py +119 -0
flowyml/registry/__init__.py +2 -1
flowyml/registry/model_environment.py +109 -0
flowyml/registry/model_registry.py +241 -96
flowyml/serving/__init__.py +17 -0
flowyml/serving/model_server.py +628 -0
flowyml/stacks/__init__.py +60 -0
flowyml/stacks/aws.py +93 -0
flowyml/stacks/base.py +62 -0
flowyml/stacks/components.py +12 -0
flowyml/stacks/gcp.py +44 -9
flowyml/stacks/plugins.py +115 -0
flowyml/stacks/registry.py +2 -1
flowyml/storage/sql.py +401 -12
flowyml/tracking/experiment.py +8 -5
flowyml/ui/backend/Dockerfile +87 -16
flowyml/ui/backend/auth.py +12 -2
flowyml/ui/backend/main.py +149 -5
flowyml/ui/backend/routers/ai_context.py +226 -0
flowyml/ui/backend/routers/assets.py +23 -4
flowyml/ui/backend/routers/auth.py +96 -0
flowyml/ui/backend/routers/deployments.py +660 -0
flowyml/ui/backend/routers/model_explorer.py +597 -0
flowyml/ui/backend/routers/plugins.py +103 -51
flowyml/ui/backend/routers/projects.py +91 -8
flowyml/ui/backend/routers/runs.py +20 -1
flowyml/ui/backend/routers/schedules.py +22 -17
flowyml/ui/backend/routers/templates.py +319 -0
flowyml/ui/backend/routers/websocket.py +2 -2
flowyml/ui/frontend/Dockerfile +55 -6
flowyml/ui/frontend/dist/assets/index-B5AsPTSz.css +1 -0
flowyml/ui/frontend/dist/assets/index-dFbZ8wD8.js +753 -0
flowyml/ui/frontend/dist/index.html +2 -2
flowyml/ui/frontend/dist/logo.png +0 -0
flowyml/ui/frontend/nginx.conf +65 -4
flowyml/ui/frontend/package-lock.json +1404 -74
flowyml/ui/frontend/package.json +3 -0
flowyml/ui/frontend/public/logo.png +0 -0
flowyml/ui/frontend/src/App.jsx +10 -7
flowyml/ui/frontend/src/app/auth/Login.jsx +90 -0
flowyml/ui/frontend/src/app/dashboard/page.jsx +8 -8
flowyml/ui/frontend/src/app/deployments/page.jsx +786 -0
flowyml/ui/frontend/src/app/model-explorer/page.jsx +1031 -0
flowyml/ui/frontend/src/app/pipelines/page.jsx +12 -2
flowyml/ui/frontend/src/app/projects/[projectId]/_components/ProjectExperimentsList.jsx +19 -6
flowyml/ui/frontend/src/app/runs/[runId]/page.jsx +36 -24
flowyml/ui/frontend/src/app/runs/page.jsx +8 -2
flowyml/ui/frontend/src/app/settings/page.jsx +267 -253
flowyml/ui/frontend/src/components/AssetDetailsPanel.jsx +29 -7
flowyml/ui/frontend/src/components/Layout.jsx +6 -0
flowyml/ui/frontend/src/components/PipelineGraph.jsx +79 -29
flowyml/ui/frontend/src/components/RunDetailsPanel.jsx +36 -6
flowyml/ui/frontend/src/components/RunMetaPanel.jsx +113 -0
flowyml/ui/frontend/src/components/ai/AIAssistantButton.jsx +71 -0
flowyml/ui/frontend/src/components/ai/AIAssistantPanel.jsx +420 -0
flowyml/ui/frontend/src/components/header/Header.jsx +22 -0
flowyml/ui/frontend/src/components/plugins/PluginManager.jsx +4 -4
flowyml/ui/frontend/src/components/plugins/{ZenMLIntegration.jsx → StackImport.jsx} +38 -12
flowyml/ui/frontend/src/components/sidebar/Sidebar.jsx +36 -13
flowyml/ui/frontend/src/contexts/AIAssistantContext.jsx +245 -0
flowyml/ui/frontend/src/contexts/AuthContext.jsx +108 -0
flowyml/ui/frontend/src/hooks/useAIContext.js +156 -0
flowyml/ui/frontend/src/hooks/useWebGPU.js +54 -0
flowyml/ui/frontend/src/layouts/MainLayout.jsx +6 -0
flowyml/ui/frontend/src/router/index.jsx +47 -20
flowyml/ui/frontend/src/services/pluginService.js +3 -1
flowyml/ui/server_manager.py +5 -5
flowyml/ui/utils.py +157 -39
flowyml/utils/config.py +37 -15
flowyml/utils/model_introspection.py +123 -0
flowyml/utils/observability.py +30 -0
flowyml-1.8.0.dist-info/METADATA +174 -0
{flowyml-1.7.2.dist-info → flowyml-1.8.0.dist-info}/RECORD +123 -65
{flowyml-1.7.2.dist-info → flowyml-1.8.0.dist-info}/WHEEL +1 -1
flowyml/ui/frontend/dist/assets/index-B40RsQDq.css +0 -1
flowyml/ui/frontend/dist/assets/index-CjI0zKCn.js +0 -685
flowyml-1.7.2.dist-info/METADATA +0 -477
{flowyml-1.7.2.dist-info → flowyml-1.8.0.dist-info}/entry_points.txt +0 -0
{flowyml-1.7.2.dist-info → flowyml-1.8.0.dist-info}/licenses/LICENSE +0 -0

flowyml/core/routing.py ADDED Viewed

@@ -0,0 +1,558 @@
+"""FlowyML Artifact Routing - Automatic Type-Based Artifact Routing.
+This module provides automatic routing of step outputs to appropriate
+infrastructure based on their Python types. When a step returns a
+`Model`, `Dataset`, `Metrics`, or other artifact type, the runtime
+automatically routes it to the configured stores and registries.
+Usage:
+    from flowyml.core.routing import route_artifact
+    # After step execution
+    result = step.func(**inputs)
+    # Route based on type and stack config
+    artifact_info = route_artifact(
+        output=result,
+        step_name="train_model",
+        run_id="run-123",
+    )
+The routing is configured via flowyml.yaml:
+    stacks:
+      gcp-prod:
+        artifact_routing:
+          Model: { store: gcs, register: true }
+          Dataset: { store: gcs }
+          Metrics: { log_to_tracker: true }
+"""
+import logging
+from typing import Any, get_type_hints
+from dataclasses import dataclass, field
+logger = logging.getLogger(__name__)
+@dataclass
+class RoutingResult:
+    """Result of artifact routing.
+    Attributes:
+        artifact_type: Name of the artifact type (Model, Dataset, etc.)
+        store_uri: URI where the artifact was stored
+        registered: Whether the artifact was registered (e.g., in model registry)
+        deployed: Whether the artifact was deployed (e.g., to endpoint)
+        endpoint_uri: URI of the deployment endpoint
+        logged: Whether the artifact was logged (e.g., metrics to tracker)
+        metadata: Additional metadata from routing
+    """
+    artifact_type: str | None = None
+    store_uri: str | None = None
+    registered: bool = False
+    deployed: bool = False
+    endpoint_uri: str | None = None
+    logged: bool = False
+    metadata: dict[str, Any] = field(default_factory=dict)
+def get_step_return_type(step_func: callable) -> type | None:
+    """Get the return type annotation from a step function.
+    Args:
+        step_func: The step function to inspect.
+    Returns:
+        The return type annotation, or None if not annotated.
+    """
+    try:
+        hints = get_type_hints(step_func)
+        return hints.get("return")
+    except Exception:
+        # Fallback to __annotations__ if get_type_hints fails
+        try:
+            return step_func.__annotations__.get("return")
+        except Exception:
+            return None
+def detect_artifact_type(output: Any) -> str | None:
+    """Detect the artifact type from an output value.
+    This checks if the output is an instance of one of our artifact types
+    or if it matches specific patterns (like dict for Metrics).
+    Args:
+        output: The step output value.
+    Returns:
+        Type name string or None.
+    """
+    # Import types here to avoid circular imports
+    from flowyml.core.types import Artifact, Model, Dataset, Metrics, Parameters
+    if isinstance(output, Model):
+        return "Model"
+    elif isinstance(output, Dataset):
+        return "Dataset"
+    elif isinstance(output, Metrics):
+        return "Metrics"
+    elif isinstance(output, Parameters):
+        return "Parameters"
+    elif isinstance(output, Artifact):
+        return type(output).__name__
+    return None
+def route_artifact(
+    output: Any,
+    step_name: str,
+    run_id: str,
+    return_type: type | None = None,
+    project_name: str = "default",
+) -> RoutingResult:
+    """Route a step output to appropriate infrastructure based on type.
+    This is the main entry point for type-based artifact routing.
+    It inspects the output type and routes to configured stores/registries.
+    Args:
+        output: The step output to route.
+        step_name: Name of the step that produced this output.
+        run_id: Current run identifier.
+        return_type: Optional return type annotation (if known).
+        project_name: Project name for namespacing.
+    Returns:
+        RoutingResult with routing information.
+    """
+    result = RoutingResult()
+    # Skip None outputs
+    if output is None:
+        return result
+    # Detect artifact type
+    artifact_type = detect_artifact_type(output)
+    # If not detected from value, try from type annotation
+    if artifact_type is None and return_type is not None:
+        try:
+            type_name = return_type.__name__ if hasattr(return_type, "__name__") else str(return_type)
+            if type_name in ("Model", "Dataset", "Metrics", "Parameters"):
+                artifact_type = type_name
+        except Exception:
+            pass
+    if artifact_type is None:
+        # Not a routable artifact type
+        return result
+    result.artifact_type = artifact_type
+    logger.debug(f"Routing {artifact_type} artifact from step '{step_name}'")
+    # Get routing configuration from active stack
+    try:
+        from flowyml.plugins.stack_config import get_routing_for_type, get_active_stack
+        routing_rule = get_routing_for_type(artifact_type)
+        stack = get_active_stack()
+        if routing_rule is None:
+            logger.debug(f"No routing rule for {artifact_type}, using defaults")
+            return result
+        # Route to artifact store
+        if routing_rule.store:
+            result.store_uri = _save_to_store(
+                output=output,
+                artifact_type=artifact_type,
+                store_name=routing_rule.store,
+                path=routing_rule.format_path(
+                    run_id=run_id,
+                    step_name=step_name,
+                    artifact_name=artifact_type.lower(),
+                ),
+                stack=stack,
+            )
+        # Register model if configured
+        if routing_rule.register and artifact_type == "Model":
+            result.registered = _register_model(
+                output=output,
+                step_name=step_name,
+                run_id=run_id,
+                stack=stack,
+            )
+        # Deploy model if configured and conditions are met
+        # Note: deploy=True just enables deployment - actual deployment depends on deploy_condition
+        if routing_rule.deploy and artifact_type == "Model":
+            # Get metrics from model metadata for conditional deployment
+            model_metrics = None
+            if hasattr(output, "metadata") and output.metadata:
+                model_metrics = output.metadata.get("metrics", {})
+            # Check if auto-deployment should proceed
+            if routing_rule.should_auto_deploy(model_metrics):
+                endpoint_name = routing_rule.endpoint_name or f"{step_name}-endpoint"
+                result.deployed, result.endpoint_uri = _deploy_model(
+                    output=output,
+                    step_name=step_name,
+                    run_id=run_id,
+                    endpoint_name=endpoint_name,
+                    stack=stack,
+                )
+            else:
+                # Log that deployment is pending approval/manual action
+                condition = routing_rule.deploy_condition
+                if condition == "manual":
+                    logger.info(
+                        f"Model registered but not deployed (deploy_condition='manual'). "
+                        f"Use 'flowyml model deploy {output.name}' to deploy.",
+                    )
+                elif condition == "on_approval":
+                    logger.info("Model registered, awaiting approval for deployment.")
+                elif condition == "auto" and routing_rule.deploy_min_metrics:
+                    logger.info(
+                        f"Model not deployed - metrics did not meet thresholds: " f"{routing_rule.deploy_min_metrics}",
+                    )
+        # Log metrics if configured
+        if routing_rule.log_to_tracker and artifact_type == "Metrics":
+            result.logged = _log_metrics(
+                output=output,
+                step_name=step_name,
+                run_id=run_id,
+                stack=stack,
+            )
+        # Log parameters if configured
+        if routing_rule.log_to_tracker and artifact_type == "Parameters":
+            result.logged = _log_parameters(
+                output=output,
+                step_name=step_name,
+                run_id=run_id,
+                stack=stack,
+            )
+        # Add routing metadata
+        result.metadata = {
+            "store": routing_rule.store,
+            "path": routing_rule.path,
+            "registered": result.registered,
+            "deployed": result.deployed,
+            "logged": result.logged,
+        }
+    except ImportError:
+        logger.debug("Stack config not available, skipping routing")
+    except Exception as e:
+        logger.warning(f"Error during artifact routing: {e}")
+    return result
+def _save_to_store(
+    output: Any,
+    artifact_type: str,
+    store_name: str,
+    path: str,
+    stack: Any,
+) -> str | None:
+    """Save artifact to the configured store.
+    Args:
+        output: The artifact to save.
+        artifact_type: Type of the artifact.
+        store_name: Name of the store (gcs, s3, local).
+        path: Path within the store.
+        stack: Stack configuration.
+    Returns:
+        URI of the saved artifact or None.
+    """
+    try:
+        # Get artifact store from stack
+        if store_name and stack and stack.artifact_stores:
+            store_config = stack.artifact_stores.get(store_name)
+            if store_config:
+                # Instantiate and use the store
+                from flowyml.plugins.config import get_artifact_store
+                store = get_artifact_store()
+                if store:
+                    # Extract data if it's an Artifact wrapper
+                    from flowyml.core.types import Artifact
+                    data = output.data if isinstance(output, Artifact) else output
+                    return store.save(data, path)
+        # Fallback to default artifact store
+        from flowyml.plugins.config import get_artifact_store
+        store = get_artifact_store()
+        if store:
+            from flowyml.core.types import Artifact
+            data = output.data if isinstance(output, Artifact) else output
+            return store.save(data, path)
+    except Exception as e:
+        logger.warning(f"Failed to save artifact to store: {e}")
+    return None
+def _register_model(
+    output: Any,
+    step_name: str,
+    run_id: str,
+    stack: Any,
+) -> bool:
+    """Register a model in the model registry.
+    Args:
+        output: The Model artifact.
+        step_name: Step that produced the model.
+        run_id: Current run ID.
+        stack: Stack configuration.
+    Returns:
+        True if registration was successful.
+    """
+    try:
+        from flowyml.core.types import Model
+        if not isinstance(output, Model):
+            return False
+        # Get model registry from plugins
+        from flowyml.plugins.config import get_config
+        config = get_config()
+        registry = config._get_plugin("model_registry")
+        if registry:
+            model_name = output.name or f"{step_name}_model"
+            model_uri = output.uri or f"runs/{run_id}/models/{step_name}"
+            registry.register_model(
+                name=model_name,
+                model_uri=model_uri,
+                version=output.version,
+                metadata={
+                    "framework": output.framework,
+                    "step_name": step_name,
+                    "run_id": run_id,
+                    **output.metadata,
+                },
+            )
+            logger.info(f"Registered model '{model_name}' to registry")
+            return True
+    except Exception as e:
+        logger.warning(f"Failed to register model: {e}")
+    return False
+def _deploy_model(
+    output: Any,
+    step_name: str,
+    run_id: str,
+    endpoint_name: str,
+    stack: Any,
+) -> tuple[bool, str | None]:
+    """Deploy a model to an endpoint.
+    Args:
+        output: The Model artifact.
+        step_name: Step that produced the model.
+        run_id: Current run ID.
+        endpoint_name: Name for the endpoint.
+        stack: Stack configuration.
+    Returns:
+        Tuple of (success, endpoint_uri).
+    """
+    try:
+        from flowyml.core.types import Model
+        if not isinstance(output, Model):
+            return False, None
+        # Get model deployer from stack config
+        if stack and stack.model_deployer:
+            deployer_config = stack.model_deployer
+            deployer_type = deployer_config.get("type", "")
+            deployer = None
+            # Instantiate the appropriate deployer
+            if "vertex" in deployer_type:
+                from flowyml.plugins.deployers.vertex import VertexEndpointDeployer
+                deployer = VertexEndpointDeployer(
+                    project=deployer_config.get("project"),
+                    location=deployer_config.get("location", "us-central1"),
+                )
+            elif "sagemaker" in deployer_type:
+                from flowyml.plugins.deployers.sagemaker import SageMakerEndpointDeployer
+                deployer = SageMakerEndpointDeployer(
+                    region=deployer_config.get("region"),
+                    role_arn=deployer_config.get("role_arn"),
+                )
+            if deployer:
+                deployer.initialize()
+                # Get model URI (from artifact store or output)
+                model_uri = output.uri or f"runs/{run_id}/models/{step_name}"
+                endpoint_uri = deployer.deploy(
+                    model_uri=model_uri,
+                    endpoint_name=endpoint_name,
+                )
+                logger.info(f"Deployed model to endpoint: {endpoint_uri}")
+                return True, endpoint_uri
+        # No deployer configured
+        logger.debug("No model deployer configured in stack")
+        return False, None
+    except Exception as e:
+        logger.warning(f"Failed to deploy model: {e}")
+    return False, None
+def _log_metrics(
+    output: Any,
+    step_name: str,
+    run_id: str,
+    stack: Any,
+) -> bool:
+    """Log metrics to the experiment tracker.
+    Args:
+        output: The Metrics artifact (dict-like).
+        step_name: Step that produced the metrics.
+        run_id: Current run ID.
+        stack: Stack configuration.
+    Returns:
+        True if logging was successful.
+    """
+    try:
+        from flowyml.core.types import Metrics
+        from flowyml.plugins.config import get_tracker
+        tracker = get_tracker()
+        if tracker:
+            # Get metrics values
+            if isinstance(output, Metrics):
+                metrics_dict = dict(output)
+                step_num = output._step
+            else:
+                metrics_dict = dict(output)
+                step_num = None
+            tracker.log_metrics(metrics_dict, step=step_num)
+            logger.debug(f"Logged metrics from step '{step_name}': {list(metrics_dict.keys())}")
+            return True
+    except Exception as e:
+        logger.warning(f"Failed to log metrics: {e}")
+    return False
+def _log_parameters(
+    output: Any,
+    step_name: str,
+    run_id: str,
+    stack: Any,
+) -> bool:
+    """Log parameters to the experiment tracker.
+    Args:
+        output: The Parameters artifact (dict-like).
+        step_name: Step that uses the parameters.
+        run_id: Current run ID.
+        stack: Stack configuration.
+    Returns:
+        True if logging was successful.
+    """
+    try:
+        from flowyml.core.types import Parameters
+        from flowyml.plugins.config import get_tracker
+        tracker = get_tracker()
+        if tracker:
+            # Get parameter values
+            if isinstance(output, Parameters):
+                params_dict = dict(output)
+            else:
+                params_dict = dict(output)
+            # Log parameters (with step prefix for clarity)
+            prefixed_params = {f"{step_name}/{k}": v for k, v in params_dict.items()}
+            tracker.log_params(prefixed_params)
+            logger.debug(f"Logged parameters from step '{step_name}': {list(params_dict.keys())}")
+            return True
+    except Exception as e:
+        logger.warning(f"Failed to log parameters: {e}")
+    return False
+def should_route(output: Any) -> bool:
+    """Check if an output should be routed.
+    Args:
+        output: The step output.
+    Returns:
+        True if the output should be routed.
+    """
+    if output is None:
+        return False
+    from flowyml.core.types import is_artifact_type
+    return is_artifact_type(output)
+def auto_route_metrics_and_params(
+    output: Any,
+    step_name: str,
+    run_id: str,
+) -> bool:
+    """Automatically route Metrics and Parameters without explicit config.
+    This is a convenience function that can be called to log Metrics
+    and Parameters even when no routing rule is configured.
+    Args:
+        output: The step output.
+        step_name: Step name.
+        run_id: Run ID.
+    Returns:
+        True if logging was successful.
+    """
+    from flowyml.core.types import Metrics, Parameters
+    if isinstance(output, Metrics):
+        return _log_metrics(output, step_name, run_id, None)
+    elif isinstance(output, Parameters):
+        return _log_parameters(output, step_name, run_id, None)
+    return False

flowyml/core/step.py CHANGED Viewed

@@ -31,6 +31,8 @@ class StepConfig:
     tags: dict[str, str] = field(default_factory=dict)
     condition: Callable | None = None
     execution_group: str | None = None
+    source_file: str | None = None
+    source_line: int | None = None
     def __hash__(self):
         """Make StepConfig hashable."""
@@ -84,11 +86,15 @@ class Step:
         self.condition = condition
         self.execution_group = execution_group
-        # Capture source code for UI display
+        # Capture source code and location for UI display
         try:
             self.source_code = inspect.getsource(func)
+            self.source_file = inspect.getsourcefile(func)
+            _, self.source_line = inspect.getsourcelines(func)
         except (OSError, TypeError):
             self.source_code = "# Source code not available"
+            self.source_file = None
+            self.source_line = None
         self.config = StepConfig(
             name=self.name,
@@ -102,6 +108,8 @@ class Step:
             tags=self.tags,
             condition=self.condition,
             execution_group=self.execution_group,
+            source_file=self.source_file,
+            source_line=self.source_line,
         )
     def __call__(self, *args, **kwargs):

flowyml/core/step_grouping.py CHANGED Viewed

@@ -172,26 +172,23 @@ class StepGroupAnalyzer:
         Returns:
             True if steps can execute consecutively
         """
-        # Get all dependencies of step2
-        step2_deps = dag.get_all_dependencies(step2.name)
+        # Get ALL transitively producing and consuming nodes between step1 and step2
+        # Steps are consecutive if there are no intermediate steps NOT in this group
+        # that must execute between step1 and step2.
+        all_deps_of_s2 = dag.get_all_dependencies(step2.name)
-        # If step2 doesn't depend on anything in the group, they can be consecutive
-        # (parallel steps in same group are OK if no dependencies)
-        group_deps = step2_deps & group_step_names
-        if not group_deps:
-            # No dependencies from this group, consecutive is OK
-            return True
+        # If step1 is not even a dependency of step2, they are independent.
+        # They can be grouped as long as there is no path from step1 to step2
+        # through an external step.
-        # If step2 depends on step1, check for intermediate group steps
-        if step1.name in step2_deps:
-            # Get all group steps that step2 depends on (excluding step1)
-            intermediate = group_deps - {step1.name}
+        # All nodes on any path from step1 to step2:
+        all_successors_of_s1 = dag.get_all_dependents(step1.name)
+        intermediate_nodes = all_successors_of_s1 & all_deps_of_s2
-            # If there are NO intermediate group steps, they're consecutive
-            return len(intermediate) == 0
+        # If any node on a path from s1 to s2 is NOT in the group, they are not consecutive
+        external_intermediates = intermediate_nodes - group_step_names
-        # step2 doesn't depend on step1, not consecutive
-        return False
+        return len(external_intermediates) == 0
     def _get_execution_order(self, steps: list[Step], dag: DAG) -> list[str]:
         """Get topological execution order for steps in a group.
@@ -264,29 +261,46 @@ def get_execution_units(dag: DAG, steps: list[Step]) -> list[Step | StepGroup]:
         for step in group.steps:
             step_to_group[step.name] = group
-    # Get topological order of all nodes
-    all_nodes = dag.topological_sort()
+    # To correctly determine execution order of units (which may have changed due to grouping),
+    # we build a new DAG where each node is an execution unit (Step or StepGroup).
+    from flowyml.core.graph import Node as DAGNode
-    # Build execution units, avoiding duplicates for grouped steps
-    execution_units: list[Step | StepGroup] = []
-    processed_groups: set[str] = set()
+    units_dag = DAG()
+    unit_map: dict[str, Step | StepGroup] = {}
-    for node in all_nodes:
-        # Find the step object
-        step = next((s for s in steps if s.name == node.name), None)
-        if not step:
+    # Add units as nodes
+    processed_steps = set()
+    for step in steps:
+        if step.name in processed_steps:
             continue
-        # Check if this step belongs to a group
+        unit: Step | StepGroup
         if step.name in step_to_group:
-            group = step_to_group[step.name]
-            # Only add the group once (when we encounter its first step)
-            if group.group_name not in processed_groups:
-                execution_units.append(group)
-                processed_groups.add(group.group_name)
+            unit = step_to_group[step.name]
+            unit_name = f"group:{unit.group_name}"
+            # Extract names for inputs/outputs
+            u_inputs_set = set()
+            u_outputs_set = set()
+            for s in unit.steps:
+                u_inputs_set.update(s.inputs)
+                u_outputs_set.update(s.outputs)
+                processed_steps.add(s.name)
+            # External inputs are those not produced within the group
+            u_inputs = list(u_inputs_set - u_outputs_set)
+            u_outputs = list(u_outputs_set)
         else:
-            # Ungrouped step, add as-is
-            execution_units.append(step)
+            unit = step
+            unit_name = step.name
+            u_inputs = step.inputs
+            u_outputs = step.outputs
+            processed_steps.add(step.name)
+        unit_map[unit_name] = unit
+        units_dag.add_node(DAGNode(name=unit_name, step=unit, inputs=u_inputs, outputs=u_outputs))
+    # Build edges and sort
+    units_dag.build_edges()
+    sorted_unit_nodes = units_dag.topological_sort()
-    return execution_units
+    return [unit_map[node.name] for node in sorted_unit_nodes]

flowyml 1.7.2__py3-none-any.whl → 1.8.0__py3-none-any.whl

flowyml 1.7.2py3-none-any.whl → 1.8.0py3-none-any.whl