PyPI - flowk - Versions diffs - 0.1.0__tar.gz - Mend

flowk 0.1.0__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

flowk-0.1.0/PKG-INFO +177 -0
flowk-0.1.0/README.md +161 -0
flowk-0.1.0/flowk/__init__.py +20 -0
flowk-0.1.0/flowk/debugger.py +68 -0
flowk-0.1.0/flowk/exceptions.py +15 -0
flowk-0.1.0/flowk/executor.py +256 -0
flowk-0.1.0/flowk/graph.py +147 -0
flowk-0.1.0/flowk/memory.py +57 -0
flowk-0.1.0/flowk/metrics.py +48 -0
flowk-0.1.0/flowk/node.py +112 -0
flowk-0.1.0/flowk/plugins/__init__.py +1 -0
flowk-0.1.0/flowk/plugins/base.py +55 -0
flowk-0.1.0/flowk/plugins/llm.py +19 -0
flowk-0.1.0/flowk/plugins/storage.py +27 -0
flowk-0.1.0/flowk/state.py +45 -0
flowk-0.1.0/flowk/storage.py +25 -0
flowk-0.1.0/flowk/utils.py +20 -0
flowk-0.1.0/flowk/visualization.py +61 -0
flowk-0.1.0/flowk.egg-info/PKG-INFO +177 -0
flowk-0.1.0/flowk.egg-info/SOURCES.txt +24 -0
flowk-0.1.0/flowk.egg-info/dependency_links.txt +1 -0
flowk-0.1.0/flowk.egg-info/requires.txt +1 -0
flowk-0.1.0/flowk.egg-info/top_level.txt +1 -0
flowk-0.1.0/pyproject.toml +27 -0
flowk-0.1.0/setup.cfg +4 -0
flowk-0.1.0/tests/test_core.py +50 -0

flowk-0.1.0/PKG-INFO ADDED Viewed

@@ -0,0 +1,177 @@
+Metadata-Version: 2.4
+Name: flowk
+Version: 0.1.0
+Summary: A lightweight, modular, and developer-first workflow orchestration engine for AI/LLM pipelines.
+Author-email: Folk Nallathambi <folkadonis7@gmail.com>
+Project-URL: Homepage, https://github.com/folkadonis/flowk
+Project-URL: Bug Tracker, https://github.com/folkadonis/flowk/issues
+Classifier: Programming Language :: Python :: 3
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Operating System :: OS Independent
+Classifier: Intended Audience :: Developers
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
+Requires-Python: >=3.8
+Description-Content-Type: text/markdown
+Requires-Dist: pydantic>=2.0.0
+# Flowk 🌊
+**Flowk** is a lightweight, high-performance workflow orchestration engine specifically designed for AI and LLM pipelines. It offers a simpler, developer-first alternative to complex frameworks while providing first-class support for complex routing, shared state memory, observability, and debugging.
+---
+## 🚀 Key Features
+- **Extremely Simple API:** Turn standard Python functions into executable graph nodes seamlessly.
+- **Node Retries & Fallbacks:** Built-in resilience out-of-the-box.
+- **Dynamic Routing:** Direct your execution paths dynamically on the fly based on outputs.
+- **Stepping & Time Travel:** Pausable execution steps and total trace replay capabilities.
+- **Telemetry & Visualization:** Live terminal tracking, cost metric emulation, and highly readable CLI flow rendering.
+- **Pluggable Architecture:** Tap into lifecycle hooks using Plugins effortlessly.
+---
+## 🛠️ Core Concepts
+### 1. The Graph
+The `Graph` is the brain of Flowk. It wires up nodes sequentially or through condition-based router intersections:
+```python
+from flowk import Graph
+g = Graph()
+```
+### 2. Nodes & State
+Nodes are just typical Python functions decorated with `@g.node()`. An internal `GraphState` mutable dictionary is implicitly available across your pipeline.
+```python
+# Pass `state` as an argument to read/write shared data across the lifecycle map
+@g.node(retries=3)
+def prepare_prompt(input_text: str, state: dict):
+    state["original_query"] = input_text
+    return input_text.upper()
+```
+### 3. Connections
+Bind nodes synchronously. The `Graph` auto-detects the first configured node as the entrypoint. All data returned from Node A automatically gets piped into Node B as the `input_text`.
+```python
+g.connect(prepare_prompt, call_llm)
+```
+### 4. Routing (Conditional Branching)
+When execution forks depend on context (e.g., standard request vs. priority request), use `g.route()`.
+```python
+def check_priority(result_from_previous_node: str):
+    return "fast" if "URGENT" in result_from_previous_node else "standard"
+# Map condition strings to actual handling Nodes
+router_node = g.route(check_priority, {
+    "fast": priority_handler_node,
+    "standard": normal_handler_node
+})
+g.connect(prepare_prompt, router_node)
+```
+---
+## 🔍 Tooling & Observability
+Flowk ships with beautiful tooling crafted identically for both fast prototyping and robust production monitoring.
+### Visualizing Graphs
+Check exactly how your configuration looks using `g.show()`.
+```text
+==================================================
+📊 FLOWK EXECUTION FLOW
+==================================================
+[ prepare_prompt ]
+  │
+  ▼
+⟪ priority_check ⟫ (Router)
+  │
+  ├─[fast]──────► [ priority_handler ]
+  │                 │
+  │                 ▼
+  │               [ cleanup ]
+  │
+  └─[standard]──► [ standard_handler ]
+                    │
+                    ▼
+                  [ cleanup ] 🔄 (already visited)
+==================================================
+```
+### Metrics Tracking
+Built-in timing tracking per node alongside mock LLM tracking usage:
+```python
+g.run("Hello!")
+from flowk import MetricsRegistry
+print(MetricsRegistry.get_summary())
+```
+### 🧠 Session Memory Management
+Flowk supports native execution memory persistence across multiple `.run()` calls via the `session_id` parameter. This is critically useful for multi-turn chat workflows where the LLM needs to continually append messages to the `GraphState` instead of wiping the slate clean!
+```python
+# Turns persist data appended into state automatically
+r1 = g.run("Hello", session_id="user_john")
+r2 = g.run("Are you there?", session_id="user_john")
+r3_anon = g.run("Who am I?") # Anonymous runs use empty states
+```
+### ⚡ Async, Streaming, and Parallel Execution (v2)
+Flowk utilizes high-performance asynchronous primitives to match enterprise scale:
+- Define any node as `async def` and Flowk natively awaits it without blocking the thread pool.
+- Use `g.arun()` for standard async resolution.
+- Broadcast real-time node outputs manually using `async for event in g.astream(...)`. This is extremely optimal for mapping LLM outputs into WebSocket frontends!
+- **Fan-Out Parallelism:** If a node splits into multiple separate nodes, Flowk executes all concurrent branches exactly concurrently using `asyncio.gather`.
+### 🛑 Human-in-The-Loop (Breakpoints)
+Need a human to review an action before it commits to a database? Interrupt the graph!
+```python
+# 1. Compile the graph with a breakpoint
+g.compile(interrupt_before=["commit_to_database"])
+# 2. Execution will stop and exit when reaching the node
+for event in g.astream(input_data, session_id="user_1"):
+    if event["type"] == "interrupt":
+        print("Waiting for human...")
+# 3. Later, resume using the exact same session_id!
+g.arun(None, session_id="user_1")
+```
+### 🛡️ Pydantic Safe-State Validation
+Never let a silent property typo crash a 20-minute LLM pipeline again. Wrap your shared state in a Pydantic schema:
+```python
+from pydantic import BaseModel
+class AgentState(BaseModel):
+    messages: list
+    cost: float
+g = Graph(state_schema=AgentState)
+# Flowk will validate `AgentState(**state)` between EVERY node execution.
+```
+### Debug & Time Travel
+Encountering bugs in a complex run? Flowk saves runs by default!
+- To run with highly verbose sequential logging, replace `g.run()` with `g.debug()`.
+- To sequentially replay historic traces visually in terminal, grab the `run_id` outputted from any run:
+  `g.replay("run-123-abc")`
+---
+## 🧩 Plugins (Extensions)
+Under the hood, flow runs evaluate through hooks (`on_run_start`, `on_node_start`, `on_node_end`, `on_run_end`). Check `flowk.plugins.base.Plugin` to extend the system yourself—like intercepting runs to store trace files via `FileStoragePlugin`!
+```python
+from flowk.plugins.base import PluginManager
+from flowk.plugins.storage import FileStoragePlugin
+PluginManager.register(FileStoragePlugin("server_logs.jsonl"))
+```

flowk-0.1.0/README.md ADDED Viewed

@@ -0,0 +1,161 @@
+# Flowk 🌊
+**Flowk** is a lightweight, high-performance workflow orchestration engine specifically designed for AI and LLM pipelines. It offers a simpler, developer-first alternative to complex frameworks while providing first-class support for complex routing, shared state memory, observability, and debugging.
+---
+## 🚀 Key Features
+- **Extremely Simple API:** Turn standard Python functions into executable graph nodes seamlessly.
+- **Node Retries & Fallbacks:** Built-in resilience out-of-the-box.
+- **Dynamic Routing:** Direct your execution paths dynamically on the fly based on outputs.
+- **Stepping & Time Travel:** Pausable execution steps and total trace replay capabilities.
+- **Telemetry & Visualization:** Live terminal tracking, cost metric emulation, and highly readable CLI flow rendering.
+- **Pluggable Architecture:** Tap into lifecycle hooks using Plugins effortlessly.
+---
+## 🛠️ Core Concepts
+### 1. The Graph
+The `Graph` is the brain of Flowk. It wires up nodes sequentially or through condition-based router intersections:
+```python
+from flowk import Graph
+g = Graph()
+```
+### 2. Nodes & State
+Nodes are just typical Python functions decorated with `@g.node()`. An internal `GraphState` mutable dictionary is implicitly available across your pipeline.
+```python
+# Pass `state` as an argument to read/write shared data across the lifecycle map
+@g.node(retries=3)
+def prepare_prompt(input_text: str, state: dict):
+    state["original_query"] = input_text
+    return input_text.upper()
+```
+### 3. Connections
+Bind nodes synchronously. The `Graph` auto-detects the first configured node as the entrypoint. All data returned from Node A automatically gets piped into Node B as the `input_text`.
+```python
+g.connect(prepare_prompt, call_llm)
+```
+### 4. Routing (Conditional Branching)
+When execution forks depend on context (e.g., standard request vs. priority request), use `g.route()`.
+```python
+def check_priority(result_from_previous_node: str):
+    return "fast" if "URGENT" in result_from_previous_node else "standard"
+# Map condition strings to actual handling Nodes
+router_node = g.route(check_priority, {
+    "fast": priority_handler_node,
+    "standard": normal_handler_node
+})
+g.connect(prepare_prompt, router_node)
+```
+---
+## 🔍 Tooling & Observability
+Flowk ships with beautiful tooling crafted identically for both fast prototyping and robust production monitoring.
+### Visualizing Graphs
+Check exactly how your configuration looks using `g.show()`.
+```text
+==================================================
+📊 FLOWK EXECUTION FLOW
+==================================================
+[ prepare_prompt ]
+  │
+  ▼
+⟪ priority_check ⟫ (Router)
+  │
+  ├─[fast]──────► [ priority_handler ]
+  │                 │
+  │                 ▼
+  │               [ cleanup ]
+  │
+  └─[standard]──► [ standard_handler ]
+                    │
+                    ▼
+                  [ cleanup ] 🔄 (already visited)
+==================================================
+```
+### Metrics Tracking
+Built-in timing tracking per node alongside mock LLM tracking usage:
+```python
+g.run("Hello!")
+from flowk import MetricsRegistry
+print(MetricsRegistry.get_summary())
+```
+### 🧠 Session Memory Management
+Flowk supports native execution memory persistence across multiple `.run()` calls via the `session_id` parameter. This is critically useful for multi-turn chat workflows where the LLM needs to continually append messages to the `GraphState` instead of wiping the slate clean!
+```python
+# Turns persist data appended into state automatically
+r1 = g.run("Hello", session_id="user_john")
+r2 = g.run("Are you there?", session_id="user_john")
+r3_anon = g.run("Who am I?") # Anonymous runs use empty states
+```
+### ⚡ Async, Streaming, and Parallel Execution (v2)
+Flowk utilizes high-performance asynchronous primitives to match enterprise scale:
+- Define any node as `async def` and Flowk natively awaits it without blocking the thread pool.
+- Use `g.arun()` for standard async resolution.
+- Broadcast real-time node outputs manually using `async for event in g.astream(...)`. This is extremely optimal for mapping LLM outputs into WebSocket frontends!
+- **Fan-Out Parallelism:** If a node splits into multiple separate nodes, Flowk executes all concurrent branches exactly concurrently using `asyncio.gather`.
+### 🛑 Human-in-The-Loop (Breakpoints)
+Need a human to review an action before it commits to a database? Interrupt the graph!
+```python
+# 1. Compile the graph with a breakpoint
+g.compile(interrupt_before=["commit_to_database"])
+# 2. Execution will stop and exit when reaching the node
+for event in g.astream(input_data, session_id="user_1"):
+    if event["type"] == "interrupt":
+        print("Waiting for human...")
+# 3. Later, resume using the exact same session_id!
+g.arun(None, session_id="user_1")
+```
+### 🛡️ Pydantic Safe-State Validation
+Never let a silent property typo crash a 20-minute LLM pipeline again. Wrap your shared state in a Pydantic schema:
+```python
+from pydantic import BaseModel
+class AgentState(BaseModel):
+    messages: list
+    cost: float
+g = Graph(state_schema=AgentState)
+# Flowk will validate `AgentState(**state)` between EVERY node execution.
+```
+### Debug & Time Travel
+Encountering bugs in a complex run? Flowk saves runs by default!
+- To run with highly verbose sequential logging, replace `g.run()` with `g.debug()`.
+- To sequentially replay historic traces visually in terminal, grab the `run_id` outputted from any run:
+  `g.replay("run-123-abc")`
+---
+## 🧩 Plugins (Extensions)
+Under the hood, flow runs evaluate through hooks (`on_run_start`, `on_node_start`, `on_node_end`, `on_run_end`). Check `flowk.plugins.base.Plugin` to extend the system yourself—like intercepting runs to store trace files via `FileStoragePlugin`!
+```python
+from flowk.plugins.base import PluginManager
+from flowk.plugins.storage import FileStoragePlugin
+PluginManager.register(FileStoragePlugin("server_logs.jsonl"))
+```

flowk-0.1.0/flowk/__init__.py ADDED Viewed

@@ -0,0 +1,20 @@
+"""
+Flowk: A lightweight, modular, and extensible workflow orchestration engine for AI/LLM pipelines.
+"""
+from flowk.graph import Graph
+from flowk.exceptions import GraphError, NodeExecutionError, InvalidGraphError, ReplayError
+from flowk.state import GraphState
+from flowk.metrics import MetricsRegistry
+__all__ = [
+    "Graph",
+    "GraphState",
+    "MetricsRegistry",
+    "GraphError",
+    "NodeExecutionError",
+    "InvalidGraphError",
+    "ReplayError"
+]
+__version__ = "0.1.0"

flowk-0.1.0/flowk/debugger.py ADDED Viewed

@@ -0,0 +1,68 @@
+import time
+import uuid
+from typing import Any
+from flowk.graph import Graph
+from flowk.storage import StorageRegistry
+from flowk.plugins.base import PluginManager, DebugPlugin
+from flowk.executor import SequentialExecutor
+class Debugger:
+    def __init__(self, graph: Graph):
+        self.graph = graph
+    def run(self, input_data: Any, session_id: str = None) -> Any:
+        run_id = f"debug_{uuid.uuid4().hex[:8]}"
+        debug_plugin = DebugPlugin()
+        # Attach strictly for this run
+        PluginManager.register(debug_plugin)
+        try:
+            executor = SequentialExecutor(self.graph)
+            return executor.execute(input_data, run_id=run_id, session_id=session_id)
+        finally:
+            # Cleanup plugin so subsequent graph.run() goes silent
+            PluginManager.plugins.remove(debug_plugin)
+    def replay(self, run_id: str):
+        print(f"\n⏪ REPLAYING RUN: {run_id}")
+        print("="*50)
+        trace = StorageRegistry.get_trace(run_id)
+        for step in trace:
+            print(f"\nStep {step['step']}: Node '{step['node']}'")
+            print(f"  Input:  {step['input']}")
+            print(f"  State:  {step['state_snapshot']}")
+            print(f"  Status: {step['status']}")
+            if step['status'] == 'error':
+                print(f"  Error:  {step['error']}")
+            else:
+                print(f"  Output: {step['output']}")
+            print(f"  Duration: {step['duration']:.4f}s")
+            time.sleep(0.5)
+        print("\n" + "="*50)
+        print("⏹️ REPLAY COMPLETE\n")
+    def step(self, input_data: Any):
+        """Interactive stepping generator (v1 simple console input)."""
+        run_id = f"step_{uuid.uuid4().hex[:8]}"
+        executor = SequentialExecutor(self.graph)
+        print("\n" + "="*50)
+        print("👞 STEP DEBUGGER STARTED")
+        print("="*50)
+        # We hook into nodes via a custom plugin
+        class SteppingPlugin(DebugPlugin):
+            def on_node_start(self, run_id, node, input_data, state):
+                super().on_node_start(run_id, node, input_data, state)
+                input("\n[Press Enter to execute this node...]")
+        step_plugin = SteppingPlugin()
+        PluginManager.register(step_plugin)
+        try:
+            return executor.execute(input_data, run_id=run_id)
+        finally:
+            PluginManager.plugins.remove(step_plugin)

flowk-0.1.0/flowk/exceptions.py ADDED Viewed

@@ -0,0 +1,15 @@
+class GraphError(Exception):
+    """Base exception for all graph-related errors."""
+    pass
+class NodeExecutionError(GraphError):
+    """Raised when a node fails to execute after all retries."""
+    pass
+class InvalidGraphError(GraphError):
+    """Raised when the graph structure is invalid."""
+    pass
+class ReplayError(GraphError):
+    """Raised when an execution trace cannot be replayed."""
+    pass