PyPI - soe-ai - Versions diffs - 0.2.0b1__py3-none-any.whl - Mend

soe-ai 0.2.0b1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (145) hide show

soe/__init__.py +50 -0
soe/broker.py +168 -0
soe/builtin_tools/__init__.py +51 -0
soe/builtin_tools/soe_add_signal.py +82 -0
soe/builtin_tools/soe_call_tool.py +111 -0
soe/builtin_tools/soe_copy_context.py +80 -0
soe/builtin_tools/soe_explore_docs.py +290 -0
soe/builtin_tools/soe_get_available_tools.py +42 -0
soe/builtin_tools/soe_get_context.py +50 -0
soe/builtin_tools/soe_get_context_schema.py +56 -0
soe/builtin_tools/soe_get_identities.py +63 -0
soe/builtin_tools/soe_get_workflows.py +63 -0
soe/builtin_tools/soe_inject_context_schema_field.py +80 -0
soe/builtin_tools/soe_inject_identity.py +64 -0
soe/builtin_tools/soe_inject_node.py +86 -0
soe/builtin_tools/soe_inject_workflow.py +105 -0
soe/builtin_tools/soe_list_contexts.py +73 -0
soe/builtin_tools/soe_remove_context_schema_field.py +61 -0
soe/builtin_tools/soe_remove_identity.py +61 -0
soe/builtin_tools/soe_remove_node.py +72 -0
soe/builtin_tools/soe_remove_workflow.py +62 -0
soe/builtin_tools/soe_update_context.py +54 -0
soe/docs/_config.yml +10 -0
soe/docs/advanced_patterns/guide_fanout_and_aggregations.md +318 -0
soe/docs/advanced_patterns/guide_inheritance.md +435 -0
soe/docs/advanced_patterns/hybrid_intelligence.md +237 -0
soe/docs/advanced_patterns/index.md +49 -0
soe/docs/advanced_patterns/operational.md +781 -0
soe/docs/advanced_patterns/self_evolving_workflows.md +385 -0
soe/docs/advanced_patterns/swarm_intelligence.md +211 -0
soe/docs/builtins/context.md +164 -0
soe/docs/builtins/context_schema.md +158 -0
soe/docs/builtins/identity.md +139 -0
soe/docs/builtins/soe_explore_docs.md +135 -0
soe/docs/builtins/tools.md +164 -0
soe/docs/builtins/workflows.md +199 -0
soe/docs/guide_00_getting_started.md +341 -0
soe/docs/guide_01_tool.md +206 -0
soe/docs/guide_02_llm.md +143 -0
soe/docs/guide_03_router.md +146 -0
soe/docs/guide_04_patterns.md +475 -0
soe/docs/guide_05_agent.md +159 -0
soe/docs/guide_06_schema.md +397 -0
soe/docs/guide_07_identity.md +540 -0
soe/docs/guide_08_child.md +612 -0
soe/docs/guide_09_ecosystem.md +690 -0
soe/docs/guide_10_infrastructure.md +427 -0
soe/docs/guide_11_builtins.md +126 -0
soe/docs/index.md +104 -0
soe/docs/primitives/backends.md +281 -0
soe/docs/primitives/context.md +256 -0
soe/docs/primitives/node_reference.md +259 -0
soe/docs/primitives/primitives.md +331 -0
soe/docs/primitives/signals.md +865 -0
soe/docs_index.py +2 -0
soe/init.py +165 -0
soe/lib/__init__.py +0 -0
soe/lib/child_context.py +46 -0
soe/lib/context_fields.py +51 -0
soe/lib/inheritance.py +172 -0
soe/lib/jinja_render.py +113 -0
soe/lib/operational.py +51 -0
soe/lib/parent_sync.py +71 -0
soe/lib/register_event.py +75 -0
soe/lib/schema_validation.py +134 -0
soe/lib/yaml_parser.py +14 -0
soe/local_backends/__init__.py +18 -0
soe/local_backends/factory.py +124 -0
soe/local_backends/in_memory/context.py +38 -0
soe/local_backends/in_memory/conversation_history.py +60 -0
soe/local_backends/in_memory/identity.py +52 -0
soe/local_backends/in_memory/schema.py +40 -0
soe/local_backends/in_memory/telemetry.py +38 -0
soe/local_backends/in_memory/workflow.py +33 -0
soe/local_backends/storage/context.py +57 -0
soe/local_backends/storage/conversation_history.py +82 -0
soe/local_backends/storage/identity.py +118 -0
soe/local_backends/storage/schema.py +96 -0
soe/local_backends/storage/telemetry.py +72 -0
soe/local_backends/storage/workflow.py +56 -0
soe/nodes/__init__.py +13 -0
soe/nodes/agent/__init__.py +10 -0
soe/nodes/agent/factory.py +134 -0
soe/nodes/agent/lib/loop_handlers.py +150 -0
soe/nodes/agent/lib/loop_state.py +157 -0
soe/nodes/agent/lib/prompts.py +65 -0
soe/nodes/agent/lib/tools.py +35 -0
soe/nodes/agent/stages/__init__.py +12 -0
soe/nodes/agent/stages/parameter.py +37 -0
soe/nodes/agent/stages/response.py +54 -0
soe/nodes/agent/stages/router.py +37 -0
soe/nodes/agent/state.py +111 -0
soe/nodes/agent/types.py +66 -0
soe/nodes/agent/validation/__init__.py +11 -0
soe/nodes/agent/validation/config.py +95 -0
soe/nodes/agent/validation/operational.py +24 -0
soe/nodes/child/__init__.py +3 -0
soe/nodes/child/factory.py +61 -0
soe/nodes/child/state.py +59 -0
soe/nodes/child/validation/__init__.py +11 -0
soe/nodes/child/validation/config.py +126 -0
soe/nodes/child/validation/operational.py +28 -0
soe/nodes/lib/conditions.py +71 -0
soe/nodes/lib/context.py +24 -0
soe/nodes/lib/conversation_history.py +77 -0
soe/nodes/lib/identity.py +64 -0
soe/nodes/lib/llm_resolver.py +142 -0
soe/nodes/lib/output.py +68 -0
soe/nodes/lib/response_builder.py +91 -0
soe/nodes/lib/signal_emission.py +79 -0
soe/nodes/lib/signals.py +54 -0
soe/nodes/lib/tools.py +100 -0
soe/nodes/llm/__init__.py +7 -0
soe/nodes/llm/factory.py +103 -0
soe/nodes/llm/state.py +76 -0
soe/nodes/llm/types.py +12 -0
soe/nodes/llm/validation/__init__.py +11 -0
soe/nodes/llm/validation/config.py +89 -0
soe/nodes/llm/validation/operational.py +23 -0
soe/nodes/router/__init__.py +3 -0
soe/nodes/router/factory.py +37 -0
soe/nodes/router/state.py +32 -0
soe/nodes/router/validation/__init__.py +11 -0
soe/nodes/router/validation/config.py +58 -0
soe/nodes/router/validation/operational.py +16 -0
soe/nodes/tool/factory.py +66 -0
soe/nodes/tool/lib/__init__.py +11 -0
soe/nodes/tool/lib/conditions.py +35 -0
soe/nodes/tool/lib/failure.py +28 -0
soe/nodes/tool/lib/parameters.py +67 -0
soe/nodes/tool/state.py +66 -0
soe/nodes/tool/types.py +27 -0
soe/nodes/tool/validation/__init__.py +15 -0
soe/nodes/tool/validation/config.py +132 -0
soe/nodes/tool/validation/operational.py +16 -0
soe/types.py +209 -0
soe/validation/__init__.py +18 -0
soe/validation/config.py +195 -0
soe/validation/jinja.py +54 -0
soe/validation/operational.py +110 -0
soe_ai-0.2.0b1.dist-info/METADATA +262 -0
soe_ai-0.2.0b1.dist-info/RECORD +145 -0
soe_ai-0.2.0b1.dist-info/WHEEL +5 -0
soe_ai-0.2.0b1.dist-info/licenses/LICENSE +21 -0
soe_ai-0.2.0b1.dist-info/top_level.txt +1 -0

soe/docs/guide_06_schema.md ADDED Viewed

@@ -0,0 +1,397 @@
+# SOE Guide: Chapter 6 - Context Schema
+## Introduction to Context Schema
+**Context Schema** provides optional type validation for context fields. When an LLM node writes to a context field, the schema ensures the output matches the expected type (string, integer, object, etc.).
+> **Note**: This was previously called just "Schema". We renamed it to "Context Schema" to distinguish it from the Identity Schema (see [Chapter 7](guide_07_identity.md)).
+### Why Use Context Schema?
+- **Type Safety**: Catch malformed LLM output before it breaks downstream nodes.
+- **Tool Integration**: Ensure LLM output has the correct structure for tools.
+- **Documentation**: Schema definitions serve as documentation for your workflow's data model.
+- **Removes Prompt Boilerplate**: You don't need to specify output format in every prompt—the schema handles it.
+## Defining a Schema
+Schemas are defined per-workflow, mapping field names to their types:
+```python
+schemas = {
+    "example_workflow": {
+        "summary": {
+            "type": "string",
+            "description": "A one-sentence summary of the input text"
+        }
+    }
+}
+```
+### Available Types
+| Type | Python Type | Description |
+|------|-------------|-------------|
+| `string` | `str` | Text values |
+| `integer` | `int` | Whole numbers |
+| `number` | `float` | Decimal numbers |
+| `boolean` | `bool` | True/False |
+| `object` | `dict` | JSON objects |
+| `list` | `list` | Arrays |
+| `dict` | `dict` | Alias for object |
+## Your First Schema (Full Config)
+Let's validate that an LLM returns a proper string summary using the **combined config** format (workflows + context_schema in one YAML).
+### Full Workflow + Schema (Config)
+```yaml
+workflows:
+  example_workflow:
+    SummarizeLLM:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Summarize the following text in one sentence: &#123;&#123; context.input_text &#125;&#125;"
+      output_field: summary
+      event_emissions:
+        - signal_name: SUMMARY_COMPLETE
+context_schema:
+  summary:
+    type: string
+    description: A one-sentence summary of the input text
+```
+### How It Works
+1.  The LLM node writes to `output_field: summary`.
+2.  Schema backend finds the schema for `summary`.
+3.  The LLM returns the **schema value directly** (no wrapper key).
+4.  Valid output → saved to context under `summary` → `SUMMARY_COMPLETE` emitted.
+## Integer Schema (Full Config)
+For numeric outputs like counts or scores:
+### Full Workflow + Schema (Config)
+```yaml
+workflows:
+  example_workflow:
+    CounterLLM:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Count the number of words in this text: &#123;&#123; context.input_text &#125;&#125;. Return only the count."
+      output_field: word_count
+      event_emissions:
+        - signal_name: COUNT_COMPLETE
+context_schema:
+  word_count:
+    type: integer
+    description: The number of words in the input text
+```
+The LLM must return `42` (an integer), not `"forty-two"`.
+## Object Schema (Full Config)
+For structured data extraction:
+### Full Workflow + Schema (Config)
+```yaml
+workflows:
+  example_workflow:
+    ExtractorLLM:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Extract the person's name and age from: &#123;&#123; context.input_text &#125;&#125;. Return as JSON with 'name' and 'age' fields."
+      output_field: person_data
+      event_emissions:
+        - signal_name: EXTRACTION_COMPLETE
+context_schema:
+  person_data:
+    type: object
+    description: Extracted person data with name and age
+    properties:
+      name:
+        type: string
+      age:
+        type: integer
+```
+Object schemas accept JSON objects. You can also define nested fields with `properties`.
+### Nested Object Schema (with `properties`)
+```yaml
+context_schema:
+    person_data:
+        type: object
+        description: Person data
+        properties:
+            name:
+                type: string
+            age:
+                type: integer
+            address:
+                type: object
+                properties:
+                    city:
+                        type: string
+                    zip:
+                        type: string
+```
+**Valid LLM output (no wrapper):**
+```json
+{"name": "Bob", "age": 25, "address": {"city": "NYC", "zip": "10001"}}
+```
+## Schema with Tool Integration (Full Config)
+Schema shines when LLM output feeds into tool parameters. This ensures the LLM returns data in the exact format your tool expects.
+### Full Workflow + Schema (Config)
+```yaml
+workflows:
+  example_workflow:
+    ParameterExtractor:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Extract the operation and numbers from: &#123;&#123; context.user_request &#125;&#125;. Return JSON with 'operation' (add/multiply) and 'numbers' (list of integers)."
+      output_field: params
+      event_emissions:
+        - signal_name: PARAMS_EXTRACTED
+    Calculator:
+      node_type: tool
+      event_triggers: [PARAMS_EXTRACTED]
+      tool_name: calculate
+      context_parameter_field: params
+      output_field: result
+      event_emissions:
+        - signal_name: CALCULATED
+context_schema:
+  params:
+    type: object
+    description: Extracted parameters with operation and numbers
+    properties:
+      operation:
+        type: string
+      numbers:
+        type: list
+        items:
+          type: integer
+  result:
+    type: object
+    description: Calculation result
+```
+### Data Flow
+1.  `ParameterExtractor` LLM extracts `{ "operation": "add", "numbers": [10, 20, 30] }`.
+2.  Schema validates this is an object (dict).
+3.  `Calculator` tool receives the validated params.
+4.  Tool returns result, also validated against schema.
+## Multiple Fields (Full Config)
+A single workflow can have schemas for multiple fields:
+### Full Workflow + Schema (Config)
+```yaml
+workflows:
+  example_workflow:
+    AnalyzerLLM:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Analyze this text: &#123;&#123; context.input_text &#125;&#125;. Extract the topic and key points."
+      output_field: topic
+      event_emissions:
+        - signal_name: TOPIC_EXTRACTED
+    SummarizerLLM:
+      node_type: llm
+      event_triggers: [TOPIC_EXTRACTED]
+      prompt: "Given the topic '&#123;&#123; context.topic &#125;&#125;', provide a brief summary of: &#123;&#123; context.input_text &#125;&#125;"
+      output_field: summary
+      event_emissions:
+        - signal_name: ANALYSIS_COMPLETE
+context_schema:
+  topic:
+    type: string
+    description: The main topic of the text
+  summary:
+    type: string
+    description: A brief summary based on the topic
+```
+Each field is validated independently when its LLM node completes.
+## Agent Node + Schema (Full Config)
+```yaml
+workflows:
+  example_workflow:
+    DataAgent:
+      node_type: agent
+      event_triggers: [START]
+      prompt: "Process this request: &#123;&#123; context.user_request &#125;&#125;"
+      tools: [fetch_data]
+      output_field: response
+      event_emissions:
+        - signal_name: AGENT_COMPLETE
+context_schema:
+  response:
+    type: string
+    description: The agent's final response to the user
+```
+The agent response is validated against the schema for `response`.
+## Schema is Optional (Workflow Only)
+Schemas are completely optional. Workflows work fine without them:
+### The Workflow (No context_schema)
+```yaml
+example_workflow:
+  FreeLLM:
+    node_type: llm
+    event_triggers: [START]
+    prompt: "Do whatever you want with: &#123;&#123; context.input_text &#125;&#125;"
+    output_field: output
+    event_emissions:
+      - signal_name: DONE
+```
+Without schema, LLM output is saved as-is without validation. This is fine for:
+- Prototyping
+- Free-form text generation
+- When you trust the LLM output format
+## Output Shape (Important)
+When `context_schema` is present, the LLM should return the **schema value directly**:
+- For `string`: `"short summary"`
+- For `integer`: `42`
+- For `object`: `{ "domain": "ECOSYSTEM", "instruction": "..." }`
+- For `list`: `["a", "b", "c"]`
+SOE stores that value under `context[output_field]`.
+## Defining Schemas in Config (Recommended)
+The simplest approach is including `context_schema` directly in your config YAML:
+```yaml
+# Complete config with workflows and context_schema
+workflows:
+  example_workflow:
+    Summarizer:
+      node_type: llm
+      event_triggers: [START]
+      prompt: "Summarize: {{ context.input }}"
+      output_field: summary
+      event_emissions:
+        - signal_name: DONE
+context_schema:
+  summary:
+    type: string
+    description: A one-sentence summary
+  result:
+    type: object
+    description: The workflow result
+```
+Then pass the entire config to orchestrate:
+```python
+from soe import orchestrate
+execution_id = orchestrate(
+    config=CONFIG_YAML,  # The YAML string above
+    initial_workflow_name="example_workflow",
+    initial_signals=["START"],
+    initial_context={"input": "test"},
+    backends=backends,
+    broadcast_signals_caller=broadcast_signals_caller,
+)
+```
+When `context_schema` is included in config:
+1. It's automatically extracted and saved to the `ContextSchemaBackend`
+2. It's keyed by `execution_id` (specifically `main_execution_id`)
+3. Child workflows can access parent's schema through the same `main_execution_id`
+### Backend Requirement
+For context schema to work, you need a `ContextSchemaBackend`. The local backends include one:
+```python
+from soe.local_backends import create_local_backends
+backends = create_local_backends(
+    context_storage_dir="./data/contexts",
+    workflow_storage_dir="./data/workflows",
+    schema_storage_dir="./data/schemas",  # Context schema storage
+)
+```
+**Recommendation**: Use the same database for workflows, context, identities, and context_schema. The backend methods create separate tables, not separate databases. This simplifies infrastructure management.
+## Saving Schemas Programmatically
+You can also save schemas via the backend directly. Note that schemas are keyed by `execution_id`, not workflow name:
+```python
+from soe import orchestrate
+from soe.local_backends import create_local_backends
+backends = create_local_backends(...)
+# Run orchestrate first to get the execution_id
+execution_id = orchestrate(
+    config=MY_WORKFLOW,
+    initial_workflow_name="my_workflow",
+    initial_signals=["START"],
+    initial_context={"input": "test"},
+    backends=backends,
+    broadcast_signals_caller=broadcast_signals_caller,
+)
+# Retrieve schema (keyed by execution_id)
+schema = backends.context_schema.get_context_schema(execution_id)
+# Get schema for specific field
+field_schema = backends.context_schema.get_field_schema(execution_id, "result")
+```
+**Important**: The preferred approach is defining `context_schema` in your config, which automatically saves it before orchestration begins.
+## Key Points
+- **Optional but powerful**: Use schemas when type safety matters.
+- **Define in config**: Use `context_schema` section in your config for automatic setup.
+- **Keyed by execution_id**: Schemas are stored by `main_execution_id`, enabling child workflow access.
+- **Per-field types**: Each context field can have its own type.
+- **LLM validation**: Ensures LLM output matches expected structure.
+- **Tool integration**: Critical when LLM output feeds tool parameters.
+## Next Steps
+Now that you understand how to validate LLM output structure, let's explore [Identity](guide_07_identity.md) for persisting conversation history across LLM calls →