PyPI - qtype - Versions diffs - 0.0.12__py3-none-any.whl → 0.1.3__py3-none-any.whl - Mend

qtype 0.0.12py3-none-any.whl → 0.1.3py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (137) hide show

qtype/application/commons/tools.py +1 -1
qtype/application/converters/tools_from_api.py +476 -11
qtype/application/converters/tools_from_module.py +38 -14
qtype/application/converters/types.py +15 -30
qtype/application/documentation.py +1 -1
qtype/application/facade.py +102 -85
qtype/base/types.py +227 -7
qtype/cli.py +5 -1
qtype/commands/convert.py +52 -6
qtype/commands/generate.py +44 -4
qtype/commands/run.py +78 -36
qtype/commands/serve.py +74 -44
qtype/commands/validate.py +37 -14
qtype/commands/visualize.py +46 -25
qtype/dsl/__init__.py +6 -5
qtype/dsl/custom_types.py +1 -1
qtype/dsl/domain_types.py +86 -5
qtype/dsl/linker.py +384 -0
qtype/dsl/loader.py +315 -0
qtype/dsl/model.py +751 -263
qtype/dsl/parser.py +200 -0
qtype/dsl/types.py +50 -0
qtype/interpreter/api.py +63 -136
qtype/interpreter/auth/aws.py +19 -9
qtype/interpreter/auth/generic.py +93 -16
qtype/interpreter/base/base_step_executor.py +436 -0
qtype/interpreter/base/batch_step_executor.py +171 -0
qtype/interpreter/base/exceptions.py +50 -0
qtype/interpreter/base/executor_context.py +91 -0
qtype/interpreter/base/factory.py +84 -0
qtype/interpreter/base/progress_tracker.py +110 -0
qtype/interpreter/base/secrets.py +339 -0
qtype/interpreter/base/step_cache.py +74 -0
qtype/interpreter/base/stream_emitter.py +469 -0
qtype/interpreter/conversions.py +471 -22
qtype/interpreter/converters.py +79 -0
qtype/interpreter/endpoints.py +355 -0
qtype/interpreter/executors/agent_executor.py +242 -0
qtype/interpreter/executors/aggregate_executor.py +93 -0
qtype/interpreter/executors/bedrock_reranker_executor.py +195 -0
qtype/interpreter/executors/decoder_executor.py +163 -0
qtype/interpreter/executors/doc_to_text_executor.py +112 -0
qtype/interpreter/executors/document_embedder_executor.py +107 -0
qtype/interpreter/executors/document_search_executor.py +113 -0
qtype/interpreter/executors/document_source_executor.py +118 -0
qtype/interpreter/executors/document_splitter_executor.py +105 -0
qtype/interpreter/executors/echo_executor.py +63 -0
qtype/interpreter/executors/field_extractor_executor.py +165 -0
qtype/interpreter/executors/file_source_executor.py +101 -0
qtype/interpreter/executors/file_writer_executor.py +110 -0
qtype/interpreter/executors/index_upsert_executor.py +232 -0
qtype/interpreter/executors/invoke_embedding_executor.py +92 -0
qtype/interpreter/executors/invoke_flow_executor.py +51 -0
qtype/interpreter/executors/invoke_tool_executor.py +358 -0
qtype/interpreter/executors/llm_inference_executor.py +272 -0
qtype/interpreter/executors/prompt_template_executor.py +78 -0
qtype/interpreter/executors/sql_source_executor.py +106 -0
qtype/interpreter/executors/vector_search_executor.py +91 -0
qtype/interpreter/flow.py +173 -22
qtype/interpreter/logging_progress.py +61 -0
qtype/interpreter/metadata_api.py +115 -0
qtype/interpreter/resource_cache.py +5 -4
qtype/interpreter/rich_progress.py +225 -0
qtype/interpreter/stream/chat/__init__.py +15 -0
qtype/interpreter/stream/chat/converter.py +391 -0
qtype/interpreter/{chat → stream/chat}/file_conversions.py +2 -2
qtype/interpreter/stream/chat/ui_request_to_domain_type.py +140 -0
qtype/interpreter/stream/chat/vercel.py +609 -0
qtype/interpreter/stream/utils/__init__.py +15 -0
qtype/interpreter/stream/utils/build_vercel_ai_formatter.py +74 -0
qtype/interpreter/stream/utils/callback_to_stream.py +66 -0
qtype/interpreter/stream/utils/create_streaming_response.py +18 -0
qtype/interpreter/stream/utils/default_chat_extract_text.py +20 -0
qtype/interpreter/stream/utils/error_streaming_response.py +20 -0
qtype/interpreter/telemetry.py +135 -8
qtype/interpreter/tools/__init__.py +5 -0
qtype/interpreter/tools/function_tool_helper.py +265 -0
qtype/interpreter/types.py +330 -0
qtype/interpreter/typing.py +83 -89
qtype/interpreter/ui/404/index.html +1 -1
qtype/interpreter/ui/404.html +1 -1
qtype/interpreter/ui/_next/static/{OT8QJQW3J70VbDWWfrEMT → 20HoJN6otZ_LyHLHpCPE6}/_buildManifest.js +1 -1
qtype/interpreter/ui/_next/static/chunks/434-b2112d19f25c44ff.js +36 -0
qtype/interpreter/ui/_next/static/chunks/{964-ed4ab073db645007.js → 964-2b041321a01cbf56.js} +1 -1
qtype/interpreter/ui/_next/static/chunks/app/{layout-5ccbc44fd528d089.js → layout-a05273ead5de2c41.js} +1 -1
qtype/interpreter/ui/_next/static/chunks/app/page-8c67d16ac90d23cb.js +1 -0
qtype/interpreter/ui/_next/static/chunks/ba12c10f-546f2714ff8abc66.js +1 -0
qtype/interpreter/ui/_next/static/chunks/{main-6d261b6c5d6fb6c2.js → main-e26b9cb206da2cac.js} +1 -1
qtype/interpreter/ui/_next/static/chunks/webpack-08642e441b39b6c2.js +1 -0
qtype/interpreter/ui/_next/static/css/8a8d1269e362fef7.css +3 -0
qtype/interpreter/ui/_next/static/media/4cf2300e9c8272f7-s.p.woff2 +0 -0
qtype/interpreter/ui/icon.png +0 -0
qtype/interpreter/ui/index.html +1 -1
qtype/interpreter/ui/index.txt +5 -5
qtype/semantic/checker.py +643 -0
qtype/semantic/generate.py +268 -85
qtype/semantic/loader.py +95 -0
qtype/semantic/model.py +535 -163
qtype/semantic/resolver.py +63 -19
qtype/semantic/visualize.py +50 -35
{qtype-0.0.12.dist-info → qtype-0.1.3.dist-info}/METADATA +21 -4
qtype-0.1.3.dist-info/RECORD +137 -0
qtype/dsl/base_types.py +0 -38
qtype/dsl/validator.py +0 -464
qtype/interpreter/batch/__init__.py +0 -0
qtype/interpreter/batch/flow.py +0 -95
qtype/interpreter/batch/sql_source.py +0 -95
qtype/interpreter/batch/step.py +0 -63
qtype/interpreter/batch/types.py +0 -41
qtype/interpreter/batch/utils.py +0 -179
qtype/interpreter/chat/chat_api.py +0 -237
qtype/interpreter/chat/vercel.py +0 -314
qtype/interpreter/exceptions.py +0 -10
qtype/interpreter/step.py +0 -67
qtype/interpreter/steps/__init__.py +0 -0
qtype/interpreter/steps/agent.py +0 -114
qtype/interpreter/steps/condition.py +0 -36
qtype/interpreter/steps/decoder.py +0 -88
qtype/interpreter/steps/llm_inference.py +0 -150
qtype/interpreter/steps/prompt_template.py +0 -54
qtype/interpreter/steps/search.py +0 -24
qtype/interpreter/steps/tool.py +0 -53
qtype/interpreter/streaming_helpers.py +0 -123
qtype/interpreter/ui/_next/static/chunks/736-7fc606e244fedcb1.js +0 -36
qtype/interpreter/ui/_next/static/chunks/app/page-c72e847e888e549d.js +0 -1
qtype/interpreter/ui/_next/static/chunks/ba12c10f-22556063851a6df2.js +0 -1
qtype/interpreter/ui/_next/static/chunks/webpack-8289c17c67827f22.js +0 -1
qtype/interpreter/ui/_next/static/css/a262c53826df929b.css +0 -3
qtype/interpreter/ui/_next/static/media/569ce4b8f30dc480-s.p.woff2 +0 -0
qtype/interpreter/ui/favicon.ico +0 -0
qtype/loader.py +0 -389
qtype-0.0.12.dist-info/RECORD +0 -105
/qtype/interpreter/ui/_next/static/{OT8QJQW3J70VbDWWfrEMT → 20HoJN6otZ_LyHLHpCPE6}/_ssgManifest.js +0 -0
{qtype-0.0.12.dist-info → qtype-0.1.3.dist-info}/WHEEL +0 -0
{qtype-0.0.12.dist-info → qtype-0.1.3.dist-info}/entry_points.txt +0 -0
{qtype-0.0.12.dist-info → qtype-0.1.3.dist-info}/licenses/LICENSE +0 -0
{qtype-0.0.12.dist-info → qtype-0.1.3.dist-info}/top_level.txt +0 -0

qtype/semantic/model.py CHANGED Viewed

@@ -13,18 +13,27 @@ Types are ignored since they should reflect dsl directly, which is type checked.
 from __future__ import annotations
-from typing import Any, Literal
-from pydantic import BaseModel, Field, model_validator
-# Import enums and type aliases from DSL
+from functools import partial
+from typing import Any, Literal, Union
+from pydantic import BaseModel, Field
+# Import enums, mixins, and type aliases
+from qtype.base.types import (  # noqa: F401
+    BatchableStepMixin,
+    BatchConfig,
+    CachedStepMixin,
+    ConcurrencyConfig,
+    ConcurrentStepMixin,
+)
 from qtype.dsl.model import VariableType  # noqa: F401
 from qtype.dsl.model import (  # noqa: F401
     CustomType,
     DecoderFormat,
+    ListType,
     PrimitiveTypeEnum,
     StepCardinality,
-    StructuralTypeEnum,
+    ToolParameter,
 )
 from qtype.dsl.model import Variable as DSLVariable  # noqa: F401
 from qtype.semantic.base_types import ImmutableModel
@@ -48,6 +57,58 @@ class AuthorizationProvider(ImmutableModel):
     type: str = Field(..., description="Authorization method type.")
+class Tool(ImmutableModel):
+    """
+    Base class for callable functions or external operations available to the model or as a step in a flow.
+    """
+    id: str = Field(..., description="Unique ID of this component.")
+    name: str = Field(..., description="Name of the tool function.")
+    description: str = Field(
+        ..., description="Description of what the tool does."
+    )
+    inputs: dict[str, ToolParameter] = Field(
+        default_factory=dict,
+        description="Input parameters required by this tool.",
+    )
+    outputs: dict[str, ToolParameter] = Field(
+        default_factory=dict,
+        description="Output parameters produced by this tool.",
+    )
+class SecretManager(BaseModel):
+    """Base class for secret manager configurations."""
+    id: str = Field(
+        ..., description="Unique ID for this secret manager configuration."
+    )
+    type: str = Field(..., description="The type of secret manager.")
+    auth: AuthorizationProvider = Field(
+        ...,
+        description="AuthorizationProvider used to access this secret manager.",
+    )
+class Step(CachedStepMixin, BaseModel):
+    """Base class for components that take inputs and produce outputs."""
+    id: str = Field(..., description="Unique ID of this component.")
+    type: str = Field(..., description="Type of the step component.")
+    cardinality: StepCardinality = Field(
+        StepCardinality.one,
+        description="Does this step emit 1 (one) or 0...N (many) instances of the outputs?",
+    )
+    inputs: list[Variable] = Field(
+        default_factory=list,
+        description="References to the variables required by this step.",
+    )
+    outputs: list[Variable] = Field(
+        default_factory=list,
+        description="References to the variables where output is stored.",
+    )
 class Application(BaseModel):
     """Defines a complete QType application specification.
@@ -64,51 +125,52 @@ class Application(BaseModel):
         None, description="Optional description of the application."
     )
     memories: list[Memory] = Field(
-        [], description="List of memory definitions used in this application."
+        default_factory=list,
+        description="List of memory definitions used in this application.",
     )
     models: list[Model] = Field(
-        [], description="List of models used in this application."
+        default_factory=list,
+        description="List of models used in this application.",
     )
     types: list[CustomType] = Field(
-        [], description="List of custom types defined in this application."
-    )
-    variables: list[Variable] = Field(
-        [], description="List of variables used in this application."
+        default_factory=list,
+        description="List of custom types defined in this application.",
     )
     flows: list[Flow] = Field(
-        [], description="List of flows defined in this application."
+        default_factory=list,
+        description="List of flows defined in this application.",
     )
-    auths: list[APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider] = (
-        Field(
-            [],
-            description="List of authorization providers used for API access.",
-        )
+    auths: list[AuthorizationProvider] = Field(
+        default_factory=list,
+        description="List of authorization providers used for API access.",
     )
     tools: list[Tool] = Field(
-        [], description="List of tools available in this application."
+        default_factory=list,
+        description="List of tools available in this application.",
     )
     indexes: list[Index] = Field(
-        [], description="List of indexes available for search operations."
+        default_factory=list,
+        description="List of indexes available for search operations.",
+    )
+    secret_manager: AWSSecretManager | None = Field(
+        None,
+        description="Optional secret manager configuration for the application.",
     )
     telemetry: TelemetrySink | None = Field(
         None, description="Optional telemetry sink for observability."
     )
-class Step(BaseModel):
-    """Base class for components that take inputs and produce outputs."""
+class AuthorizationProviderList(BaseModel):
+    """Schema for a standalone list of authorization providers."""
-    id: str = Field(..., description="Unique ID of this component.")
-    cardinality: StepCardinality = Field(
-        StepCardinality.one,
-        description="Does this step emit 1 (one) or 0...N (many) instances of the outputs?",
-    )
-    inputs: list[Variable] = Field(
-        [], description="Input variables required by this step."
-    )
-    outputs: list[Variable] = Field(
-        [], description="Variable where output is stored."
-    )
+    root: list[AuthorizationProvider] = Field(...)
+class ConstantPath(BaseModel):
+    """Semantic version of ConstantPath."""
+    uri: str = Field(..., description="A constant Fsspec URI.")
 class Index(ImmutableModel):
@@ -116,13 +178,11 @@ class Index(ImmutableModel):
     id: str = Field(..., description="Unique ID of the index.")
     args: dict[str, Any] = Field(
-        {},
+        default_factory=dict,
         description="Index-specific configuration and connection parameters.",
     )
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(
-            None, description="AuthorizationProvider for accessing the index."
-        )
+    auth: AuthorizationProvider | None = Field(
+        None, description="AuthorizationProvider for accessing the index."
     )
     name: str = Field(..., description="Name of the index/collection/table.")
@@ -130,20 +190,64 @@ class Index(ImmutableModel):
 class Model(ImmutableModel):
     """Describes a generative model configuration, including provider and model ID."""
+    type: Literal["Model"] = Field("Model")
     id: str = Field(..., description="Unique ID for the model.")
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(None, description="AuthorizationProvider used for model access.")
+    auth: AuthorizationProvider | None = Field(
+        None, description="AuthorizationProvider used for model access."
     )
     inference_params: dict[str, Any] = Field(
-        {},
+        default_factory=dict,
         description="Optional inference parameters like temperature or max_tokens.",
     )
     model_id: str | None = Field(
         None,
         description="The specific model name or ID for the provider. If None, id is used",
     )
-    provider: str = Field(
-        ..., description="Name of the provider, e.g., openai or anthropic."
+    provider: Literal["openai", "anthropic", "aws-bedrock", "gcp-vertex"] = (
+        Field(
+            ..., description="Name of the provider, e.g., openai or anthropic."
+        )
+    )
+class Flow(BaseModel):
+    """Defines a flow of steps that can be executed in sequence or parallel.
+    If input or output variables are not specified, they are inferred from
+    the first and last step, respectively."""
+    id: str = Field(..., description="Unique ID of the flow.")
+    type: Literal["Flow"] = Field("Flow")
+    description: str | None = Field(
+        None, description="Optional description of the flow."
+    )
+    steps: list[Step | Step] = Field(
+        default_factory=list,
+        description="List of steps or references to steps",
+    )
+    interface: FlowInterface | None = Field(None)
+    variables: list[Variable] = Field(
+        default_factory=list,
+        description="List of variables available at the application scope.",
+    )
+    inputs: list[Variable] = Field(
+        default_factory=list,
+        description="Input variables required by this step.",
+    )
+    outputs: list[Variable] = Field(
+        default_factory=list, description="Resulting variables"
+    )
+class FlowInterface(BaseModel):
+    """
+    Defines the public-facing contract for a Flow, guiding the UI
+    and session management.
+    """
+    type: Literal["Complete", "Conversational"] = Field("Complete")
+    session_inputs: list[Variable] = Field(
+        default_factory=list,
+        description="A list of input variable IDs that are set once and then persisted across a session.",
     )
@@ -163,28 +267,73 @@ class Memory(ImmutableModel):
     )
+class ModelList(BaseModel):
+    """Schema for a standalone list of models."""
+    root: list[Model] = Field(...)
+class SecretReference(BaseModel):
+    """
+    A reference to a secret in the application's configured SecretManager.
+    This value is resolved at runtime by the interpreter.
+    """
+    secret_name: str = Field(
+        ...,
+        description="The name, ID, or ARN of the secret to fetch (e.g., 'my-project/db-password').",
+    )
+    key: str | None = Field(
+        None,
+        description="Optional key if the secret is a JSON blob or map (e.g., a specific key in a K8s secret).",
+    )
 class TelemetrySink(BaseModel):
     """Defines an observability endpoint for collecting telemetry data from the QType runtime."""
     id: str = Field(
         ..., description="Unique ID of the telemetry sink configuration."
     )
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(
-            None,
-            description="AuthorizationProvider used to authenticate telemetry data transmission.",
-        )
+    provider: Literal["Phoenix", "Langfuse"] = Field("Phoenix")
+    auth: AuthorizationProvider | None = Field(
+        None,
+        description="AuthorizationProvider used to authenticate telemetry data transmission.",
     )
-    endpoint: str = Field(
+    endpoint: str | SecretReference = Field(
         ..., description="URL endpoint where telemetry data will be sent."
     )
+    args: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Additional configuration arguments specific to the telemetry sink type.",
+    )
+class ToolList(BaseModel):
+    """Schema for a standalone list of tools."""
+    root: list[Tool] = Field(...)
+class TypeList(BaseModel):
+    """Schema for a standalone list of type definitions."""
+    root: list[CustomType] = Field(...)
+class VariableList(BaseModel):
+    """Schema for a standalone list of variables."""
+    root: list[Variable] = Field(...)
 class APIKeyAuthProvider(AuthorizationProvider):
     """API key-based authentication provider."""
     type: Literal["api_key"] = Field("api_key")
-    api_key: str = Field(..., description="API key for authentication.")
+    api_key: str | SecretReference = Field(
+        ..., description="API key for authentication."
+    )
     host: str | None = Field(
         None, description="Base URL or domain of the provider."
     )
@@ -194,11 +343,13 @@ class AWSAuthProvider(AuthorizationProvider):
     """AWS authentication provider supporting multiple credential methods."""
     type: Literal["aws"] = Field("aws")
-    access_key_id: str | None = Field(None, description="AWS access key ID.")
-    secret_access_key: str | None = Field(
+    access_key_id: str | SecretReference | None = Field(
+        None, description="AWS access key ID."
+    )
+    secret_access_key: str | SecretReference | None = Field(
         None, description="AWS secret access key."
     )
-    session_token: str | None = Field(
+    session_token: str | SecretReference | None = Field(
         None, description="AWS session token for temporary credentials."
     )
     profile_name: str | None = Field(
@@ -216,50 +367,251 @@ class AWSAuthProvider(AuthorizationProvider):
     region: str | None = Field(None, description="AWS region.")
+class BearerTokenAuthProvider(AuthorizationProvider):
+    """Bearer token authentication provider."""
+    type: Literal["bearer_token"] = Field("bearer_token")
+    token: str | SecretReference = Field(
+        ..., description="Bearer token for authentication."
+    )
 class OAuth2AuthProvider(AuthorizationProvider):
     """OAuth2 authentication provider."""
     type: Literal["oauth2"] = Field("oauth2")
     client_id: str = Field(..., description="OAuth2 client ID.")
-    client_secret: str = Field(..., description="OAuth2 client secret.")
+    client_secret: str | SecretReference = Field(
+        ..., description="OAuth2 client secret."
+    )
     token_url: str = Field(..., description="Token endpoint URL.")
-    scopes: list[str] = Field([], description="OAuth2 scopes required.")
+    scopes: list[str] = Field(
+        default_factory=list, description="OAuth2 scopes required."
+    )
+class VertexAuthProvider(AuthorizationProvider):
+    """Google Vertex authentication provider supporting gcloud profile or service account."""
+    type: Literal["vertex"] = Field("vertex")
+    profile_name: str | None = Field(
+        None,
+        description="Local gcloud profile name (if using existing CLI credentials).",
+    )
+    project_id: str | None = Field(
+        None,
+        description="Explicit GCP project ID override (if different from profile).",
+    )
+    service_account_file: str | None = Field(
+        None, description="Path to a service account JSON key file."
+    )
+    region: str | None = Field(
+        None, description="Vertex region (e.g., us-central1)."
+    )
-class Condition(Step):
-    """Conditional logic gate within a flow. Supports branching logic for execution based on variable values."""
+class APITool(Tool):
+    """Tool that invokes an API endpoint."""
-    else_: Step | None = Field(
+    type: Literal["APITool"] = Field("APITool")
+    endpoint: str = Field(..., description="API endpoint URL to call.")
+    method: str = Field(
+        "GET", description="HTTP method to use (GET, POST, PUT, DELETE, etc.)."
+    )
+    auth: AuthorizationProvider | None = Field(
         None,
-        description="Optional step to run if condition fails.",
-        alias="else",
+        description="Optional AuthorizationProvider for API authentication.",
+    )
+    headers: dict[str, str] = Field(
+        default_factory=dict,
+        description="Optional HTTP headers to include in the request.",
+    )
+    parameters: dict[str, ToolParameter] = Field(
+        default_factory=dict,
+        description="Output parameters produced by this tool.",
+    )
+class PythonFunctionTool(Tool):
+    """Tool that calls a Python function."""
+    type: Literal["PythonFunctionTool"] = Field("PythonFunctionTool")
+    function_name: str = Field(
+        ..., description="Name of the Python function to call."
     )
-    equals: Variable | None = Field(
-        None, description="Match condition for equality check."
+    module_path: str = Field(
+        ..., description="Optional module path where the function is defined."
+    )
+class AWSSecretManager(SecretManager):
+    """Configuration for AWS Secrets Manager."""
+    type: Literal["aws_secret_manager"] = Field("aws_secret_manager")
+class Aggregate(Step):
+    """
+    A terminal step that consumes an entire input stream and produces a single
+    summary message with success/error counts.
+    """
+    type: Literal["Aggregate"] = Field("Aggregate")
+    cardinality: Literal[StepCardinality.one] = Field(StepCardinality.one)
+    outputs: list[Variable] = Field(
+        default_factory=list,
+        description="References to the variables for the output. There should be one and only one output with type AggregateStats",
     )
-    then: Step = Field(..., description="Step to run if condition matches.")
 class Decoder(Step):
     """Defines a step that decodes string data into structured outputs.
     If parsing fails, the step will raise an error and halt execution.
-    Use conditional logic in your flow to handle potential parsing errors.
-    """
+    Use conditional logic in your flow to handle potential parsing errors."""
+    type: Literal["Decoder"] = Field("Decoder")
     format: DecoderFormat = Field(
         DecoderFormat.json,
         description="Format in which the decoder processes data. Defaults to JSON.",
     )
-class LLMInference(Step):
+class DocToTextConverter(Step, ConcurrentStepMixin):
+    """Defines a step to convert raw documents (e.g., PDF, DOCX) loaded by a DocumentSource into plain text
+    using an external tool like Docling or LlamaParse for pre-processing before chunking.
+    The input and output are both RAGDocument, but the output after processing with have content of type markdown.
+    """
+    type: Literal["DocToTextConverter"] = Field("DocToTextConverter")
+class DocumentEmbedder(Step, ConcurrentStepMixin):
+    """Embeds document chunks using a specified embedding model."""
+    type: Literal["DocumentEmbedder"] = Field("DocumentEmbedder")
+    cardinality: Literal[StepCardinality.many] = Field(
+        StepCardinality.many,
+        description="Consumes one chunk and emits one embedded chunk.",
+    )
+    model: EmbeddingModel = Field(
+        ..., description="Embedding model to use for vectorization."
+    )
+class DocumentSplitter(Step, ConcurrentStepMixin):
+    """Configuration for chunking/splitting documents into embeddable nodes/chunks."""
+    type: Literal["DocumentSplitter"] = Field("DocumentSplitter")
+    cardinality: Literal[StepCardinality.many] = Field(
+        StepCardinality.many,
+        description="Consumes one document and emits 0...N nodes/chunks.",
+    )
+    splitter_name: str = Field(
+        "SentenceSplitter",
+        description="Name of the LlamaIndex TextSplitter class.",
+    )
+    chunk_size: int = Field(1024, description="Size of each chunk.")
+    chunk_overlap: int = Field(
+        20, description="Overlap between consecutive chunks."
+    )
+    args: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Additional arguments specific to the chosen splitter class.",
+    )
+class Echo(Step):
+    """Defines a step that echoes its inputs as outputs.
+    Useful for debugging flows by inspecting variable values at a specific
+    point in the execution pipeline. The step simply passes through all input
+    variables as outputs without modification.
+    """
+    type: Literal["Echo"] = Field("Echo")
+class FieldExtractor(Step):
+    """Extracts specific fields from input data using JSONPath expressions.
+    This step uses JSONPath syntax to extract data from structured inputs
+    (Pydantic models, dicts, lists). The input is first converted to a dict
+    using model_dump() if it's a Pydantic model, then the JSONPath expression
+    is evaluated.
+    If the JSONPath matches multiple values, the step yields multiple output
+    messages (1-to-many cardinality). If it matches a single value, it yields
+    one output message. If it matches nothing, it raises an error.
+    The extracted data is used to construct the output variable by passing it
+    as keyword arguments to the output type's constructor.
+    Example JSONPath expressions:
+    - `$.field_name` - Extract a single field
+    - `$.items[*]` - Extract all items from a list
+    - `$.items[?(@.price > 10)]` - Filter items by condition
+    """
+    type: Literal["FieldExtractor"] = Field("FieldExtractor")
+    json_path: str = Field(
+        ...,
+        description="JSONPath expression to extract data from the input. Uses jsonpath-ng syntax.",
+    )
+    fail_on_missing: bool = Field(
+        True,
+        description="Whether to raise an error if the JSONPath matches no data. If False, returns None.",
+    )
+class InvokeEmbedding(Step, ConcurrentStepMixin):
+    """Defines a step that generates embeddings using an embedding model.
+    It takes input variables and produces output variables containing the embeddings."""
+    type: Literal["InvokeEmbedding"] = Field("InvokeEmbedding")
+    model: EmbeddingModel = Field(
+        ..., description="The embedding model to use."
+    )
+class InvokeFlow(Step):
+    """Invokes a flow with input and output bindings."""
+    type: Literal["InvokeFlow"] = Field("InvokeFlow")
+    flow: Flow = Field(..., description="Flow to invoke.")
+    input_bindings: dict[Variable, str] = Field(
+        ...,
+        description="Mapping from variable references to flow input variable IDs.",
+    )
+    output_bindings: dict[Variable, str] = Field(
+        ...,
+        description="Mapping from variable references to flow output variable IDs.",
+    )
+class InvokeTool(Step, ConcurrentStepMixin):
+    """Invokes a tool with input and output bindings."""
+    type: Literal["InvokeTool"] = Field("InvokeTool")
+    tool: Tool = Field(..., description="Tool to invoke.")
+    input_bindings: dict[str, str] = Field(
+        ...,
+        description="Mapping from variable references to tool input parameter names.",
+    )
+    output_bindings: dict[str, str] = Field(
+        ...,
+        description="Mapping from variable references to tool output parameter names.",
+    )
+class LLMInference(Step, ConcurrentStepMixin):
     """Defines a step that performs inference using a language model.
     It can take input variables and produce output variables based on the model's response."""
+    type: Literal["LLMInference"] = Field("LLMInference")
     memory: Memory | None = Field(
         None,
-        description="Memory object to retain context across interactions.",
+        description="A reference to a Memory object to retain context across interactions.",
     )
     model: Model = Field(..., description="The model to use for inference.")
     system_message: str | None = Field(
@@ -272,30 +624,32 @@ class PromptTemplate(Step):
     """Defines a prompt template with a string format and variable bindings.
     This is used to generate prompts dynamically based on input variables."""
+    type: Literal["PromptTemplate"] = Field("PromptTemplate")
     template: str = Field(
         ...,
         description="String template for the prompt with variable placeholders.",
     )
+class Reranker(Step):
+    """Reranks a list of documents based on relevance to a query using an LLM."""
+    type: Literal["Reranker"] = Field("Reranker")
 class Search(Step):
     """Base class for search operations against indexes."""
     filters: dict[str, Any] = Field(
-        {}, description="Optional filters to apply during search."
+        default_factory=dict,
+        description="Optional filters to apply during search.",
     )
     index: Index = Field(
         ..., description="Index to search against (object or ID reference)."
     )
-class Sink(Step):
-    """Base class for data sinks"""
-    id: str = Field(..., description="Unique ID of the data sink.")
-    cardinality: Literal["one"] = Field(
-        StepCardinality.one,
-        description="Flows always emit exactly one instance of the outputs.",
+    default_top_k: int | None = Field(
+        10,
+        description="Number of top results to retrieve if not provided in the inputs.",
     )
@@ -303,32 +657,40 @@ class Source(Step):
     """Base class for data sources"""
     id: str = Field(..., description="Unique ID of the data source.")
-    cardinality: Literal["many"] = Field(
+    cardinality: Literal[StepCardinality.many] = Field(
         StepCardinality.many,
         description="Sources always emit 0...N instances of the outputs.",
     )
-class Tool(Step, ImmutableModel):
-    """
-    Base class for callable functions or external operations available to the model or as a step in a flow.
-    """
+class Writer(Step, BatchableStepMixin):
+    """Base class for things that write data in batches."""
-    name: str = Field(..., description="Name of the tool function.")
-    description: str = Field(
-        ..., description="Description of what the tool does."
-    )
+    id: str = Field(..., description="Unique ID of the data writer.")
 class DocumentIndex(Index):
     """Document search index for text-based search (e.g., Elasticsearch, OpenSearch)."""
-    pass
+    type: Literal["DocumentIndex"] = Field("DocumentIndex")
+    endpoint: str = Field(
+        ...,
+        description="URL endpoint for the search cluster (e.g., https://my-cluster.es.amazonaws.com).",
+    )
+    id_field: str | None = Field(
+        None,
+        description="Field name to use as document ID. If not specified, auto-detects from: _id, id, doc_id, document_id, or uuid. If all are missing, a UUID is generated.",
+    )
 class VectorIndex(Index):
     """Vector database index for similarity search using embeddings."""
+    type: Literal["VectorIndex"] = Field("VectorIndex")
+    module: str = Field(
+        ...,
+        description="Python module path for the vector store implementation (e.g., 'llama_index.vector_stores.qdrant.QdrantVectorStore').",
+    )
     embedding_model: EmbeddingModel = Field(
         ...,
         description="Embedding model used to vectorize queries and documents.",
@@ -338,6 +700,7 @@ class VectorIndex(Index):
 class EmbeddingModel(Model):
     """Describes an embedding model configuration, extending the base Model class."""
+    type: Literal["EmbeddingModel"] = Field("EmbeddingModel")
     dimensions: int = Field(
         ...,
         description="Dimensionality of the embedding vectors produced by this model.",
@@ -347,121 +710,130 @@ class EmbeddingModel(Model):
 class Agent(LLMInference):
     """Defines an agent that can perform tasks and make decisions based on user input and context."""
+    type: Literal["Agent"] = Field("Agent")
     tools: list[Tool] = Field(
-        ..., description="List of tools available to the agent."
+        default_factory=list,
+        description="List of tools available to the agent.",
     )
-class DocumentSearch(Search):
+class BedrockReranker(Reranker, ConcurrentStepMixin):
+    """Reranks documents using an AWS Bedrock model."""
+    type: Literal["BedrockReranker"] = Field("BedrockReranker")
+    auth: AWSAuthProvider | None = Field(
+        None, description="AWS authorization provider for Bedrock access."
+    )
+    model_id: str = Field(
+        ...,
+        description="Bedrock model ID to use for reranking. See https://docs.aws.amazon.com/bedrock/latest/userguide/rerank-supported.html",
+    )
+    num_results: int | None = Field(
+        None, description="Return this many results."
+    )
+class DocumentSearch(Search, ConcurrentStepMixin):
     """Performs document search against a document index."""
-    pass
+    type: Literal["DocumentSearch"] = Field("DocumentSearch")
+    index: DocumentIndex = Field(
+        ..., description="Index to search against (object or ID reference)."
+    )
+    query_args: dict[str, Any] = Field(
+        {"type": "best_fields", "fields": ["*"]},
+        description="The arguments (other than 'query') to specify to the query shape (see https://docs.opensearch.org/latest/query-dsl/full-text/multi-match/).",
+    )
-class VectorSearch(Search):
+class VectorSearch(Search, BatchableStepMixin):
     """Performs vector similarity search against a vector index."""
-    default_top_k: int | None = Field(
-        50,
-        description="Number of top results to retrieve if not provided in the inputs.",
+    type: Literal["VectorSearch"] = Field("VectorSearch")
+    index: VectorIndex = Field(
+        ..., description="Index to search against (object or ID reference)."
     )
-class IndexUpsert(Sink):
-    """Semantic version of IndexUpsert."""
+class DocumentSource(Source):
+    """A source of documents that will be used in retrieval augmented generation.
+    It uses LlamaIndex readers to load one or more raw Documents
+    from a specified path or system (e.g., Google Drive, web page).
+    See https://github.com/run-llama/llama_index/tree/main/llama-index-integrations/readers
+    """
-    index: Index = Field(
-        ..., description="Index to upsert into (object or ID reference)."
+    type: Literal["DocumentSource"] = Field("DocumentSource")
+    reader_module: str = Field(
+        ..., description="Module path of the LlamaIndex Reader)."
+    )
+    args: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Reader-specific arguments to pass to the Reader constructor.",
+    )
+    loader_args: dict[str, Any] = Field(
+        default_factory=dict,
+        description="Loader-specific arguments to pass to the load_data method.",
+    )
+    auth: AuthorizationProvider | None = Field(
+        None, description="AuthorizationProvider for accessing the source."
     )
-class SQLSource(Source):
-    """SQL database source that executes queries and emits rows."""
+class FileSource(Source):
+    """File source that reads data from a file using fsspec-compatible URIs."""
-    query: str = Field(
-        ..., description="SQL query to execute. Inputs are injected as params."
-    )
-    connection: str = Field(
+    type: Literal["FileSource"] = Field("FileSource")
+    path: ConstantPath | Variable = Field(
         ...,
-        description="Database connection string or reference to auth provider. Typically in SQLAlchemy format.",
-    )
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(
-            None,
-            description="Optional AuthorizationProvider for database authentication.",
-        )
+        description="Reference to a variable with an fsspec-compatible URI to read from, or the uri itself.",
     )
-class SourceType(Source):
+class SQLSource(Source):
     """SQL database source that executes queries and emits rows."""
+    type: Literal["SQLSource"] = Field("SQLSource")
     query: str = Field(
         ..., description="SQL query to execute. Inputs are injected as params."
     )
-    connection: str = Field(
+    connection: str | SecretReference = Field(
         ...,
         description="Database connection string or reference to auth provider. Typically in SQLAlchemy format.",
     )
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(
-            None,
-            description="Optional AuthorizationProvider for database authentication.",
-        )
+    auth: AuthorizationProvider | None = Field(
+        None,
+        description="Optional AuthorizationProvider for database authentication.",
     )
-class APITool(Tool):
-    """Tool that invokes an API endpoint."""
+class FileWriter(Writer, BatchableStepMixin):
+    """File writer that writes data to a file using fsspec-compatible URIs."""
-    endpoint: str = Field(..., description="API endpoint URL to call.")
-    method: str = Field(
-        "GET", description="HTTP method to use (GET, POST, PUT, DELETE, etc.)."
-    )
-    auth: APIKeyAuthProvider | AWSAuthProvider | OAuth2AuthProvider | None = (
-        Field(
-            None,
-            description="Optional AuthorizationProvider for API authentication.",
-        )
+    type: Literal["FileWriter"] = Field("FileWriter")
+    path: ConstantPath | Variable = Field(
+        ...,
+        description="Reference to a variable with an fsspec-compatible URI to read from, or the uri itself.",
     )
-    headers: dict[str, str] = Field(
-        {}, description="Optional HTTP headers to include in the request."
+    batch_config: BatchConfig = Field(
+        default_factory=partial(BatchConfig, batch_size=9223372036854775807),
+        description="Configuration for processing the input stream in batches. If omitted, the step processes items one by one.",
     )
-class PythonFunctionTool(Tool):
-    """Tool that calls a Python function."""
+class IndexUpsert(Writer):
+    """Semantic version of IndexUpsert."""
-    function_name: str = Field(
-        ..., description="Name of the Python function to call."
-    )
-    module_path: str = Field(
-        ..., description="Optional module path where the function is defined."
+    type: Literal["IndexUpsert"] = Field("IndexUpsert")
+    index: Index = Field(
+        ..., description="Index to upsert into (object or ID reference)."
     )
-class Flow(Step):
-    """Defines a flow of steps that can be executed in sequence or parallel.
-    If input or output variables are not specified, they are inferred from
-    the first and last step, respectively.
-    """
-    description: str | None = Field(
-        None, description="Optional description of the flow."
-    )
-    cardinality: StepCardinality = Field(
-        StepCardinality.auto,
-        description="The cardinality of the flow, inferred from its steps when set to 'auto'.",
-    )
-    mode: Literal["Complete", "Chat"] = Field("Complete")
-    steps: list[Step] = Field(..., description="List of steps or step IDs.")
-    @model_validator(mode="after")
-    def infer_cardinality(self) -> "Flow":
-        if self.cardinality == StepCardinality.auto:
-            self.cardinality = StepCardinality.one
-            for step in self.steps:
-                if step.cardinality == StepCardinality.many:
-                    self.cardinality = StepCardinality.many
-                    break
-        return self
+DocumentType = Union[
+    Application,
+    AuthorizationProviderList,
+    ModelList,
+    ToolList,
+    TypeList,
+    VariableList,
+]

qtype 0.0.12__py3-none-any.whl → 0.1.3__py3-none-any.whl

qtype 0.0.12py3-none-any.whl → 0.1.3py3-none-any.whl