PyPI - ostruct-cli - Versions diffs - 0.6.0__py3-none-any.whl → 0.6.2__py3-none-any.whl - Mend

ostruct-cli 0.6.0py3-none-any.whl → 0.6.2py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (15) hide show

ostruct/cli/cli.py +195 -412
ostruct/cli/errors.py +61 -54
ostruct/cli/model_creation.py +480 -0
ostruct/cli/security/errors.py +1 -1
ostruct/cli/security/normalization.py +1 -1
ostruct/cli/security/security_manager.py +48 -7
ostruct/cli/template_extensions.py +32 -1
ostruct/cli/template_utils.py +175 -16
ostruct/cli/utils.py +3 -1
ostruct/cli/validators.py +6 -2
{ostruct_cli-0.6.0.dist-info → ostruct_cli-0.6.2.dist-info}/METADATA +39 -177
{ostruct_cli-0.6.0.dist-info → ostruct_cli-0.6.2.dist-info}/RECORD +15 -14
{ostruct_cli-0.6.0.dist-info → ostruct_cli-0.6.2.dist-info}/LICENSE +0 -0
{ostruct_cli-0.6.0.dist-info → ostruct_cli-0.6.2.dist-info}/WHEEL +0 -0
{ostruct_cli-0.6.0.dist-info → ostruct_cli-0.6.2.dist-info}/entry_points.txt +0 -0

ostruct/cli/errors.py CHANGED Viewed

@@ -323,60 +323,6 @@ class SchemaFileError(CLIError):
         return self.context.get("schema_path")
-class SchemaValidationError(CLIError):
-    """Error raised when a schema fails validation."""
-    def __init__(
-        self,
-        message: str,
-        context: Optional[Dict[str, Any]] = None,
-    ):
-        context = context or {}
-        # Format error message with tips
-        formatted_message = [message]
-        if "path" in context:
-            formatted_message.append(f"\nLocation: {context['path']}")
-        if "found" in context:
-            formatted_message.append(f"Found: {context['found']}")
-        if "count" in context:
-            formatted_message.append(f"Count: {context['count']}")
-        if "missing_required" in context:
-            formatted_message.append(
-                f"Missing required: {context['missing_required']}"
-            )
-        if "extra_required" in context:
-            formatted_message.append(
-                f"Extra required: {context['extra_required']}"
-            )
-        if "prohibited_used" in context:
-            formatted_message.append(
-                f"Prohibited keywords used: {context['prohibited_used']}"
-            )
-        if "tips" in context:
-            formatted_message.append("\nHow to fix:")
-            for tip in context["tips"]:
-                if isinstance(tip, dict):
-                    # Format JSON example
-                    formatted_message.append("Example schema:")
-                    formatted_message.append(json.dumps(tip, indent=2))
-                else:
-                    formatted_message.append(f"- {tip}")
-        super().__init__(
-            "\n".join(formatted_message),
-            context=context,
-            exit_code=ExitCode.SCHEMA_ERROR,
-        )
 class ModelCreationError(CLIError):
     """Base class for model creation errors."""
@@ -496,6 +442,67 @@ class OpenAIClientError(CLIError):
         super().__init__(message, exit_code=exit_code, context=context)
+class SchemaValidationError(ModelCreationError):
+    """Raised when schema validation fails."""
+    def __init__(
+        self,
+        message: str,
+        context: Optional[Dict[str, Any]] = None,
+        exit_code: ExitCode = ExitCode.SCHEMA_ERROR,
+    ):
+        context = context or {}
+        # Preserve validation type for error handling
+        context.setdefault("validation_type", "schema")
+        # Format error message with tips
+        formatted_message = []
+        if "path" in context:
+            formatted_message.append(f"\nLocation: {context['path']}")
+        if "found" in context:
+            formatted_message.append(f"Found: {context['found']}")
+        if "reference" in context:
+            formatted_message.append(f"Reference: {context['reference']}")
+        if "count" in context:
+            formatted_message.append(f"Count: {context['count']}")
+        if "missing_required" in context:
+            formatted_message.append(
+                f"Missing required: {context['missing_required']}"
+            )
+        if "extra_required" in context:
+            formatted_message.append(
+                f"Extra required: {context['extra_required']}"
+            )
+        if "prohibited_used" in context:
+            formatted_message.append(
+                f"Prohibited keywords used: {context['prohibited_used']}"
+            )
+        if "tips" in context:
+            formatted_message.append("\nHow to fix:")
+            for tip in context["tips"]:
+                if isinstance(tip, dict):
+                    # Format JSON example
+                    formatted_message.append("Example schema:")
+                    formatted_message.append(json.dumps(tip, indent=2))
+                else:
+                    formatted_message.append(f"- {tip}")
+        # Combine message with details
+        final_message = message
+        if formatted_message:
+            final_message += "\n" + "\n".join(formatted_message)
+        super().__init__(final_message, context=context, exit_code=exit_code)
 # Export public API
 __all__ = [
     "VariableError",

ostruct/cli/model_creation.py ADDED Viewed

@@ -0,0 +1,480 @@
+"""Model creation utilities for the CLI."""
+import json
+import logging
+import sys
+from datetime import date, datetime, time
+from enum import Enum, IntEnum
+from typing import (
+    Any,
+    Dict,
+    List,
+    Optional,
+    Tuple,
+    Type,
+    Union,
+    cast,
+    get_origin,
+)
+if sys.version_info >= (3, 11):
+    from enum import StrEnum
+from pydantic import (
+    AnyUrl,
+    BaseModel,
+    ConfigDict,
+    EmailStr,
+    Field,
+    ValidationError,
+    create_model,
+)
+from pydantic.fields import FieldInfo
+from pydantic.functional_validators import BeforeValidator
+from pydantic.types import constr
+from .errors import (
+    FieldDefinitionError,
+    ModelCreationError,
+    ModelValidationError,
+    NestedModelError,
+    SchemaValidationError,
+)
+from .exit_codes import ExitCode
+logger = logging.getLogger(__name__)
+# Type aliases
+FieldType = Type[
+    Any
+]  # Changed from Type[Any] to allow both concrete types and generics
+FieldDefinition = Tuple[Any, FieldInfo]  # Changed to Any to handle generics
+def _create_enum_type(values: List[Any], field_name: str) -> Type[Enum]:
+    """Create an enum type from a list of values.
+    Args:
+        values: List of enum values
+        field_name: Name of the field for enum type name
+    Returns:
+        Created enum type
+    """
+    # Determine the value type
+    value_types = {type(v) for v in values}
+    if len(value_types) > 1:
+        # Mixed types, use string representation
+        enum_dict = {f"VALUE_{i}": str(v) for i, v in enumerate(values)}
+        return type(f"{field_name.title()}Enum", (str, Enum), enum_dict)
+    elif value_types == {int}:
+        # All integer values
+        enum_dict = {f"VALUE_{v}": v for v in values}
+        return type(f"{field_name.title()}Enum", (IntEnum,), enum_dict)
+    elif value_types == {str}:
+        # All string values
+        enum_dict = {v.upper().replace(" ", "_"): v for v in values}
+        if sys.version_info >= (3, 11):
+            return type(f"{field_name.title()}Enum", (StrEnum,), enum_dict)
+        else:
+            # Other types, use string representation
+            return type(f"{field_name.title()}Enum", (str, Enum), enum_dict)
+    # Default case: treat as string enum
+    enum_dict = {f"VALUE_{i}": str(v) for i, v in enumerate(values)}
+    return type(f"{field_name.title()}Enum", (str, Enum), enum_dict)
+def is_container_type(tp: Type[Any]) -> bool:
+    """Check if a type is a container type (List, Dict, etc).
+    Args:
+        tp: Type to check
+    Returns:
+        bool: True if type is a container type
+    """
+    origin = get_origin(tp)
+    return origin is not None and origin in (list, dict, List, Dict)
+# Validation functions
+def pattern(regex: str) -> Any:
+    return constr(pattern=regex)
+def min_length(length: int) -> Any:
+    return BeforeValidator(lambda v: v if len(str(v)) >= length else None)
+def max_length(length: int) -> Any:
+    return BeforeValidator(lambda v: v if len(str(v)) <= length else None)
+def ge(value: Union[int, float]) -> Any:
+    return BeforeValidator(lambda v: v if float(v) >= value else None)
+def le(value: Union[int, float]) -> Any:
+    return BeforeValidator(lambda v: v if float(v) <= value else None)
+def gt(value: Union[int, float]) -> Any:
+    return BeforeValidator(lambda v: v if float(v) > value else None)
+def lt(value: Union[int, float]) -> Any:
+    return BeforeValidator(lambda v: v if float(v) < value else None)
+def multiple_of(value: Union[int, float]) -> Any:
+    return BeforeValidator(lambda v: v if float(v) % value == 0 else None)
+def _get_type_with_constraints(
+    field_schema: Dict[str, Any], field_name: str, base_name: str
+) -> FieldDefinition:
+    """Get type with constraints from field schema.
+    Args:
+        field_schema: Field schema dict
+        field_name: Name of the field
+        base_name: Base name for nested models
+    Returns:
+        Tuple of (type, field)
+    """
+    field_kwargs: Dict[str, Any] = {}
+    # Add common field metadata
+    if "title" in field_schema:
+        field_kwargs["title"] = field_schema["title"]
+    if "description" in field_schema:
+        field_kwargs["description"] = field_schema["description"]
+    if "default" in field_schema:
+        field_kwargs["default"] = field_schema["default"]
+    if "readOnly" in field_schema:
+        field_kwargs["frozen"] = field_schema["readOnly"]
+    field_type = field_schema.get("type")
+    # Handle array type
+    if field_type == "array":
+        items_schema = field_schema.get("items", {})
+        if not items_schema:
+            return (List[Any], Field(**field_kwargs))  # Direct generic type
+        # Create nested model for object items
+        if (
+            isinstance(items_schema, dict)
+            and items_schema.get("type") == "object"
+        ):
+            array_item_model = create_dynamic_model(
+                items_schema,
+                base_name=f"{base_name}_{field_name}_Item",
+                show_schema=False,
+                debug_validation=False,
+            )
+            return (List[array_item_model], Field(**field_kwargs))  # type: ignore[valid-type]
+        # For non-object items, use the type directly
+        item_type = items_schema.get("type", "string")
+        if item_type == "string":
+            return (List[str], Field(**field_kwargs))
+        elif item_type == "integer":
+            return (List[int], Field(**field_kwargs))
+        elif item_type == "number":
+            return (List[float], Field(**field_kwargs))
+        elif item_type == "boolean":
+            return (List[bool], Field(**field_kwargs))
+        else:
+            return (List[Any], Field(**field_kwargs))
+    # Handle object type
+    if field_type == "object":
+        # Create nested model with explicit type annotation
+        object_model = create_dynamic_model(
+            field_schema,
+            base_name=f"{base_name}_{field_name}",
+            show_schema=False,
+            debug_validation=False,
+        )
+        return (object_model, Field(**field_kwargs))
+    # Handle additionalProperties
+    if "additionalProperties" in field_schema and isinstance(
+        field_schema["additionalProperties"], dict
+    ):
+        # Create nested model with explicit type annotation
+        dict_value_model = create_dynamic_model(
+            field_schema["additionalProperties"],
+            base_name=f"{base_name}_{field_name}_Value",
+            show_schema=False,
+            debug_validation=False,
+        )
+        dict_type: Type[Dict[str, Any]] = Dict[str, dict_value_model]  # type: ignore[valid-type]
+        return (dict_type, Field(**field_kwargs))
+    # Handle other types
+    if field_type == "string":
+        field_type_cls: Type[Any] = str
+        # Add string-specific constraints to field_kwargs
+        if "pattern" in field_schema:
+            field_kwargs["pattern"] = field_schema["pattern"]
+        if "minLength" in field_schema:
+            field_kwargs["min_length"] = field_schema["minLength"]
+        if "maxLength" in field_schema:
+            field_kwargs["max_length"] = field_schema["maxLength"]
+        # Handle special string formats
+        if "format" in field_schema:
+            if field_schema["format"] == "date-time":
+                field_type_cls = datetime
+            elif field_schema["format"] == "date":
+                field_type_cls = date
+            elif field_schema["format"] == "time":
+                field_type_cls = time
+            elif field_schema["format"] == "email":
+                field_type_cls = EmailStr
+            elif field_schema["format"] == "uri":
+                field_type_cls = AnyUrl
+        return (field_type_cls, Field(**field_kwargs))
+    if field_type == "number":
+        field_type_cls = float
+        # Add number-specific constraints to field_kwargs
+        if "minimum" in field_schema:
+            field_kwargs["ge"] = field_schema["minimum"]
+        if "maximum" in field_schema:
+            field_kwargs["le"] = field_schema["maximum"]
+        if "exclusiveMinimum" in field_schema:
+            field_kwargs["gt"] = field_schema["exclusiveMinimum"]
+        if "exclusiveMaximum" in field_schema:
+            field_kwargs["lt"] = field_schema["exclusiveMaximum"]
+        if "multipleOf" in field_schema:
+            field_kwargs["multiple_of"] = field_schema["multipleOf"]
+        return (field_type_cls, Field(**field_kwargs))
+    if field_type == "integer":
+        field_type_cls = int
+        # Add integer-specific constraints to field_kwargs
+        if "minimum" in field_schema:
+            field_kwargs["ge"] = field_schema["minimum"]
+        if "maximum" in field_schema:
+            field_kwargs["le"] = field_schema["maximum"]
+        if "exclusiveMinimum" in field_schema:
+            field_kwargs["gt"] = field_schema["exclusiveMinimum"]
+        if "exclusiveMaximum" in field_schema:
+            field_kwargs["lt"] = field_schema["exclusiveMaximum"]
+        if "multipleOf" in field_schema:
+            field_kwargs["multiple_of"] = field_schema["multipleOf"]
+        return (field_type_cls, Field(**field_kwargs))
+    if field_type == "boolean":
+        return (bool, Field(**field_kwargs))
+    if field_type == "null":
+        return (type(None), Field(**field_kwargs))
+    # Handle enum
+    if "enum" in field_schema:
+        enum_type = _create_enum_type(field_schema["enum"], field_name)
+        return (cast(Type[Any], enum_type), Field(**field_kwargs))
+    # Default to Any for unknown types
+    return (Any, Field(**field_kwargs))
+def create_dynamic_model(
+    schema: Dict[str, Any],
+    base_name: str = "DynamicModel",
+    show_schema: bool = False,
+    debug_validation: bool = False,
+) -> Type[BaseModel]:
+    """Create a Pydantic model from a JSON Schema.
+    Args:
+        schema: JSON Schema to create model from
+        base_name: Base name for the model class
+        show_schema: Whether to show the generated schema
+        debug_validation: Whether to show debug validation info
+    Returns:
+        Generated Pydantic model class
+    Raises:
+        SchemaValidationError: If schema validation fails
+        ModelCreationError: If model creation fails
+    """
+    try:
+        # Validate schema structure before model creation
+        from .template_utils import validate_json_schema
+        validate_json_schema(schema)
+        # Process schema properties into fields
+        properties = schema.get("properties", {})
+        required = schema.get("required", [])
+        field_definitions: Dict[str, Tuple[Type[Any], FieldInfo]] = {}
+        for field_name, field_schema in properties.items():
+            if debug_validation:
+                logger.info("Processing field %s:", field_name)
+                logger.info("  Schema: %s", json.dumps(field_schema, indent=2))
+            try:
+                python_type, field = _get_type_with_constraints(
+                    field_schema, field_name, base_name
+                )
+                # Handle optional fields
+                if field_name not in required:
+                    if debug_validation:
+                        logger.info(
+                            "Field %s is optional, wrapping in Optional",
+                            field_name,
+                        )
+                    field_type = cast(Type[Any], Optional[python_type])
+                else:
+                    field_type = python_type
+                    if debug_validation:
+                        logger.info("Field %s is required", field_name)
+                # Create field definition
+                field_definitions[field_name] = (field_type, field)
+                if debug_validation:
+                    logger.info("Successfully created field definition:")
+                    logger.info("  Name: %s", field_name)
+                    logger.info("  Type: %s", str(field_type))
+                    logger.info("  Required: %s", field_name in required)
+            except (FieldDefinitionError, NestedModelError) as e:
+                if debug_validation:
+                    logger.error("Error creating field %s:", field_name)
+                    logger.error("  Error type: %s", type(e).__name__)
+                    logger.error("  Error message: %s", str(e))
+                raise ModelValidationError(base_name, [str(e)])
+        # Create the model with the fields
+        field_defs: Dict[str, Any] = {
+            name: (
+                (
+                    cast(Type[Any], field_type)
+                    if is_container_type(field_type)
+                    else field_type
+                ),
+                field,
+            )
+            for name, (field_type, field) in field_definitions.items()
+        }
+        # Create model class
+        model = create_model(base_name, __base__=BaseModel, **field_defs)
+        # Set model config
+        model.model_config = ConfigDict(
+            title=schema.get("title", base_name),
+            extra="forbid",
+        )
+        if show_schema:
+            logger.info(
+                "Generated schema for %s:\n%s",
+                base_name,
+                json.dumps(model.model_json_schema(), indent=2),
+            )
+        try:
+            # Validate model schema
+            model.model_json_schema()
+        except ValidationError as e:
+            validation_errors = (
+                [str(err) for err in e.errors()]
+                if hasattr(e, "errors")
+                else [str(e)]
+            )
+            if debug_validation:
+                logger.error("Schema validation failed:")
+                logger.error("  Error type: %s", type(e).__name__)
+                logger.error("  Error message: %s", str(e))
+            raise ModelValidationError(base_name, validation_errors)
+        except KeyError as e:
+            # Handle Pydantic schema generation errors, particularly for recursive references
+            error_msg = str(e).strip(
+                "'\""
+            )  # Strip quotes from KeyError message
+            if error_msg.startswith("#/definitions/"):
+                context = {
+                    "schema_path": schema.get("$id", "unknown"),
+                    "reference": error_msg,
+                    "found": "circular reference or missing definition",
+                    "tips": [
+                        "Add explicit $ref definitions for recursive structures",
+                        "Use Pydantic's deferred annotations with typing.Self",
+                        "Limit recursion depth with max_depth validator",
+                        "Flatten nested structures using reference IDs",
+                    ],
+                }
+                error_msg = (
+                    f"Invalid schema reference: {error_msg}\n"
+                    "Detected circular reference or missing definition.\n"
+                    "Solutions:\n"
+                    "1. Add missing $ref definitions to your schema\n"
+                    "2. Use explicit ID references instead of nested objects\n"
+                    "3. Implement depth limits for recursive structures"
+                )
+                if debug_validation:
+                    logger.error("Schema reference error:")
+                    logger.error("  Error type: %s", type(e).__name__)
+                    logger.error("  Error message: %s", error_msg)
+                raise SchemaValidationError(
+                    error_msg, context=context, exit_code=ExitCode.SCHEMA_ERROR
+                ) from e
+            # For other KeyErrors, preserve the original error
+            raise ModelCreationError(
+                f"Failed to create model {base_name}",
+                context={"error": str(e)},
+            ) from e
+        return model
+    except SchemaValidationError:
+        # Re-raise schema validation errors without wrapping
+        raise
+    except Exception as e:
+        # Always log basic error info
+        logger.error("Model creation error: %s", str(e))
+        # Log additional debug info if requested
+        if debug_validation:
+            logger.error("  Error type: %s", type(e).__name__)
+            logger.error("  Error details: %s", str(e))
+            if hasattr(e, "__cause__"):
+                logger.error("  Caused by: %s", str(e.__cause__))
+            if hasattr(e, "__context__"):
+                logger.error("  Context: %s", str(e.__context__))
+            if hasattr(e, "__traceback__"):
+                import traceback
+                logger.error(
+                    "  Traceback:\n%s",
+                    "".join(traceback.format_tb(e.__traceback__)),
+                )
+        # Always wrap other errors as ModelCreationError
+        raise ModelCreationError(
+            f"Failed to create model {base_name}",
+            context={"error": str(e)},
+        ) from e

ostruct/cli/security/errors.py CHANGED Viewed

@@ -63,7 +63,7 @@ class PathSecurityError(SecurityErrorBase):
     @property
     def details(self) -> str:
         """Get the detailed explanation of the error."""
-        return self.details
+        return str(self.context.get("details", ""))
     @classmethod
     def from_expanded_paths(

ostruct/cli/security/normalization.py CHANGED Viewed

@@ -61,7 +61,7 @@ from .errors import PathSecurityError, SecurityErrorReasons
 # Patterns for path normalization and validation
 _UNICODE_SAFETY_PATTERN = re.compile(
     r"[\u0000-\u001F\u007F-\u009F\u2028-\u2029\u0085]"  # Control chars and line separators
-    r"|\.{2,}"  # Directory traversal attempts
+    r"|(?:^|/)\.\.(?:/|$)"  # Directory traversal attempts (only ".." as a path component)
     r"|[\u2024\u2025\uFE52\u2024\u2025\u2026\uFE19\uFE30\uFE52\uFF0E\uFF61]"  # Alternative dots and separators
 )
 _BACKSLASH_PATTERN = re.compile(r"\\")

ostruct-cli 0.6.0__py3-none-any.whl → 0.6.2__py3-none-any.whl

ostruct-cli 0.6.0py3-none-any.whl → 0.6.2py3-none-any.whl