PyPI - tellaro-query-language - Versions diffs - 0.1.0__py3-none-any.whl - Mend

tellaro-query-language 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (56) hide show

tellaro_query_language-0.1.0.dist-info/LICENSE +21 -0
tellaro_query_language-0.1.0.dist-info/METADATA +401 -0
tellaro_query_language-0.1.0.dist-info/RECORD +56 -0
tellaro_query_language-0.1.0.dist-info/WHEEL +4 -0
tellaro_query_language-0.1.0.dist-info/entry_points.txt +7 -0
tql/__init__.py +47 -0
tql/analyzer.py +385 -0
tql/cache/__init__.py +7 -0
tql/cache/base.py +25 -0
tql/cache/memory.py +63 -0
tql/cache/redis.py +68 -0
tql/core.py +929 -0
tql/core_components/README.md +92 -0
tql/core_components/__init__.py +20 -0
tql/core_components/file_operations.py +113 -0
tql/core_components/opensearch_operations.py +869 -0
tql/core_components/stats_operations.py +200 -0
tql/core_components/validation_operations.py +599 -0
tql/evaluator.py +379 -0
tql/evaluator_components/README.md +131 -0
tql/evaluator_components/__init__.py +17 -0
tql/evaluator_components/field_access.py +176 -0
tql/evaluator_components/special_expressions.py +296 -0
tql/evaluator_components/value_comparison.py +315 -0
tql/exceptions.py +160 -0
tql/geoip_normalizer.py +233 -0
tql/mutator_analyzer.py +830 -0
tql/mutators/__init__.py +222 -0
tql/mutators/base.py +78 -0
tql/mutators/dns.py +316 -0
tql/mutators/encoding.py +218 -0
tql/mutators/geo.py +363 -0
tql/mutators/list.py +212 -0
tql/mutators/network.py +163 -0
tql/mutators/security.py +225 -0
tql/mutators/string.py +165 -0
tql/opensearch.py +78 -0
tql/opensearch_components/README.md +130 -0
tql/opensearch_components/__init__.py +17 -0
tql/opensearch_components/field_mapping.py +399 -0
tql/opensearch_components/lucene_converter.py +305 -0
tql/opensearch_components/query_converter.py +775 -0
tql/opensearch_mappings.py +309 -0
tql/opensearch_stats.py +451 -0
tql/parser.py +1363 -0
tql/parser_components/README.md +72 -0
tql/parser_components/__init__.py +20 -0
tql/parser_components/ast_builder.py +162 -0
tql/parser_components/error_analyzer.py +101 -0
tql/parser_components/field_extractor.py +112 -0
tql/parser_components/grammar.py +473 -0
tql/post_processor.py +737 -0
tql/scripts.py +124 -0
tql/stats_evaluator.py +444 -0
tql/stats_transformer.py +184 -0
tql/validators.py +110 -0

tql/evaluator_components/value_comparison.py ADDED Viewed

@@ -0,0 +1,315 @@
+"""Value comparison operations for TQL evaluator.
+This module handles all value comparison operations including type conversions,
+operator implementations, and special cases like CIDR matching.
+"""
+import ipaddress
+import re
+from typing import Any
+class ValueComparator:
+    """Handles value comparison operations for TQL evaluation."""
+    # Sentinel value to distinguish missing fields from None values
+    _MISSING_FIELD = object()
+    def compare_values(self, field_value: Any, operator: str, expected_value: Any) -> bool:  # noqa: C901
+        """Compare a field value against an expected value using the given operator.
+        Args:
+            field_value: Value from the record
+            operator: Comparison operator
+            expected_value: Expected value from the query
+        Returns:
+            Boolean result of comparison
+        """
+        # Handle missing fields
+        if field_value is self._MISSING_FIELD:
+            if operator in ["exists"]:
+                return False
+            elif operator in ["not_exists"]:
+                return True  # Field doesn't exist, so "not exists" is true
+            # For negated string operators, missing fields should return True
+            # (e.g., if field doesn't exist, it doesn't contain/start with/end with the value)
+            elif operator in ["not_contains", "not_startswith", "not_endswith", "not_regexp"]:
+                return True
+            # For not_cidr, missing fields should return False (can't check CIDR on missing IP)
+            elif operator in ["cidr", "not_cidr"]:
+                return False
+            # Note: for is_not operations, missing fields are treated as non-matching
+            else:
+                # Missing fields return False for all other operators
+                return False
+        # Handle None field values (field exists but is None)
+        if field_value is None:
+            if operator in ["exists"]:
+                return True  # Field exists, even if value is None
+            elif operator in ["is"]:
+                # Check for null comparison - expected_value can be None or "null"
+                return expected_value is None or (isinstance(expected_value, str) and expected_value.lower() == "null")
+            else:
+                return False
+        # Convert numeric strings to numbers for comparison
+        field_value = self._convert_numeric(field_value)
+        expected_value = self._convert_numeric(expected_value)
+        # Convert boolean strings to booleans for comparison
+        if isinstance(expected_value, str) and expected_value.lower() in ["true", "false"]:
+            expected_value = expected_value.lower() == "true"
+        if isinstance(field_value, str) and field_value.lower() in ["true", "false"]:
+            field_value = field_value.lower() == "true"
+        try:
+            if operator in ["eq", "="]:
+                return field_value == expected_value
+            elif operator in ["ne", "!="]:
+                return field_value != expected_value
+            elif operator in ["gt", ">"]:
+                return field_value > expected_value
+            elif operator in ["gte", ">="]:
+                return field_value >= expected_value
+            elif operator in ["lt", "<"]:
+                return field_value < expected_value
+            elif operator in ["lte", "<="]:
+                return field_value <= expected_value
+            elif operator == "contains":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                # Handle list fields by checking if expected value is in the list
+                if isinstance(field_value, list):
+                    # For lists, check if expected value is in the list
+                    return expected_value in field_value
+                else:
+                    return str(expected_value) in str(field_value)
+            elif operator == "startswith":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return str(field_value).startswith(str(expected_value))
+            elif operator == "endswith":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return str(field_value).endswith(str(expected_value))
+            elif operator == "in":
+                if isinstance(expected_value, list):
+                    if len(expected_value) == 1 and isinstance(field_value, list):
+                        # This is likely a reversed 'in' case: 'value' in field_list
+                        # Check if the single expected value is in the field list
+                        converted_expected = self._convert_numeric(expected_value[0])
+                        return converted_expected in field_value
+                    else:
+                        # Standard case: field_value in list
+                        # Convert list elements to appropriate types for comparison
+                        converted_list = [self._convert_numeric(val) for val in expected_value]
+                        return field_value in converted_list
+                else:
+                    return field_value == expected_value
+            elif operator == "regexp":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return bool(re.search(str(expected_value), str(field_value)))
+            elif operator == "cidr":
+                # Unwrap single-element lists for CIDR
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return self._check_cidr(field_value, expected_value)
+            elif operator == "exists":
+                return True  # If we got here, field exists
+            elif operator == "is":
+                # Handle null comparison specially
+                if isinstance(expected_value, str) and expected_value.lower() == "null":
+                    return field_value is None
+                # Handle boolean and other literal comparisons
+                return field_value is expected_value
+            elif operator == "between":
+                # between requires a list with two values
+                if isinstance(expected_value, list) and len(expected_value) == 2:
+                    # Convert string values to appropriate numeric types if needed
+                    val1 = self._convert_numeric(expected_value[0])
+                    val2 = self._convert_numeric(expected_value[1])
+                    # Allow values in any order (determine lower and upper bounds)
+                    lower_bound = min(val1, val2)
+                    upper_bound = max(val1, val2)
+                    # Perform range check
+                    return lower_bound <= field_value <= upper_bound
+                else:
+                    return False
+            # Negated operators - return the opposite of the base operator
+            elif operator == "not_exists":
+                # Field should not exist (handled earlier for missing fields)
+                return False  # If we got here, field exists, so return False
+            elif operator == "is_not":
+                # Handle null comparison specially
+                if isinstance(expected_value, str) and expected_value.lower() == "null":
+                    return field_value is not None
+                # Handle boolean and other literal comparisons
+                return field_value is not expected_value
+            elif operator == "not_in":
+                if isinstance(expected_value, list):
+                    # Convert list elements to appropriate types for comparison
+                    converted_list = [self._convert_numeric(val) for val in expected_value]
+                    return field_value not in converted_list
+                else:
+                    return field_value != expected_value
+            elif operator == "not_contains":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return str(expected_value) not in str(field_value)
+            elif operator == "not_startswith":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return not str(field_value).startswith(str(expected_value))
+            elif operator == "not_endswith":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return not str(field_value).endswith(str(expected_value))
+            elif operator == "not_regexp":
+                # Unwrap single-element lists for string operators
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return not bool(re.search(str(expected_value), str(field_value)))
+            elif operator == "not_cidr":
+                # Unwrap single-element lists for CIDR
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                return not self._check_cidr(field_value, expected_value)
+            elif operator == "not_between":
+                # not between requires a list with two values
+                if isinstance(expected_value, list) and len(expected_value) == 2:
+                    # Convert string values to appropriate numeric types if needed
+                    val1 = self._convert_numeric(expected_value[0])
+                    val2 = self._convert_numeric(expected_value[1])
+                    # Allow values in any order (determine lower and upper bounds)
+                    lower_bound = min(val1, val2)
+                    upper_bound = max(val1, val2)
+                    # Perform range check (opposite of between)
+                    return not lower_bound <= field_value <= upper_bound
+                else:
+                    return False
+            elif operator == "any":
+                # ANY operator - matches if the value equals any element (for arrays)
+                # or equals the value (for single values)
+                # Handle case where expected_value might be wrapped in a list
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                if isinstance(field_value, (list, tuple, set)):
+                    # For arrays, check if expected value is in the array
+                    return expected_value in field_value
+                else:
+                    # For single values, just check equality
+                    return field_value == expected_value
+            elif operator == "all":
+                # ALL operator - for arrays, all elements must equal the value
+                # For single values, it's just equality
+                # Handle case where expected_value might be wrapped in a list
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                if isinstance(field_value, (list, tuple, set)):
+                    # For arrays, all elements must equal the expected value
+                    return all(elem == expected_value for elem in field_value) if field_value else False
+                else:
+                    # For single values, just check equality
+                    return field_value == expected_value
+            elif operator == "not_any":
+                # NOT ANY - the value should not equal any element
+                # Handle case where expected_value might be wrapped in a list
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                if isinstance(field_value, (list, tuple, set)):
+                    # For arrays, expected value should not be in the array
+                    return expected_value not in field_value
+                else:
+                    # For single values, check inequality
+                    return field_value != expected_value
+            elif operator == "not_all":
+                # NOT ALL - at least one element doesn't equal the value
+                # Handle case where expected_value might be wrapped in a list
+                if isinstance(expected_value, list) and len(expected_value) == 1:
+                    expected_value = expected_value[0]
+                if isinstance(field_value, (list, tuple, set)):
+                    # For arrays, at least one element must not equal the expected value
+                    # This is true if ANY element doesn't match
+                    return any(elem != expected_value for elem in field_value) if field_value else True
+                else:
+                    # For single values, NOT ALL means the opposite of ALL
+                    # If the single value matches, then ALL match, so NOT ALL is false
+                    return field_value != expected_value
+            else:
+                raise ValueError(f"Unknown operator: {operator}")
+        except (TypeError, ValueError):
+            # Type mismatch or conversion error
+            return False
+    def _convert_numeric(self, value: Any) -> Any:
+        """Convert string numbers and booleans to appropriate types.
+        Args:
+            value: Value to convert
+        Returns:
+            Converted value (int, float, bool, or original)
+        """
+        if isinstance(value, str):
+            # Try to convert to int
+            try:
+                # Check if it's a valid integer
+                if "." not in value and "e" not in value.lower() and "E" not in value:
+                    return int(value)
+            except ValueError:
+                pass
+            # Try to convert to float
+            try:
+                return float(value)
+            except ValueError:
+                pass
+            # Try to convert to boolean
+            if value.lower() == "true":
+                return True
+            elif value.lower() == "false":
+                return False
+        return value
+    def _check_cidr(self, ip_value: Any, cidr: str) -> bool:
+        """Check if an IP address matches a CIDR pattern.
+        Args:
+            ip_value: IP address to check
+            cidr: CIDR pattern
+        Returns:
+            True if IP is in CIDR range
+        """
+        try:
+            # Convert IP value to string if needed
+            ip_str = str(ip_value)
+            # Create network from CIDR
+            network = ipaddress.ip_network(cidr, strict=False)
+            # Check if IP is in network
+            ip = ipaddress.ip_address(ip_str)
+            return ip in network
+        except (ValueError, TypeError):
+            # Invalid IP or CIDR
+            return False

tql/exceptions.py ADDED Viewed

@@ -0,0 +1,160 @@
+"""TQL exception classes.
+This module defines custom exceptions used throughout the TQL library.
+"""
+from typing import Any, Dict, List, Optional
+class TQLError(Exception):
+    """Base exception class for all TQL errors."""
+    def __init__(
+        self,
+        message: str,
+        position: Optional[int] = None,
+        query: Optional[str] = None,
+        suggestions: Optional[List[str]] = None,
+        context: Optional[Dict[str, Any]] = None,
+    ):
+        """Initialize TQL error with enhanced context.
+        Args:
+            message: Primary error message
+            position: Character position where error occurred
+            query: Original query string
+            suggestions: List of suggestions or examples
+            context: Additional context information
+        """
+        super().__init__(message)
+        self.position = position
+        self.query = query
+        self.suggestions = suggestions or []
+        self.context = context or {}
+    def __str__(self) -> str:
+        """Format error message with position and suggestions."""
+        lines = []
+        # Main error message with position
+        if self.position is not None:
+            lines.append(f"{self.__class__.__name__} at position {self.position}: {super().__str__()}")
+            # Show query with position indicator
+            if self.query:
+                lines.append(f"Query: {self.query}")
+                # Add position indicator
+                if 0 <= self.position <= len(self.query):
+                    lines.append(" " * (7 + self.position) + "^")
+        else:
+            lines.append(f"{self.__class__.__name__}: {super().__str__()}")
+        # Add suggestions
+        if self.suggestions:
+            if len(self.suggestions) == 1:
+                lines.append(f"Did you mean: {self.suggestions[0]}?")
+            else:
+                lines.append("Suggestions:")
+                for suggestion in self.suggestions:
+                    lines.append(f"  - {suggestion}")
+        return "\n".join(lines)
+class TQLSyntaxError(TQLError):
+    """Raised when TQL query has syntax errors."""
+class TQLParseError(TQLError):
+    """Raised when there's an error parsing a TQL query."""
+class TQLTypeError(TQLError):
+    """Raised when an operator is incompatible with a field's data type."""
+    def __init__(
+        self, field: str, field_type: str, operator: str, valid_operators: Optional[List[str]] = None, **kwargs
+    ):
+        """Initialize type error with field and operator context."""
+        message = f"Cannot apply operator '{operator}' to field '{field}' of type '{field_type}'. "
+        if operator in [">", ">=", "<", "<="] and field_type in ["keyword", "text"]:
+            message += (
+                "Numeric comparison operators (>, >=, <, <=) require numeric field types "
+                "(integer, long, float, double). "
+            )
+            if valid_operators:
+                message += f"Consider using: {', '.join(valid_operators)} for {field_type} fields."
+        elif valid_operators:
+            message += f"Valid operators for {field_type} fields: {', '.join(valid_operators)}"
+        super().__init__(message, **kwargs)
+        self.field = field
+        self.field_type = field_type
+        self.operator = operator
+        self.valid_operators = valid_operators
+class TQLFieldError(TQLError):
+    """Raised when referencing invalid or non-existent fields."""
+    def __init__(self, field: str, available_fields: Optional[List[str]] = None, **kwargs):
+        """Initialize field error with available fields context."""
+        message = f"Unknown field '{field}'."
+        if available_fields:
+            message += f"\nAvailable fields: {', '.join(sorted(available_fields))}"
+            # Simple suggestion based on string similarity
+            suggestions = []
+            field_lower = field.lower()
+            for available in available_fields:
+                if field_lower in available.lower() or available.lower() in field_lower:
+                    suggestions.append(f"{available}")
+            if suggestions and "suggestions" not in kwargs:
+                kwargs["suggestions"] = suggestions[:3]  # Limit to top 3 suggestions
+        super().__init__(message, **kwargs)
+        self.field = field
+        self.available_fields = available_fields
+class TQLValueError(TQLError):
+    """Raised when provided values don't match expected formats."""
+class TQLOperatorError(TQLError):
+    """Raised when operators are used incorrectly."""
+class TQLExecutionError(TQLError):
+    """Raised when there's an error executing a TQL query."""
+class TQLValidationError(TQLError):
+    """Raised when a TQL query fails validation."""
+class TQLUnsupportedOperationError(TQLError):
+    """Raised when attempting to use unsupported operations with a backend."""
+class TQLConfigError(TQLError):
+    """Raised when there's a configuration error."""
+class TQLMutatorError(TQLError):
+    """Raised when there's an error applying a mutator."""
+    def __init__(self, mutator_name: str, field_name: str, value_type: str, message: Optional[str] = None, **kwargs):
+        """Initialize mutator error with context."""
+        if not message:
+            message = (
+                f"Cannot apply mutator '{mutator_name}' to field '{field_name}' with value of type '{value_type}'."
+            )
+        super().__init__(message, **kwargs)
+        self.mutator_name = mutator_name
+        self.field_name = field_name
+        self.value_type = value_type