PyPI - aws-python-helper - Versions diffs - 0.23.0__py3-none-any.whl - Mend

aws-python-helper 0.23.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (37) hide show

aws_python_helper/__init__.py +45 -0
aws_python_helper/api/__init__.py +11 -0
aws_python_helper/api/auth_middleware.py +108 -0
aws_python_helper/api/auth_validators.py +143 -0
aws_python_helper/api/base.py +272 -0
aws_python_helper/api/dispatcher.py +213 -0
aws_python_helper/api/exceptions.py +43 -0
aws_python_helper/api/fetcher.py +210 -0
aws_python_helper/api/handler.py +106 -0
aws_python_helper/database/__init__.py +11 -0
aws_python_helper/database/database_proxy.py +50 -0
aws_python_helper/database/external_database_proxy.py +66 -0
aws_python_helper/database/external_mongo_manager.py +212 -0
aws_python_helper/database/mongo_manager.py +214 -0
aws_python_helper/fargate/__init__.py +9 -0
aws_python_helper/fargate/executor.py +226 -0
aws_python_helper/fargate/fetcher.py +108 -0
aws_python_helper/fargate/handler.py +101 -0
aws_python_helper/fargate/task_base.py +165 -0
aws_python_helper/lambda_standalone/__init__.py +8 -0
aws_python_helper/lambda_standalone/base.py +171 -0
aws_python_helper/lambda_standalone/fetcher.py +122 -0
aws_python_helper/lambda_standalone/handler.py +117 -0
aws_python_helper/sns/__init__.py +6 -0
aws_python_helper/sns/publisher.py +245 -0
aws_python_helper/sqs/__init__.py +10 -0
aws_python_helper/sqs/consumer_base.py +416 -0
aws_python_helper/sqs/fetcher.py +111 -0
aws_python_helper/sqs/handler.py +138 -0
aws_python_helper/utils/__init__.py +9 -0
aws_python_helper/utils/json_encoder.py +108 -0
aws_python_helper/utils/response.py +145 -0
aws_python_helper/utils/serializer.py +103 -0
aws_python_helper-0.23.0.dist-info/METADATA +712 -0
aws_python_helper-0.23.0.dist-info/RECORD +37 -0
aws_python_helper-0.23.0.dist-info/WHEEL +5 -0
aws_python_helper-0.23.0.dist-info/top_level.txt +1 -0

aws_python_helper/sqs/consumer_base.py ADDED Viewed

@@ -0,0 +1,416 @@
+"""
+SQS Consumer Base - Base class for all SQS consumers
+"""
+from abc import ABC, abstractmethod
+from typing import Dict, Any, List
+import logging
+import json
+from ..database.mongo_manager import MongoManager
+from ..database.database_proxy import DatabaseProxy
+from ..database.external_mongo_manager import ExternalMongoManager
+from ..database.external_database_proxy import ExternalDatabaseProxy
+class SQSConsumer(ABC):
+    """
+    Base class for all SQS consumers
+    Provides structure to process SQS messages in batch or individually.
+    Processing modes:
+        - "single": Process messages one by one using process_record()
+        - "batch": Process all messages together using process_batch()
+    Error Handling & Retries:
+        Both modes support controlled retry via AWS SQS reportBatchItemFailures:
+        - "single" mode: If process_record() raises an exception, that message
+          is automatically reported for retry. Other messages continue processing.
+        - "batch" mode: Use add_message_failed() to mark failed messages.
+          The handler will automatically create reportBatchItemFailures so AWS SQS
+          retries only those specific messages. Your _do_process_batch() is automatically
+          wrapped with error handling.
+        This ensures that if 1 message fails out of 5, only that 1 message is retried,
+        not the entire batch.
+    Usage:
+        # Single mode (default):
+        class MyConsumer(SQSConsumer):
+            @property
+            def processing_mode(self):
+                return "single"  # or omit, "single" is default
+            async def process_record(self, record):
+                # Process individual record
+                # If you raise an exception here, AWS SQS will retry only this message
+                # Other messages in the batch will continue processing normally
+                body = self.parse_body(record)
+                # Your processing logic here
+                # If something fails, just raise an exception:
+                # if error_condition:
+                #     raise ValueError("This message failed, will be retried")
+                pass
+        # Batch mode:
+        class MyBatchConsumer(SQSConsumer):
+            @property
+            def processing_mode(self):
+                return "batch"
+            async def process_batch(self, records):
+                # Process all records together
+                # Use add_message_failed() to mark failed messages - no need for try-except!
+                # The base class wraps this method with error handling automatically
+                for record in records:
+                    message_id = record.get('messageId')
+                    try:
+                        # Your batch processing logic here
+                        # Process all records together (bulk operations, transactions, etc.)
+                        await self.process_message(record)
+                    except Exception as e:
+                        # Mark as failed - automatically handled by base class
+                        self.add_message_failed(message_id, str(e))
+                # No need to return results - base class handles it automatically
+                # But you can return results if you want more control
+    """
+    def __init__(self):
+        """Initialize the consumer with a logger"""
+        self.logger = logging.getLogger(self.__class__.__name__)
+        self._db = None
+        self._external_db = None
+        self._failed_messages = []  # Track failed messages for batch mode
+    @property
+    def processing_mode(self) -> str:
+        """
+        Processing mode: "single" or "batch"
+        - "single": Process messages individually using process_record()
+        - "batch": Process all messages together using process_batch()
+        Returns:
+            "single" or "batch" (default: "single")
+        """
+        return "single"
+    @property
+    def db(self):
+        """
+        Access to MongoDB databases (main cluster)
+        Usage:
+            result = await self.db.users_db.users.find_one({'_id': user_id})
+        """
+        if self._db is None:
+            self._db = DatabaseProxy(MongoManager)
+        return self._db
+    @property
+    def external_db(self):
+        """
+        Access to external MongoDB clusters
+        Returns None if EXTERNAL_MONGODB_CONNECTIONS environment variable is not set.
+        Usage:
+            if self.external_db:
+                result = await self.external_db.ClusterDockets.smart_data.addresses.find_one({...})
+                await self.external_db.ClusterDockets.core.users.insert_one({...})
+        Returns:
+            ExternalDatabaseProxy instance for accessing external clusters, or None if not configured
+        """
+        if self._external_db is None:
+            # Initialize external connections if not already done
+            if not ExternalMongoManager.is_initialized():
+                has_connections = ExternalMongoManager.initialize()
+                if not has_connections:
+                    # No external connections available, return None
+                    return None
+            else:
+                # Check if there are any connections available
+                if len(ExternalMongoManager.get_available_clusters()) == 0:
+                    return None
+            self._external_db = ExternalDatabaseProxy()
+        return self._external_db
+    async def process_record(self, record: Dict[str, Any]):
+        """
+        Process an individual SQS record
+        This method is required when processing_mode is "single".
+        When processing_mode is "batch", this method is optional.
+        If this method raises an exception, AWS SQS will automatically retry
+        only that specific message. Other messages in the batch will continue
+        processing normally.
+        Args:
+            record: SQS record with 'body', 'messageId', etc.
+        Raises:
+            Exception: Any error in the processing. The exception will be caught
+                      and the message will be reported for retry by AWS SQS.
+        """
+        # Only raise NotImplementedError if in single mode
+        if self.processing_mode == "single":
+            raise NotImplementedError(
+                f"You must implement process_record() when processing_mode is 'single'"
+            )
+        # In batch mode, this method is optional
+    def extract_content_message(self, record: Dict[str, Any]) -> Dict[str, Any]:
+        """
+        Parse the body of the SQS message
+        When SNS sends messages to SQS, the body has this structure:
+        {
+            "Type": "Notification",
+            "Message": "{...the actual message serialized as JSON string...}",
+            "MessageAttributes": {...}
+        }
+        This method automatically detects SNS messages and extracts the actual content
+        from the "Message" field. If it's not an SNS message, it parses the body directly.
+        Args:
+            record: SQS record with 'body' field
+        Returns:
+            Parsed body as dict. For SNS messages, returns the parsed content from the "Message" field.
+            For regular SQS messages, returns the parsed body directly.
+        """
+        body = record.get('body', '{}')
+        # Parse the body string to JSON if needed
+        if isinstance(body, str):
+            try:
+                body_json = json.loads(body)
+            except json.JSONDecodeError:
+                self.logger.warning(f"Could not parse body as JSON: {body}")
+                return {'raw': body}
+        else:
+            body_json = body
+        # Check if this is an SNS notification message
+        if isinstance(body_json, dict) and body_json.get('Type') == 'Notification':
+            # Extract the actual message from the "Message" field
+            message_str = body_json.get('Message', '{}')
+            if isinstance(message_str, str):
+                try:
+                    # Parse the JSON string in the Message field
+                    message_content = json.loads(message_str)
+                    self.logger.debug(f"Extracted SNS message content: {message_content}")
+                    return message_content
+                except json.JSONDecodeError:
+                    self.logger.warning(f"Could not parse SNS Message field as JSON: {message_str}")
+                    return {'raw': message_str, 'sns_notification': True}
+            else:
+                # Message field is already a dict
+                return message_str
+        # Not an SNS message, return the body as-is
+        return body_json
+    def add_message_failed(self, message_id: str, error: str = None):
+        """
+        Mark a message as failed (for batch mode)
+        Use this method in your process_batch() implementation to mark messages
+        that failed during batch processing. The handler will automatically
+        create reportBatchItemFailures for these messages.
+        Args:
+            message_id: The messageId of the failed message
+            error: Optional error message describing the failure
+        Usage:
+            async def process_batch(self, records):
+                for record in records:
+                    message_id = record.get('messageId')
+                    try:
+                        # Your processing logic
+                        process_message(record)
+                    except Exception as e:
+                        # Mark as failed - no need to manually add to results
+                        self.add_message_failed(message_id, str(e))
+        """
+        self._failed_messages.append({
+            'messageId': message_id,
+            'itemIdentifier': message_id,
+            'error': error
+        })
+        if error:
+            self.logger.error(f"Message {message_id} marked as failed: {error}")
+        else:
+            self.logger.error(f"Message {message_id} marked as failed")
+    async def _process_batch_internal(self, records: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+        """
+        Internal method called by the handler to process a batch of SQS records
+        This method routes to the appropriate processing based on processing_mode:
+        - "single": Processes records one by one using process_record()
+        - "batch": Wraps the user's process_batch() implementation with error handling
+        Args:
+            records: List of SQS records
+        Returns:
+            List of results with success/error for each record
+        """
+        mode = self.processing_mode
+        if mode == "batch":
+            # Reset failed messages list for this batch
+            self._failed_messages = []
+            # Wrap batch processing with error handling
+            return await self._process_batch_wrapper(records)
+        else:
+            # Single mode: process records one by one using process_record()
+            return await self._process_batch_single(records)
+    async def process_batch(self, records: List[Dict[str, Any]]) -> None:
+        """
+        Process a batch of SQS records (to be overridden by user in batch mode)
+        When processing_mode is "batch", override this method to implement
+        your batch processing logic. Use add_message_failed() to mark failed messages.
+        The base class will wrap your implementation with error handling automatically.
+        This method should not return any value. Simply process the records and use
+        add_message_failed() to mark any messages that fail. All other messages will
+        be automatically marked as successful.
+        Args:
+            records: List of SQS records
+        Example:
+            async def process_batch(self, records):
+                for record in records:
+                    message_id = record.get('messageId')
+                    try:
+                        # Your processing logic
+                        await self.process_message(record)
+                    except Exception as e:
+                        # Mark as failed - automatically handled
+                        self.add_message_failed(message_id, str(e))
+        """
+        # Base implementation - should be overridden by user when processing_mode is "batch"
+        # This method is only called when processing_mode is "batch"
+        # If not overridden, all messages will be marked as successful
+        # (unless marked as failed via add_message_failed)
+        if self.processing_mode == "batch":
+            raise NotImplementedError(
+                f"You must implement process_batch() when processing_mode is 'batch'"
+            )
+    async def _process_batch_wrapper(self, records: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+        """
+        Wrapper for batch mode processing with automatic error handling
+        This method wraps the user's process_batch() implementation with try-except
+        to catch any unhandled exceptions. It also merges failed messages marked
+        with add_message_failed() into the results.
+        Internal method used when processing_mode is "batch"
+        """
+        # Get all message IDs upfront
+        message_ids = [record.get('messageId', f'record-{i}') for i, record in enumerate(records)]
+        results = []
+        try:
+            # Call the user's process_batch implementation (no return value expected)
+            await self.process_batch(records)
+            # Build results based on _failed_messages
+            # All messages are successful by default, except those marked as failed
+            for message_id in message_ids:
+                # Check if this message was marked as failed
+                failed_msg = next((fm for fm in self._failed_messages if fm['messageId'] == message_id), None)
+                if failed_msg:
+                    # Message was marked as failed
+                    results.append({
+                        'messageId': message_id,
+                        'success': False,
+                        'error': failed_msg.get('error'),
+                        'itemIdentifier': failed_msg['itemIdentifier']
+                    })
+                else:
+                    # Message was successful
+                    results.append({
+                        'messageId': message_id,
+                        'success': True
+                    })
+        except Exception as e:
+            # If the entire batch processing fails, mark all messages as failed
+            self.logger.exception(f"Unhandled exception in process_batch: {e}")
+            for message_id in message_ids:
+                results.append({
+                    'messageId': message_id,
+                    'success': False,
+                    'error': str(e),
+                    'itemIdentifier': message_id
+                })
+        # Log summary
+        success_count = sum(1 for r in results if r.get('success', False))
+        failed_count = len(results) - success_count
+        self.logger.info(
+            f"Batch processing complete: {success_count} successful, {failed_count} failed"
+        )
+        return results
+    async def _process_batch_single(self, records: List[Dict[str, Any]]) -> List[Dict[str, Any]]:
+        """
+        Process records one by one (single mode)
+        If a message fails (raises an exception), it will be reported as failed
+        and AWS SQS will retry only that message. Other messages continue processing.
+        Internal method used when processing_mode is "single"
+        """
+        results = []
+        for i, record in enumerate(records):
+            message_id = record.get('messageId', f'record-{i}')
+            try:
+                self.logger.info(f"Processing message: {message_id}")
+                await self.process_record(record)
+                results.append({
+                    'messageId': message_id,
+                    'success': True
+                })
+                self.logger.info(f"Successfully processed message: {message_id}")
+            except Exception as e:
+                # Log the error but continue with other messages
+                self.logger.error(
+                    f"Error processing message {message_id}: {e}",
+                    exc_info=True
+                )
+                results.append({
+                    'messageId': message_id,
+                    'success': False,
+                    'error': str(e),
+                    'itemIdentifier': message_id  # For reportBatchItemFailures (AWS SQS messageId)
+                })
+        # Log summary
+        success_count = sum(1 for r in results if r['success'])
+        failed_count = len(results) - success_count
+        self.logger.info(
+            f"Batch processing complete: {success_count} successful, {failed_count} failed"
+        )
+        return results

aws_python_helper/sqs/fetcher.py ADDED Viewed

@@ -0,0 +1,111 @@
+"""
+SQS Fetcher - Dynamically load consumers based on name
+"""
+import os
+import importlib.util
+from pathlib import Path
+class SQSFetcher:
+    """
+    Dynamically load SQS consumers
+    Searches for consumers as direct files in 'src/consumer/' folder.
+    Convention:
+        consumer-name -> src/consumer/consumer_name.py -> ConsumerNameConsumer
+    Examples:
+        'user-created' -> src/consumer/user_created.py -> UserCreatedConsumer
+        'title-indexed' -> src/consumer/title_indexed.py -> TitleIndexedConsumer
+    """
+    CONSUMERS_FOLDER = "consumer"
+    _cache = {}
+    def __init__(self, consumer_name: str):
+        """
+        Initialize the fetcher
+        Args:
+            consumer_name: Name of the consumer in kebab-case (e.g.: 'user-created')
+        """
+        self.consumer_name = consumer_name
+    @property
+    def file_path(self) -> str:
+        """
+        Calculate the path of the consumer file
+        Converts 'user-created' to 'user_created.py'
+        Returns:
+            Absolute path to the consumer file
+        """
+        # Convert dashes to underscores for Python file name
+        file_name = self.consumer_name.replace('-', '_') + '_consumer.py'
+        base_path = Path(os.getcwd()) / self.CONSUMERS_FOLDER
+        file_path = base_path / file_name
+        return str(file_path)
+    def get_consumer(self):
+        """
+        Load and return an instance of the consumer
+        Returns:
+            Instance of the consumer
+        Raises:
+            FileNotFoundError: If the file does not exist
+            ValueError: If the consumer class is not valid
+        """
+        file_path = self.file_path
+        # Verify cache
+        if file_path in self._cache:
+            return self._cache[file_path]()
+        # Verify that the file exists
+        if not os.path.exists(file_path):
+            raise FileNotFoundError(
+                f"Consumer not found: {file_path}\n"
+                f"Expected file for consumer '{self.consumer_name}' at {file_path}"
+            )
+        # Load module dynamically
+        spec = importlib.util.spec_from_file_location("consumer_module", file_path)
+        if not spec or not spec.loader:
+            raise ImportError(f"Could not load module spec from: {file_path}")
+        module = importlib.util.module_from_spec(spec)
+        spec.loader.exec_module(module)
+        # Search for class that inherits from SQSConsumer
+        # Expected class name: 'user-created' -> 'UserCreatedConsumer'
+        class_name = ''.join(
+            word.capitalize() for word in self.consumer_name.split('-')
+        ) + 'Consumer'
+        consumer_class = None
+        for item_name in dir(module):
+            item = getattr(module, item_name)
+            if (isinstance(item, type) and
+                hasattr(item, 'process_record') and
+                item.__name__ not in ['SQSConsumer', 'ABC']):
+                consumer_class = item
+                break
+        if not consumer_class:
+            raise ValueError(
+                f"No SQSConsumer class found in {file_path}\n"
+                f"Make sure your file exports a class that inherits from SQSConsumer\n"
+                f"Expected class name: {class_name}"
+            )
+        # Cache the class
+        self._cache[file_path] = consumer_class
+        # Return new instance
+        return consumer_class()

aws_python_helper/sqs/handler.py ADDED Viewed

@@ -0,0 +1,138 @@
+"""
+SQS Handler - Generic reusable handler for SQS consumers
+"""
+import asyncio
+import logging
+import sys
+from typing import Dict, Any, Callable
+from .fetcher import SQSFetcher
+from ..utils.serializer import serialize_mongo_types
+from ..database.mongo_manager import MongoManager
+def setup_logging():
+    root_logger = logging.getLogger()
+    root_logger.setLevel(logging.INFO)
+    # Solo configurar si no tiene handlers
+    if not root_logger.handlers:
+        handler = logging.StreamHandler(sys.stderr)
+        handler.setFormatter(
+            logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
+        )
+        root_logger.addHandler(handler)
+    else:
+        # Si ya tiene handlers, solo actualizar el nivel
+        for handler in root_logger.handlers:
+            handler.setLevel(logging.INFO)
+# Llamar al inicio del módulo
+setup_logging()
+logger = logging.getLogger(__name__)
+def sqs_handler(consumer_name: str) -> Callable:
+    """
+    Factory that returns a handler for a specific consumer
+    This pattern allows creating specific handlers for each consumer
+    while keeping the code DRY.
+    Args:
+        consumer_name: Name of the consumer (must exist in consumer/)
+    Returns:
+        Configured handler function for that consumer
+    """
+    def handler(event: Dict[str, Any], context: Any) -> Dict[str, Any]:
+        """
+        Generic handler for AWS Lambda SQS
+        Args:
+            event: SQS event with Records
+            context: Lambda context
+        Returns:
+            Summary of the processing
+        """
+        # Initialize MongoDB connection (only once, reused in subsequent invocations)
+        try:
+            if not MongoManager.is_initialized():
+                MongoManager.initialize()
+        except Exception as e:
+            logger.warning(f"MongoDB initialization skipped: {e}")
+        try:
+            # Load consumer
+            fetcher = SQSFetcher(consumer_name)
+            consumer = fetcher.get_consumer()
+            # Get records
+            records = event.get('Records', [])
+            # Process batch
+            # Use get_event_loop() instead of asyncio.run() to avoid closing the loop
+            # This is important for AWS Lambda container reuse with Motor/MongoDB
+            try:
+                loop = asyncio.get_event_loop()
+                if loop.is_closed():
+                    loop = asyncio.new_event_loop()
+                    asyncio.set_event_loop(loop)
+            except RuntimeError:
+                loop = asyncio.new_event_loop()
+                asyncio.set_event_loop(loop)
+            results = loop.run_until_complete(consumer._process_batch_internal(records))
+            # Count successes and failures
+            success_count = sum(1 for r in results if r['success'])
+            error_count = len(results) - success_count
+            # Get failed message IDs for reportBatchItemFailures
+            # This allows AWS SQS to retry only failed messages, not the entire batch
+            failed_message_ids = [
+                r.get('itemIdentifier') or r.get('messageId')
+                for r in results
+                if not r.get('success', True)
+            ]
+            response = {
+                'processed': len(results),
+                'successful': success_count,
+                'failed': error_count,
+                'results': results  # Include detailed results
+            }
+            # If there are failures, add reportBatchItemFailures for partial batch failure reporting
+            # This tells AWS SQS to only retry the failed messages
+            if failed_message_ids:
+                response['batchItemFailures'] = [
+                    {'itemIdentifier': msg_id} for msg_id in failed_message_ids
+                ]
+                logger.warning(
+                    f"Processing complete with {error_count} failures. "
+                    f"Failed messages will be retried: {failed_message_ids}"
+                )
+            # Serialize MongoDB types to JSON-serializable types
+            # AWS Lambda will serialize the return value to JSON, so we need to ensure
+            # all MongoDB types (ObjectId, datetime, etc.) are converted first
+            response = serialize_mongo_types(response)
+            return response
+        except Exception as e:
+            logger.exception(f"Unhandled exception in SQS handler: {e}")
+            return {
+                'processed': 0,
+                'successful': 0,
+                'failed': len(event.get('Records', [])),
+                'error': str(e)
+            }
+    return handler

aws_python_helper/utils/__init__.py ADDED Viewed

@@ -0,0 +1,9 @@
+"""
+Utils Module - Utilities for the framework
+"""
+from .response import ApiResponse
+from .json_encoder import MongoJSONEncoder, mongo_json_dumps
+from .serializer import serialize_mongo_types
+__all__ = ['MongoJSONEncoder', 'ApiResponse', 'mongo_json_dumps', 'serialize_mongo_types']