PyPI - documente_shared - Versions diffs - 0.1.145__py3-none-any.whl - Mend

documente_shared 0.1.145__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (63) hide show

documente_shared/__init__.py +0 -0
documente_shared/application/__init__.py +0 -0
documente_shared/application/dates.py +7 -0
documente_shared/application/digest.py +7 -0
documente_shared/application/exceptions.py +23 -0
documente_shared/application/files.py +27 -0
documente_shared/application/json.py +45 -0
documente_shared/application/numbers.py +7 -0
documente_shared/application/payloads.py +29 -0
documente_shared/application/query_params.py +133 -0
documente_shared/application/retry_utils.py +69 -0
documente_shared/application/time_utils.py +13 -0
documente_shared/application/timezone.py +7 -0
documente_shared/domain/__init__.py +0 -0
documente_shared/domain/base_enum.py +54 -0
documente_shared/domain/constants.py +8 -0
documente_shared/domain/entities/__init__.py +0 -0
documente_shared/domain/entities/document.py +410 -0
documente_shared/domain/entities/document_metadata.py +64 -0
documente_shared/domain/entities/in_memory_document.py +75 -0
documente_shared/domain/entities/processing_case.py +215 -0
documente_shared/domain/entities/processing_case_filters.py +51 -0
documente_shared/domain/entities/processing_case_item.py +300 -0
documente_shared/domain/entities/processing_case_item_filters.py +54 -0
documente_shared/domain/entities/processing_documents.py +11 -0
documente_shared/domain/entities/processing_event.py +71 -0
documente_shared/domain/entities/scaling.py +31 -0
documente_shared/domain/enums/__init__.py +0 -0
documente_shared/domain/enums/circular_oficio.py +29 -0
documente_shared/domain/enums/common.py +133 -0
documente_shared/domain/enums/document.py +124 -0
documente_shared/domain/enums/document_type_record.py +13 -0
documente_shared/domain/enums/processing_case.py +66 -0
documente_shared/domain/exceptions.py +5 -0
documente_shared/domain/interfaces/__init__.py +0 -0
documente_shared/domain/interfaces/scaling.py +10 -0
documente_shared/domain/repositories/__init__.py +0 -0
documente_shared/domain/repositories/document.py +24 -0
documente_shared/domain/repositories/processing_case.py +36 -0
documente_shared/domain/repositories/processing_case_item.py +49 -0
documente_shared/infrastructure/__init__.py +0 -0
documente_shared/infrastructure/documente_client.py +27 -0
documente_shared/infrastructure/dynamo_table.py +75 -0
documente_shared/infrastructure/lambdas.py +14 -0
documente_shared/infrastructure/repositories/__init__.py +0 -0
documente_shared/infrastructure/repositories/dynamo_document.py +43 -0
documente_shared/infrastructure/repositories/dynamo_processing_case.py +55 -0
documente_shared/infrastructure/repositories/dynamo_processing_case_item.py +70 -0
documente_shared/infrastructure/repositories/http_document.py +66 -0
documente_shared/infrastructure/repositories/http_processing_case.py +82 -0
documente_shared/infrastructure/repositories/http_processing_case_item.py +118 -0
documente_shared/infrastructure/repositories/mem_document.py +46 -0
documente_shared/infrastructure/repositories/mem_processing_case.py +44 -0
documente_shared/infrastructure/repositories/mem_processing_case_item.py +52 -0
documente_shared/infrastructure/s3_bucket.py +58 -0
documente_shared/infrastructure/services/__init__.py +0 -0
documente_shared/infrastructure/services/http_scaling.py +25 -0
documente_shared/infrastructure/sqs_queue.py +48 -0
documente_shared/presentation/__init__.py +0 -0
documente_shared/presentation/presenters.py +16 -0
documente_shared-0.1.145.dist-info/METADATA +39 -0
documente_shared-0.1.145.dist-info/RECORD +63 -0
documente_shared-0.1.145.dist-info/WHEEL +4 -0

documente_shared/domain/entities/processing_case.py ADDED Viewed

@@ -0,0 +1,215 @@
+from dataclasses import dataclass
+from datetime import datetime, tzinfo
+from typing import Optional, List
+from documente_shared.application.time_utils import get_datetime_from_data
+from documente_shared.domain.constants import la_paz_tz
+from documente_shared.domain.entities.processing_case_item import ProcessingCaseItem
+from documente_shared.domain.enums.common import ProcessingStatus
+from documente_shared.domain.enums.processing_case import ProcessingCaseType
+@dataclass
+class ProcessingCase(object):
+    uuid: str
+    name: str
+    tenant_slug: str
+    status: ProcessingStatus
+    case_type: ProcessingCaseType
+    enqueued_at: Optional[datetime] = None
+    started_at: Optional[datetime] = None
+    failed_at: Optional[datetime] = None
+    feedback: Optional[list | dict] = None
+    completed_at: Optional[datetime] = None
+    metadata: Optional[dict] = None
+    items: Optional[List[ProcessingCaseItem]] = None
+    def __post_init__(self):
+        self.items = self.items or []
+    def __eq__(self, other: 'ProcessingCase') -> bool:
+        if not other:
+            return False
+        return (
+            self.uuid == other.uuid
+            and self.name == other.name
+            and self.status == other.status
+            and self.case_type == other.case_type
+            and self.enqueued_at == other.enqueued_at
+            and self.started_at == other.started_at
+            and self.failed_at == other.failed_at
+            and self.feedback == other.feedback
+            and self.completed_at == other.completed_at
+            and self.metadata == other.metadata
+        )
+    @property
+    def strategy_id(self) ->str:
+        return str(self.case_type)
+    @property
+    def is_procesable(self) -> bool:
+        return self.items and len(self.items) > 0
+    @property
+    def is_queue_procesable(self) -> bool:
+        return len(self.pending_items) > 0
+    @property
+    def pending_items(self) -> List[ProcessingCaseItem]:
+        return [
+            item for item in self.items
+            if item.status == ProcessingStatus.PENDING
+        ]
+    @property
+    def is_bcp_microcredito(self) -> bool:
+        return self.case_type and self.case_type.is_bcp_microcredito
+    @property
+    def is_univida_soat(self) -> bool:
+        return self.case_type and self.case_type.is_univida_soat
+    @property
+    def to_dict(self) -> dict:
+        return {
+            'uuid': self.uuid,
+            'tenant_slug': self.tenant_slug,
+            'name': self.name,
+            'status': str(self.status),
+            'case_type': (
+                str(self.case_type)
+                if self.case_type else None
+            ),
+            'enqueued_at': self.enqueued_at.isoformat() if self.enqueued_at else None,
+            'started_at': self.started_at.isoformat() if self.started_at else None,
+            'failed_at': self.failed_at.isoformat() if self.failed_at else None,
+            'feedback': self.feedback,
+            'completed_at': self.completed_at.isoformat() if self.completed_at else None,
+            'metadata': self.metadata,
+            'items': [item.to_dict for item in self.items],
+        }
+    @property
+    def to_queue_dict(self) -> dict:
+        data = self.to_dict
+        data["items"] = [
+            item.to_queue_dict for item in self.items
+        ]
+        return data
+    @property
+    def to_persist_dict(self) -> dict:
+        persist_data = self.to_dict
+        persist_data["items"] = [
+            item.to_dict for item in self.items
+        ]
+        return persist_data
+    @property
+    def procesable_items(self) -> List[ProcessingCaseItem]:
+        return [
+            item for item in self.items
+            if item.status in [
+                ProcessingStatus.PENDING,
+                ProcessingStatus.ENQUEUED,
+            ]
+        ]
+    @property
+    def has_procesable_items(self) -> bool:
+        return len(self.procesable_items) > 0
+    def pending(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.PENDING
+        self.started_at = None
+    def enqueue(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.ENQUEUED
+        self.enqueued_at = datetime.now(tz=timezone)
+    def processing(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.PROCESSING
+        self.started_at = datetime.now(tz=timezone)
+    def failed(
+        self,
+        error_message: Optional[str] = None,
+        timezone: tzinfo = la_paz_tz,
+    ):
+        self.status = ProcessingStatus.FAILED
+        self.failed_at = datetime.now(tz=timezone)
+    def incomplete(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.INCOMPLETE
+        self.updated_at = datetime.now(tz=timezone)
+    def in_reviewed(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.IN_REVIEW
+        self.updated_at = datetime.now(tz=timezone)
+    def cancelled(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.CANCELLED
+        self.updated_at = datetime.now(tz=timezone)
+    def completed(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.COMPLETED
+        self.completed_at = datetime.now(tz=timezone)
+    def deleted(self):
+        self.status = ProcessingStatus.DELETED
+    def refresh_status(self):
+        if not self.items:
+            return
+        item_statuses = [item.status for item in self.items]
+        if any(status == ProcessingStatus.FAILED for status in item_statuses):
+            self.status = ProcessingStatus.INCOMPLETE
+        elif any(status == ProcessingStatus.PROCESSING for status in item_statuses):
+            self.status = ProcessingStatus.PROCESSING
+        elif any(status == ProcessingStatus.INCOMPLETE for status in item_statuses):  # ← AGREGAR ESTA LÍNEA
+            self.status = ProcessingStatus.INCOMPLETE
+        elif all(status == ProcessingStatus.COMPLETED for status in item_statuses):
+            self.status = ProcessingStatus.COMPLETED
+        elif all(status == ProcessingStatus.PENDING for status in item_statuses):
+            self.status = ProcessingStatus.PENDING
+        else:
+            self.status = ProcessingStatus.PENDING
+    @classmethod
+    def from_dict(cls, data: dict) -> 'ProcessingCase':
+        return cls(
+            uuid=data.get('uuid'),
+            name=data.get('name'),
+            tenant_slug=data.get('tenant_slug'),
+            status=ProcessingStatus.from_value(data.get('status')),
+            case_type=(
+                ProcessingCaseType.from_value(data.get('case_type'))
+                if data.get('case_type') else None
+            ),
+            enqueued_at=get_datetime_from_data(input_datetime=data.get('enqueued_at')),
+            started_at=get_datetime_from_data(input_datetime=data.get('started_at')),
+            failed_at=get_datetime_from_data(input_datetime=data.get('failed_at')),
+            feedback=data.get('feedback'),
+            metadata=data.get('metadata', {}),
+            completed_at=get_datetime_from_data(input_datetime=data.get('completed_at')),
+            items=[
+                ProcessingCaseItem.from_dict(item_dict)
+                for item_dict in data.get('items', [])
+            ],
+        )
+    @classmethod
+    def from_persist_dict(cls, data: dict) -> 'ProcessingCase':
+        instance = cls.from_dict(data)
+        instance.items = [
+            ProcessingCaseItem.from_persist_dict(item_dict)
+            for item_dict in data.get('items', [])
+        ]
+        return instance

documente_shared/domain/entities/processing_case_filters.py ADDED Viewed

@@ -0,0 +1,51 @@
+from dataclasses import dataclass
+from datetime import datetime
+from typing import List, Optional
+from documente_shared.domain.enums.common import ProcessingStatus
+from documente_shared.domain.enums.processing_case import ProcessingCaseType
+from documente_shared.application.query_params import QueryParams
+@dataclass
+class ProcessingCaseFilters(object):
+    case_ids: Optional[List[str]] = None
+    sort_order: Optional[str] = None
+    search: Optional[str] = None
+    init_date: Optional[datetime] = None
+    end_date: Optional[datetime] = None
+    statuses: List[ProcessingStatus] = None
+    case_types: List[ProcessingCaseType] = None
+    include_archived: bool = False
+    tenant_slug: Optional[str] = None
+    def __post_init__(self):
+        self.case_ids = self.case_ids or []
+        self.statuses = self.statuses or []
+        self.case_types = self.case_types or []
+        self.sort_order = self.sort_order or "desc"
+    @classmethod
+    def from_params(cls, params: QueryParams) -> "ProcessingCaseFilters":
+        search_term = params.get_str(key="search", default=None)
+        return ProcessingCaseFilters(
+            case_ids=params.get_uuid_list(key="case_ids", default=None),
+            sort_order=params.get(key="sort", default="desc"),
+            search=search_term.strip() if search_term else None,
+            init_date=params.get_datetime(key="init_date", default=None),
+            end_date=params.get_datetime(key="end_date", default=None),
+            statuses=params.get_enum_list(
+                key="statuses",
+                enum_class=ProcessingStatus,
+                default=None,
+            ),
+            case_types=params.get_enum_list(
+                key="case_types",
+                enum_class=ProcessingCaseType,
+                default=None,
+            ),
+            include_archived=params.get_bool(
+                key="include_archived",
+                default=False,
+            ),
+        )

documente_shared/domain/entities/processing_case_item.py ADDED Viewed

@@ -0,0 +1,300 @@
+from dataclasses import dataclass
+from datetime import datetime, tzinfo
+from decimal import Decimal
+from typing import Optional, List
+from documente_shared.application.numbers import normalize_number
+from documente_shared.application.time_utils import get_datetime_from_data
+from documente_shared.domain.constants import la_paz_tz
+from documente_shared.domain.entities.in_memory_document import InMemoryDocument
+from documente_shared.domain.enums.common import ProcessingStatus, ProcessingSource
+from documente_shared.domain.enums.processing_case import ProcessingDocumentType
+@dataclass
+class ProcessingCaseItem(object):
+    uuid: str
+    case_id: str
+    digest: str
+    status: ProcessingStatus
+    name: Optional[str] = None
+    document: Optional[InMemoryDocument] = None
+    document_type: Optional[ProcessingDocumentType] = None
+    uploaded_from: Optional[ProcessingSource] = None
+    processed_csv: Optional[InMemoryDocument] = None
+    processed_xlsx: Optional[InMemoryDocument] = None
+    processed_json: Optional[InMemoryDocument] = None
+    processing_time: Optional[Decimal] = None
+    processing_confidence: Optional[Decimal] = None
+    uploaded_at: Optional[datetime] = None
+    started_at: Optional[datetime] = None
+    failed_at: Optional[datetime] = None
+    completed_at: Optional[datetime] = None
+    feedback: Optional[list | dict] = None
+    metadata: Optional[dict] = None
+    def __post_init__(self):
+        self.feedback = self.feedback or []
+        self.metadata = self.metadata or {}
+    def __eq__(self, other: 'ProcessingCaseItem') -> bool:
+        if not other:
+            return False
+        return (
+            self.uuid == other.uuid
+            and self.digest == other.digest
+            and self.status == other.status
+            and self.document_type == other.document_type
+            and self.document == other.document
+            and self.processing_time == other.processing_time
+            and self.processing_confidence == other.processing_confidence
+            and self.uploaded_at == other.uploaded_at
+            and self.started_at == other.started_at
+            and self.failed_at == other.failed_at
+            and self.completed_at == other.completed_at
+        )
+    def pending(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.PENDING
+        self.started_at = None
+    def processing(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.PROCESSING
+        self.started_at = datetime.now(tz=timezone)
+    def failed(
+        self,
+        error_message: Optional[str] = None,
+        timezone: tzinfo = la_paz_tz,
+    ):
+        self.status = ProcessingStatus.FAILED
+        self.failed_at = datetime.now(tz=timezone)
+    def completed(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.COMPLETED
+        self.completed_at = datetime.now(tz=timezone)
+    def incomplete(self, timezone: tzinfo = la_paz_tz):
+        self.status = ProcessingStatus.INCOMPLETE
+        self.completed_at = datetime.now(tz=timezone)
+    def deleted(self):
+        self.status = ProcessingStatus.DELETED
+    def in_review(self):
+        self.status = ProcessingStatus.IN_REVIEW
+    def overload(
+        self,
+        new_instance: 'ProcessingCaseItem',
+        properties: List[str] = None,
+    ):
+        instance_properties = properties or [
+            'status',
+            'name',
+            'document',
+            'document_type',
+            'uploaded_from',
+            'processed_csv',
+            'processed_xlsx',
+            'processed_json',
+            'processing_time',
+            'processing_confidence',
+            'uploaded_at',
+            'started_at',
+            'failed_at',
+            'completed_at',
+            'feedback',
+            'metadata',
+        ]
+        for _property in instance_properties:
+            property_value = getattr(new_instance, _property)
+            if not hasattr(self, _property):
+                continue
+            setattr(self, _property, property_value)
+        return self
+    @property
+    def combined_id(self) -> str:
+        return f"{self.case_id}__{self.uuid}"
+    @property
+    def has_processed_csv(self) -> bool:
+        return self.processed_csv and self.processed_csv.is_valid
+    @property
+    def has_processed_xlsx(self) -> bool:
+        return self.processed_xlsx and self.processed_xlsx.is_valid
+    @property
+    def has_processed_json(self) -> bool:
+        return self.processed_json and self.processed_json.is_valid
+    @property
+    def is_procesable(self) -> bool:
+        return (
+            (self.status.is_pending or self.status.is_enqueued)
+            and self.digest
+            and self.document
+            and self.document.is_procesable
+        )
+    @property
+    def is_finished(self) -> bool:
+        return self.status in [
+            ProcessingStatus.COMPLETED,
+            ProcessingStatus.FAILED,
+        ]
+    @property
+    def to_dict(self) -> dict:
+        return {
+            'uuid': self.uuid,
+            'case_id': self.case_id,
+            'digest': self.digest,
+            'status': str(self.status),
+            'name': self.name,
+            'document':(
+                self.document.to_dict
+                if self.document else None
+            ),
+            'document_type': (
+                str(self.document_type)
+                if self.document_type else None
+            ),
+            'uploaded_from': (
+                str(self.uploaded_from)
+                if self.uploaded_from else None
+            ),
+            'processed_csv': (
+                self.processed_csv.to_dict
+                if self.processed_csv else None
+            ),
+            'processed_xlsx': (
+                self.processed_xlsx.to_dict
+                if self.processed_xlsx else None
+            ),
+            'processed_json': (
+                self.processed_json.to_dict
+                if self.processed_json else None
+            ),
+            'processing_time': (
+                normalize_number(self.processing_time)
+                if self.processing_time else None
+            ),
+            'processing_confidence': (
+                normalize_number(self.processing_confidence)
+                if self.processing_confidence else None
+            ),
+            'uploaded_at': (
+                self.uploaded_at.isoformat()
+                if self.uploaded_at else None
+            ),
+            'started_at': (
+                self.started_at.isoformat()
+                if self.started_at else None
+            ),
+            'failed_at': (
+                self.failed_at.isoformat()
+                if self.failed_at else None
+            ),
+            'feedback': self.feedback,
+            'metadata': self.metadata,
+            'completed_at': (
+                self.completed_at.isoformat()
+                if self.completed_at else None
+            ),
+        }
+    @property
+    def to_simple_dict(self) -> dict:
+        simple_dict = self.to_dict.copy()
+        return simple_dict
+    @property
+    def to_queue_dict(self) -> dict:
+        queue_dict = self.to_dict.copy()
+        queue_dict["document"] = (
+            self.document.to_queue_dict
+            if self.document else None
+        )
+        queue_dict["processed_csv"] = (
+            self.processed_csv.to_queue_dict
+            if self.processed_csv else None
+        )
+        queue_dict["processed_xlsx"] = (
+            self.processed_xlsx.to_queue_dict
+            if self.processed_xlsx else None
+        )
+        queue_dict["processed_json"] = (
+            self.processed_json.to_queue_dict
+            if self.processed_json else None
+        )
+        return queue_dict
+    @property
+    def to_persist_dict(self) -> dict:
+        return self.to_dict
+    @classmethod
+    def from_dict(cls, data: dict) -> 'ProcessingCaseItem':
+        return cls(
+            uuid=data.get('uuid'),
+            case_id=data.get('case_id'),
+            digest=data.get('digest'),
+            status=ProcessingStatus.from_value(data.get('status')),
+            name=data.get('name'),
+            document=(
+                InMemoryDocument.from_dict(data.get('document'))
+                if data.get('document') else None
+            ),
+            document_type=(
+                ProcessingDocumentType.from_value(data.get('document_type'))
+                if data.get('document_type') else None
+            ),
+            uploaded_from=(
+                ProcessingSource.from_value(data.get('uploaded_from'))
+                if data.get('uploaded_from') else None
+            ),
+            processed_csv=(
+                InMemoryDocument.from_dict(data.get('processed_csv'))
+                if data.get('processed_csv') else None
+            ),
+            processed_xlsx=(
+                InMemoryDocument.from_dict(data.get('processed_xlsx'))
+                if data.get('processed_xlsx') else None
+            ),
+            processed_json=(
+                InMemoryDocument.from_dict(data.get('processed_json'))
+                if data.get('processed_json') else None
+            ),
+            processing_time=(
+                Decimal(data.get('processing_time'))
+                if data.get('processing_time') else None
+            ),
+            processing_confidence=(
+                Decimal(data.get('processing_confidence'))
+                if data.get('processing_confidence') else None
+            ),
+            uploaded_at=get_datetime_from_data(input_datetime=data.get('uploaded_at')),
+            started_at=get_datetime_from_data(input_datetime=data.get('started_at')),
+            failed_at=get_datetime_from_data(input_datetime=data.get('failed_at')),
+            feedback=data.get('feedback'),
+            metadata=data.get('metadata', {}),
+            completed_at=get_datetime_from_data(input_datetime=data.get('completed_at')),
+        )
+    @classmethod
+    def from_persist_dict(cls, data: dict) -> 'ProcessingCaseItem':
+        instance = cls.from_dict(data)
+        if "document_path" in data:
+            instance.document = InMemoryDocument(file_path=data["document_path"])
+        if "processed_csv_path" in data:
+            instance.processed_csv = InMemoryDocument(file_path=data["processed_csv_path"])
+        if "processed_xlsx_path" in data:
+            instance.processed_xlsx = InMemoryDocument(file_path=data["processed_xlsx_path"])
+        if "processed_json_path" in data:
+            instance.processed_json = InMemoryDocument(file_path=data["processed_json_path"])
+        return instance

documente_shared/domain/entities/processing_case_item_filters.py ADDED Viewed

@@ -0,0 +1,54 @@
+from dataclasses import dataclass
+from datetime import datetime
+from typing import List, Optional
+from documente_shared.application.query_params import QueryParams
+from documente_shared.domain.enums.common import ProcessingStatus
+from documente_shared.domain.enums.document import (
+    DocumentProcessingStatus,
+)
+from documente_shared.domain.enums.processing_case import ProcessingDocumentType
+@dataclass
+class ProcessingCaseItemFilters(object):
+    sort_order: Optional[str] = None
+    search: Optional[str] = None
+    init_date: Optional[datetime] = None
+    end_date: Optional[datetime]= None
+    case_id: Optional[str] = None
+    statuses: List[ProcessingStatus] = None
+    document_types: List[ProcessingDocumentType] = None
+    include_archived: bool = False
+    tenant_slug: Optional[str] = None
+    def __post_init__(self):
+        self.statuses = self.statuses or []
+        self.document_types = self.document_types or []
+        self.sort_order = self.sort_order or "desc"
+    @classmethod
+    def from_params(cls, params: QueryParams) -> "ProcessingCaseItemFilters":
+        search_term = params.get_str(key="search", default=None)
+        return cls(
+            sort_order=params.get(key="sort", default="desc"),
+            search=search_term.strip() if search_term else None,
+            init_date=params.get_datetime(key="init_date", default=None),
+            end_date=params.get_datetime(key="end_date", default=None),
+            case_id=params.get_str(key="case_id", default=None),
+            statuses=params.get_enum_list(
+                key="statuses",
+                enum_class=DocumentProcessingStatus,
+                default=None,
+            ),
+            document_types=params.get_enum_list(
+                key="document_types",
+                enum_class=ProcessingDocumentType,
+                default=None,
+            ),
+            include_archived=params.get_bool(
+                key="include_archived",
+                default=False,
+            ),
+        )

documente_shared/domain/entities/processing_documents.py ADDED Viewed

@@ -0,0 +1,11 @@
+from dataclasses import dataclass
+from typing import Optional
+from documente_shared.domain.entities.in_memory_document import InMemoryDocument
+@dataclass
+class ProcessedDocuments(object):
+    processed_csv: Optional[InMemoryDocument] = None
+    processed_xlsx: Optional[InMemoryDocument] = None
+    processed_json: Optional[InMemoryDocument] = None