PyPI - jaf-py - Versions diffs - 2.5.10__py3-none-any.whl → 2.5.11__py3-none-any.whl - Mend

jaf-py 2.5.10py3-none-any.whl → 2.5.11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (92) hide show

jaf/__init__.py +154 -57
jaf/a2a/__init__.py +42 -21
jaf/a2a/agent.py +79 -126
jaf/a2a/agent_card.py +87 -78
jaf/a2a/client.py +30 -66
jaf/a2a/examples/client_example.py +12 -12
jaf/a2a/examples/integration_example.py +38 -47
jaf/a2a/examples/server_example.py +56 -53
jaf/a2a/memory/__init__.py +0 -4
jaf/a2a/memory/cleanup.py +28 -21
jaf/a2a/memory/factory.py +155 -133
jaf/a2a/memory/providers/composite.py +21 -26
jaf/a2a/memory/providers/in_memory.py +89 -83
jaf/a2a/memory/providers/postgres.py +117 -115
jaf/a2a/memory/providers/redis.py +128 -121
jaf/a2a/memory/serialization.py +77 -87
jaf/a2a/memory/tests/run_comprehensive_tests.py +112 -83
jaf/a2a/memory/tests/test_cleanup.py +211 -94
jaf/a2a/memory/tests/test_serialization.py +73 -68
jaf/a2a/memory/tests/test_stress_concurrency.py +186 -133
jaf/a2a/memory/tests/test_task_lifecycle.py +138 -120
jaf/a2a/memory/types.py +91 -53
jaf/a2a/protocol.py +95 -125
jaf/a2a/server.py +90 -118
jaf/a2a/standalone_client.py +30 -43
jaf/a2a/tests/__init__.py +16 -33
jaf/a2a/tests/run_tests.py +17 -53
jaf/a2a/tests/test_agent.py +40 -140
jaf/a2a/tests/test_client.py +54 -117
jaf/a2a/tests/test_integration.py +28 -82
jaf/a2a/tests/test_protocol.py +54 -139
jaf/a2a/tests/test_types.py +50 -136
jaf/a2a/types.py +58 -34
jaf/cli.py +21 -41
jaf/core/__init__.py +7 -1
jaf/core/agent_tool.py +93 -72
jaf/core/analytics.py +257 -207
jaf/core/checkpoint.py +223 -0
jaf/core/composition.py +249 -235
jaf/core/engine.py +817 -519
jaf/core/errors.py +55 -42
jaf/core/guardrails.py +276 -202
jaf/core/handoff.py +47 -31
jaf/core/parallel_agents.py +69 -75
jaf/core/performance.py +75 -73
jaf/core/proxy.py +43 -44
jaf/core/proxy_helpers.py +24 -27
jaf/core/regeneration.py +220 -129
jaf/core/state.py +68 -66
jaf/core/streaming.py +115 -108
jaf/core/tool_results.py +111 -101
jaf/core/tools.py +114 -116
jaf/core/tracing.py +269 -210
jaf/core/types.py +371 -151
jaf/core/workflows.py +209 -168
jaf/exceptions.py +46 -38
jaf/memory/__init__.py +1 -6
jaf/memory/approval_storage.py +54 -77
jaf/memory/factory.py +4 -4
jaf/memory/providers/in_memory.py +216 -180
jaf/memory/providers/postgres.py +216 -146
jaf/memory/providers/redis.py +173 -116
jaf/memory/types.py +70 -51
jaf/memory/utils.py +36 -34
jaf/plugins/__init__.py +12 -12
jaf/plugins/base.py +105 -96
jaf/policies/__init__.py +0 -1
jaf/policies/handoff.py +37 -46
jaf/policies/validation.py +76 -52
jaf/providers/__init__.py +6 -3
jaf/providers/mcp.py +97 -51
jaf/providers/model.py +360 -279
jaf/server/__init__.py +1 -1
jaf/server/main.py +7 -11
jaf/server/server.py +514 -359
jaf/server/types.py +208 -52
jaf/utils/__init__.py +17 -18
jaf/utils/attachments.py +111 -116
jaf/utils/document_processor.py +175 -174
jaf/visualization/__init__.py +1 -1
jaf/visualization/example.py +111 -110
jaf/visualization/functional_core.py +46 -71
jaf/visualization/graphviz.py +154 -189
jaf/visualization/imperative_shell.py +7 -16
jaf/visualization/types.py +8 -4
{jaf_py-2.5.10.dist-info → jaf_py-2.5.11.dist-info}/METADATA +2 -2
jaf_py-2.5.11.dist-info/RECORD +97 -0
jaf_py-2.5.10.dist-info/RECORD +0 -96
{jaf_py-2.5.10.dist-info → jaf_py-2.5.11.dist-info}/WHEEL +0 -0
{jaf_py-2.5.10.dist-info → jaf_py-2.5.11.dist-info}/entry_points.txt +0 -0
{jaf_py-2.5.10.dist-info → jaf_py-2.5.11.dist-info}/licenses/LICENSE +0 -0
{jaf_py-2.5.10.dist-info → jaf_py-2.5.11.dist-info}/top_level.txt +0 -0

jaf/utils/document_processor.py CHANGED Viewed

@@ -15,12 +15,14 @@ from typing import Dict, Any, Optional, List
 try:
     import aiofiles
     HAS_AIOFILES = True
 except ImportError:
     HAS_AIOFILES = False
 try:
     import httpx
     HAS_HTTPX = True
 except ImportError:
     HAS_HTTPX = False
@@ -31,30 +33,35 @@ from ..core.types import Attachment
 # Optional imports with graceful fallbacks
 try:
     import PyPDF2
     HAS_PDF = True
 except ImportError:
     HAS_PDF = False
 try:
     from docx import Document
     HAS_DOCX = True
 except ImportError:
     HAS_DOCX = False
 try:
     from openpyxl import load_workbook
     HAS_EXCEL = True
 except ImportError:
     HAS_EXCEL = False
 try:
     import magic
     HAS_MAGIC = True
 except ImportError:
     HAS_MAGIC = False
 try:
     from PIL import Image
     HAS_PIL = True
 except ImportError:
     HAS_PIL = False
@@ -70,7 +77,7 @@ MAX_EXCEL_ROWS_PER_SHEET = 20
 class DocumentProcessingError(Exception):
     """Exception raised when document processing fails."""
     def __init__(self, message: str, cause: Optional[Exception] = None):
         super().__init__(message)
         self.cause = cause
@@ -78,7 +85,7 @@ class DocumentProcessingError(Exception):
 class NetworkError(Exception):
     """Exception raised when network operations fail."""
     def __init__(self, message: str, status_code: Optional[int] = None):
         super().__init__(message)
         self.status_code = status_code
@@ -86,6 +93,7 @@ class NetworkError(Exception):
 class ProcessedDocument(BaseModel):
     """Result of document processing."""
     content: str
     metadata: Optional[Dict[str, Any]] = None
@@ -93,13 +101,13 @@ class ProcessedDocument(BaseModel):
 async def _fetch_url_content(url: str) -> tuple[bytes, Optional[str]]:
     """
     Fetch content from URL and return as bytes with content type.
     Args:
         url: URL to fetch
     Returns:
         Tuple of (content_bytes, content_type)
     Raises:
         NetworkError: If fetch fails
         DocumentProcessingError: If file is too large
@@ -108,20 +116,20 @@ async def _fetch_url_content(url: str) -> tuple[bytes, Optional[str]]:
         raise DocumentProcessingError(
             "URL fetching not available. Install with: pip install 'jaf-py[attachments]'"
         )
     try:
         async with httpx.AsyncClient(timeout=FETCH_TIMEOUT) as client:
             # First check content length with a HEAD request if possible
             try:
                 head_response = await client.head(
                     url,
-                    headers={'User-Agent': 'JAF-DocumentProcessor/1.0'},
-                    timeout=FETCH_TIMEOUT / 2  # Shorter timeout for HEAD request
+                    headers={"User-Agent": "JAF-DocumentProcessor/1.0"},
+                    timeout=FETCH_TIMEOUT / 2,  # Shorter timeout for HEAD request
                 )
                 head_response.raise_for_status()
                 # Check Content-Length header if present
-                content_length_str = head_response.headers.get('content-length')
+                content_length_str = head_response.headers.get("content-length")
                 if content_length_str and content_length_str.isdigit():
                     content_length = int(content_length_str)
                     if content_length > MAX_DOCUMENT_SIZE:
@@ -133,18 +141,16 @@ async def _fetch_url_content(url: str) -> tuple[bytes, Optional[str]]:
             except (httpx.HTTPStatusError, httpx.RequestError):
                 # HEAD request failed, we'll check size during streaming
                 pass
             # Stream the response to validate size as we download
             content_type = None
             accumulated_bytes = bytearray()
             async with client.stream(
-                'GET',
-                url,
-                headers={'User-Agent': 'JAF-DocumentProcessor/1.0'}
+                "GET", url, headers={"User-Agent": "JAF-DocumentProcessor/1.0"}
             ) as response:
                 response.raise_for_status()
-                content_type = response.headers.get('content-type')
+                content_type = response.headers.get("content-type")
                 # Process the response in chunks
                 async for chunk in response.aiter_bytes(chunk_size=8192):
                     accumulated_bytes.extend(chunk)
@@ -154,11 +160,13 @@ async def _fetch_url_content(url: str) -> tuple[bytes, Optional[str]]:
                         raise DocumentProcessingError(
                             f"File size ({size_mb}MB) exceeds maximum allowed size ({max_mb}MB)"
                         )
             return bytes(accumulated_bytes), content_type
     except httpx.HTTPStatusError as e:
-        raise NetworkError(f"HTTP {e.response.status_code}: {e.response.reason_phrase}", e.response.status_code)
+        raise NetworkError(
+            f"HTTP {e.response.status_code}: {e.response.reason_phrase}", e.response.status_code
+        )
     except httpx.RequestError as e:
         raise NetworkError(f"Failed to fetch URL content: {e}", cause=e)
     except Exception as e:
@@ -171,13 +179,13 @@ async def _fetch_url_content(url: str) -> tuple[bytes, Optional[str]]:
 async def extract_document_content(attachment: Attachment) -> ProcessedDocument:
     """
     Extract text content from various document formats.
     Args:
         attachment: Attachment to process
     Returns:
         ProcessedDocument with extracted content
     Raises:
         DocumentProcessingError: If processing fails
     """
@@ -189,27 +197,30 @@ async def extract_document_content(attachment: Attachment) -> ProcessedDocument:
         content_bytes = base64.b64decode(attachment.data)
         mime_type = attachment.mime_type
     else:
-        raise DocumentProcessingError('No document data or URL provided')
+        raise DocumentProcessingError("No document data or URL provided")
     # Normalize MIME type
     mime_type = mime_type.lower() if mime_type else None
     # Process based on MIME type
-    if mime_type == 'application/pdf':
+    if mime_type == "application/pdf":
         return await _extract_pdf_content(content_bytes)
-    elif mime_type in ['application/vnd.openxmlformats-officedocument.wordprocessingml.document']:
+    elif mime_type in ["application/vnd.openxmlformats-officedocument.wordprocessingml.document"]:
         return _extract_docx_content(content_bytes)
-    elif mime_type in ['application/vnd.openxmlformats-officedocument.spreadsheetml.sheet', 'application/vnd.ms-excel']:
+    elif mime_type in [
+        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
+        "application/vnd.ms-excel",
+    ]:
         return _extract_excel_content(content_bytes)
-    elif mime_type == 'application/json':
+    elif mime_type == "application/json":
         return _extract_json_content(content_bytes)
-    elif mime_type == 'application/zip':
+    elif mime_type == "application/zip":
         return _extract_zip_content(content_bytes)
-    elif mime_type in ['text/plain', 'text/csv']:
+    elif mime_type in ["text/plain", "text/csv"]:
         return _extract_text_content(content_bytes, mime_type)
     else:
         # Fallback: try to extract as text
-        return _extract_text_content(content_bytes, 'text/plain')
+        return _extract_text_content(content_bytes, "text/plain")
 async def _extract_pdf_content(content_bytes: bytes) -> ProcessedDocument:
@@ -218,28 +229,28 @@ async def _extract_pdf_content(content_bytes: bytes) -> ProcessedDocument:
         raise DocumentProcessingError(
             "PDF processing not available. Install with: pip install 'jaf-py[attachments]'"
         )
     try:
         # Run PDF processing in thread pool to avoid blocking
         def _process_pdf() -> ProcessedDocument:
             reader = PyPDF2.PdfReader(io.BytesIO(content_bytes))
             text_parts = []
             for page in reader.pages:
                 text_parts.append(page.extract_text())
-            content = '\n'.join(text_parts).strip()
+            content = "\n".join(text_parts).strip()
             return ProcessedDocument(
                 content=content,
                 metadata={
-                    'pages': len(reader.pages),
-                    'info': dict(reader.metadata) if reader.metadata else None
-                }
+                    "pages": len(reader.pages),
+                    "info": dict(reader.metadata) if reader.metadata else None,
+                },
             )
         return await asyncio.get_event_loop().run_in_executor(None, _process_pdf)
     except Exception as e:
         raise DocumentProcessingError(f"Failed to extract PDF content: {e}") from e
@@ -247,39 +258,35 @@ async def _extract_pdf_content(content_bytes: bytes) -> ProcessedDocument:
 def _extract_text_content(content_bytes: bytes, mime_type: str) -> ProcessedDocument:
     """Extract content from text files."""
     try:
-        content = content_bytes.decode('utf-8').strip()
-        if mime_type == 'text/csv':
+        content = content_bytes.decode("utf-8").strip()
+        if mime_type == "text/csv":
             # Parse CSV to provide structured overview
             try:
                 csv_reader = csv.DictReader(io.StringIO(content))
                 rows = list(csv_reader)
                 columns = csv_reader.fieldnames or []
-                content_lines = content.split('\n')
+                content_lines = content.split("\n")
                 preview_lines = content_lines[:MAX_CSV_PREVIEW_ROWS]
                 formatted_content = (
                     f"CSV File Content:\n"
                     f"Rows: {len(rows)}, Columns: {len(columns)}\n"
                     f"Columns: {', '.join(columns)}\n\n"
                     f"First few rows:\n{chr(10).join(preview_lines)}"
                 )
                 return ProcessedDocument(
                     content=formatted_content,
-                    metadata={
-                        'rows': len(rows),
-                        'columns': len(columns),
-                        'fields': columns
-                    }
+                    metadata={"rows": len(rows), "columns": len(columns), "fields": columns},
                 )
             except Exception:
                 # Fallback to raw text if CSV parsing fails
                 pass
         return ProcessedDocument(content=content)
     except UnicodeDecodeError as e:
         raise DocumentProcessingError(f"Failed to decode text content: {e}") from e
@@ -290,39 +297,36 @@ def _extract_excel_content(content_bytes: bytes) -> ProcessedDocument:
         raise DocumentProcessingError(
             "Excel processing not available. Install with: pip install 'jaf-py[attachments]'"
         )
     try:
         workbook = load_workbook(io.BytesIO(content_bytes), read_only=True)
         sheet_names = workbook.sheetnames
         content_parts = [f"Excel File Content:\nSheets: {', '.join(sheet_names)}\n"]
         # Extract content from each sheet (limit to avoid overwhelming output)
         for i, sheet_name in enumerate(sheet_names):
             if i >= MAX_EXCEL_SHEETS:
                 break
             worksheet = workbook[sheet_name]
             content_parts.append(f"\nSheet: {sheet_name}")
             # Extract up to MAX_EXCEL_ROWS_PER_SHEET rows
             rows_data = []
             for row_num, row in enumerate(worksheet.iter_rows(values_only=True), 1):
                 if row_num > MAX_EXCEL_ROWS_PER_SHEET:
                     break
                 # Convert row to strings, handling None values
-                row_strings = [str(cell) if cell is not None else '' for cell in row]
-                rows_data.append(','.join(row_strings))
-            content_parts.append('\n'.join(rows_data))
-        content = '\n'.join(content_parts).strip()
-        return ProcessedDocument(
-            content=content,
-            metadata={'sheets': sheet_names}
-        )
+                row_strings = [str(cell) if cell is not None else "" for cell in row]
+                rows_data.append(",".join(row_strings))
+            content_parts.append("\n".join(rows_data))
+        content = "\n".join(content_parts).strip()
+        return ProcessedDocument(content=content, metadata={"sheets": sheet_names})
     except Exception as e:
         raise DocumentProcessingError(f"Failed to extract Excel content: {e}") from e
@@ -333,17 +337,14 @@ def _extract_docx_content(content_bytes: bytes) -> ProcessedDocument:
         raise DocumentProcessingError(
             "Word document processing not available. Install with: pip install 'jaf-py[attachments]'"
         )
     try:
         document = Document(io.BytesIO(content_bytes))
         paragraphs = [paragraph.text for paragraph in document.paragraphs]
-        content = '\n'.join(paragraphs).strip()
-        return ProcessedDocument(
-            content=content,
-            metadata={'paragraphs': len(paragraphs)}
-        )
+        content = "\n".join(paragraphs).strip()
+        return ProcessedDocument(content=content, metadata={"paragraphs": len(paragraphs)})
     except Exception as e:
         raise DocumentProcessingError(f"Failed to extract DOCX content: {e}") from e
@@ -351,90 +352,94 @@ def _extract_docx_content(content_bytes: bytes) -> ProcessedDocument:
 def _extract_json_content(content_bytes: bytes) -> ProcessedDocument:
     """Extract content from JSON files."""
     try:
-        json_str = content_bytes.decode('utf-8')
+        json_str = content_bytes.decode("utf-8")
         json_obj = json.loads(json_str)
         # Pretty print JSON with some metadata
         formatted_content = f"JSON File Content:\n{json.dumps(json_obj, indent=2)}"
-        metadata = {
-            'type': 'array' if isinstance(json_obj, list) else type(json_obj).__name__
-        }
+        metadata = {"type": "array" if isinstance(json_obj, list) else type(json_obj).__name__}
         if isinstance(json_obj, dict):
-            metadata['keys'] = list(json_obj.keys())
+            metadata["keys"] = list(json_obj.keys())
         elif isinstance(json_obj, list):
-            metadata['length'] = len(json_obj)
-        return ProcessedDocument(
-            content=formatted_content,
-            metadata=metadata
-        )
+            metadata["length"] = len(json_obj)
+        return ProcessedDocument(content=formatted_content, metadata=metadata)
     except (UnicodeDecodeError, json.JSONDecodeError):
         # Fallback to raw text if JSON parsing fails
         if isinstance(content_bytes, bytes):
             # If input is bytes, decode with error handling
-            fallback_content = content_bytes.decode('utf-8', errors='replace').strip()
+            fallback_content = content_bytes.decode("utf-8", errors="replace").strip()
         else:
             # If input is already a string (from a previous decode attempt)
             fallback_content = json_str.strip() if isinstance(json_str, str) else str(content_bytes)
         return ProcessedDocument(content=fallback_content)
 def _extract_zip_content(content_bytes: bytes) -> ProcessedDocument:
     """Extract file listing from ZIP archives."""
     try:
-        with zipfile.ZipFile(io.BytesIO(content_bytes), 'r') as zip_file:
+        with zipfile.ZipFile(io.BytesIO(content_bytes), "r") as zip_file:
             files = zip_file.namelist()
-            content_parts = ['ZIP File Contents:\n']
+            content_parts = ["ZIP File Contents:\n"]
             safe_files = []
             # Create virtual root for path safety checks
             from pathlib import Path
             import os
-            virtual_root = Path("/safe_extract_dir")  # Virtual root never actually used for extraction
+            virtual_root = Path(
+                "/safe_extract_dir"
+            )  # Virtual root never actually used for extraction
             for file_name in files:
                 # Skip empty entries
                 if not file_name:
                     continue
                 # Basic security checks
-                if (file_name.startswith('/') or  # Absolute path
-                    file_name.startswith('\\') or  # Windows absolute path
-                    file_name.startswith('..') or  # Parent directory traversal
-                    '..' in file_name.split('/') or  # Parent directory traversal
-                    '..' in file_name.split('\\') or  # Windows traversal
-                    ':' in file_name or  # Windows drive letter
-                    '\0' in file_name):  # Null byte
+                if (
+                    file_name.startswith("/")  # Absolute path
+                    or file_name.startswith("\\")  # Windows absolute path
+                    or file_name.startswith("..")  # Parent directory traversal
+                    or ".." in file_name.split("/")  # Parent directory traversal
+                    or ".." in file_name.split("\\")  # Windows traversal
+                    or ":" in file_name  # Windows drive letter
+                    or "\0" in file_name
+                ):  # Null byte
                     # Skip unsafe entries
                     content_parts.append(f"WARNING: Skipped suspicious path: {file_name[:50]}...")
                     continue
                 # Normalize path for additional safety check
                 try:
                     # Create safe path relative to virtual root
                     norm_path = os.path.normpath(file_name)
-                    if norm_path.startswith('..'):
+                    if norm_path.startswith(".."):
                         # Skip unsafe entries that normalize to traversal
-                        content_parts.append(f"WARNING: Skipped path traversal attempt: {file_name[:50]}...")
+                        content_parts.append(
+                            f"WARNING: Skipped path traversal attempt: {file_name[:50]}..."
+                        )
                         continue
                     # Check if path would escape the virtual root
                     test_path = virtual_root.joinpath(norm_path).resolve()
                     if not str(test_path).startswith(str(virtual_root)):
                         # Skip unsafe entries that would escape extraction root
-                        content_parts.append(f"WARNING: Skipped path traversal attempt: {file_name[:50]}...")
+                        content_parts.append(
+                            f"WARNING: Skipped path traversal attempt: {file_name[:50]}..."
+                        )
                         continue
                     # Passed all security checks, add to safe file list
                     safe_files.append(file_name)
                     # Get file info for display
-                    if file_name.endswith('/'):
+                    if file_name.endswith("/"):
                         content_parts.append(f"DIR: {file_name}")
                     else:
                         try:
@@ -447,17 +452,13 @@ def _extract_zip_content(content_bytes: bytes) -> ProcessedDocument:
                     # Skip any entry that causes normalization errors
                     content_parts.append(f"WARNING: Skipped invalid path: {file_name[:50]}...")
                     continue
-            content = '\n'.join(content_parts).strip()
+            content = "\n".join(content_parts).strip()
             return ProcessedDocument(
-                content=content,
-                metadata={
-                    'files': safe_files,
-                    'total_files': len(safe_files)
-                }
+                content=content, metadata={"files": safe_files, "total_files": len(safe_files)}
             )
     except Exception as e:
         raise DocumentProcessingError(f"Failed to process ZIP file: {e}") from e
@@ -465,97 +466,97 @@ def _extract_zip_content(content_bytes: bytes) -> ProcessedDocument:
 def is_document_supported(mime_type: Optional[str]) -> bool:
     """
     Check if a MIME type is supported for content extraction.
     Args:
         mime_type: MIME type to check
     Returns:
         True if supported, False otherwise
     """
     if not mime_type:
         return False
     supported_types = [
-        'application/pdf',
-        'text/plain',
-        'text/csv',
-        'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
-        'application/vnd.ms-excel',
-        'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
-        'application/json',
-        'application/zip'
+        "application/pdf",
+        "text/plain",
+        "text/csv",
+        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet",
+        "application/vnd.ms-excel",
+        "application/vnd.openxmlformats-officedocument.wordprocessingml.document",
+        "application/json",
+        "application/zip",
     ]
     return mime_type.lower() in supported_types
 def get_document_description(mime_type: Optional[str]) -> str:
     """
     Get a human-readable description of what content will be extracted.
     Args:
         mime_type: MIME type to describe
     Returns:
         Human-readable description
     """
     if not mime_type:
-        return 'document content'
+        return "document content"
     descriptions = {
-        'application/pdf': 'PDF text content',
-        'text/plain': 'plain text content',
-        'text/csv': 'CSV data structure and sample rows',
-        'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet': 'Excel spreadsheet data',
-        'application/vnd.ms-excel': 'Excel spreadsheet data',
-        'application/vnd.openxmlformats-officedocument.wordprocessingml.document': 'Word document text content',
-        'application/json': 'JSON data structure',
-        'application/zip': 'ZIP file listing'
+        "application/pdf": "PDF text content",
+        "text/plain": "plain text content",
+        "text/csv": "CSV data structure and sample rows",
+        "application/vnd.openxmlformats-officedocument.spreadsheetml.sheet": "Excel spreadsheet data",
+        "application/vnd.ms-excel": "Excel spreadsheet data",
+        "application/vnd.openxmlformats-officedocument.wordprocessingml.document": "Word document text content",
+        "application/json": "JSON data structure",
+        "application/zip": "ZIP file listing",
     }
-    return descriptions.get(mime_type.lower(), 'document content')
+    return descriptions.get(mime_type.lower(), "document content")
 def get_missing_dependencies() -> List[str]:
     """
     Get list of missing optional dependencies for document processing.
     Returns:
         List of missing dependency names
     """
     missing = []
     if not HAS_PDF:
-        missing.append('PyPDF2 (for PDF processing)')
+        missing.append("PyPDF2 (for PDF processing)")
     if not HAS_DOCX:
-        missing.append('python-docx (for Word document processing)')
+        missing.append("python-docx (for Word document processing)")
     if not HAS_EXCEL:
-        missing.append('openpyxl (for Excel processing)')
+        missing.append("openpyxl (for Excel processing)")
     if not HAS_PIL:
-        missing.append('Pillow (for image processing)')
+        missing.append("Pillow (for image processing)")
     if not HAS_MAGIC:
-        missing.append('python-magic (for MIME type detection)')
+        missing.append("python-magic (for MIME type detection)")
     if not HAS_HTTPX:
-        missing.append('httpx (for URL fetching)')
+        missing.append("httpx (for URL fetching)")
     if not HAS_AIOFILES:
-        missing.append('aiofiles (for async file operations)')
+        missing.append("aiofiles (for async file operations)")
     return missing
 def check_dependencies() -> Dict[str, bool]:
     """
     Check availability of optional dependencies.
     Returns:
         Dictionary mapping dependency names to availability
     """
     return {
-        'pdf': HAS_PDF,
-        'docx': HAS_DOCX,
-        'excel': HAS_EXCEL,
-        'image': HAS_PIL,
-        'magic': HAS_MAGIC,
-        'httpx': HAS_HTTPX,
-        'aiofiles': HAS_AIOFILES
-    }
+        "pdf": HAS_PDF,
+        "docx": HAS_DOCX,
+        "excel": HAS_EXCEL,
+        "image": HAS_PIL,
+        "magic": HAS_MAGIC,
+        "httpx": HAS_HTTPX,
+        "aiofiles": HAS_AIOFILES,
+    }

jaf-py 2.5.10__py3-none-any.whl → 2.5.11__py3-none-any.whl

jaf-py 2.5.10py3-none-any.whl → 2.5.11py3-none-any.whl