PyPI - langchain-ocr-lib - Versions diffs - 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl - Mend

langchain-ocr-lib 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

langchain_ocr_lib/converter/converter.py CHANGED Viewed

@@ -3,11 +3,13 @@
 from abc import ABC, abstractmethod
 import inject
+from langchain_ocr_lib.di_binding_keys.binding_keys import LangfuseTracedChainKey
 class File2MarkdownConverter(ABC):
     """Abstract base class for the File2MarkdownConverter class."""
-    _chain = inject.attr("LangfuseTracedChain")
+    _chain = inject.attr(LangfuseTracedChainKey)
     @abstractmethod
     async def aconvert2markdown(self, file: bytes) -> str:

langchain_ocr_lib/di_binding_keys/__init__.py ADDED Viewed

File without changes

langchain_ocr_lib/di_binding_keys/binding_keys.py ADDED Viewed

@@ -0,0 +1,29 @@
+"""Define key classes for dependency bindings. More reliable than using strings."""
+class LargeLanguageModelKey:
+    pass
+class LangfuseClientKey:
+    pass
+class LangfuseManagerKey:
+    pass
+class OcrChainKey:
+    pass
+class LangfuseTracedChainKey:
+    pass
+class PdfConverterKey:
+    pass
+class ImageConverterKey:
+    pass

langchain_ocr_lib/di_config.py CHANGED Viewed

@@ -2,12 +2,22 @@
 from inject import Binder
 import inject
+from langchain_ocr_lib.di_binding_keys.binding_keys import (
+    ImageConverterKey,
+    LangfuseClientKey,
+    LangfuseManagerKey,
+    LangfuseTracedChainKey,
+    LargeLanguageModelKey,
+    OcrChainKey,
+    PdfConverterKey,
+)
 from langchain_ollama import ChatOllama
 from langchain_openai import ChatOpenAI
 from langfuse import Langfuse
 from langchain_ocr_lib.impl.chains.ocr_chain import OcrChain
 from langchain_ocr_lib.impl.settings.ollama_chat_settings import OllamaSettings
+from langchain_ocr_lib.impl.settings.vllm_chat_settings import VllmSettings
 from langchain_ocr_lib.impl.settings.openai_chat_settings import OpenAISettings
 from langchain_ocr_lib.impl.settings.llm_class_type_settings import LlmClassTypeSettings
 from langchain_ocr_lib.impl.settings.langfuse_settings import LangfuseSettings
@@ -44,14 +54,17 @@ def lib_di_config(binder: Binder):
     elif llm_class_type_settings.llm_type == "openai":
         settings = OpenAISettings()
         llm_instance = llm_provider(settings, ChatOpenAI)
+    elif llm_class_type_settings.llm_type == "vllm":
+        settings = VllmSettings()
+        llm_instance = llm_provider(settings, ChatOpenAI)
     else:
         raise NotImplementedError("Configured LLM is not implemented")
-    binder.bind("LargeLanguageModel", llm_instance)
+    binder.bind(LargeLanguageModelKey, llm_instance)
     prompt = ocr_prompt_template_builder(language=language_settings.language, model_name=settings.model)
     binder.bind(
-        "LangfuseClient",
+        LangfuseClientKey,
         Langfuse(
             public_key=langfuse_settings.public_key,
             secret_key=langfuse_settings.secret_key,
@@ -60,7 +73,7 @@ def lib_di_config(binder: Binder):
     )
     binder.bind(
-        "LangfuseManager",
+        LangfuseManagerKey,
         LangfuseManager(
             managed_prompts={
                 OcrChain.__name__: prompt,
@@ -68,17 +81,17 @@ def lib_di_config(binder: Binder):
         ),
     )
-    binder.bind("OcrChain", OcrChain())
+    binder.bind(OcrChainKey, OcrChain())
     binder.bind(
-        "LangfuseTracedChain",
+        LangfuseTracedChainKey,
         LangfuseTracedChain(
             settings=langfuse_settings,
         ),
     )
-    binder.bind("PdfConverter", Pdf2MarkdownConverter())
-    binder.bind("ImageConverter", Image2MarkdownConverter())
+    binder.bind(PdfConverterKey, Pdf2MarkdownConverter())
+    binder.bind(ImageConverterKey, Image2MarkdownConverter())
 def configure_di():

langchain_ocr_lib/impl/chains/ocr_chain.py CHANGED Viewed

@@ -7,6 +7,7 @@ from langchain_core.runnables.utils import Input
 import inject
 from langchain_ocr_lib.chains.chain import Chain
+from langchain_ocr_lib.di_binding_keys.binding_keys import LangfuseManagerKey
 RunnableInput = Input  # TODO: adjust properly
 RunnableOutput = str
@@ -15,7 +16,7 @@ RunnableOutput = str
 class OcrChain(Chain[RunnableInput, RunnableOutput]):
     """Base class for LLM answer generation chain."""
-    _langfuse_manager = inject.attr("LangfuseManager")
+    _langfuse_manager = inject.attr(LangfuseManagerKey)
     def __init__(self):
         """Initialize the AnswerGenerationChain.

langchain_ocr_lib/impl/converter/pdf_converter.py CHANGED Viewed

@@ -48,9 +48,11 @@ class Pdf2MarkdownConverter(File2MarkdownConverter):
                 with open(filename, "rb") as f:
                     file = f.read()
             except Exception as e:
-                raise ValueError("PDF corrupted or unsupported file type, %s" % e)
-        images = convert_from_bytes(file)
+                raise ValueError("PDF corrupted or unsupported file type") from e
+        try:
+            images = convert_from_bytes(file)
+        except Exception as e:
+            raise ValueError("PDF corrupted or unsupported file type") from e
         markdown = ""
         for image in images:
@@ -93,7 +95,10 @@ class Pdf2MarkdownConverter(File2MarkdownConverter):
             except Exception as e:
                 raise ValueError("PDF corrupted or unsupported file type") from e
-        images = convert_from_bytes(file)
+        try:
+            images = convert_from_bytes(file)
+        except Exception as e:
+            raise ValueError("PDF corrupted or unsupported file type") from e
         markdown = ""
         for image in images:

langchain_ocr_lib/impl/langfuse_manager/langfuse_manager.py CHANGED Viewed

@@ -10,6 +10,9 @@ from langchain_core.language_models.llms import LLM
 from langfuse.api.resources.commons.errors.not_found_error import NotFoundError
 from langfuse.model import ChatPromptClient
+from langchain_ocr_lib.di_binding_keys.binding_keys import LangfuseClientKey, LargeLanguageModelKey
 logger = logging.getLogger(__name__)
@@ -23,8 +26,8 @@ class LangfuseManager:
     """
     API_KEY_FILTER: str = "api_key"
-    _llm = inject.attr("LargeLanguageModel")
-    _langfuse = inject.attr("LangfuseClient")
+    _llm = inject.attr(LargeLanguageModelKey)
+    _langfuse = inject.attr(LangfuseClientKey)
     def __init__(
         self,
@@ -136,12 +139,16 @@ class LangfuseManager:
             fallback = self._managed_prompts[name]
             if isinstance(fallback, ChatPromptTemplate):
                 return fallback
-            if isinstance(fallback, list) and len(fallback) > 0 and isinstance(fallback[0], dict) and "content" in fallback[0]:
+            if (
+                isinstance(fallback, list)
+                and len(fallback) > 0
+                and isinstance(fallback[0], dict)
+                and "content" in fallback[0]
+            ):
                 image_payload = [{"type": "image_url", "image_url": {"url": "data:image/jpeg;base64,{image_data}"}}]
                 return ChatPromptTemplate.from_messages([("system", fallback[0]["content"]), ("user", image_payload)])
-            else:
-                logger.error("Unexpected structure for fallback prompt.")
-                raise ValueError("Unexpected structure for fallback prompt.")
+            logger.error("Unexpected structure for fallback prompt.")
+            raise ValueError("Unexpected structure for fallback prompt.")
         langchain_prompt = langfuse_prompt.get_langchain_prompt()
         langchain_prompt[-1] = ("user", json.loads(langchain_prompt[-1][1]))

langchain_ocr_lib/impl/llms/llm_type.py CHANGED Viewed

@@ -9,3 +9,4 @@ class LLMType(StrEnum):
     OLLAMA = "ollama"
     OPENAI = "openai"
+    VLLM = "vllm"

langchain_ocr_lib/impl/settings/openai_chat_settings.py CHANGED Viewed

@@ -18,8 +18,8 @@ class OpenAISettings(BaseSettings):
         Total probability mass of tokens to consider at each step.
     temperature : float
         What sampling temperature to use.
-    vision_capable : bool
-        Flag to enable a vision capable model.
+    base_url : str
+        The base URL for the OpenAI API endpoint.
     """
     class Config:
@@ -31,5 +31,8 @@ class OpenAISettings(BaseSettings):
     model: str = Field(default="gpt-4o-mini-search-preview-2025-03-11", description="The model identifier")
     api_key: str = Field(default="", description="The API key for authentication")
     top_p: float = Field(default=1.0, description="Total probability mass of tokens to consider at each step")
-    temperature: float = Field(default=0.7, description="What sampling temperature to use")
-    vision_capable: bool = Field(default=False, description="Enable a vision capable model")
+    temperature: float = Field(default=0, description="What sampling temperature to use")
+    base_url: str = Field(
+        default="https://api.openai.com/v1",
+        description="The base URL for the OpenAI API endpoint",
+    )

langchain_ocr_lib/impl/settings/vllm_chat_settings.py ADDED Viewed

@@ -0,0 +1,38 @@
+"""Module contains settings regarding the Vllm API."""
+from pydantic import Field
+from pydantic_settings import BaseSettings
+class VllmSettings(BaseSettings):
+    """
+    Contains settings regarding the Vllm API.
+    Attributes
+    ----------
+    model : str
+        The model identifier.
+    api_key : str
+        The API key for authentication.
+    top_p : float
+        Total probability mass of tokens to consider at each step.
+    temperature : float
+        What sampling temperature to use.
+    base_url : str
+        The base URL for the Vllm API endpoint.
+    """
+    class Config:
+        """Config class for reading fields from environment variables."""
+        env_prefix = "VLLM_"
+        case_sensitive = False
+    model: str = Field(default="", description="The model identifier")
+    api_key: str = Field(default="", description="The API key for authentication")
+    top_p: float = Field(default=1.0, description="Total probability mass of tokens to consider at each step")
+    temperature: float = Field(default=0, description="What sampling temperature to use")
+    base_url: str = Field(
+        default="http://localhost:8000/v1",
+        description="The base URL for the Vllm API endpoint",
+    )

langchain_ocr_lib/impl/tracers/langfuse_traced_chain.py CHANGED Viewed

@@ -8,6 +8,7 @@ from langfuse.callback import CallbackHandler
 from langchain_ocr_lib.impl.settings.langfuse_settings import LangfuseSettings
 from langchain_ocr_lib.tracers.traced_chain import TracedChain
+from langchain_ocr_lib.di_config import OcrChainKey
 class LangfuseTracedChain(TracedChain):
@@ -23,7 +24,7 @@ class LangfuseTracedChain(TracedChain):
     """
     CONFIG_CALLBACK_KEY = "callbacks"
-    _inner_chain = inject.attr("OcrChain")
+    _inner_chain = inject.attr(OcrChainKey)
     def __init__(self, settings: LangfuseSettings):
         super().__init__()

langchain_ocr_lib-0.3.0.dist-info/METADATA ADDED Viewed

@@ -0,0 +1,188 @@
+Metadata-Version: 2.1
+Name: langchain-ocr-lib
+Version: 0.3.0
+Summary:
+License: MIT
+Author: Andreas Klos
+Author-email: aklos@outlook.de
+Requires-Python: >=3.11,<4.0
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Programming Language :: Python :: 3
+Classifier: Programming Language :: Python :: 3.11
+Classifier: Programming Language :: Python :: 3.12
+Classifier: Programming Language :: Python :: 3.13
+Requires-Dist: deprecated (>=1.2.14,<2.0.0)
+Requires-Dist: inject (>=5.2.1,<6.0.0)
+Requires-Dist: langchain-community (>=0.3.19,<0.4.0)
+Requires-Dist: langchain-ollama (>=0.2.0,<0.3.0)
+Requires-Dist: langchain-openai (>=0.3.8,<0.4.0)
+Requires-Dist: langfuse (>=2.59.7,<3.0.0)
+Requires-Dist: openai (>=1.42.0,<2.0.0)
+Requires-Dist: pdf2image (>=1.17.0,<2.0.0)
+Requires-Dist: pillow (>=11.0.0,<12.0.0)
+Requires-Dist: pycountry (>=24.6.1,<25.0.0)
+Requires-Dist: pytest-asyncio (>=0.25.0,<0.26.0)
+Requires-Dist: pyyaml (>=6.0.2,<7.0.0)
+Description-Content-Type: text/markdown
+# langchain_ocr_lib
+**langchain_ocr_lib** is the OCR processing engine behind LangChain-OCR. It provides a modular, vision-LLM-powered Chain to convert image and PDF documents into clean Markdown. Designed for direct CLI usage or integration into larger applications.
+## Table of Contents
+1. [Overview](#1-overview)
+2. [Features](#2-features)
+3. [Installation](#3-installation)
+   1. [Prerequisites](#31-prerequisites)
+   2. [Environment Setup](#32-environment-setup)
+4. [Usage](#4-usage)
+   1. [CLI](#41-cli)
+   2. [Python Module](#42-python-module)
+   3. [Docker](#43-docker)
+5. [Architecture](#5-architecture)
+6. [Testing](#6-testing)
+7. [License](#7-license)
+---
+## 1. Overview
+This package offers the core functionality to extract text from documents using vision LLMs and convert it into Markdown. It is highly configurable by environment variables and its design based on dependency injection, that  allows you to easily swap out components. The package is designed to be used as a library, but it also provides a command-line interface (CLI) for easy local execution.
+---
+## 2. Features
+- **Vision-Language OCR:** Supports Ollama, vLLM and OpenAI (and other OpenAI conform providers). Other LLM providers can be easily integrated.
+- **CLI Interface:** Simple local execution via command line or container
+- **Highly Configurable:** Use environment variables to configure the OCR
+- **Dependency Injection:** Easily swap out components for custom implementations
+- **LangChain:** Integrates with LangChain
+- **Markdown Output:** Outputs well-formatted Markdown text
+---
+## 3. Installation
+### 3.1 Prerequisites
+- **Python:** 3.11+
+- **Poetry:** [Install Poetry](https://python-poetry.org/docs/)
+- **Docker:** For containerized CLI usage (optional)
+- **Ollama:** Follow instructions [here](https://ollama.com) (other LLM providers can be used as well, see [here](#2-features))
+- **Langfuse:** Different options for self hosting, see [here](https://langfuse.com/self-hosting) (optional, for observability)
+### 3.2 Environment Setup
+The package is published on PyPI, so you can install it directly with pip:
+```bash
+pip install langchain-ocr-lib
+```
+However, if you want to run the latest version or contribute to the project, you can clone the repository and install it locally.
+```bash
+git clone https://github.com/a-klos/langchain-ocr.git
+cd langchain-ocr/langchain_ocr_lib
+poetry install --with dev
+```
+You can configure the package by setting environment variables. Configuration options are shown in the [`.env.template`](../.env.template) file.
+---
+## 4. Usage
+Remember that you need to pull the configured LLM model first. With Ollama, you can do this with:
+```bash
+ollama pull <model_name>
+```
+For example, to pull the `gemma3:4b-it-q4_K_M` model, run:
+```bash
+ollama pull gemma3:4b-it-q4_K_M
+```
+### 4.1 CLI
+Run OCR locally from the terminal:
+```bash
+langchain-ocr <<input_file>>
+```
+Supports:
+- `.jpg`, `.jpeg`, `.png`, and `.pdf` inputs
+### 4.2 Python Module
+Use the the library programmatically:
+```python
+import inject
+import configure_di
+from langchain_ocr_lib.di_config import configure_di
+from langchain_ocr_lib.di_binding_keys.binding_keys import PdfConverterKey
+from langchain_ocr_lib.impl.converter.pdf_converter import Pdf2MarkdownConverter
+configure_di() #This sets up the dependency injection
+class Converter:
+    _converter: Pdf2MarkdownConverter = inject.attr(PdfConverterKey)
+    def convert(self, filename: str) -> str:
+        return self._converter.convert2markdown(filename=filename)
+converter = Converter()
+markdown = converter.convert("../docs/invoice.pdf") # Adjust the file path as needed
+print(markdown)
+```
+The `configure_di()` function sets up the dependency injection for the library. The dependencies can be easily swapped out or appended with new dependencies. See [../api/src/langchain_ocr/di_config.py](../api/src/langchain_ocr/di_config.py) for more details on how to add new dependencies.
+Swapping out the dependencies can be done as follows:
+```python
+import inject
+from inject import Binder
+from langchain_ocr_lib.di_config import lib_di_config, PdfConverterKey
+from langchain_ocr_lib.impl.converter.pdf_converter import Pdf2MarkdownConverter
+class MyPdfConverter(Pdf2MarkdownConverter):
+    def convert(self, filename: str) -> None:
+        markdown = self.convert2markdown(filename=filename)
+        print(markdown)
+def _api_specific_config(binder: Binder):
+    binder.install(lib_di_config)  # Install all default bindings
+    binder.bind(PdfConverterKey, MyPdfConverter())  # Then override PdfConverter
+def configure():
+    """Configure the dependency injection container."""
+    inject.configure(_api_specific_config, allow_override=True, clear=True)
+configure()
+class Converter:
+    _converter: MyPdfConverter = inject.attr(PdfConverterKey)
+    def convert(self, filename: str) -> None:
+        self._converter.convert(filename=filename)
+converter = Converter()
+converter.convert("../docs/invoice.pdf") # Adjust the file path as needed
+```
+### 4.3 Docker
+Run OCR via Docker without local Python setup:
+```bash
+docker build -t ocr -f langchain_ocr_lib/Dockerfile .
+docker run --net=host -it --rm -v ./docs:/app/docs:ro ocr docs/invoice.png
+```

{langchain_ocr_lib-0.1.0.dist-info → langchain_ocr_lib-0.3.0.dist-info}/RECORD RENAMED Viewed

@@ -2,34 +2,37 @@ langchain_ocr_lib/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU
 langchain_ocr_lib/chains/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/chains/chain.py,sha256=D00wnm987YgkJsIAIwQVehX_B4kBOzrjistaPf1M0GE,1946
 langchain_ocr_lib/converter/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-langchain_ocr_lib/converter/converter.py,sha256=aJuaLX2942d8WRPNaU0cUPO1_266QE7Y6SVKpnxpGBA,1196
-langchain_ocr_lib/di_config.py,sha256=H1CxtSlzUH3QGkRFBQqgMGJZx5HGWQ0yrB2kEvFIbOk,3083
+langchain_ocr_lib/converter/converter.py,sha256=oDUNzVWD743RgqIal7T4OVv-Z1RKE9uQYzAIPpgY3o8,1280
+langchain_ocr_lib/di_binding_keys/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+langchain_ocr_lib/di_binding_keys/binding_keys.py,sha256=jE8rwNcLaI0NflIMkK0vu0LVy5o4y0pYgdjbpDNTGyk,338
+langchain_ocr_lib/di_config.py,sha256=eYzDi_LJaYY_JhRnNqW3VYGd3N1QblaGFjWlL_6Vx9c,3537
 langchain_ocr_lib/impl/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/impl/chains/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-langchain_ocr_lib/impl/chains/ocr_chain.py,sha256=eGiflXVbo1UP56rRHPY6fB4woJtyIvv4SmXNC1RHWFY,2594
+langchain_ocr_lib/impl/chains/ocr_chain.py,sha256=stE8RLE1ieRHf6XHreKCRfhNfXzw9fNLTake7xQBGL8,2673
 langchain_ocr_lib/impl/converter/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/impl/converter/image_converter.py,sha256=G1rDOCbudWNL4sDvSGJ7CeeFrWUblfWPGaZf5JsnpiM,2871
-langchain_ocr_lib/impl/converter/pdf_converter.py,sha256=ssj8DL_9wf6kMhjUhDkw0gwSwNLrvgh8nBRspwj60Vk,3510
+langchain_ocr_lib/impl/converter/pdf_converter.py,sha256=pTHPojuNLCSWJp4FzXBHshXva2sBGyOs6Y7jnKJrnNo,3760
 langchain_ocr_lib/impl/langfuse_manager/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-langchain_ocr_lib/impl/langfuse_manager/langfuse_manager.py,sha256=G_qGE_-LnPpNJYgkoDoVqoXYkwsaMkB_HN2uSng3YVA,5245
+langchain_ocr_lib/impl/langfuse_manager/langfuse_manager.py,sha256=AEF1iFYghr-62gcPcUb4Yi3DNRYfe-JsIWd3ymsIU8I,5403
 langchain_ocr_lib/impl/llms/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/impl/llms/llm_factory.py,sha256=9DsUdoYNrjeWLGA9ISDdHN2cxcQ7DquNQ5it6zSxHlg,2199
-langchain_ocr_lib/impl/llms/llm_type.py,sha256=_Ap7yStlBn0tyOyfVLH1c2j2A9-ccsTCxAm7bgoRQnM,268
+langchain_ocr_lib/impl/llms/llm_type.py,sha256=_LKtdVuTRYX6gupkxJtEtIwrbtiMvZmG8WOxfzlm42M,286
 langchain_ocr_lib/impl/settings/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/impl/settings/langfuse_settings.py,sha256=5lr3tVeiHXDUaYtWAnZPXrKxBJgM2wgaz7yyZThhCsE,812
 langchain_ocr_lib/impl/settings/language_settings.py,sha256=tdAC1t5wGu1MoH1jhjkDnxnX4Ui7giwxt7Qm8_LPkP8,627
 langchain_ocr_lib/impl/settings/llm_class_type_settings.py,sha256=4KC6zxby13wn38rB8055J8LNVTsmUfrOiyLtLuToHaM,598
 langchain_ocr_lib/impl/settings/ollama_chat_settings.py,sha256=8RWMsaK4qDrqC6Mrxekr8IEDYwcvjYwhw9xDwZemxI4,1506
-langchain_ocr_lib/impl/settings/openai_chat_settings.py,sha256=cXzxe-sea8VCK2M_u9ZIL4l8AR_YdhmA-phZa9fwf8o,1233
+langchain_ocr_lib/impl/settings/openai_chat_settings.py,sha256=gZqmFYDtF0l5lEAnuT2VzdqLWKnTPSK_lTeg7ERmJas,1276
+langchain_ocr_lib/impl/settings/vllm_chat_settings.py,sha256=y8PPNUcce1uA4kEu6p0p5vCwCOGp9uEEvHbCoS1Ohh8,1226
 langchain_ocr_lib/impl/tracers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-langchain_ocr_lib/impl/tracers/langfuse_traced_chain.py,sha256=lfYLEf9mJ2ie5wofHFG_FUicRi1281XGBC0GKXcAkHM,1546
+langchain_ocr_lib/impl/tracers/langfuse_traced_chain.py,sha256=syjwNt8HfVmaWXZ-ElFYsc-KwpnKQz2LE3K5jV7c3GE,1599
 langchain_ocr_lib/language_mapping/language_mapping.py,sha256=VY7WkkZauoHNxkvgUYbig0rDmlKqDkz24cXMd6A7txM,700
 langchain_ocr_lib/main.py,sha256=_kx6pIsIV9pii2_TSYisFT4tKDQHMHef6buWhWoj11E,3485
 langchain_ocr_lib/prompt_templates/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/prompt_templates/ocr_prompt.py,sha256=3Be1AL-HJkxPnAP0DNH1MqvAxFWTCeM5UOKP63xkHsY,3543
 langchain_ocr_lib/tracers/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 langchain_ocr_lib/tracers/traced_chain.py,sha256=uxRkdLNn_G6dAsti_gUuF7muhIj10xrOUL7HUga40oc,3056
-langchain_ocr_lib-0.1.0.dist-info/METADATA,sha256=2H3iEatfiflH4GcrFhIw2Cg8wjsgKsLoeP2irFsVTio,991
-langchain_ocr_lib-0.1.0.dist-info/WHEEL,sha256=fGIA9gx4Qxk2KDKeNJCbOEwSrmLtjWCwzBz351GyrPQ,88
-langchain_ocr_lib-0.1.0.dist-info/entry_points.txt,sha256=l4mIs0tnIgbJYuVveZySQKVBnqNMHS-8ZZtLwz8ag5k,61
-langchain_ocr_lib-0.1.0.dist-info/RECORD,,
+langchain_ocr_lib-0.3.0.dist-info/METADATA,sha256=IaqIz9OXgu5WQXwEVpLmMNLmz2w3IowWmdZ7kt5O6VM,6240
+langchain_ocr_lib-0.3.0.dist-info/WHEEL,sha256=Nq82e9rUAnEjt98J6MlVmMCZb-t9cYE2Ir1kpBmnWfs,88
+langchain_ocr_lib-0.3.0.dist-info/entry_points.txt,sha256=l4mIs0tnIgbJYuVveZySQKVBnqNMHS-8ZZtLwz8ag5k,61
+langchain_ocr_lib-0.3.0.dist-info/RECORD,,

{langchain_ocr_lib-0.1.0.dist-info → langchain_ocr_lib-0.3.0.dist-info}/WHEEL RENAMED Viewed

@@ -1,4 +1,4 @@
 Wheel-Version: 1.0
-Generator: poetry-core 2.1.2
+Generator: poetry-core 1.9.1
 Root-Is-Purelib: true
 Tag: py3-none-any

langchain_ocr_lib-0.1.0.dist-info/METADATA DELETED Viewed

@@ -1,28 +0,0 @@
-Metadata-Version: 2.3
-Name: langchain-ocr-lib
-Version: 0.1.0
-Summary:
-License: MIT
-Author: Andreas Klos
-Author-email: aklos@outlook.de
-Requires-Python: >=3.11,<4.0
-Classifier: License :: OSI Approved :: MIT License
-Classifier: Programming Language :: Python :: 3
-Classifier: Programming Language :: Python :: 3.11
-Classifier: Programming Language :: Python :: 3.12
-Classifier: Programming Language :: Python :: 3.13
-Requires-Dist: deprecated (>=1.2.14,<2.0.0)
-Requires-Dist: inject (>=5.2.1,<6.0.0)
-Requires-Dist: langchain-community (>=0.3.19,<0.4.0)
-Requires-Dist: langchain-ollama (>=0.2.0,<0.3.0)
-Requires-Dist: langchain-openai (>=0.3.8,<0.4.0)
-Requires-Dist: langfuse (>=2.59.7,<3.0.0)
-Requires-Dist: openai (>=1.42.0,<2.0.0)
-Requires-Dist: pdf2image (>=1.17.0,<2.0.0)
-Requires-Dist: pillow (>=11.0.0,<12.0.0)
-Requires-Dist: pycountry (>=24.6.1,<25.0.0)
-Requires-Dist: pytest-asyncio (>=0.25.0,<0.26.0)
-Requires-Dist: pyyaml (>=6.0.2,<7.0.0)
-Description-Content-Type: text/markdown

{langchain_ocr_lib-0.1.0.dist-info → langchain_ocr_lib-0.3.0.dist-info}/entry_points.txt RENAMED Viewed

File without changes

langchain-ocr-lib 0.1.0__py3-none-any.whl → 0.3.0__py3-none-any.whl

langchain-ocr-lib 0.1.0py3-none-any.whl → 0.3.0py3-none-any.whl