PyPI - doctra - Versions diffs - 0.5.0__tar.gz → 0.5.1__tar.gz - Mend

doctra 0.5.0tar.gz → 0.5.1tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (85) hide show

{doctra-0.5.0/doctra.egg-info → doctra-0.5.1}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: doctra
-Version: 0.5.0
+Version: 0.5.1
 Summary: Parse, extract, and analyze documents with ease
 Home-page: https://github.com/AdemBoukhris457/Doctra
 Author: Adem Boukhris
@@ -362,7 +362,7 @@ parser = StructuredPDFParser()
 # Parser with VLM for structured data extraction
 parser = StructuredPDFParser(
     use_vlm=True,
-    vlm_provider="openai",  # or "gemini" or "anthropic" or "openrouter"
+    vlm_provider="openai",  # or "gemini", "anthropic", "openrouter", "qianfan", "ollama"
     vlm_api_key="your_api_key_here"
 )
@@ -917,7 +917,7 @@ parser.display_pages_with_boxes("document.pdf")
 ### 🤖 VLM Integration
 - Vision Language Model support for structured data extraction
-- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter)
+- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter, Qianfan, Ollama)
 - Automatic conversion of charts and tables to structured formats
 ### 📊 Multiple Output Formats

{doctra-0.5.0 → doctra-0.5.1}/README.md RENAMED Viewed

@@ -102,7 +102,7 @@ parser = StructuredPDFParser()
 # Parser with VLM for structured data extraction
 parser = StructuredPDFParser(
     use_vlm=True,
-    vlm_provider="openai",  # or "gemini" or "anthropic" or "openrouter"
+    vlm_provider="openai",  # or "gemini", "anthropic", "openrouter", "qianfan", "ollama"
     vlm_api_key="your_api_key_here"
 )
@@ -657,7 +657,7 @@ parser.display_pages_with_boxes("document.pdf")
 ### 🤖 VLM Integration
 - Vision Language Model support for structured data extraction
-- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter)
+- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter, Qianfan, Ollama)
 - Automatic conversion of charts and tables to structured formats
 ### 📊 Multiple Output Formats

{doctra-0.5.0 → doctra-0.5.1}/doctra/engines/vlm/provider.py RENAMED Viewed

@@ -22,10 +22,10 @@ def make_model(
     """
     Build a callable Outlines model for VLM processing.
-    Creates an Outlines model instance configured for Gemini, OpenAI, Anthropic, OpenRouter, or Ollama
+    Creates an Outlines model instance configured for Gemini, OpenAI, Anthropic, OpenRouter, Qianfan, or Ollama
     providers. Only one backend is active at a time, with Gemini as the default.
-    :param vlm_provider: VLM provider to use ("gemini", "openai", "anthropic", "openrouter", or "ollama", default: "gemini")
+    :param vlm_provider: VLM provider to use ("gemini", "openai", "anthropic", "openrouter", "qianfan", or "ollama", default: "gemini")
     :param vlm_model: Model name to use (defaults to provider-specific defaults)
     :param api_key: API key for the VLM provider (required for all providers except Ollama)
     :return: Configured Outlines model instance
@@ -43,6 +43,8 @@ def make_model(
             vlm_model = "claude-opus-4-1"
         elif vlm_provider == "openrouter":
             vlm_model = "x-ai/grok-4"
+        elif vlm_provider == "qianfan":
+            vlm_model = "ernie-4.5-turbo-vl-32k"
         elif vlm_provider == "ollama":
             vlm_model = "llava:latest"
@@ -87,11 +89,24 @@ def make_model(
             vlm_model
         )
+    if vlm_provider == "qianfan":
+        if not api_key:
+            raise ValueError("Qianfan provider requires api_key to be passed to make_model(...).")
+        # Create the Qianfan client with OpenAI-compatible interface
+        client = openai.OpenAI(
+            base_url="https://qianfan.baidubce.com/v2",
+            api_key=api_key,
+        )
+        return outlines.from_openai(
+            client,
+            vlm_model
+        )
     if vlm_provider == "ollama":
         # Ollama doesn't use Outlines, so we return a custom wrapper
         return OllamaModelWrapper(vlm_model)
-    raise ValueError(f"Unsupported provider: {vlm_provider}. Use 'gemini', 'openai', 'anthropic', 'openrouter', or 'ollama'.")
+    raise ValueError(f"Unsupported provider: {vlm_provider}. Use 'gemini', 'openai', 'anthropic', 'openrouter', 'qianfan', or 'ollama'.")
 class OllamaModelWrapper:

{doctra-0.5.0 → doctra-0.5.1}/doctra/engines/vlm/service.py RENAMED Viewed

@@ -32,7 +32,7 @@ class VLMStructuredExtractor:
         """
         Initialize the VLMStructuredExtractor with provider configuration.
-        :param vlm_provider: VLM provider to use ("gemini", "openai", "anthropic", or "openrouter", default: "gemini")
+        :param vlm_provider: VLM provider to use ("gemini", "openai", "anthropic", "openrouter", "qianfan", or "ollama", default: "gemini")
         :param vlm_model: Model name to use (defaults to provider-specific defaults)
         :param api_key: API key for the VLM provider (required for all providers)
         """

{doctra-0.5.0 → doctra-0.5.1}/doctra/version.py RENAMED Viewed

@@ -1,2 +1,2 @@
 """Version information for Doctra."""
-__version__ = '0.5.0'
+__version__ = '0.5.1'

{doctra-0.5.0 → doctra-0.5.1/doctra.egg-info}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: doctra
-Version: 0.5.0
+Version: 0.5.1
 Summary: Parse, extract, and analyze documents with ease
 Home-page: https://github.com/AdemBoukhris457/Doctra
 Author: Adem Boukhris
@@ -362,7 +362,7 @@ parser = StructuredPDFParser()
 # Parser with VLM for structured data extraction
 parser = StructuredPDFParser(
     use_vlm=True,
-    vlm_provider="openai",  # or "gemini" or "anthropic" or "openrouter"
+    vlm_provider="openai",  # or "gemini", "anthropic", "openrouter", "qianfan", "ollama"
     vlm_api_key="your_api_key_here"
 )
@@ -917,7 +917,7 @@ parser.display_pages_with_boxes("document.pdf")
 ### 🤖 VLM Integration
 - Vision Language Model support for structured data extraction
-- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter)
+- Multiple provider options (OpenAI, Gemini, Anthropic, OpenRouter, Qianfan, Ollama)
 - Automatic conversion of charts and tables to structured formats
 ### 📊 Multiple Output Formats