PyPI - chunkr-ai - Versions diffs - 0.1.0a10__py3-none-any.whl → 0.1.0a11__py3-none-any.whl - Mend

chunkr-ai 0.1.0a10py3-none-any.whl → 0.1.0a11py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (23) hide show

chunkr_ai/_version.py +1 -1
chunkr_ai/resources/tasks/parse.py +9 -0
chunkr_ai/types/__init__.py +2 -0
chunkr_ai/types/file_info.py +0 -3
chunkr_ai/types/llm_processing.py +36 -0
chunkr_ai/types/llm_processing_param.py +36 -0
chunkr_ai/types/ocr_result.py +6 -6
chunkr_ai/types/parse_configuration.py +4 -0
chunkr_ai/types/parse_configuration_param.py +4 -0
chunkr_ai/types/segment.py +5 -8
chunkr_ai/types/segment_processing.py +2 -92
chunkr_ai/types/segment_processing_param.py +2 -92
chunkr_ai/types/task_response.py +2 -8
chunkr_ai/types/tasks/extract_create_response.py +1 -7
chunkr_ai/types/tasks/extract_get_response.py +1 -7
chunkr_ai/types/tasks/parse_create_params.py +4 -0
chunkr_ai/types/tasks/parse_create_response.py +0 -6
chunkr_ai/types/tasks/parse_get_response.py +0 -6
chunkr_ai/types/version_info.py +1 -1
{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/METADATA +1 -1
{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/RECORD +23 -21
{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/WHEEL +0 -0
{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/licenses/LICENSE +0 -0

chunkr_ai/_version.py CHANGED Viewed

@@ -1,4 +1,4 @@
 # File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
 __title__ = "chunkr_ai"
-__version__ = "0.1.0-alpha.10"  # x-release-please-version
+__version__ = "0.1.0-alpha.11"  # x-release-please-version

chunkr_ai/resources/tasks/parse.py CHANGED Viewed

@@ -19,6 +19,7 @@ from ..._response import (
 )
 from ...types.tasks import parse_get_params, parse_create_params
 from ..._base_client import make_request_options
+from ...types.llm_processing_param import LlmProcessingParam
 from ...types.chunk_processing_param import ChunkProcessingParam
 from ...types.segment_processing_param import SegmentProcessingParam
 from ...types.tasks.parse_get_response import ParseGetResponse
@@ -55,6 +56,7 @@ class ParseResource(SyncAPIResource):
         error_handling: Literal["Fail", "Continue"] | Omit = omit,
         expires_in: Optional[int] | Omit = omit,
         file_name: Optional[str] | Omit = omit,
+        llm_processing: LlmProcessingParam | Omit = omit,
         ocr_strategy: Literal["All", "Auto"] | Omit = omit,
         pipeline: Literal["Azure", "Chunkr"] | Omit = omit,
         segment_processing: Optional[SegmentProcessingParam] | Omit = omit,
@@ -97,6 +99,8 @@ class ParseResource(SyncAPIResource):
           file_name: The name of the file to be parsed. If not set a name will be generated.
+          llm_processing: Controls the LLM used for the task.
           ocr_strategy: Controls the Optical Character Recognition (OCR) strategy.
               - `All`: Processes all pages with OCR. (Latency penalty: ~0.5 seconds per page)
@@ -146,6 +150,7 @@ class ParseResource(SyncAPIResource):
                     "error_handling": error_handling,
                     "expires_in": expires_in,
                     "file_name": file_name,
+                    "llm_processing": llm_processing,
                     "ocr_strategy": ocr_strategy,
                     "pipeline": pipeline,
                     "segment_processing": segment_processing,
@@ -251,6 +256,7 @@ class AsyncParseResource(AsyncAPIResource):
         error_handling: Literal["Fail", "Continue"] | Omit = omit,
         expires_in: Optional[int] | Omit = omit,
         file_name: Optional[str] | Omit = omit,
+        llm_processing: LlmProcessingParam | Omit = omit,
         ocr_strategy: Literal["All", "Auto"] | Omit = omit,
         pipeline: Literal["Azure", "Chunkr"] | Omit = omit,
         segment_processing: Optional[SegmentProcessingParam] | Omit = omit,
@@ -293,6 +299,8 @@ class AsyncParseResource(AsyncAPIResource):
           file_name: The name of the file to be parsed. If not set a name will be generated.
+          llm_processing: Controls the LLM used for the task.
           ocr_strategy: Controls the Optical Character Recognition (OCR) strategy.
               - `All`: Processes all pages with OCR. (Latency penalty: ~0.5 seconds per page)
@@ -342,6 +350,7 @@ class AsyncParseResource(AsyncAPIResource):
                     "error_handling": error_handling,
                     "expires_in": expires_in,
                     "file_name": file_name,
+                    "llm_processing": llm_processing,
                     "ocr_strategy": ocr_strategy,
                     "pipeline": pipeline,
                     "segment_processing": segment_processing,

chunkr_ai/types/__init__.py CHANGED Viewed

@@ -15,6 +15,7 @@ from .ocr_result import OcrResult as OcrResult
 from .bounding_box import BoundingBox as BoundingBox
 from .version_info import VersionInfo as VersionInfo
 from .task_response import TaskResponse as TaskResponse
+from .llm_processing import LlmProcessing as LlmProcessing
 from .file_url_params import FileURLParams as FileURLParams
 from .task_get_params import TaskGetParams as TaskGetParams
 from .chunk_processing import ChunkProcessing as ChunkProcessing
@@ -25,6 +26,7 @@ from .file_create_params import FileCreateParams as FileCreateParams
 from .segment_processing import SegmentProcessing as SegmentProcessing
 from .files_list_response import FilesListResponse as FilesListResponse
 from .parse_configuration import ParseConfiguration as ParseConfiguration
+from .llm_processing_param import LlmProcessingParam as LlmProcessingParam
 from .unwrap_webhook_event import UnwrapWebhookEvent as UnwrapWebhookEvent
 from .webhook_url_response import WebhookURLResponse as WebhookURLResponse
 from .extract_configuration import ExtractConfiguration as ExtractConfiguration

chunkr_ai/types/file_info.py CHANGED Viewed

@@ -19,6 +19,3 @@ class FileInfo(BaseModel):
     page_count: Optional[int] = None
     """The number of pages in the file."""
-    ss_cell_count: Optional[int] = None
-    """The number of cells in the file. Only used for spreadsheets."""

chunkr_ai/types/llm_processing.py ADDED Viewed

@@ -0,0 +1,36 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+from typing import Union, Optional
+from typing_extensions import Literal, TypeAlias
+from pydantic import Field as FieldInfo
+from .._models import BaseModel
+__all__ = ["LlmProcessing", "FallbackStrategy", "FallbackStrategyModel"]
+class FallbackStrategyModel(BaseModel):
+    model: str = FieldInfo(alias="Model")
+    """Use a specific model as fallback"""
+FallbackStrategy: TypeAlias = Union[Literal["None", "Default"], FallbackStrategyModel]
+class LlmProcessing(BaseModel):
+    fallback_strategy: Optional[FallbackStrategy] = None
+    """The fallback strategy to use for the LLMs in the task."""
+    llm_model_id: Optional[str] = None
+    """The ID of the model to use for the task.
+    If not provided, the default model will be used. Please check the documentation
+    for the model you want to use.
+    """
+    max_completion_tokens: Optional[int] = None
+    """The maximum number of tokens to generate."""
+    temperature: Optional[float] = None
+    """The temperature to use for the LLM."""

chunkr_ai/types/llm_processing_param.py ADDED Viewed

@@ -0,0 +1,36 @@
+# File generated from our OpenAPI spec by Stainless. See CONTRIBUTING.md for details.
+from __future__ import annotations
+from typing import Union, Optional
+from typing_extensions import Literal, Required, Annotated, TypeAlias, TypedDict
+from .._utils import PropertyInfo
+__all__ = ["LlmProcessingParam", "FallbackStrategy", "FallbackStrategyModel"]
+class FallbackStrategyModel(TypedDict, total=False):
+    model: Required[Annotated[str, PropertyInfo(alias="Model")]]
+    """Use a specific model as fallback"""
+FallbackStrategy: TypeAlias = Union[Literal["None", "Default"], FallbackStrategyModel]
+class LlmProcessingParam(TypedDict, total=False):
+    fallback_strategy: FallbackStrategy
+    """The fallback strategy to use for the LLMs in the task."""
+    llm_model_id: Optional[str]
+    """The ID of the model to use for the task.
+    If not provided, the default model will be used. Please check the documentation
+    for the model you want to use.
+    """
+    max_completion_tokens: Optional[int]
+    """The maximum number of tokens to generate."""
+    temperature: float
+    """The temperature to use for the LLM."""

chunkr_ai/types/ocr_result.py CHANGED Viewed

@@ -15,14 +15,14 @@ class OcrResult(BaseModel):
     text: str
     """The recognized text of the OCR result."""
+    cell_ref: Optional[str] = None
+    """
+    Excel-style cell reference (e.g., "A1" or "A1:B2") when OCR originates from a
+    spreadsheet cell
+    """
     confidence: Optional[float] = None
     """The confidence score of the recognized text."""
     ocr_id: Optional[str] = None
     """The unique identifier for the OCR result."""
-    ss_cell_ref: Optional[str] = None
-    """
-    Excel-style cell reference (e.g., "A1" or "A1:B2") when OCR originates from a
-    spreadsheet cell
-    """

chunkr_ai/types/parse_configuration.py CHANGED Viewed

@@ -4,6 +4,7 @@ from typing import Optional
 from typing_extensions import Literal
 from .._models import BaseModel
+from .llm_processing import LlmProcessing
 from .chunk_processing import ChunkProcessing
 from .segment_processing import SegmentProcessing
@@ -22,6 +23,9 @@ class ParseConfiguration(BaseModel):
       LLM refusals etc.)
     """
+    llm_processing: Optional[LlmProcessing] = None
+    """Controls the LLM used for the task."""
     ocr_strategy: Optional[Literal["All", "Auto"]] = None
     """Controls the Optical Character Recognition (OCR) strategy.

chunkr_ai/types/parse_configuration_param.py CHANGED Viewed

@@ -5,6 +5,7 @@ from __future__ import annotations
 from typing import Optional
 from typing_extensions import Literal, TypedDict
+from .llm_processing_param import LlmProcessingParam
 from .chunk_processing_param import ChunkProcessingParam
 from .segment_processing_param import SegmentProcessingParam
@@ -23,6 +24,9 @@ class ParseConfigurationParam(TypedDict, total=False):
       LLM refusals etc.)
     """
+    llm_processing: LlmProcessingParam
+    """Controls the LLM used for the task."""
     ocr_strategy: Literal["All", "Auto"]
     """Controls the Optical Character Recognition (OCR) strategy.

chunkr_ai/types/segment.py CHANGED Viewed

@@ -31,23 +31,20 @@ class Segment(BaseModel):
         "Caption",
         "Footnote",
         "Formula",
-        "FormRegion",
-        "GraphicalItem",
-        "Legend",
-        "LineNumber",
         "ListItem",
         "Page",
         "PageFooter",
         "PageHeader",
-        "PageNumber",
         "Picture",
+        "SectionHeader",
         "Table",
         "Text",
         "Title",
-        "Unknown",
-        "SectionHeader",
     ]
-    """All the possible types for a segment."""
+    """
+    All the possible types for a segment. Note: Different configurations will
+    produce different types. Please refer to the documentation for more information.
+    """
     confidence: Optional[float] = None
     """Confidence score of the layout analysis model"""

chunkr_ai/types/segment_processing.py CHANGED Viewed

@@ -47,24 +47,6 @@ class SegmentProcessing(BaseModel):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    form_region: Optional[GenerationConfig] = FieldInfo(alias="FormRegion", default=None)
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
     formula: Optional[GenerationConfig] = FieldInfo(alias="Formula", default=None)
     """Controls the processing and generation for the segment.
@@ -83,60 +65,6 @@ class SegmentProcessing(BaseModel):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    graphical_item: Optional[GenerationConfig] = FieldInfo(alias="GraphicalItem", default=None)
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
-    legend: Optional[GenerationConfig] = FieldInfo(alias="Legend", default=None)
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
-    line_number: Optional[GenerationConfig] = FieldInfo(alias="LineNumber", default=None)
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
     list_item: Optional[GenerationConfig] = FieldInfo(alias="ListItem", default=None)
     """Controls the processing and generation for the segment.
@@ -209,7 +137,7 @@ class SegmentProcessing(BaseModel):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    page_number: Optional[GenerationConfig] = FieldInfo(alias="PageNumber", default=None)
+    picture: Optional[GenerationConfig] = FieldInfo(alias="Picture", default=None)
     """Controls the processing and generation for the segment.
     - `crop_image` controls whether to crop the file's images to the segment's
@@ -227,7 +155,7 @@ class SegmentProcessing(BaseModel):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    picture: Optional[GenerationConfig] = FieldInfo(alias="Picture", default=None)
+    section_header: Optional[GenerationConfig] = FieldInfo(alias="SectionHeader", default=None)
     """Controls the processing and generation for the segment.
     - `crop_image` controls whether to crop the file's images to the segment's
@@ -298,21 +226,3 @@ class SegmentProcessing(BaseModel):
       configuration.
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    unknown: Optional[GenerationConfig] = FieldInfo(alias="Unknown", default=None)
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """

chunkr_ai/types/segment_processing_param.py CHANGED Viewed

@@ -48,24 +48,6 @@ class SegmentProcessingParam(TypedDict, total=False):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    form_region: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="FormRegion")]
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
     formula: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="Formula")]
     """Controls the processing and generation for the segment.
@@ -84,60 +66,6 @@ class SegmentProcessingParam(TypedDict, total=False):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    graphical_item: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="GraphicalItem")]
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
-    legend: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="Legend")]
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
-    line_number: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="LineNumber")]
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """
     list_item: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="ListItem")]
     """Controls the processing and generation for the segment.
@@ -210,7 +138,7 @@ class SegmentProcessingParam(TypedDict, total=False):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    page_number: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="PageNumber")]
+    picture: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="Picture")]
     """Controls the processing and generation for the segment.
     - `crop_image` controls whether to crop the file's images to the segment's
@@ -228,7 +156,7 @@ class SegmentProcessingParam(TypedDict, total=False):
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    picture: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="Picture")]
+    section_header: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="SectionHeader")]
     """Controls the processing and generation for the segment.
     - `crop_image` controls whether to crop the file's images to the segment's
@@ -299,21 +227,3 @@ class SegmentProcessingParam(TypedDict, total=False):
       configuration.
     - `extended_context` uses the full page image as context for LLM generation.
     """
-    unknown: Annotated[Optional[GenerationConfigParam], PropertyInfo(alias="Unknown")]
-    """Controls the processing and generation for the segment.
-    - `crop_image` controls whether to crop the file's images to the segment's
-      bounding box. The cropped image will be stored in the segment's `image` field.
-      Use `All` to always crop, or `Auto` to only crop when needed for
-      post-processing.
-    - `format` specifies the output format: `Html` or `Markdown`
-    - `strategy` determines how the content is generated: `Auto`, `LLM`, or `Ignore`
-      - `Auto`: Process content automatically
-      - `LLM`: Use large language models for processing
-      - `Ignore`: Exclude segments from final output
-    - `description` enables LLM-generated descriptions for segments. **Note:** This
-      uses chunkr's own VLM models and is not configurable via LLM processing
-      configuration.
-    - `extended_context` uses the full page image as context for LLM generation.
-    """

chunkr_ai/types/task_response.py CHANGED Viewed

@@ -20,12 +20,6 @@ Output: TypeAlias = Union[ParseOutputResponse, ExtractOutputResponse, None]
 class TaskResponse(BaseModel):
-    completed: bool
-    """True when the task reaches a terminal state i.e.
-    `status` is `Succeeded` or `Failed` or `Cancelled`
-    """
     configuration: Configuration
     """
     Unified configuration type that can represent either parse or extract
@@ -64,8 +58,8 @@ class TaskResponse(BaseModel):
     output: Optional[Output] = None
     """Unified output type that can represent either parse or extract results"""
-    parse_task_id: Optional[str] = None
-    """The ID of the source `parse` task that was used for the task"""
+    source_task_id: Optional[str] = None
+    """The ID of the source task that was used for the task"""
     started_at: Optional[datetime] = None
     """The date and time when the task was started."""

chunkr_ai/types/tasks/extract_create_response.py CHANGED Viewed

@@ -14,12 +14,6 @@ __all__ = ["ExtractCreateResponse"]
 class ExtractCreateResponse(BaseModel):
-    completed: bool
-    """True when the task reaches a terminal state i.e.
-    `status` is `Succeeded` or `Failed` or `Cancelled`
-    """
     configuration: ExtractConfiguration
     created_at: datetime
@@ -63,7 +57,7 @@ class ExtractCreateResponse(BaseModel):
       for that field.
     """
-    parse_task_id: Optional[str] = None
+    source_task_id: Optional[str] = None
     """The ID of the source `parse` task that was used for extraction"""
     started_at: Optional[datetime] = None

chunkr_ai/types/tasks/extract_get_response.py CHANGED Viewed

@@ -14,12 +14,6 @@ __all__ = ["ExtractGetResponse"]
 class ExtractGetResponse(BaseModel):
-    completed: bool
-    """True when the task reaches a terminal state i.e.
-    `status` is `Succeeded` or `Failed` or `Cancelled`
-    """
     configuration: ExtractConfiguration
     created_at: datetime
@@ -63,7 +57,7 @@ class ExtractGetResponse(BaseModel):
       for that field.
     """
-    parse_task_id: Optional[str] = None
+    source_task_id: Optional[str] = None
     """The ID of the source `parse` task that was used for extraction"""
     started_at: Optional[datetime] = None

chunkr_ai/types/tasks/parse_create_params.py CHANGED Viewed

@@ -5,6 +5,7 @@ from __future__ import annotations
 from typing import Optional
 from typing_extensions import Literal, Required, TypedDict
+from ..llm_processing_param import LlmProcessingParam
 from ..chunk_processing_param import ChunkProcessingParam
 from ..segment_processing_param import SegmentProcessingParam
@@ -41,6 +42,9 @@ class ParseCreateParams(TypedDict, total=False):
     file_name: Optional[str]
     """The name of the file to be parsed. If not set a name will be generated."""
+    llm_processing: LlmProcessingParam
+    """Controls the LLM used for the task."""
     ocr_strategy: Literal["All", "Auto"]
     """Controls the Optical Character Recognition (OCR) strategy.

chunkr_ai/types/tasks/parse_create_response.py CHANGED Viewed

@@ -14,12 +14,6 @@ __all__ = ["ParseCreateResponse"]
 class ParseCreateResponse(BaseModel):
-    completed: bool
-    """True when the task reaches a terminal state i.e.
-    `status` is `Succeeded` or `Failed` or `Cancelled`
-    """
     configuration: ParseConfiguration
     created_at: datetime

chunkr_ai/types/tasks/parse_get_response.py CHANGED Viewed

@@ -14,12 +14,6 @@ __all__ = ["ParseGetResponse"]
 class ParseGetResponse(BaseModel):
-    completed: bool
-    """True when the task reaches a terminal state i.e.
-    `status` is `Succeeded` or `Failed` or `Cancelled`
-    """
     configuration: ParseConfiguration
     created_at: datetime

chunkr_ai/types/version_info.py CHANGED Viewed

@@ -20,7 +20,7 @@ class ClientVersionGeneratedSDK(BaseModel):
     """Version of the auto-generated SDK"""
-ClientVersion: TypeAlias = Union[Literal["Legacy", "Unspecified"], ClientVersionManualSDK, ClientVersionGeneratedSDK]
+ClientVersion: TypeAlias = Union[Literal["Legacy"], ClientVersionManualSDK, ClientVersionGeneratedSDK]
 class VersionInfo(BaseModel):

{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.3
 Name: chunkr-ai
-Version: 0.1.0a10
+Version: 0.1.0a11
 Summary: The official Python library for the chunkr API
 Project-URL: Homepage, https://github.com/lumina-ai-inc/chunkr-python
 Project-URL: Repository, https://github.com/lumina-ai-inc/chunkr-python

{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/RECORD RENAMED Viewed

@@ -11,7 +11,7 @@ chunkr_ai/_resource.py,sha256=f5tiwjxcKdbeMor8idoHtMFTUhqD9yc2xXtq5rqeLLk,1100
 chunkr_ai/_response.py,sha256=xXNpF53hiYARmAW7npKuxQ5UHAEjgAzm7ME_L3eIstY,28800
 chunkr_ai/_streaming.py,sha256=ZmyrVWk7-AWkLAATR55WgNxnyFzYmaqJt2LthA_PTqQ,10100
 chunkr_ai/_types.py,sha256=nzD_EEP9CVutLcSeuKLO6Mpn5cd_R0Vo0dEM7AWa7yY,7239
-chunkr_ai/_version.py,sha256=DjItTmf7c0SXbPfiF1CUJ2pzf-qJNG2loWN0G4kVsqw,170
+chunkr_ai/_version.py,sha256=O_LWqHa5Todq2XeeCDSW_cu4p1oubeyQ-SQUznjufns,170
 chunkr_ai/pagination.py,sha256=bT-ErcJ80YlKBV6tWq2s9uqg-wv7o66SKe_AgUAGrKc,3533
 chunkr_ai/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
 chunkr_ai/_utils/__init__.py,sha256=7fch0GT9zpNnErbciSpUNa-SjTxxjY6kxHxKMOM4AGs,2305
@@ -33,9 +33,9 @@ chunkr_ai/resources/health.py,sha256=sLA4PSAf-4JK1Lrqb0TApQ0Hc5Q8fZzbKQXzA3bNEdQ
 chunkr_ai/resources/webhooks.py,sha256=RhteI3ahE2rGSDEMUZH0HDBTOQqWS8sZ5D00ErKWnpE,7006
 chunkr_ai/resources/tasks/__init__.py,sha256=wDCnwtnpTfiaLg7NBxoLZYh2TtOw44_DSqtJa_TjmXU,1439
 chunkr_ai/resources/tasks/extract.py,sha256=LQJTmYItqUu60G0hYfdw_nyMLARyxqzjVO6ETIn8hDo,14980
-chunkr_ai/resources/tasks/parse.py,sha256=hbFEFu-tU6RWktA0Tv6KP0HyeLdS62kO4UoQfbSsAJc,18963
+chunkr_ai/resources/tasks/parse.py,sha256=bQcA-zOQvTN9_OiqmzILsJLQqJtONU5XbNZQMAm-0yk,19374
 chunkr_ai/resources/tasks/tasks.py,sha256=W9bXpfgE56MkM5buBYg5-dcPYGFo_CzgVkr1kOOpXtQ,23582
-chunkr_ai/types/__init__.py,sha256=gO4mkpo_tYfe1PGSc0Uzlc8rZr9PTmHshGZFzmG98mM,2365
+chunkr_ai/types/__init__.py,sha256=vBUEzAt6cblUc44h8NivvVrua_CmaIujTvjvf8B0_S0,2499
 chunkr_ai/types/bounding_box.py,sha256=JDZlhJJl4lg6RYGf8VpC46soQfQ10-K8YwHHA6XBFkM,431
 chunkr_ai/types/cell.py,sha256=D-S_XAzmOJs0Lo2RgY7T3h_ChdhSrRrI8IN4qo2sGOU,1143
 chunkr_ai/types/cell_style.py,sha256=VqSz6pZ7rjmHYrq_S63IOFPaWvXjWhNUIGc3V4UlF6U,873
@@ -47,7 +47,7 @@ chunkr_ai/types/extract_configuration.py,sha256=OCs3SnuS8qXWB926o8Gv1Y2AuNszplGm
 chunkr_ai/types/extract_output_response.py,sha256=kfkHbeEVl3x3t-7u4h4Cd4wC5KbrOjz4-joP5RV1WyA,1272
 chunkr_ai/types/file.py,sha256=kOxR0g-3A-qOxz2cjuTcq0wFMqPoph9uQuLYQ56zb-c,718
 chunkr_ai/types/file_create_params.py,sha256=_1Dr3FlO9BOv6gzhCN4g46_otCBqEdLe0mnxpdaRPaE,468
-chunkr_ai/types/file_info.py,sha256=y5kVR3mPeiwsPBMc3IBAigQbkVRpGQN09IpDPdvCe7E,611
+chunkr_ai/types/file_info.py,sha256=78r0AITTY2nlZyW9pHy7dywVXyOsCK1Ysmmc-wfQBVM,499
 chunkr_ai/types/file_list_params.py,sha256=oJGTf88aAxBhNfmQDbxGT63b95HdSbMXUubKjXM22_U,822
 chunkr_ai/types/file_url.py,sha256=L434WnOXkNmt59dJiaAgT1_3pN3BIsxm2q14zHQK6xY,365
 chunkr_ai/types/file_url_params.py,sha256=ZHfKiy_6B25StdDemulavGcsPggNNMKLWf6KN7xfPTY,413
@@ -55,32 +55,34 @@ chunkr_ai/types/files_list_response.py,sha256=ggSRWhTzZWjcDXxStyCzrYICXXB5TqnL2j
 chunkr_ai/types/generation_config.py,sha256=9gfwdd228x29jC1egxq3IreKwgkGZCjSWHCXIkzQwqE,958
 chunkr_ai/types/generation_config_param.py,sha256=9E0Mhee-NInwOzjXmq3gpd8G5drsPBpzFs0AA2ywTc0,960
 chunkr_ai/types/health_check_response.py,sha256=6Zn5YYHCQf2RgMjDlf39mtiTPqfaBfC9Vv599U_rKCI,200
-chunkr_ai/types/ocr_result.py,sha256=W3piXLotfmZ40FJrJYMuS72shaVYLsKeN6jCf26uZGI,743
+chunkr_ai/types/llm_processing.py,sha256=cTm5LBBCpnmA4u-nGQdO67JYCTizzf4lJAvUsG6BX2Q,1095
+chunkr_ai/types/llm_processing_param.py,sha256=CSnW4-5-32Pzoo-G7G3p_NUvljtCkNguj1dHVc2Y4cA,1135
+chunkr_ai/types/ocr_result.py,sha256=EdIvpuccQ_8A8ml7yVCOEOfBoewgwTBzVJZ_les9udM,740
 chunkr_ai/types/page.py,sha256=ADdGJisS-GxBD_wdu3q1pmikgJ7twFsP0choDEXw9ro,690
-chunkr_ai/types/parse_configuration.py,sha256=WcUUk7ai0sHTeWUQYHyDn1ZjYqT7dzLqRWjGx5zFfsg,2427
-chunkr_ai/types/parse_configuration_param.py,sha256=dl884XkCnloSS9YMk8UnUm7Z963HiAzNy5qgtCSIPH8,2405
+chunkr_ai/types/parse_configuration.py,sha256=MOTypSv3kiwoLEcjAgsyc674CMG4xw6SxXEXweFU6V4,2567
+chunkr_ai/types/parse_configuration_param.py,sha256=hJWngWEtT3RYgHqkAvmS4RG7cODla6i-Cp8ubtZfmz0,2544
 chunkr_ai/types/parse_output_response.py,sha256=KfRFY5PnchJfEWr4jy3Dd-3AWeImGE5BP_NMFC5I6_c,947
-chunkr_ai/types/segment.py,sha256=KsGNynGQq7s55EHuPLY7glmvXunv2Wszhx5FhkhkN5U,3093
-chunkr_ai/types/segment_processing.py,sha256=uyNbxp7DsgTgBHoS9ELoyW8j-aTBbOshxYrb-TQ990E,17049
-chunkr_ai/types/segment_processing_param.py,sha256=a1Zk8NiaeFNSbHw5P8Usq-17mqENuZdCOQCn8nNN0o0,17199
+chunkr_ai/types/segment.py,sha256=_QNYmAMSZOCNv67CwsmIOq7X0ZeYsj6jzQbKhbnoTrA,3096
+chunkr_ai/types/segment_processing.py,sha256=0-b4nSoLeGsMKSVw5LPQFXnn-PoVvIJ0wFfSFEOTpsw,12115
+chunkr_ai/types/segment_processing_param.py,sha256=fVbvFSzmxLPiQoPniFwqqXlbo6fRaZwzZ_TbnwYVOss,12245
 chunkr_ai/types/task_extract_updated_webhook_event.py,sha256=YYHDQEs4wg2bDgGXgHUgX_CwSLFxePJZrT5OV4J6Mhk,640
 chunkr_ai/types/task_get_params.py,sha256=Nx2luhebcoaiuRln4KP4FarWvBPd1OYi__efi56zHPM,460
 chunkr_ai/types/task_list_params.py,sha256=NySdOH1mIhZAJvcHr9xm2PeODsCO05lJMsrAiGGBKNE,1275
 chunkr_ai/types/task_parse_updated_webhook_event.py,sha256=3NsfEpJr_bfFB3Y66elraSxk0FS76c60BLUmhqmU9Vc,636
-chunkr_ai/types/task_response.py,sha256=RgyRaZK8TKjVfMSvsI10LYAv61QY2-195Tg3op8yCGo,2339
+chunkr_ai/types/task_response.py,sha256=I53d8JdZxbg3p-AUnigISmwFFt5DILnm0gyOc2wRu28,2191
 chunkr_ai/types/unwrap_webhook_event.py,sha256=G23CLp0__AMlfM2xE11ugnDxN82uiG0Xru0p-pI9VHQ,442
-chunkr_ai/types/version_info.py,sha256=MVSU2Z9ATehyc1IgVExczvcP_yH7wYc1UV_BwXeF0UA,917
+chunkr_ai/types/version_info.py,sha256=1qYIitGOB7aeOI7gWFfX6cAp2yw5pMzARiTtNl5NNDc,902
 chunkr_ai/types/webhook_url_response.py,sha256=q7VsWGOLqVfA_ctdcrbynQJVbfCGh1rHlXZsDc-9Sus,205
 chunkr_ai/types/tasks/__init__.py,sha256=AEF_lM5YdEvz8_7fcX0HHnVvsXdC8Hcsb2Cs-LzRBK4,711
 chunkr_ai/types/tasks/extract_create_params.py,sha256=IV5TrFqJAGFf4w_uH3hqWlbEySlAOC_2QzwKZ-3oM6o,1376
-chunkr_ai/types/tasks/extract_create_response.py,sha256=goc8x-L3W0hJowb4PvXigc2o_p15JL0a2ESo9Geg9xc,2287
+chunkr_ai/types/tasks/extract_create_response.py,sha256=Umbm40i0Q6Oz3vX9WwTeOXwKU2g8ddZmFhRwl-5Rm5U,2147
 chunkr_ai/types/tasks/extract_get_params.py,sha256=AsJvXHvdDnIcVOvTK9gCeiMFk4wckuv19IXIJcqpqso,466
-chunkr_ai/types/tasks/extract_get_response.py,sha256=sQgDLTwpE2w-xVcuXO7NAF_kjhLXv_0swdBJQRGQNSI,2281
-chunkr_ai/types/tasks/parse_create_params.py,sha256=8ctOPP2QT-q_8zN8Fl8ene74ZGOUnR6EAA9XcvA_0p4,2957
-chunkr_ai/types/tasks/parse_create_response.py,sha256=l9hj6qKs76-qKzjBtVeo9lRe9wRuYltsh2GFNPyfEDM,1820
+chunkr_ai/types/tasks/extract_get_response.py,sha256=FWXfS3Qobg3k6seWbbXJZ5y4N_mtJbHsN_FeZV5_ieM,2141
+chunkr_ai/types/tasks/parse_create_params.py,sha256=xzWA5UX183-Lk-JDtWoV37-4pXpFGmQmS4DwSa7K8Ug,3097
+chunkr_ai/types/tasks/parse_create_response.py,sha256=asqeI2l6QbdtPhaQkxkbpSwVLe2HEFfeTPG5OX_xfus,1679
 chunkr_ai/types/tasks/parse_get_params.py,sha256=Ca0C91k6ajNTMhtUkFMulgC6g8_wI7YLVGxsWiupiVA,462
-chunkr_ai/types/tasks/parse_get_response.py,sha256=2IoZeN8BAxQEtxRq6CCA_d9nWPvCQbp71zMzaaKPlug,1814
-chunkr_ai-0.1.0a10.dist-info/METADATA,sha256=xTpeNw9Gsz28LK7DnbTqP7cw_VcaVifr2tHH2DepHho,16493
-chunkr_ai-0.1.0a10.dist-info/WHEEL,sha256=C2FUgwZgiLbznR-k0b_5k3Ai_1aASOXDss3lzCUsUug,87
-chunkr_ai-0.1.0a10.dist-info/licenses/LICENSE,sha256=3FDRL-L-DFkrFy8yJpb1Nxhuztm0PB2kawcCgK5utFg,11336
-chunkr_ai-0.1.0a10.dist-info/RECORD,,
+chunkr_ai/types/tasks/parse_get_response.py,sha256=-0_j1_5skabmAtmcK882jZGroVsBRxC_o5d6pg31bJY,1673
+chunkr_ai-0.1.0a11.dist-info/METADATA,sha256=-aO85KHXxUtKZc2UZdKBe_pIWnljQ8wOj02ug2oVGCE,16493
+chunkr_ai-0.1.0a11.dist-info/WHEEL,sha256=C2FUgwZgiLbznR-k0b_5k3Ai_1aASOXDss3lzCUsUug,87
+chunkr_ai-0.1.0a11.dist-info/licenses/LICENSE,sha256=3FDRL-L-DFkrFy8yJpb1Nxhuztm0PB2kawcCgK5utFg,11336
+chunkr_ai-0.1.0a11.dist-info/RECORD,,

{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/WHEEL RENAMED Viewed

File without changes

{chunkr_ai-0.1.0a10.dist-info → chunkr_ai-0.1.0a11.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

chunkr-ai 0.1.0a10__py3-none-any.whl → 0.1.0a11__py3-none-any.whl

chunkr-ai 0.1.0a10py3-none-any.whl → 0.1.0a11py3-none-any.whl