kodexa 6.1.1a1__tar.gz → 6.1.1a2.post4573624930__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/PKG-INFO +1 -1
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/client.py +26 -1
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/pyproject.toml +1 -1
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/setup.py +1 -1
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/LICENSE +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/README.md +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/assistant/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/assistant/assistant.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/connectors/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/connectors/connectors.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/base.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/model.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/objects.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/persistence.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/pipeline/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/pipeline/pipeline.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/kodexa.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/ast.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/core.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lexrules.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lextab.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lextab.pyi +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parserules.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parserules.pyi +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parsetab.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parsetab.pyi +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/azure_models.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/bbox_common.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/table_form_common.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/steps/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/steps/common.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/test_components.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/test_utils.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/training/__init__.py +0 -0
- {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/training/train_utils.py +0 -0
@@ -1937,6 +1937,31 @@ class DataStoreEndpoint(StoreEndpoint):
|
|
1937
1937
|
data_object_page.content]
|
1938
1938
|
return data_object_page
|
1939
1939
|
|
1940
|
+
def get_stream_data_objects_request(self, path: str, query="*", document_family: Optional[DocumentFamily] = None,
|
1941
|
+
parent_id: Optional[str] = None):
|
1942
|
+
"""
|
1943
|
+
Stream page request
|
1944
|
+
:param path (str): The parent taxon (/ is root)
|
1945
|
+
:param query (str): The query to limit results (Default *)
|
1946
|
+
:param document_family (Optional[DocumentFamily): Optionally the document family to limit results to
|
1947
|
+
:param parent_id (Optional[str]): Optionally the parent ID to limit results to
|
1948
|
+
:return:
|
1949
|
+
"""
|
1950
|
+
page_size = 20
|
1951
|
+
page = 1
|
1952
|
+
|
1953
|
+
while True:
|
1954
|
+
data_object_response = self.get_data_objects_page_request(self, path, page, page_size, query,
|
1955
|
+
document_family, parent_id)
|
1956
|
+
if not data_object_response.content:
|
1957
|
+
break
|
1958
|
+
|
1959
|
+
yield data_object_response.content
|
1960
|
+
for data_object in data_object_response.content:
|
1961
|
+
yield data_object
|
1962
|
+
|
1963
|
+
page += 1
|
1964
|
+
|
1940
1965
|
def create_data_objects(self, data_objects: List[DataObject]) -> List[DataObjectEndpoint]:
|
1941
1966
|
"""
|
1942
1967
|
Create data objects in the store
|
@@ -2079,7 +2104,7 @@ class DocumentStoreEndpoint(StoreEndpoint):
|
|
2079
2104
|
def download_document_families(self, output_dir: str):
|
2080
2105
|
"""Download all the document families in the store to the given directory"""
|
2081
2106
|
|
2082
|
-
for document_family in self.
|
2107
|
+
for document_family in self.stream_query():
|
2083
2108
|
export_bytes = document_family.export()
|
2084
2109
|
with open(os.path.join(output_dir, document_family.id + ".dfm"), 'wb') as f:
|
2085
2110
|
f.write(export_bytes)
|
@@ -1,6 +1,6 @@
|
|
1
1
|
[tool.poetry]
|
2
2
|
name = "kodexa"
|
3
|
-
version = "6.1.
|
3
|
+
version = "6.1.1a2-4573624930"
|
4
4
|
description = "Python SDK for the Kodexa Platform"
|
5
5
|
authors = ["Austin Redenbaugh <austin@kodexa.com>", "Philip Dodds <philip@kodexa.com>", "Romar Cablao <rcablao@kodexa.com>", "Amadea Paula Dodds <amadeapaula@kodexa.com>"]
|
6
6
|
readme = "README.md"
|
@@ -37,7 +37,7 @@ install_requires = \
|
|
37
37
|
|
38
38
|
setup_kwargs = {
|
39
39
|
'name': 'kodexa',
|
40
|
-
'version': '6.1.
|
40
|
+
'version': '6.1.1a2.post4573624930',
|
41
41
|
'description': 'Python SDK for the Kodexa Platform',
|
42
42
|
'long_description': '# Kodexa\n\n[](https://github.com/kodexa-ai/kodexa/actions/workflows/main.yml)\n\n\n\nKodexa is a platform for building intelligent document processing pipelines. It is a set of tools and services that\nallow you to build a pipeline that can take a document, extract the content, and then process it to extract the\ninformation you need.\n\nIt is built on a set of core principles:\n\n* **Document Centric** - Kodexa is built around the idea of a document. A document is a collection of content\n nodes that are connected together. This is a powerful model that allows you to build pipelines that can\n extract content from a wide range of sources.\n\n* **Pipeline Oriented** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that\n can be executed on a document. This allows you to build a pipeline that can extract content from a wide range\n of sources.\n\n* **Extensible** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that can be executed\n on a document. This allows you to build a pipeline that can extract content from a wide range of sources.\n\n* **Label Driven** - Kodexa focuses on the idea of labels. Labels are a way to identify content within a document\n and then use that content to drive the processing of the document.\n\n# Python SDK\n\nThis repository contains the Python SDK for Kodexa. The SDK is the primary way to interact with Kodexa. It allows you to\ndefine actions, models, and pipelines that can be executed on Kodexa. It also includes a complete SDK client for\nworking with a Kodexa platform instance.\n\n## Documentation & Examples\n\nDocumentation is available at the [Kodexa Documentation Portal](https://docs.kodexa.com)\n\n## Current Development\n\nThe main branch is 6.0 which is a production release.\n\n## Set-up\n\nWe use poetry to manage our dependencies, so you can install them with:\n\n poetry install\n\nYou can then run the tests with:\n\n poetry run pytest\n\n# Contributing\n\nWe welcome contributions to the Kodexa platform. Please see our [contributing guide](CONTRIBUTING.md) for more details.\n\n# License\n\nApache 2.0\n',
|
43
43
|
'author': 'Austin Redenbaugh',
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|
File without changes
|