kodexa 6.1.1a1__tar.gz → 6.1.1a2.post4573624930__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (41) hide show
  1. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/PKG-INFO +1 -1
  2. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/client.py +26 -1
  3. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/pyproject.toml +1 -1
  4. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/setup.py +1 -1
  5. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/LICENSE +0 -0
  6. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/README.md +0 -0
  7. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/__init__.py +0 -0
  8. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/assistant/__init__.py +0 -0
  9. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/assistant/assistant.py +0 -0
  10. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/connectors/__init__.py +0 -0
  11. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/connectors/connectors.py +0 -0
  12. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/__init__.py +0 -0
  13. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/base.py +0 -0
  14. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/model.py +0 -0
  15. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/objects.py +0 -0
  16. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/model/persistence.py +0 -0
  17. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/pipeline/__init__.py +0 -0
  18. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/pipeline/pipeline.py +0 -0
  19. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/__init__.py +0 -0
  20. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/platform/kodexa.py +0 -0
  21. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/__init__.py +0 -0
  22. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/ast.py +0 -0
  23. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/core.py +0 -0
  24. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lexrules.py +0 -0
  25. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lextab.py +0 -0
  26. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/lextab.pyi +0 -0
  27. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parserules.py +0 -0
  28. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parserules.pyi +0 -0
  29. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parsetab.py +0 -0
  30. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/selectors/parsetab.pyi +0 -0
  31. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/__init__.py +0 -0
  32. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/azure_models.py +0 -0
  33. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/bbox_common.py +0 -0
  34. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/spatial/table_form_common.py +0 -0
  35. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/steps/__init__.py +0 -0
  36. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/steps/common.py +0 -0
  37. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/__init__.py +0 -0
  38. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/test_components.py +0 -0
  39. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/testing/test_utils.py +0 -0
  40. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/training/__init__.py +0 -0
  41. {kodexa-6.1.1a1 → kodexa-6.1.1a2.post4573624930}/kodexa/training/train_utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: kodexa
3
- Version: 6.1.1a1
3
+ Version: 6.1.1a2.post4573624930
4
4
  Summary: Python SDK for the Kodexa Platform
5
5
  Author: Austin Redenbaugh
6
6
  Author-email: austin@kodexa.com
@@ -1937,6 +1937,31 @@ class DataStoreEndpoint(StoreEndpoint):
1937
1937
  data_object_page.content]
1938
1938
  return data_object_page
1939
1939
 
1940
+ def get_stream_data_objects_request(self, path: str, query="*", document_family: Optional[DocumentFamily] = None,
1941
+ parent_id: Optional[str] = None):
1942
+ """
1943
+ Stream page request
1944
+ :param path (str): The parent taxon (/ is root)
1945
+ :param query (str): The query to limit results (Default *)
1946
+ :param document_family (Optional[DocumentFamily): Optionally the document family to limit results to
1947
+ :param parent_id (Optional[str]): Optionally the parent ID to limit results to
1948
+ :return:
1949
+ """
1950
+ page_size = 20
1951
+ page = 1
1952
+
1953
+ while True:
1954
+ data_object_response = self.get_data_objects_page_request(self, path, page, page_size, query,
1955
+ document_family, parent_id)
1956
+ if not data_object_response.content:
1957
+ break
1958
+
1959
+ yield data_object_response.content
1960
+ for data_object in data_object_response.content:
1961
+ yield data_object
1962
+
1963
+ page += 1
1964
+
1940
1965
  def create_data_objects(self, data_objects: List[DataObject]) -> List[DataObjectEndpoint]:
1941
1966
  """
1942
1967
  Create data objects in the store
@@ -2079,7 +2104,7 @@ class DocumentStoreEndpoint(StoreEndpoint):
2079
2104
  def download_document_families(self, output_dir: str):
2080
2105
  """Download all the document families in the store to the given directory"""
2081
2106
 
2082
- for document_family in self.query(page_size=9999).content:
2107
+ for document_family in self.stream_query():
2083
2108
  export_bytes = document_family.export()
2084
2109
  with open(os.path.join(output_dir, document_family.id + ".dfm"), 'wb') as f:
2085
2110
  f.write(export_bytes)
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "kodexa"
3
- version = "6.1.1a1"
3
+ version = "6.1.1a2-4573624930"
4
4
  description = "Python SDK for the Kodexa Platform"
5
5
  authors = ["Austin Redenbaugh <austin@kodexa.com>", "Philip Dodds <philip@kodexa.com>", "Romar Cablao <rcablao@kodexa.com>", "Amadea Paula Dodds <amadeapaula@kodexa.com>"]
6
6
  readme = "README.md"
@@ -37,7 +37,7 @@ install_requires = \
37
37
 
38
38
  setup_kwargs = {
39
39
  'name': 'kodexa',
40
- 'version': '6.1.1a1',
40
+ 'version': '6.1.1a2.post4573624930',
41
41
  'description': 'Python SDK for the Kodexa Platform',
42
42
  'long_description': '# Kodexa\n\n[![Build and Package with Poetry](https://github.com/kodexa-ai/kodexa/actions/workflows/main.yml/badge.svg?branch=main)](https://github.com/kodexa-ai/kodexa/actions/workflows/main.yml)\n\n![img.png](https://docs.kodexa.com/img.png)\n\nKodexa is a platform for building intelligent document processing pipelines. It is a set of tools and services that\nallow you to build a pipeline that can take a document, extract the content, and then process it to extract the\ninformation you need.\n\nIt is built on a set of core principles:\n\n* **Document Centric** - Kodexa is built around the idea of a document. A document is a collection of content\n nodes that are connected together. This is a powerful model that allows you to build pipelines that can\n extract content from a wide range of sources.\n\n* **Pipeline Oriented** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that\n can be executed on a document. This allows you to build a pipeline that can extract content from a wide range\n of sources.\n\n* **Extensible** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that can be executed\n on a document. This allows you to build a pipeline that can extract content from a wide range of sources.\n\n* **Label Driven** - Kodexa focuses on the idea of labels. Labels are a way to identify content within a document\n and then use that content to drive the processing of the document.\n\n# Python SDK\n\nThis repository contains the Python SDK for Kodexa. The SDK is the primary way to interact with Kodexa. It allows you to\ndefine actions, models, and pipelines that can be executed on Kodexa. It also includes a complete SDK client for\nworking with a Kodexa platform instance.\n\n## Documentation & Examples\n\nDocumentation is available at the [Kodexa Documentation Portal](https://docs.kodexa.com)\n\n## Current Development\n\nThe main branch is 6.0 which is a production release.\n\n## Set-up\n\nWe use poetry to manage our dependencies, so you can install them with:\n\n poetry install\n\nYou can then run the tests with:\n\n poetry run pytest\n\n# Contributing\n\nWe welcome contributions to the Kodexa platform. Please see our [contributing guide](CONTRIBUTING.md) for more details.\n\n# License\n\nApache 2.0\n',
43
43
  'author': 'Austin Redenbaugh',