kodexa 6.1.15059972675__tar.gz → 6.1.15059982168__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (41) hide show
  1. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/PKG-INFO +1 -1
  2. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/model/model.py +43 -1
  3. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/pyproject.toml +1 -1
  4. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/setup.py +1 -1
  5. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/LICENSE +0 -0
  6. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/README.md +0 -0
  7. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/__init__.py +0 -0
  8. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/assistant/__init__.py +0 -0
  9. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/assistant/assistant.py +0 -0
  10. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/connectors/__init__.py +0 -0
  11. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/connectors/connectors.py +0 -0
  12. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/model/__init__.py +0 -0
  13. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/model/base.py +0 -0
  14. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/model/objects.py +0 -0
  15. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/model/persistence.py +0 -0
  16. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/pipeline/__init__.py +0 -0
  17. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/pipeline/pipeline.py +0 -0
  18. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/platform/__init__.py +0 -0
  19. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/platform/client.py +0 -0
  20. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/platform/kodexa.py +0 -0
  21. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/__init__.py +0 -0
  22. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/ast.py +0 -0
  23. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/core.py +0 -0
  24. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/lexrules.py +0 -0
  25. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/lextab.py +0 -0
  26. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/lextab.pyi +0 -0
  27. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/parserules.py +0 -0
  28. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/parserules.pyi +0 -0
  29. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/parsetab.py +0 -0
  30. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/selectors/parsetab.pyi +0 -0
  31. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/spatial/__init__.py +0 -0
  32. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/spatial/azure_models.py +0 -0
  33. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/spatial/bbox_common.py +0 -0
  34. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/spatial/table_form_common.py +0 -0
  35. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/steps/__init__.py +0 -0
  36. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/steps/common.py +0 -0
  37. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/testing/__init__.py +0 -0
  38. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/testing/test_components.py +0 -0
  39. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/testing/test_utils.py +0 -0
  40. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/training/__init__.py +0 -0
  41. {kodexa-6.1.15059972675 → kodexa-6.1.15059982168}/kodexa/training/train_utils.py +0 -0
@@ -1,6 +1,6 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: kodexa
3
- Version: 6.1.15059972675
3
+ Version: 6.1.15059982168
4
4
  Summary: Python SDK for the Kodexa Platform
5
5
  Author: Austin Redenbaugh
6
6
  Author-email: austin@kodexa.com
@@ -82,7 +82,7 @@ class Tag(Dict):
82
82
  """A string representing the value that was labelled in the node"""
83
83
  self.data: Optional[Any] = data
84
84
  """Any data object (JSON serializable) that you wish to associate with the label"""
85
- self.uuid: Optional[str] = uuid
85
+ self.uuid: Optional[str] = uuid or str(uuid.uuid4())
86
86
  """The UUID for this tag instance, this allows tags that are on different content nodes to be related through the same UUID"""
87
87
  self.confidence: Optional[float] = confidence
88
88
  """The confidence of the tag in a range of 0-1"""
@@ -1893,6 +1893,9 @@ class Document(object):
1893
1893
  self.classes: List[ContentClassification] = []
1894
1894
  """A list of the content classifications associated at the document level"""
1895
1895
 
1896
+ self.tag_instances: List[TagInstance] = []
1897
+ """A list of tag instances that contains a set of tag that has a set of nodes"""
1898
+
1896
1899
  # Start persistence layer
1897
1900
  from kodexa.model import PersistenceManager
1898
1901
 
@@ -1901,6 +1904,36 @@ class Document(object):
1901
1904
  delete_on_close=delete_on_close)
1902
1905
  self._persistence_layer.initialize()
1903
1906
 
1907
+ def add_tag_instance(self, tag_to_apply, node_list: List[ContentNode]):
1908
+ """
1909
+ This will create a group of a tag with indexes
1910
+ :param tag: name of the tag
1911
+ :param node_indices: contains the list of index of a node
1912
+ :return:
1913
+ """
1914
+ # For each node in the list create/update a feature
1915
+ tag = Tag()
1916
+ for node in node_list:
1917
+ node.add_feature('tag', tag_to_apply, Tag)
1918
+ # Tag Object
1919
+ tag_instance = TagInstance(tag, node_list)
1920
+ self.tag_instances.append(tag_instance)
1921
+
1922
+ def update_tag_instance(self, tag_uuid):
1923
+ for tag_instance in self.tag_instances:
1924
+ if tag_instance.tag.uuid == tag_uuid:
1925
+ # Update attributes of a Tag
1926
+ for node in tag_instance.nodes:
1927
+ node.get_tag(tag_instance.tag.value, tag_uuid=tag_instance.tag.uuid)
1928
+
1929
+ def get_tag_instance(self, tag):
1930
+ """
1931
+ Get the tag instance based on the tag itself
1932
+ :param tag: name of the tag
1933
+ :return: a list of tag instance
1934
+ """
1935
+ return [tag_instance for tag_instance in self.tag_instances if tag_instance.tag == tag]
1936
+
1904
1937
  def get_persistence(self):
1905
1938
  return self._persistence_layer
1906
1939
 
@@ -2444,6 +2477,15 @@ class Document(object):
2444
2477
  return self._persistence_layer.get_all_tagged_nodes()
2445
2478
 
2446
2479
 
2480
+ class TagInstance:
2481
+ def __init__(self, tag: Tag, nodes):
2482
+ self.tag = tag
2483
+ self.nodes = nodes
2484
+
2485
+ def add_node(self, nodes: List[ContentNode]):
2486
+ self.nodes.extend(nodes)
2487
+
2488
+
2447
2489
  class ContentObjectReference:
2448
2490
  """ """
2449
2491
 
@@ -1,6 +1,6 @@
1
1
  [tool.poetry]
2
2
  name = "kodexa"
3
- version = "6.1.15059972675"
3
+ version = "6.1.15059982168"
4
4
  description = "Python SDK for the Kodexa Platform"
5
5
  authors = ["Austin Redenbaugh <austin@kodexa.com>", "Philip Dodds <philip@kodexa.com>", "Romar Cablao <rcablao@kodexa.com>", "Amadea Paula Dodds <amadeapaula@kodexa.com>"]
6
6
  readme = "README.md"
@@ -37,7 +37,7 @@ install_requires = \
37
37
 
38
38
  setup_kwargs = {
39
39
  'name': 'kodexa',
40
- 'version': '6.1.15059972675',
40
+ 'version': '6.1.15059982168',
41
41
  'description': 'Python SDK for the Kodexa Platform',
42
42
  'long_description': '# Kodexa\n\n[![Build and Package with Poetry](https://github.com/kodexa-ai/kodexa/actions/workflows/main.yml/badge.svg?branch=main)](https://github.com/kodexa-ai/kodexa/actions/workflows/main.yml)\n\n![img.png](https://docs.kodexa.com/img.png)\n\nKodexa is a platform for building intelligent document processing pipelines. It is a set of tools and services that\nallow you to build a pipeline that can take a document, extract the content, and then process it to extract the\ninformation you need.\n\nIt is built on a set of core principles:\n\n* **Document Centric** - Kodexa is built around the idea of a document. A document is a collection of content\n nodes that are connected together. This is a powerful model that allows you to build pipelines that can\n extract content from a wide range of sources.\n\n* **Pipeline Oriented** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that\n can be executed on a document. This allows you to build a pipeline that can extract content from a wide range\n of sources.\n\n* **Extensible** - Kodexa is built around the idea of a pipeline. A pipeline is a series of steps that can be executed\n on a document. This allows you to build a pipeline that can extract content from a wide range of sources.\n\n* **Label Driven** - Kodexa focuses on the idea of labels. Labels are a way to identify content within a document\n and then use that content to drive the processing of the document.\n\n# Python SDK\n\nThis repository contains the Python SDK for Kodexa. The SDK is the primary way to interact with Kodexa. It allows you to\ndefine actions, models, and pipelines that can be executed on Kodexa. It also includes a complete SDK client for\nworking with a Kodexa platform instance.\n\n## Documentation & Examples\n\nDocumentation is available at the [Kodexa Documentation Portal](https://docs.kodexa.com)\n\n## Current Development\n\n[//]: # (Replace it with the diagrams and descriptions for build releases)\n**BUILD VERSION FLOW**\n![build-version-flow.png](docs%2Fbuild-version-flow.png)\nBuild version will differ based on the branches that are published to pypi.\n\n**GITHUB PROCESS**\n![github-process.png](docs%2Fgithub-process.png)\nChanges that contain bugs, features, and fixes should first be pushed to the test branch. \nOnce these changes are thoroughly tested, they can be submitted as a pull request to the main branch. The pull request should be reviewed and approved by an appropriate person before the changes can be merged.\n\n## Set-up\n\nWe use poetry to manage our dependencies, so you can install them with:\n\n poetry install\n\nYou can then run the tests with:\n\n poetry run pytest\n\n# Contributing\n\nWe welcome contributions to the Kodexa platform. Please see our [contributing guide](CONTRIBUTING.md) for more details.\n\n# License\n\nApache 2.0\n\n',
43
43
  'author': 'Austin Redenbaugh',