PyPI - onnxtr - Versions diffs - 0.1.0__py3-none-any.whl - Mend

onnxtr 0.1.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (70) hide show

onnxtr/__init__.py +2 -0
onnxtr/contrib/__init__.py +0 -0
onnxtr/contrib/artefacts.py +131 -0
onnxtr/contrib/base.py +105 -0
onnxtr/file_utils.py +33 -0
onnxtr/io/__init__.py +5 -0
onnxtr/io/elements.py +455 -0
onnxtr/io/html.py +28 -0
onnxtr/io/image.py +56 -0
onnxtr/io/pdf.py +42 -0
onnxtr/io/reader.py +85 -0
onnxtr/models/__init__.py +4 -0
onnxtr/models/_utils.py +141 -0
onnxtr/models/builder.py +355 -0
onnxtr/models/classification/__init__.py +2 -0
onnxtr/models/classification/models/__init__.py +1 -0
onnxtr/models/classification/models/mobilenet.py +120 -0
onnxtr/models/classification/predictor/__init__.py +1 -0
onnxtr/models/classification/predictor/base.py +57 -0
onnxtr/models/classification/zoo.py +76 -0
onnxtr/models/detection/__init__.py +2 -0
onnxtr/models/detection/core.py +101 -0
onnxtr/models/detection/models/__init__.py +3 -0
onnxtr/models/detection/models/differentiable_binarization.py +159 -0
onnxtr/models/detection/models/fast.py +160 -0
onnxtr/models/detection/models/linknet.py +160 -0
onnxtr/models/detection/postprocessor/__init__.py +0 -0
onnxtr/models/detection/postprocessor/base.py +144 -0
onnxtr/models/detection/predictor/__init__.py +1 -0
onnxtr/models/detection/predictor/base.py +54 -0
onnxtr/models/detection/zoo.py +73 -0
onnxtr/models/engine.py +50 -0
onnxtr/models/predictor/__init__.py +1 -0
onnxtr/models/predictor/base.py +175 -0
onnxtr/models/predictor/predictor.py +145 -0
onnxtr/models/preprocessor/__init__.py +1 -0
onnxtr/models/preprocessor/base.py +118 -0
onnxtr/models/recognition/__init__.py +2 -0
onnxtr/models/recognition/core.py +28 -0
onnxtr/models/recognition/models/__init__.py +5 -0
onnxtr/models/recognition/models/crnn.py +226 -0
onnxtr/models/recognition/models/master.py +145 -0
onnxtr/models/recognition/models/parseq.py +134 -0
onnxtr/models/recognition/models/sar.py +134 -0
onnxtr/models/recognition/models/vitstr.py +166 -0
onnxtr/models/recognition/predictor/__init__.py +1 -0
onnxtr/models/recognition/predictor/_utils.py +86 -0
onnxtr/models/recognition/predictor/base.py +79 -0
onnxtr/models/recognition/utils.py +89 -0
onnxtr/models/recognition/zoo.py +69 -0
onnxtr/models/zoo.py +114 -0
onnxtr/transforms/__init__.py +1 -0
onnxtr/transforms/base.py +112 -0
onnxtr/utils/__init__.py +4 -0
onnxtr/utils/common_types.py +18 -0
onnxtr/utils/data.py +126 -0
onnxtr/utils/fonts.py +41 -0
onnxtr/utils/geometry.py +498 -0
onnxtr/utils/multithreading.py +50 -0
onnxtr/utils/reconstitution.py +70 -0
onnxtr/utils/repr.py +64 -0
onnxtr/utils/visualization.py +291 -0
onnxtr/utils/vocabs.py +71 -0
onnxtr/version.py +1 -0
onnxtr-0.1.0.dist-info/LICENSE +201 -0
onnxtr-0.1.0.dist-info/METADATA +481 -0
onnxtr-0.1.0.dist-info/RECORD +70 -0
onnxtr-0.1.0.dist-info/WHEEL +5 -0
onnxtr-0.1.0.dist-info/top_level.txt +2 -0
onnxtr-0.1.0.dist-info/zip-safe +1 -0

onnxtr/__init__.py ADDED Viewed

	@@ -0,0 +1,2 @@
1	+ from . import io, models, contrib, transforms, utils
2	+ from .version import __version__ # noqa: F401

onnxtr/contrib/__init__.py ADDED Viewed

File without changes

onnxtr/contrib/artefacts.py ADDED Viewed

@@ -0,0 +1,131 @@
+# Copyright (C) 2021-2024, Mindee | Felix Dittrich.
+# This program is licensed under the Apache License 2.0.
+# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
+from typing import Any, Dict, List, Optional, Tuple
+import cv2
+import numpy as np
+from onnxtr.file_utils import requires_package
+from .base import _BasePredictor
+__all__ = ["ArtefactDetector"]
+default_cfgs: Dict[str, Dict[str, Any]] = {
+    "yolov8_artefact": {
+        "input_shape": (3, 1024, 1024),
+        "labels": ["bar_code", "qr_code", "logo", "photo"],
+        "url": "https://github.com/felixdittrich92/OnnxTR/releases/download/v0.0.1/yolo_artefact-f9d66f14.onnx",
+    },
+}
+class ArtefactDetector(_BasePredictor):
+    """
+    A class to detect artefacts in images
+    >>> from onnxtr.io import DocumentFile
+    >>> from onnxtr.contrib.artefacts import ArtefactDetector
+    >>> doc = DocumentFile.from_images(["path/to/image.jpg"])
+    >>> detector = ArtefactDetector()
+    >>> results = detector(doc)
+    Args:
+    ----
+        arch: the architecture to use
+        batch_size: the batch size to use
+        model_path: the path to the model to use
+        labels: the labels to use
+        input_shape: the input shape to use
+        mask_labels: the mask labels to use
+        conf_threshold: the confidence threshold to use
+        iou_threshold: the intersection over union threshold to use
+        **kwargs: additional arguments to be passed to `download_from_url`
+    """
+    def __init__(
+        self,
+        arch: str = "yolov8_artefact",
+        batch_size: int = 2,
+        model_path: Optional[str] = None,
+        labels: Optional[List[str]] = None,
+        input_shape: Optional[Tuple[int, int, int]] = None,
+        conf_threshold: float = 0.5,
+        iou_threshold: float = 0.5,
+        **kwargs: Any,
+    ) -> None:
+        super().__init__(batch_size=batch_size, url=default_cfgs[arch]["url"], model_path=model_path, **kwargs)
+        self.labels = labels or default_cfgs[arch]["labels"]
+        self.input_shape = input_shape or default_cfgs[arch]["input_shape"]
+        self.conf_threshold = conf_threshold
+        self.iou_threshold = iou_threshold
+    def preprocess(self, img: np.ndarray) -> np.ndarray:
+        return np.transpose(cv2.resize(img, (self.input_shape[2], self.input_shape[1])), (2, 0, 1)) / np.array(255.0)
+    def postprocess(self, output: List[np.ndarray], input_images: List[List[np.ndarray]]) -> List[List[Dict[str, Any]]]:
+        results = []
+        for batch in zip(output, input_images):
+            for out, img in zip(batch[0], batch[1]):
+                org_height, org_width = img.shape[:2]
+                width_scale, height_scale = org_width / self.input_shape[2], org_height / self.input_shape[1]
+                for res in out:
+                    sample_results = []
+                    for row in np.transpose(np.squeeze(res)):
+                        classes_scores = row[4:]
+                        max_score = np.amax(classes_scores)
+                        if max_score >= self.conf_threshold:
+                            class_id = np.argmax(classes_scores)
+                            x, y, w, h = row[0], row[1], row[2], row[3]
+                            # to rescaled xmin, ymin, xmax, ymax
+                            xmin = int((x - w / 2) * width_scale)
+                            ymin = int((y - h / 2) * height_scale)
+                            xmax = int((x + w / 2) * width_scale)
+                            ymax = int((y + h / 2) * height_scale)
+                            sample_results.append({
+                                "label": self.labels[class_id],
+                                "confidence": float(max_score),
+                                "box": [xmin, ymin, xmax, ymax],
+                            })
+                    # Filter out overlapping boxes
+                    boxes = [res["box"] for res in sample_results]
+                    scores = [res["confidence"] for res in sample_results]
+                    keep_indices = cv2.dnn.NMSBoxes(boxes, scores, self.conf_threshold, self.iou_threshold)  # type: ignore[arg-type]
+                    sample_results = [sample_results[i] for i in keep_indices]
+                    results.append(sample_results)
+        self._results = results
+        return results
+    def show(self, **kwargs: Any) -> None:
+        """
+        Display the results
+        Args:
+        ----
+            **kwargs: additional keyword arguments to be passed to `plt.show`
+        """
+        requires_package("matplotlib", "`.show()` requires matplotlib installed")
+        import matplotlib.pyplot as plt
+        from matplotlib.patches import Rectangle
+        # visualize the results with matplotlib
+        if self._results and self._inputs:
+            for img, res in zip(self._inputs, self._results):
+                plt.figure(figsize=(10, 10))
+                plt.imshow(img)
+                for obj in res:
+                    xmin, ymin, xmax, ymax = obj["box"]
+                    label = obj["label"]
+                    plt.text(xmin, ymin, f"{label} {obj['confidence']:.2f}", color="red")
+                    plt.gca().add_patch(
+                        Rectangle((xmin, ymin), xmax - xmin, ymax - ymin, fill=False, edgecolor="red", linewidth=2)
+                    )
+                plt.show(**kwargs)

onnxtr/contrib/base.py ADDED Viewed

@@ -0,0 +1,105 @@
+# Copyright (C) 2021-2024, Mindee | Felix Dittrich.
+# This program is licensed under the Apache License 2.0.
+# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
+from typing import Any, List, Optional
+import numpy as np
+from onnxtr.file_utils import requires_package
+from onnxtr.utils.data import download_from_url
+class _BasePredictor:
+    """
+    Base class for all predictors
+    Args:
+    ----
+        batch_size: the batch size to use
+        url: the url to use to download a model if needed
+        model_path: the path to the model to use
+        **kwargs: additional arguments to be passed to `download_from_url`
+    """
+    def __init__(self, batch_size: int, url: Optional[str] = None, model_path: Optional[str] = None, **kwargs) -> None:
+        self.batch_size = batch_size
+        self.session = self._init_model(url, model_path, **kwargs)
+        self._inputs: List[np.ndarray] = []
+        self._results: List[Any] = []
+    def _init_model(self, url: Optional[str] = None, model_path: Optional[str] = None, **kwargs: Any) -> Any:
+        """
+        Download the model from the given url if needed
+        Args:
+        ----
+            url: the url to use
+            model_path: the path to the model to use
+            **kwargs: additional arguments to be passed to `download_from_url`
+        Returns:
+        -------
+            Any: the ONNX loaded model
+        """
+        requires_package("onnxruntime", "`.contrib` module requires `onnxruntime` to be installed.")
+        import onnxruntime as ort
+        if not url and not model_path:
+            raise ValueError("You must provide either a url or a model_path")
+        onnx_model_path = model_path if model_path else str(download_from_url(url, cache_subdir="models", **kwargs))  # type: ignore[arg-type]
+        return ort.InferenceSession(onnx_model_path, providers=["CUDAExecutionProvider", "CPUExecutionProvider"])
+    def preprocess(self, img: np.ndarray) -> np.ndarray:
+        """
+        Preprocess the input image
+        Args:
+        ----
+            img: the input image to preprocess
+        Returns:
+        -------
+            np.ndarray: the preprocessed image
+        """
+        raise NotImplementedError
+    def postprocess(self, output: List[np.ndarray], input_images: List[List[np.ndarray]]) -> Any:
+        """
+        Postprocess the model output
+        Args:
+        ----
+            output: the model output to postprocess
+            input_images: the input images used to generate the output
+        Returns:
+        -------
+            Any: the postprocessed output
+        """
+        raise NotImplementedError
+    def __call__(self, inputs: List[np.ndarray]) -> Any:
+        """
+        Call the model on the given inputs
+        Args:
+        ----
+            inputs: the inputs to use
+        Returns:
+        -------
+            Any: the postprocessed output
+        """
+        self._inputs = inputs
+        model_inputs = self.session.get_inputs()
+        batched_inputs = [inputs[i : i + self.batch_size] for i in range(0, len(inputs), self.batch_size)]
+        processed_batches = [
+            np.array([self.preprocess(img) for img in batch], dtype=np.float32) for batch in batched_inputs
+        ]
+        outputs = [self.session.run(None, {model_inputs[0].name: batch}) for batch in processed_batches]
+        return self.postprocess(outputs, batched_inputs)

onnxtr/file_utils.py ADDED Viewed

@@ -0,0 +1,33 @@
+# Copyright (C) 2021-2024, Mindee | Felix Dittrich.
+# This program is licensed under the Apache License 2.0.
+# See LICENSE or go to <https://opensource.org/licenses/Apache-2.0> for full license details.
+import importlib.metadata
+import importlib.util
+import logging
+from typing import Optional
+__all__ = ["requires_package"]
+ENV_VARS_TRUE_VALUES = {"1", "ON", "YES", "TRUE"}
+ENV_VARS_TRUE_AND_AUTO_VALUES = ENV_VARS_TRUE_VALUES.union({"AUTO"})
+def requires_package(name: str, extra_message: Optional[str] = None) -> None:  # pragma: no cover
+    """
+    package requirement helper
+    Args:
+    ----
+        name: name of the package
+        extra_message: additional message to display if the package is not found
+    """
+    try:
+        _pkg_version = importlib.metadata.version(name)
+        logging.info(f"{name} version {_pkg_version} available.")
+    except importlib.metadata.PackageNotFoundError:
+        raise ImportError(
+            f"\n\n{extra_message if extra_message is not None else ''} "
+            f"\nPlease install it with the following command: pip install {name}\n"
+        )

onnxtr/io/__init__.py ADDED Viewed

@@ -0,0 +1,5 @@
+from .elements import *
+from .html import *
+from .image import *
+from .pdf import *
+from .reader import *