ocr-stringdist 1.0.0__cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl → 1.0.1__cp310-cp310-manylinux_2_17_aarch64.manylinux2014_aarch64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- ocr_stringdist/__init__.py +2 -0
- ocr_stringdist/_rust_stringdist.cpython-310-aarch64-linux-gnu.so +0 -0
- ocr_stringdist/edit_operation.py +5 -2
- ocr_stringdist/levenshtein.py +2 -1
- {ocr_stringdist-1.0.0.dist-info → ocr_stringdist-1.0.1.dist-info}/METADATA +1 -1
- ocr_stringdist-1.0.1.dist-info/RECORD +13 -0
- ocr_stringdist-1.0.0.dist-info/RECORD +0 -13
- {ocr_stringdist-1.0.0.dist-info → ocr_stringdist-1.0.1.dist-info}/WHEEL +0 -0
- {ocr_stringdist-1.0.0.dist-info → ocr_stringdist-1.0.1.dist-info}/licenses/LICENSE +0 -0
    
        ocr_stringdist/__init__.py
    CHANGED
    
    | @@ -1,10 +1,12 @@ | |
| 1 1 | 
             
            from .default_ocr_distances import ocr_distance_map
         | 
| 2 | 
            +
            from .edit_operation import EditOperation
         | 
| 2 3 | 
             
            from .learner import CostLearner
         | 
| 3 4 | 
             
            from .levenshtein import WeightedLevenshtein
         | 
| 4 5 | 
             
            from .matching import find_best_candidate
         | 
| 5 6 |  | 
| 6 7 | 
             
            __all__ = [
         | 
| 7 8 | 
             
                "ocr_distance_map",
         | 
| 9 | 
            +
                "EditOperation",
         | 
| 8 10 | 
             
                "CostLearner",
         | 
| 9 11 | 
             
                "WeightedLevenshtein",
         | 
| 10 12 | 
             
                "find_best_candidate",
         | 
| Binary file | 
    
        ocr_stringdist/edit_operation.py
    CHANGED
    
    | @@ -1,5 +1,5 @@ | |
| 1 | 
            -
            from dataclasses import dataclass
         | 
| 2 | 
            -
            from typing import Literal, Optional
         | 
| 1 | 
            +
            from dataclasses import asdict, dataclass
         | 
| 2 | 
            +
            from typing import Any, Literal, Optional
         | 
| 3 3 |  | 
| 4 4 | 
             
            OperationType = Literal["substitute", "insert", "delete", "match"]
         | 
| 5 5 |  | 
| @@ -14,3 +14,6 @@ class EditOperation: | |
| 14 14 | 
             
                source_token: Optional[str]
         | 
| 15 15 | 
             
                target_token: Optional[str]
         | 
| 16 16 | 
             
                cost: float
         | 
| 17 | 
            +
             | 
| 18 | 
            +
                def to_dict(self) -> dict[str, Any]:
         | 
| 19 | 
            +
                    return asdict(self)
         | 
    
        ocr_stringdist/levenshtein.py
    CHANGED
    
    | @@ -191,6 +191,7 @@ class WeightedLevenshtein: | |
| 191 191 | 
             
                    For the counterpart, see :meth:`WeightedLevenshtein.to_dict`.
         | 
| 192 192 |  | 
| 193 193 | 
             
                    :param data: A dictionary with (not necessarily all of) the following keys:
         | 
| 194 | 
            +
             | 
| 194 195 | 
             
                                 - "substitution_costs": {"from": str, "to": str, "cost": float}
         | 
| 195 196 | 
             
                                 - "substitution_costs": dict[str, float]
         | 
| 196 197 | 
             
                                 - "deletion_costs": dict[str, float]
         | 
| @@ -206,7 +207,7 @@ class WeightedLevenshtein: | |
| 206 207 |  | 
| 207 208 | 
             
                    return cls(
         | 
| 208 209 | 
             
                        substitution_costs=sub_costs,
         | 
| 209 | 
            -
                        insertion_costs=data.get(" | 
| 210 | 
            +
                        insertion_costs=data.get("insertion_costs"),
         | 
| 210 211 | 
             
                        deletion_costs=data.get("deletion_costs"),
         | 
| 211 212 | 
             
                        symmetric_substitution=data.get("symmetric_substitution", True),
         | 
| 212 213 | 
             
                        default_substitution_cost=data.get("default_substitution_cost", 1.0),
         | 
| @@ -0,0 +1,13 @@ | |
| 1 | 
            +
            ocr_stringdist-1.0.1.dist-info/METADATA,sha256=86GHCkU8E3oyRoN14UPF_PJM55eD7_1NIVppBRr62Ro,3963
         | 
| 2 | 
            +
            ocr_stringdist-1.0.1.dist-info/WHEEL,sha256=Xci0wQUn185O40gd7BpQOd6FhkCRTTECoTx1iWoeZos,131
         | 
| 3 | 
            +
            ocr_stringdist-1.0.1.dist-info/licenses/LICENSE,sha256=5BPRcjlnbl2t4TidSgpfGrtC_birSf8JlZfA-qmVoQE,1072
         | 
| 4 | 
            +
            ocr_stringdist/__init__.py,sha256=tU-70gwq3CAJ9nZdDSM-C59ShuDE4ClNYEPAkbntYeQ,347
         | 
| 5 | 
            +
            ocr_stringdist/_rust_stringdist.cpython-310-aarch64-linux-gnu.so,sha256=h4Lep-yVduvJY4p3dAHgfV0n0BDbU9wlF98NQMnG5Sk,846672
         | 
| 6 | 
            +
            ocr_stringdist/default_ocr_distances.py,sha256=oSu-TpHjPA4jxKpLAfmap8z0ZsC99jsOjnRVHW7Hj_Y,1033
         | 
| 7 | 
            +
            ocr_stringdist/edit_operation.py,sha256=JjCZulSwZpXLnLL3xcuz2j8EUzNQM9_hNxxVdCHMkvQ,478
         | 
| 8 | 
            +
            ocr_stringdist/learner.py,sha256=3qWvqHrAWm4seuwmBmFN4InRL20u8HnPATHjCTnU3I0,10491
         | 
| 9 | 
            +
            ocr_stringdist/levenshtein.py,sha256=m4WAh5iaQefDIQXzqcgC4XcCXntb7zNKhyWAx8A1yOs,9852
         | 
| 10 | 
            +
            ocr_stringdist/matching.py,sha256=28Xt-x_V_iVsohD3F64MfZ0mys4_qOZXTIAcmSOE0dA,3270
         | 
| 11 | 
            +
            ocr_stringdist/protocols.py,sha256=IyvGzzktPgmPRZyDRE0UKCYo4C0tdewU8IgwFbxZLls,265
         | 
| 12 | 
            +
            ocr_stringdist/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
         | 
| 13 | 
            +
            ocr_stringdist-1.0.1.dist-info/RECORD,,
         | 
| @@ -1,13 +0,0 @@ | |
| 1 | 
            -
            ocr_stringdist-1.0.0.dist-info/METADATA,sha256=sFZnhhX8kHoYFbMua4zHCq2tELQPXQw3vWGNRoStR-4,3963
         | 
| 2 | 
            -
            ocr_stringdist-1.0.0.dist-info/WHEEL,sha256=Xci0wQUn185O40gd7BpQOd6FhkCRTTECoTx1iWoeZos,131
         | 
| 3 | 
            -
            ocr_stringdist-1.0.0.dist-info/licenses/LICENSE,sha256=5BPRcjlnbl2t4TidSgpfGrtC_birSf8JlZfA-qmVoQE,1072
         | 
| 4 | 
            -
            ocr_stringdist/__init__.py,sha256=mL-19TkQQElK5B6iVFCV7vjKVal-6JcsBOFKwiCPQnA,284
         | 
| 5 | 
            -
            ocr_stringdist/_rust_stringdist.cpython-310-aarch64-linux-gnu.so,sha256=9DjP6imI-aliFH3tMIwa4B9HVYt2x3kFvnWPwLCSBTU,846664
         | 
| 6 | 
            -
            ocr_stringdist/default_ocr_distances.py,sha256=oSu-TpHjPA4jxKpLAfmap8z0ZsC99jsOjnRVHW7Hj_Y,1033
         | 
| 7 | 
            -
            ocr_stringdist/edit_operation.py,sha256=EgEc-2_nOwLUZDOWtogYqKLXIQJxOd9sIAbcGkn-TMY,395
         | 
| 8 | 
            -
            ocr_stringdist/learner.py,sha256=3qWvqHrAWm4seuwmBmFN4InRL20u8HnPATHjCTnU3I0,10491
         | 
| 9 | 
            -
            ocr_stringdist/levenshtein.py,sha256=t05FicwL5WTTsRSzDa92v79D2LpDiEUOYG_6te8oT28,9854
         | 
| 10 | 
            -
            ocr_stringdist/matching.py,sha256=28Xt-x_V_iVsohD3F64MfZ0mys4_qOZXTIAcmSOE0dA,3270
         | 
| 11 | 
            -
            ocr_stringdist/protocols.py,sha256=IyvGzzktPgmPRZyDRE0UKCYo4C0tdewU8IgwFbxZLls,265
         | 
| 12 | 
            -
            ocr_stringdist/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
         | 
| 13 | 
            -
            ocr_stringdist-1.0.0.dist-info/RECORD,,
         | 
| 
            File without changes
         | 
| 
            File without changes
         |