kreuzberg 3.20.0__py3-none-any.whl → 3.20.2__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- kreuzberg/_gmft.py +36 -4
- kreuzberg/_types.py +10 -0
- {kreuzberg-3.20.0.dist-info → kreuzberg-3.20.2.dist-info}/METADATA +30 -47
- {kreuzberg-3.20.0.dist-info → kreuzberg-3.20.2.dist-info}/RECORD +17 -18
- kreuzberg-3.20.2.dist-info/WHEEL +4 -0
- {kreuzberg-3.20.0.dist-info → kreuzberg-3.20.2.dist-info}/entry_points.txt +1 -0
- kreuzberg-3.20.0.dist-info/WHEEL +0 -4
- kreuzberg-3.20.0.dist-info/licenses/LICENSE +0 -7
kreuzberg/_gmft.py
CHANGED
@@ -193,9 +193,14 @@ async def extract_tables(
|
|
193
193
|
await run_sync(doc.close)
|
194
194
|
|
195
195
|
except ImportError as e: # pragma: no cover
|
196
|
-
|
196
|
+
error = MissingDependencyError.create_for_package(
|
197
197
|
dependency_group="gmft", functionality="table extraction", package_name="gmft"
|
198
|
-
)
|
198
|
+
)
|
199
|
+
error.context = {
|
200
|
+
"file_path": str(Path(file_path)),
|
201
|
+
"error_message": str(e),
|
202
|
+
}
|
203
|
+
raise error from e
|
199
204
|
finally:
|
200
205
|
table_cache.mark_complete(**cache_kwargs)
|
201
206
|
|
@@ -294,9 +299,14 @@ def extract_tables_sync(
|
|
294
299
|
doc.close() # type: ignore[no-untyped-call]
|
295
300
|
|
296
301
|
except ImportError as e: # pragma: no cover
|
297
|
-
|
302
|
+
error = MissingDependencyError.create_for_package(
|
298
303
|
dependency_group="gmft", functionality="table extraction", package_name="gmft"
|
299
|
-
)
|
304
|
+
)
|
305
|
+
error.context = {
|
306
|
+
"file_path": str(Path(file_path)),
|
307
|
+
"error_message": str(e),
|
308
|
+
}
|
309
|
+
raise error from e
|
300
310
|
|
301
311
|
|
302
312
|
def _extract_tables_in_process(
|
@@ -449,6 +459,17 @@ def _extract_tables_isolated(
|
|
449
459
|
return tables
|
450
460
|
|
451
461
|
error_info = result
|
462
|
+
if error_info.get("type") == "ImportError":
|
463
|
+
error = MissingDependencyError.create_for_package(
|
464
|
+
dependency_group="gmft", functionality="table extraction", package_name="gmft"
|
465
|
+
)
|
466
|
+
error.context = {
|
467
|
+
"file_path": str(Path(file_path)),
|
468
|
+
"error_message": error_info["error"],
|
469
|
+
"traceback": error_info.get("traceback"),
|
470
|
+
}
|
471
|
+
raise error from ImportError(error_info["error"])
|
472
|
+
|
452
473
|
raise ParsingError(
|
453
474
|
f"GMFT table extraction failed: {error_info['error']}",
|
454
475
|
context={
|
@@ -536,6 +557,17 @@ async def _extract_tables_isolated_async(
|
|
536
557
|
return tables
|
537
558
|
|
538
559
|
error_info = result
|
560
|
+
if error_info.get("type") == "ImportError":
|
561
|
+
error = MissingDependencyError.create_for_package(
|
562
|
+
dependency_group="gmft", functionality="table extraction", package_name="gmft"
|
563
|
+
)
|
564
|
+
error.context = {
|
565
|
+
"file_path": str(Path(file_path)),
|
566
|
+
"error_message": error_info["error"],
|
567
|
+
"traceback": error_info.get("traceback"),
|
568
|
+
}
|
569
|
+
raise error from ImportError(error_info["error"])
|
570
|
+
|
539
571
|
raise ParsingError(
|
540
572
|
f"GMFT table extraction failed: {error_info['error']}",
|
541
573
|
context={
|
kreuzberg/_types.py
CHANGED
@@ -1,6 +1,7 @@
|
|
1
1
|
from __future__ import annotations
|
2
2
|
|
3
3
|
import sys
|
4
|
+
import warnings
|
4
5
|
from collections.abc import Awaitable, Callable, Mapping
|
5
6
|
from dataclasses import asdict, dataclass, field
|
6
7
|
from enum import Enum
|
@@ -262,6 +263,15 @@ class PaddleOCRConfig(ConfigDict):
|
|
262
263
|
|
263
264
|
@dataclass(unsafe_hash=True, frozen=True, slots=True)
|
264
265
|
class GMFTConfig(ConfigDict):
|
266
|
+
def __post_init__(self) -> None:
|
267
|
+
warnings.warn(
|
268
|
+
"GMFTConfig is deprecated and will be removed in Kreuzberg v4.0. "
|
269
|
+
"Install `kreuzberg[gmft]` only if you still rely on GMFT. "
|
270
|
+
"Future versions use native TATR-based table extraction via TableExtractionConfig.",
|
271
|
+
FutureWarning,
|
272
|
+
stacklevel=2,
|
273
|
+
)
|
274
|
+
|
265
275
|
verbosity: int = 0
|
266
276
|
"""
|
267
277
|
Verbosity level for logging.
|
@@ -1,13 +1,11 @@
|
|
1
|
-
Metadata-Version: 2.
|
1
|
+
Metadata-Version: 2.3
|
2
2
|
Name: kreuzberg
|
3
|
-
Version: 3.20.
|
3
|
+
Version: 3.20.2
|
4
4
|
Summary: Document intelligence framework for Python - Extract text, metadata, and structured data from diverse file formats
|
5
|
-
|
6
|
-
|
5
|
+
Keywords: async,document-analysis,document-classification,document-intelligence,document-processing,extensible,information-extraction,mcp,metadata-extraction,model-context-protocol,ocr,pandoc,pdf-extraction,pdfium,plugin-architecture,rag,retrieval-augmented-generation,structured-data,table-extraction,tesseract,text-extraction
|
6
|
+
Author: Na'aman Hirschfeld
|
7
7
|
Author-email: Na'aman Hirschfeld <nhirschfed@gmail.com>
|
8
8
|
License: MIT
|
9
|
-
License-File: LICENSE
|
10
|
-
Keywords: async,document-analysis,document-classification,document-intelligence,document-processing,extensible,information-extraction,mcp,metadata-extraction,model-context-protocol,ocr,pandoc,pdf-extraction,pdfium,plugin-architecture,rag,retrieval-augmented-generation,structured-data,table-extraction,tesseract,text-extraction
|
11
9
|
Classifier: Development Status :: 5 - Production/Stable
|
12
10
|
Classifier: Intended Audience :: Developers
|
13
11
|
Classifier: Intended Audience :: Information Technology
|
@@ -19,7 +17,6 @@ Classifier: Programming Language :: Python :: 3.10
|
|
19
17
|
Classifier: Programming Language :: Python :: 3.11
|
20
18
|
Classifier: Programming Language :: Python :: 3.12
|
21
19
|
Classifier: Programming Language :: Python :: 3.13
|
22
|
-
Classifier: Programming Language :: Python :: 3.14
|
23
20
|
Classifier: Topic :: Database
|
24
21
|
Classifier: Topic :: Multimedia :: Graphics :: Capture :: Scanners
|
25
22
|
Classifier: Topic :: Office/Business :: Office Suites
|
@@ -28,11 +25,10 @@ Classifier: Topic :: Scientific/Engineering :: Information Analysis
|
|
28
25
|
Classifier: Topic :: Software Development :: Libraries :: Python Modules
|
29
26
|
Classifier: Topic :: Text Processing :: General
|
30
27
|
Classifier: Typing :: Typed
|
31
|
-
Requires-Python: <3.15,>=3.10
|
32
28
|
Requires-Dist: anyio>=4.11.0
|
33
29
|
Requires-Dist: chardetng-py>=0.3.5
|
34
|
-
Requires-Dist: exceptiongroup>=1.2.2;
|
35
|
-
Requires-Dist: html-to-markdown>=2.1.
|
30
|
+
Requires-Dist: exceptiongroup>=1.2.2 ; python_full_version < '3.11'
|
31
|
+
Requires-Dist: html-to-markdown>=2.1.2
|
36
32
|
Requires-Dist: langcodes>=3.5.0
|
37
33
|
Requires-Dist: mcp>=1.17.0
|
38
34
|
Requires-Dist: msgspec>=0.18.0
|
@@ -43,55 +39,42 @@ Requires-Dist: psutil>=7.1.0
|
|
43
39
|
Requires-Dist: pypdfium2==4.30.0
|
44
40
|
Requires-Dist: python-calamine>=0.5.3
|
45
41
|
Requires-Dist: python-pptx>=1.0.2
|
46
|
-
Requires-Dist: transformers>=4.
|
47
|
-
Requires-Dist: typing-extensions>=4.15.0;
|
42
|
+
Requires-Dist: transformers>=4.55.0
|
43
|
+
Requires-Dist: typing-extensions>=4.15.0 ; python_full_version < '3.12'
|
44
|
+
Requires-Dist: mailparse>=1.0.15 ; extra == 'additional-extensions'
|
45
|
+
Requires-Dist: tomli>=2.0.0 ; python_full_version < '3.11' and extra == 'additional-extensions'
|
46
|
+
Requires-Dist: kreuzberg[additional-extensions,api,chunking,cli,crypto,document-classification,easyocr,entity-extraction,gmft,langdetect,paddleocr] ; extra == 'all'
|
47
|
+
Requires-Dist: litestar[opentelemetry,standard,structlog]>=2.18.0 ; extra == 'api'
|
48
|
+
Requires-Dist: semantic-text-splitter>=0.28.0 ; extra == 'chunking'
|
49
|
+
Requires-Dist: click>=8.3.0 ; extra == 'cli'
|
50
|
+
Requires-Dist: rich>=14.2.0 ; extra == 'cli'
|
51
|
+
Requires-Dist: tomli>=2.0.0 ; python_full_version < '3.11' and extra == 'cli'
|
52
|
+
Requires-Dist: playa-pdf[crypto]>=0.7.0 ; extra == 'crypto'
|
53
|
+
Requires-Dist: deep-translator>=1.11.4 ; extra == 'document-classification'
|
54
|
+
Requires-Dist: easyocr>=1.7.2 ; python_full_version < '3.14' and extra == 'easyocr'
|
55
|
+
Requires-Dist: keybert>=0.9.0 ; extra == 'entity-extraction'
|
56
|
+
Requires-Dist: spacy>=3.8.7 ; python_full_version < '3.14' and extra == 'entity-extraction'
|
57
|
+
Requires-Dist: gmft>=0.4.2 ; extra == 'gmft'
|
58
|
+
Requires-Dist: transformers>=4.57.0 ; extra == 'gmft'
|
59
|
+
Requires-Dist: fast-langdetect>=1.0.0 ; extra == 'langdetect'
|
60
|
+
Requires-Dist: paddleocr>=3.2.0 ; python_full_version < '3.14' and extra == 'paddleocr'
|
61
|
+
Requires-Dist: paddlepaddle>=3.2.0 ; python_full_version < '3.14' and extra == 'paddleocr'
|
62
|
+
Requires-Dist: setuptools>=80.9.0 ; extra == 'paddleocr'
|
63
|
+
Requires-Python: >=3.10
|
64
|
+
Project-URL: documentation, https://kreuzberg.dev
|
65
|
+
Project-URL: homepage, https://github.com/Goldziher/kreuzberg
|
48
66
|
Provides-Extra: additional-extensions
|
49
|
-
Requires-Dist: mailparse>=1.0.15; extra == 'additional-extensions'
|
50
|
-
Requires-Dist: tomli>=2.0.0; (python_version < '3.11') and extra == 'additional-extensions'
|
51
67
|
Provides-Extra: all
|
52
|
-
Requires-Dist: click>=8.3.0; extra == 'all'
|
53
|
-
Requires-Dist: deep-translator>=1.11.4; extra == 'all'
|
54
|
-
Requires-Dist: easyocr>=1.7.2; (python_version < '3.14') and extra == 'all'
|
55
|
-
Requires-Dist: fast-langdetect>=1.0.0; extra == 'all'
|
56
|
-
Requires-Dist: gmft>=0.4.2; extra == 'all'
|
57
|
-
Requires-Dist: keybert>=0.9.0; extra == 'all'
|
58
|
-
Requires-Dist: litestar[opentelemetry,standard,structlog]>=2.18.0; extra == 'all'
|
59
|
-
Requires-Dist: mailparse>=1.0.15; extra == 'all'
|
60
|
-
Requires-Dist: paddleocr>=3.2.0; (python_version < '3.14') and extra == 'all'
|
61
|
-
Requires-Dist: paddlepaddle>=3.2.0; (python_version < '3.14') and extra == 'all'
|
62
|
-
Requires-Dist: playa-pdf[crypto]>=0.7.0; extra == 'all'
|
63
|
-
Requires-Dist: rich>=14.2.0; extra == 'all'
|
64
|
-
Requires-Dist: semantic-text-splitter>=0.28.0; extra == 'all'
|
65
|
-
Requires-Dist: setuptools>=80.9.0; extra == 'all'
|
66
|
-
Requires-Dist: spacy>=3.8.7; (python_version < '3.14') and extra == 'all'
|
67
|
-
Requires-Dist: tomli>=2.0.0; (python_version < '3.11') and extra == 'all'
|
68
|
-
Requires-Dist: transformers>=4.57.0; extra == 'all'
|
69
68
|
Provides-Extra: api
|
70
|
-
Requires-Dist: litestar[opentelemetry,standard,structlog]>=2.18.0; extra == 'api'
|
71
69
|
Provides-Extra: chunking
|
72
|
-
Requires-Dist: semantic-text-splitter>=0.28.0; extra == 'chunking'
|
73
70
|
Provides-Extra: cli
|
74
|
-
Requires-Dist: click>=8.3.0; extra == 'cli'
|
75
|
-
Requires-Dist: rich>=14.2.0; extra == 'cli'
|
76
|
-
Requires-Dist: tomli>=2.0.0; (python_version < '3.11') and extra == 'cli'
|
77
71
|
Provides-Extra: crypto
|
78
|
-
Requires-Dist: playa-pdf[crypto]>=0.7.0; extra == 'crypto'
|
79
72
|
Provides-Extra: document-classification
|
80
|
-
Requires-Dist: deep-translator>=1.11.4; extra == 'document-classification'
|
81
73
|
Provides-Extra: easyocr
|
82
|
-
Requires-Dist: easyocr>=1.7.2; (python_version < '3.14') and extra == 'easyocr'
|
83
74
|
Provides-Extra: entity-extraction
|
84
|
-
Requires-Dist: keybert>=0.9.0; extra == 'entity-extraction'
|
85
|
-
Requires-Dist: spacy>=3.8.7; (python_version < '3.14') and extra == 'entity-extraction'
|
86
75
|
Provides-Extra: gmft
|
87
|
-
Requires-Dist: gmft>=0.4.2; extra == 'gmft'
|
88
|
-
Requires-Dist: transformers>=4.57.0; extra == 'gmft'
|
89
76
|
Provides-Extra: langdetect
|
90
|
-
Requires-Dist: fast-langdetect>=1.0.0; extra == 'langdetect'
|
91
77
|
Provides-Extra: paddleocr
|
92
|
-
Requires-Dist: paddleocr>=3.2.0; (python_version < '3.14') and extra == 'paddleocr'
|
93
|
-
Requires-Dist: paddlepaddle>=3.2.0; (python_version < '3.14') and extra == 'paddleocr'
|
94
|
-
Requires-Dist: setuptools>=80.9.0; extra == 'paddleocr'
|
95
78
|
Description-Content-Type: text/markdown
|
96
79
|
|
97
80
|
# Kreuzberg
|
@@ -1,24 +1,14 @@
|
|
1
1
|
kreuzberg/__init__.py,sha256=niF_YZ7YADL_oXZ8zB5EMov4xnyFzuxTABVlHoRnBJA,1629
|
2
2
|
kreuzberg/__main__.py,sha256=3cIDdzTggj2kj8uKx4WShWHmCWqdZazdM3BxUGbAuSI,104
|
3
|
+
kreuzberg/_api/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
4
|
+
kreuzberg/_api/_config_cache.py,sha256=gX_ezGNq6SCpTn02yFkn24zMVrQwfIk8-u5XkKJiHFg,8774
|
5
|
+
kreuzberg/_api/main.py,sha256=tmg1fICU4wshq0XXhGOk22oivfXjELtsEgOumdkZNI4,15257
|
3
6
|
kreuzberg/_chunker.py,sha256=lRXvVN60vmWaTxa1b3QzvE-jBmOqYzh5dY-3Kl6pSqI,1427
|
4
7
|
kreuzberg/_config.py,sha256=ZYIcnJAjDnbWW_2WBy7NlOk1Ol6WpoMG5FMNMmHpqSY,13086
|
5
8
|
kreuzberg/_constants.py,sha256=gY6SpCi9za59ghRuLX_z7xfSok6qqvPbvEnv4BLczqI,265
|
6
9
|
kreuzberg/_document_classification.py,sha256=55aDxDIJ65qK6yEXt-fRYTn8LgALvYsWssjWSheVpR0,5697
|
7
10
|
kreuzberg/_entity_extraction.py,sha256=Ks-1gZIYDqgg2uJerd0FH_lYhjIwS0f0bMVhR9M59jA,7518
|
8
11
|
kreuzberg/_error_handling.py,sha256=Isr9yrY4JRKOmUVaUOky_LZ7tGVZAm8jxRD3qGbkc1g,5604
|
9
|
-
kreuzberg/_gmft.py,sha256=gfRXOsv-K9R7Y0zZ2SUa5wid3FpP2eFIlg5nepWcz1Q,20827
|
10
|
-
kreuzberg/_language_detection.py,sha256=4JzQldcDIVZRWUzRFc9AOFiq6Wfl9858mip1ZnrD2Ks,1143
|
11
|
-
kreuzberg/_mime_types.py,sha256=duEMDBg_qIf9A02tXAC_2znD-wgE-2BBMW9ofyYTJjE,8622
|
12
|
-
kreuzberg/_playa.py,sha256=p4G5ymSSCbQoDeXJjH-yuVzdd4y-wKcolqDthjPtqok,11413
|
13
|
-
kreuzberg/_registry.py,sha256=8XYT-vPhNYMAbB5RBIUKz-1Zdg48OCnBcdVZzBq6YwY,3307
|
14
|
-
kreuzberg/_types.py,sha256=eh4bZFG3jIw5GhfC3u4R0aa_y9niKZDI4O93j0MCZGw,53672
|
15
|
-
kreuzberg/cli.py,sha256=P_dqOHbGh-fFYZ4WErjngTKq7wbqaUmTD1Gjw2lIsDI,15242
|
16
|
-
kreuzberg/exceptions.py,sha256=KiGAfIX3_TkGYG1h9eTZ_E_pALsAqhZ_A3XfhwxwaS0,2909
|
17
|
-
kreuzberg/extraction.py,sha256=jMsomvg7SPnuXLGZKQl0YH64D0AhczSNDM4CKORd9d0,24185
|
18
|
-
kreuzberg/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
19
|
-
kreuzberg/_api/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
20
|
-
kreuzberg/_api/_config_cache.py,sha256=gX_ezGNq6SCpTn02yFkn24zMVrQwfIk8-u5XkKJiHFg,8774
|
21
|
-
kreuzberg/_api/main.py,sha256=tmg1fICU4wshq0XXhGOk22oivfXjELtsEgOumdkZNI4,15257
|
22
12
|
kreuzberg/_extractors/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
23
13
|
kreuzberg/_extractors/_base.py,sha256=99r-CUZcAp72c0mqkj-E41lj0SyzNaTb_w2EtKgfGJ8,9934
|
24
14
|
kreuzberg/_extractors/_email.py,sha256=DzNthVbmbdlajDUfs0nNwbHNvG0CAQVqJsRfsatHtf0,8799
|
@@ -29,14 +19,19 @@ kreuzberg/_extractors/_pdf.py,sha256=_MPtO_8BCpyAXyIWusmfqOaEsPMDxucjTQKz3cTaj8o
|
|
29
19
|
kreuzberg/_extractors/_presentation.py,sha256=2g6PJnpgUpUfMjQJh-7_gHywDulE8QE8ypH__BrEUTQ,10692
|
30
20
|
kreuzberg/_extractors/_spread_sheet.py,sha256=TJOM70DLN0HzcOkAowZJogAx7QFrouohvU5V0OIliag,12738
|
31
21
|
kreuzberg/_extractors/_structured.py,sha256=thpXhsBnvaHzGQX4sy6eVHowFv0yaYxLGHwxx4DouCI,8947
|
22
|
+
kreuzberg/_gmft.py,sha256=0jmCTEs9EV78awlpCvmfLWAEiiq9n9Qx3n3FnCboTgg,22119
|
23
|
+
kreuzberg/_language_detection.py,sha256=4JzQldcDIVZRWUzRFc9AOFiq6Wfl9858mip1ZnrD2Ks,1143
|
32
24
|
kreuzberg/_mcp/__init__.py,sha256=h6DgLFO4TMUk7_wCJ2jn2Y6IkFmfzb-Z7jX-G5UCYVc,43
|
33
25
|
kreuzberg/_mcp/server.py,sha256=71MhjiFDwgFROdGejf0djgO1eG370qudWmZsN59CUeA,16743
|
26
|
+
kreuzberg/_mime_types.py,sha256=duEMDBg_qIf9A02tXAC_2znD-wgE-2BBMW9ofyYTJjE,8622
|
34
27
|
kreuzberg/_ocr/__init__.py,sha256=grshVFwVQl2rMvH1hg1JNlYXjy5-Tdb_rusLD1Cselk,706
|
35
28
|
kreuzberg/_ocr/_base.py,sha256=ZvOJvW8DtylQJZdCPk9vlVNZiBFK-dC4Oj7Kb6-mWkY,1419
|
36
29
|
kreuzberg/_ocr/_easyocr.py,sha256=bHz2S_8nNHaPHPemcJK-U0al9_qP-vUmWE4ECVlf7AA,15485
|
37
30
|
kreuzberg/_ocr/_paddleocr.py,sha256=CV9cCjkRe-3cNJ5tRu_sBXd_HNghEwfPIgWwxAZTeRY,15026
|
38
31
|
kreuzberg/_ocr/_table_extractor.py,sha256=LhBiCX8R_xR-uK1FH3ONA_vqOmqUWANZJ2HMCBLsmNY,5513
|
39
32
|
kreuzberg/_ocr/_tesseract.py,sha256=9F6V72WGi9ExruSNESjz8WGHCXuTYq1M1ctbayhQO0Y,43358
|
33
|
+
kreuzberg/_playa.py,sha256=p4G5ymSSCbQoDeXJjH-yuVzdd4y-wKcolqDthjPtqok,11413
|
34
|
+
kreuzberg/_registry.py,sha256=8XYT-vPhNYMAbB5RBIUKz-1Zdg48OCnBcdVZzBq6YwY,3307
|
40
35
|
kreuzberg/_token_reduction/__init__.py,sha256=y_2WgPxJes8_PD-VMfx7vQT0hGjFIixzS8PjaIseAGg,311
|
41
36
|
kreuzberg/_token_reduction/_reducer.py,sha256=shAfMPznP69sTSzwX_bE1LpcBmoia9cpd7r6bSc4R5Q,13609
|
42
37
|
kreuzberg/_token_reduction/_stopwords.py,sha256=mu-5CapG0RCP7LYzjhdTM6WWLtmt3cjZ08OOsyQkJVg,3608
|
@@ -104,6 +99,7 @@ kreuzberg/_token_reduction/stopwords/vi_stopwords.json,sha256=UOyAEKBwMcQV65QGpQ
|
|
104
99
|
kreuzberg/_token_reduction/stopwords/yo_stopwords.json,sha256=60liY89h7KReEvHEPxe-hCWLPuqr4U89aQDCi7iRCfo,651
|
105
100
|
kreuzberg/_token_reduction/stopwords/zh_stopwords.json,sha256=rouSTCkXun90Q1aCvLjHyt4I7pGrtlcruDpNVybpAMI,8934
|
106
101
|
kreuzberg/_token_reduction/stopwords/zu_stopwords.json,sha256=hfm4E2EDI_VWyR0GUOVjcMQA7ZDH7FsV4FUMcns1H28,324
|
102
|
+
kreuzberg/_types.py,sha256=qh4S9PhIZkvueTCgvO1d3lKmy5pWYfuhHpoGcoIEyYY,54061
|
107
103
|
kreuzberg/_utils/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
108
104
|
kreuzberg/_utils/_cache.py,sha256=AtANbs1MWR4WLB2MhatVGhlh7kM-yjSfFuDnSVSNp50,14110
|
109
105
|
kreuzberg/_utils/_device.py,sha256=o03rLiHiRX6TKhJ55LO1Vj2Map1Po5YdjuMdA63tGOE,8249
|
@@ -121,8 +117,11 @@ kreuzberg/_utils/_string.py,sha256=wVyvEHByHBeu_6evmqJGv9Ml-NAwkyz60n8l-7L5Cw0,4
|
|
121
117
|
kreuzberg/_utils/_sync.py,sha256=gb828WYfVtkB4wKslJrPMmrdeI1h3htWceq-gywHtO4,3184
|
122
118
|
kreuzberg/_utils/_table.py,sha256=OVg6T2QnerMhVNb1juLTBSIjyjFiE5-OrUWr5NSCgnQ,6493
|
123
119
|
kreuzberg/_utils/_tmp.py,sha256=mwZ0BFzhGPfYa2tt8qSjUjfcHnSYvbQT4VlPRCRc_q8,2038
|
124
|
-
kreuzberg
|
125
|
-
kreuzberg
|
126
|
-
kreuzberg
|
127
|
-
kreuzberg
|
128
|
-
kreuzberg-3.20.
|
120
|
+
kreuzberg/cli.py,sha256=P_dqOHbGh-fFYZ4WErjngTKq7wbqaUmTD1Gjw2lIsDI,15242
|
121
|
+
kreuzberg/exceptions.py,sha256=KiGAfIX3_TkGYG1h9eTZ_E_pALsAqhZ_A3XfhwxwaS0,2909
|
122
|
+
kreuzberg/extraction.py,sha256=jMsomvg7SPnuXLGZKQl0YH64D0AhczSNDM4CKORd9d0,24185
|
123
|
+
kreuzberg/py.typed,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
|
124
|
+
kreuzberg-3.20.2.dist-info/WHEEL,sha256=X16MKk8bp2DRsAuyteHJ-9qOjzmnY0x1aj0P1ftqqWA,78
|
125
|
+
kreuzberg-3.20.2.dist-info/entry_points.txt,sha256=nFqXF3_dNlhHuvtNX26GKKutjOjH2a7TUiaYSu2eOAk,92
|
126
|
+
kreuzberg-3.20.2.dist-info/METADATA,sha256=vR4TfFvm5tx66RV7dS0CXRCTmCFksHb8Jyhy-3FHNUQ,11923
|
127
|
+
kreuzberg-3.20.2.dist-info/RECORD,,
|
kreuzberg-3.20.0.dist-info/WHEEL
DELETED
@@ -1,7 +0,0 @@
|
|
1
|
-
Copyright 2025 Na'aman Hirschfeld
|
2
|
-
|
3
|
-
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated documentation files (the “Software”), to deal in the Software without restriction, including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so, subject to the following conditions:
|
4
|
-
|
5
|
-
The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
|
6
|
-
|
7
|
-
THE SOFTWARE IS PROVIDED “AS IS”, WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|