content-core 1.0.1__tar.gz → 1.0.2__tar.gz
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of content-core might be problematic. Click here for more details.
- {content_core-1.0.1 → content_core-1.0.2}/PKG-INFO +3 -2
- {content_core-1.0.1 → content_core-1.0.2}/pyproject.toml +4 -2
- {content_core-1.0.1 → content_core-1.0.2}/uv.lock +14 -8
- {content_core-1.0.1 → content_core-1.0.2}/.github/PULL_REQUEST_TEMPLATE.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/.github/workflows/publish.yml +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/.gitignore +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/.python-version +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/CONTRIBUTING.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/LICENSE +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/Makefile +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/README.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/docs/processors.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/docs/usage.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/prompts/content/cleanup.jinja +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/prompts/content/summarize.jinja +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/cc_config.yaml +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/common/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/common/exceptions.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/common/state.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/common/types.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/common/utils.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/config.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/cleanup/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/cleanup/core.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/extraction/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/extraction/graph.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/identification/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/summary/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/summary/core.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/logging.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/models.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/models_config.yaml +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/notebooks/run.ipynb +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/audio.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/docling.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/office.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/pdf.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/text.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/url.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/video.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/processors/youtube.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/py.typed +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/templated_message.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/tools/__init__.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/tools/cleanup.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/tools/extract.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/src/content_core/tools/summarize.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.docx +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.epub +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.md +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.mp3 +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.mp4 +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.pdf +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.pptx +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.txt +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file.xlsx +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/input_content/file_audio.mp3 +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/integration/test_cli.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/integration/test_extraction.py +0 -0
- {content_core-1.0.1 → content_core-1.0.2}/tests/unit/test_docling.py +0 -0
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
Metadata-Version: 2.4
|
|
2
2
|
Name: content-core
|
|
3
|
-
Version: 1.0.
|
|
3
|
+
Version: 1.0.2
|
|
4
4
|
Summary: Extract what matters from any media source
|
|
5
5
|
Author-email: LUIS NOVO <lfnovo@gmail.com>
|
|
6
6
|
License-File: LICENSE
|
|
@@ -11,7 +11,7 @@ Requires-Dist: asciidoc>=10.2.1
|
|
|
11
11
|
Requires-Dist: bs4>=0.0.2
|
|
12
12
|
Requires-Dist: dicttoxml>=1.7.16
|
|
13
13
|
Requires-Dist: docling>=2.34.0
|
|
14
|
-
Requires-Dist: esperanto
|
|
14
|
+
Requires-Dist: esperanto>=1.2.0
|
|
15
15
|
Requires-Dist: firecrawl-py>=2.7.0
|
|
16
16
|
Requires-Dist: jinja2>=3.1.6
|
|
17
17
|
Requires-Dist: langdetect>=1.0.9
|
|
@@ -24,6 +24,7 @@ Requires-Dist: pillow>=10.4.0
|
|
|
24
24
|
Requires-Dist: pymupdf>=1.25.5
|
|
25
25
|
Requires-Dist: python-docx>=1.1.2
|
|
26
26
|
Requires-Dist: python-dotenv>=1.1.0
|
|
27
|
+
Requires-Dist: python-magic-bin==0.4.14; sys_platform == 'win32'
|
|
27
28
|
Requires-Dist: python-magic>=0.4.27
|
|
28
29
|
Requires-Dist: python-pptx>=1.0.2
|
|
29
30
|
Requires-Dist: readability-lxml>=0.8.4.1
|
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
[project]
|
|
2
2
|
name = "content-core"
|
|
3
|
-
version = "1.0.
|
|
3
|
+
version = "1.0.2"
|
|
4
4
|
description = "Extract what matters from any media source"
|
|
5
5
|
readme = "README.md"
|
|
6
6
|
homepage = "https://github.com/lfnovo/content-core"
|
|
@@ -11,7 +11,7 @@ requires-python = ">=3.10"
|
|
|
11
11
|
dependencies = [
|
|
12
12
|
"aiohttp>=3.11",
|
|
13
13
|
"bs4>=0.0.2",
|
|
14
|
-
"esperanto
|
|
14
|
+
"esperanto>=1.2.0",
|
|
15
15
|
"jinja2>=3.1.6",
|
|
16
16
|
"langdetect>=1.0.9",
|
|
17
17
|
"loguru>=0.7.3",
|
|
@@ -33,6 +33,8 @@ dependencies = [
|
|
|
33
33
|
"docling>=2.34.0",
|
|
34
34
|
"pillow>=10.4.0",
|
|
35
35
|
"asciidoc>=10.2.1",
|
|
36
|
+
"python-magic-bin==0.4.14; sys_platform == 'win32'",
|
|
37
|
+
|
|
36
38
|
]
|
|
37
39
|
|
|
38
40
|
[project.scripts]
|
|
@@ -410,7 +410,7 @@ wheels = [
|
|
|
410
410
|
|
|
411
411
|
[[package]]
|
|
412
412
|
name = "content-core"
|
|
413
|
-
version = "1.0.
|
|
413
|
+
version = "1.0.2"
|
|
414
414
|
source = { editable = "." }
|
|
415
415
|
dependencies = [
|
|
416
416
|
{ name = "ai-prompter" },
|
|
@@ -419,7 +419,7 @@ dependencies = [
|
|
|
419
419
|
{ name = "bs4" },
|
|
420
420
|
{ name = "dicttoxml" },
|
|
421
421
|
{ name = "docling" },
|
|
422
|
-
{ name = "esperanto"
|
|
422
|
+
{ name = "esperanto" },
|
|
423
423
|
{ name = "firecrawl-py" },
|
|
424
424
|
{ name = "jinja2" },
|
|
425
425
|
{ name = "langdetect" },
|
|
@@ -433,6 +433,7 @@ dependencies = [
|
|
|
433
433
|
{ name = "python-docx" },
|
|
434
434
|
{ name = "python-dotenv" },
|
|
435
435
|
{ name = "python-magic" },
|
|
436
|
+
{ name = "python-magic-bin", marker = "(platform_machine != 'aarch64' and platform_system == 'Linux' and sys_platform == 'win32') or (platform_system != 'Darwin' and platform_system != 'Linux' and sys_platform == 'win32')" },
|
|
436
437
|
{ name = "python-pptx" },
|
|
437
438
|
{ name = "readability-lxml" },
|
|
438
439
|
{ name = "validators" },
|
|
@@ -457,7 +458,7 @@ requires-dist = [
|
|
|
457
458
|
{ name = "bs4", specifier = ">=0.0.2" },
|
|
458
459
|
{ name = "dicttoxml", specifier = ">=1.7.16" },
|
|
459
460
|
{ name = "docling", specifier = ">=2.34.0" },
|
|
460
|
-
{ name = "esperanto",
|
|
461
|
+
{ name = "esperanto", specifier = ">=1.2.0" },
|
|
461
462
|
{ name = "firecrawl-py", specifier = ">=2.7.0" },
|
|
462
463
|
{ name = "jinja2", specifier = ">=3.1.6" },
|
|
463
464
|
{ name = "langdetect", specifier = ">=1.0.9" },
|
|
@@ -471,6 +472,7 @@ requires-dist = [
|
|
|
471
472
|
{ name = "python-docx", specifier = ">=1.1.2" },
|
|
472
473
|
{ name = "python-dotenv", specifier = ">=1.1.0" },
|
|
473
474
|
{ name = "python-magic", specifier = ">=0.4.27" },
|
|
475
|
+
{ name = "python-magic-bin", marker = "sys_platform == 'win32'", specifier = "==0.4.14" },
|
|
474
476
|
{ name = "python-pptx", specifier = ">=1.0.2" },
|
|
475
477
|
{ name = "readability-lxml", specifier = ">=0.8.4.1" },
|
|
476
478
|
{ name = "validators", specifier = ">=0.34.0" },
|
|
@@ -729,11 +731,6 @@ wheels = [
|
|
|
729
731
|
{ url = "https://files.pythonhosted.org/packages/f9/79/5d74f2b8f9d73da83bfe80a39ff11505a2a285c03a869750db98cd89ddfd/esperanto-1.2.1-py3-none-any.whl", hash = "sha256:2fa41e5e35c847b1fe58395906d8877035f7e55d6429870d897781f7c9f17c42", size = 57680 },
|
|
730
732
|
]
|
|
731
733
|
|
|
732
|
-
[package.optional-dependencies]
|
|
733
|
-
openai = [
|
|
734
|
-
{ name = "openai" },
|
|
735
|
-
]
|
|
736
|
-
|
|
737
734
|
[[package]]
|
|
738
735
|
name = "et-xmlfile"
|
|
739
736
|
version = "2.0.0"
|
|
@@ -2919,6 +2916,15 @@ wheels = [
|
|
|
2919
2916
|
{ url = "https://files.pythonhosted.org/packages/6c/73/9f872cb81fc5c3bb48f7227872c28975f998f3e7c2b1c16e95e6432bbb90/python_magic-0.4.27-py2.py3-none-any.whl", hash = "sha256:c212960ad306f700aa0d01e5d7a325d20548ff97eb9920dcd29513174f0294d3", size = 13840 },
|
|
2920
2917
|
]
|
|
2921
2918
|
|
|
2919
|
+
[[package]]
|
|
2920
|
+
name = "python-magic-bin"
|
|
2921
|
+
version = "0.4.14"
|
|
2922
|
+
source = { registry = "https://pypi.org/simple" }
|
|
2923
|
+
wheels = [
|
|
2924
|
+
{ url = "https://files.pythonhosted.org/packages/5a/5d/10b9ac745d9fd2f7151a2ab901e6bb6983dbd70e87c71111f54859d1ca2e/python_magic_bin-0.4.14-py2.py3-none-win32.whl", hash = "sha256:34a788c03adde7608028203e2dbb208f1f62225ad91518787ae26d603ae68892", size = 397784 },
|
|
2925
|
+
{ url = "https://files.pythonhosted.org/packages/07/c2/094e3d62b906d952537196603a23aec4bcd7c6126bf80eb14e6f9f4be3a2/python_magic_bin-0.4.14-py2.py3-none-win_amd64.whl", hash = "sha256:90be6206ad31071a36065a2fc169c5afb5e0355cbe6030e87641c6c62edc2b69", size = 409299 },
|
|
2926
|
+
]
|
|
2927
|
+
|
|
2922
2928
|
[[package]]
|
|
2923
2929
|
name = "python-pptx"
|
|
2924
2930
|
version = "1.0.2"
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
{content_core-1.0.1 → content_core-1.0.2}/src/content_core/content/identification/__init__.py
RENAMED
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|
|
File without changes
|