content-core 0.1.0__tar.gz → 0.1.2__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of content-core might be problematic. Click here for more details.

Files changed (53) hide show
  1. content_core-0.1.2/CONTRIBUTING.md +78 -0
  2. content_core-0.1.2/LICENSE +21 -0
  3. {content_core-0.1.0 → content_core-0.1.2}/PKG-INFO +8 -5
  4. {content_core-0.1.0 → content_core-0.1.2}/README.md +5 -3
  5. {content_core-0.1.0 → content_core-0.1.2}/pyproject.toml +2 -2
  6. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/youtube.py +1 -0
  7. {content_core-0.1.0 → content_core-0.1.2}/uv.lock +2 -2
  8. {content_core-0.1.0 → content_core-0.1.2}/.github/PULL_REQUEST_TEMPLATE.md +0 -0
  9. {content_core-0.1.0 → content_core-0.1.2}/.github/workflows/publish.yml +0 -0
  10. {content_core-0.1.0 → content_core-0.1.2}/.gitignore +0 -0
  11. {content_core-0.1.0 → content_core-0.1.2}/.python-version +0 -0
  12. {content_core-0.1.0 → content_core-0.1.2}/.windsurfrules +0 -0
  13. {content_core-0.1.0 → content_core-0.1.2}/Makefile +0 -0
  14. {content_core-0.1.0 → content_core-0.1.2}/prompts/content/cleanup.jinja +0 -0
  15. {content_core-0.1.0 → content_core-0.1.2}/prompts/content/summarize.jinja +0 -0
  16. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/__init__.py +0 -0
  17. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/common/__init__.py +0 -0
  18. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/common/exceptions.py +0 -0
  19. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/common/state.py +0 -0
  20. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/common/utils.py +0 -0
  21. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/config.py +0 -0
  22. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/__init__.py +0 -0
  23. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/cleanup/__init__.py +0 -0
  24. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/cleanup/core.py +0 -0
  25. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/extraction/__init__.py +0 -0
  26. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/extraction/graph.py +0 -0
  27. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/summary/__init__.py +0 -0
  28. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/content/summary/core.py +0 -0
  29. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/notebooks/run.ipynb +0 -0
  30. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/audio.py +0 -0
  31. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/office.py +0 -0
  32. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/pdf.py +0 -0
  33. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/text.py +0 -0
  34. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/url.py +0 -0
  35. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/processors/video.py +0 -0
  36. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/prompter.py +0 -0
  37. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/py.typed +0 -0
  38. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/templated_message.py +0 -0
  39. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/tools/__init__.py +0 -0
  40. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/tools/cleanup.py +0 -0
  41. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/tools/extract.py +0 -0
  42. {content_core-0.1.0 → content_core-0.1.2}/src/content_core/tools/summarize.py +0 -0
  43. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.docx +0 -0
  44. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.epub +0 -0
  45. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.md +0 -0
  46. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.mp3 +0 -0
  47. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.mp4 +0 -0
  48. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.pdf +0 -0
  49. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.pptx +0 -0
  50. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.txt +0 -0
  51. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file.xlsx +0 -0
  52. {content_core-0.1.0 → content_core-0.1.2}/tests/input_content/file_audio.mp3 +0 -0
  53. {content_core-0.1.0 → content_core-0.1.2}/tests/integration/test_extraction.py +0 -0
@@ -0,0 +1,78 @@
1
+ # Contributing to Content-Core
2
+
3
+ Thank you for your interest in contributing to Content-Core! This guide will help you get started with the contribution process.
4
+
5
+ ## Code of Conduct
6
+
7
+ In the interest of fostering an open and welcoming environment, we expect all contributors to be respectful and considerate of others. By participating in this project, you agree to:
8
+
9
+ - Be respectful of different viewpoints and experiences
10
+ - Gracefully accept constructive criticism
11
+ - Focus on what is best for the community
12
+ - Show empathy towards other community members
13
+
14
+ ## How Can I Contribute?
15
+
16
+ ### Reporting Bugs
17
+
18
+ - Ensure the bug was not already reported by searching on GitHub under [Issues](https://github.com/lfnovo/content-core/issues).
19
+ - If you're unable to find an open issue addressing the problem, [open a new one](https://github.com/lfnovo/content-core/issues/new).
20
+ - Include a clear title and description.
21
+ - Add as much relevant information as possible, including:
22
+ - Steps to reproduce the issue
23
+ - Expected behavior
24
+ - Actual behavior
25
+ - System details (OS, Python version, etc.)
26
+
27
+ ### Suggesting Enhancements
28
+
29
+ - Open an issue with the tag "enhancement" to suggest new features or improvements.
30
+ - Clearly describe the enhancement and its benefits.
31
+
32
+ ### Code Contributions
33
+
34
+ 1. **Fork the Repo**: Fork the project repository to your own GitHub account.
35
+ 2. **Clone the Repo**: Clone the forked repository to your local machine.
36
+ 3. **Create a Branch**: Create a branch with a descriptive name related to the feature or bug you're working on.
37
+ 4. **Make Changes**: Make your changes to the codebase. Ensure your code follows the project's coding style and conventions.
38
+ 5. **Test Your Changes**: Make sure your changes pass all tests. Add tests if you're introducing new functionality.
39
+ 6. **Commit Your Changes**: Commit your changes with a clear and descriptive commit message.
40
+ 7. **Push to Your Fork**: Push your changes to your forked repository.
41
+ 8. **Submit a Pull Request**: Create a pull request from your fork to the main project repository. Provide a clear description of your changes and why they are needed.
42
+
43
+ ### Pull Request Guidelines
44
+
45
+ - Ensure your PR addresses a single issue or feature.
46
+ - Update documentation if your changes affect it.
47
+ - Reference related issues in your PR description.
48
+ - Be prepared to make changes based on feedback from maintainers.
49
+
50
+ ## Development Setup
51
+
52
+ To set up the development environment:
53
+
54
+ 1. Install Python 3.10 or later.
55
+ 2. Install `uv` for package management:
56
+ ```bash
57
+ curl -LsSf https://astral.sh/uv/install.sh | sh
58
+ ```
59
+ 3. Clone the repository and navigate to the project directory.
60
+ 4. Create a virtual environment and install dependencies:
61
+ ```bash
62
+ uv venv
63
+ uv sync
64
+ ```
65
+ 5. Run tests to ensure everything is set up correctly:
66
+ ```bash
67
+ uv run pytest
68
+ ```
69
+
70
+ ## Coding Style
71
+
72
+ We follow PEP 8 for Python code. Please ensure your code adheres to these guidelines. Use tools like `flake8` or `pylint` to check your code style.
73
+
74
+ ## License
75
+
76
+ By contributing to Content-Core, you agree that your contributions will be licensed under the [MIT License](LICENSE).
77
+
78
+ Thank you for contributing to Content-Core and helping make it better!
@@ -0,0 +1,21 @@
1
+ MIT License
2
+
3
+ Copyright (c) 2025 Luis Novo
4
+
5
+ Permission is hereby granted, free of charge, to any person obtaining a copy
6
+ of this software and associated documentation files (the "Software"), to deal
7
+ in the Software without restriction, including without limitation the rights
8
+ to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
9
+ copies of the Software, and to permit persons to whom the Software is
10
+ furnished to do so, subject to the following conditions:
11
+
12
+ The above copyright notice and this permission notice shall be included in all
13
+ copies or substantial portions of the Software.
14
+
15
+ THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16
+ IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17
+ FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
18
+ AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19
+ LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20
+ OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21
+ SOFTWARE.
@@ -1,10 +1,11 @@
1
1
  Metadata-Version: 2.4
2
2
  Name: content-core
3
- Version: 0.1.0
3
+ Version: 0.1.2
4
4
  Summary: Extract what matters from any media source
5
5
  Author-email: LUIS NOVO <lfnovo@gmail.com>
6
+ License-File: LICENSE
6
7
  Requires-Python: >=3.10
7
- Requires-Dist: aiohttp>=3.11.16
8
+ Requires-Dist: aiohttp>=3.11
8
9
  Requires-Dist: bs4>=0.0.2
9
10
  Requires-Dist: dicttoxml>=1.7.16
10
11
  Requires-Dist: esperanto>=1.2.0
@@ -243,8 +244,10 @@ make lint
243
244
  make help
244
245
  ```
245
246
 
247
+ ## License
248
+
249
+ This project is licensed under the [MIT License](LICENSE). See the [LICENSE](LICENSE) file for details.
250
+
246
251
  ## Contributing
247
- Contributions are welcome! Please follow standard practices (fork, feature branch, pull request).
248
252
 
249
- ## License
250
- This project is licensed under the MIT License - see the LICENSE file for details.
253
+ Contributions are welcome! Please see our [Contributing Guide](CONTRIBUTING.md) for more details on how to get started.
@@ -215,8 +215,10 @@ make lint
215
215
  make help
216
216
  ```
217
217
 
218
+ ## License
219
+
220
+ This project is licensed under the [MIT License](LICENSE). See the [LICENSE](LICENSE) file for details.
221
+
218
222
  ## Contributing
219
- Contributions are welcome! Please follow standard practices (fork, feature branch, pull request).
220
223
 
221
- ## License
222
- This project is licensed under the MIT License - see the LICENSE file for details.
224
+ Contributions are welcome! Please see our [Contributing Guide](CONTRIBUTING.md) for more details on how to get started.
@@ -1,6 +1,6 @@
1
1
  [project]
2
2
  name = "content-core"
3
- version = "0.1.0"
3
+ version = "0.1.2"
4
4
  description = "Extract what matters from any media source"
5
5
  readme = "README.md"
6
6
  authors = [
@@ -8,7 +8,7 @@ authors = [
8
8
  ]
9
9
  requires-python = ">=3.10"
10
10
  dependencies = [
11
- "aiohttp>=3.11.16",
11
+ "aiohttp>=3.11",
12
12
  "bs4>=0.0.2",
13
13
  "esperanto>=1.2.0",
14
14
  "google-genai>=1.10.0",
@@ -156,4 +156,5 @@ async def extract_youtube_transcript(state: ProcessSourceState):
156
156
  return {
157
157
  "content": formatter.format_transcript(transcript),
158
158
  "title": title,
159
+ "metadata": {"video_id": video_id, "transcript": transcript.to_raw_data()},
159
160
  }
@@ -354,7 +354,7 @@ wheels = [
354
354
 
355
355
  [[package]]
356
356
  name = "content-core"
357
- version = "0.1.0"
357
+ version = "0.1.2"
358
358
  source = { editable = "." }
359
359
  dependencies = [
360
360
  { name = "aiohttp" },
@@ -390,7 +390,7 @@ dev = [
390
390
 
391
391
  [package.metadata]
392
392
  requires-dist = [
393
- { name = "aiohttp", specifier = ">=3.11.16" },
393
+ { name = "aiohttp", specifier = ">=3.11" },
394
394
  { name = "bs4", specifier = ">=0.0.2" },
395
395
  { name = "dicttoxml", specifier = ">=1.7.16" },
396
396
  { name = "esperanto", specifier = ">=1.2.0" },
File without changes
File without changes