PyPI - content-core - Versions diffs - 1.0.3__tar.gz → 1.0.4__tar.gz - Mend

content-core 1.0.3tar.gz → 1.0.4tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of content-core might be problematic. Click here for more details.

Files changed (62) hide show

{content_core-1.0.3 → content_core-1.0.4}/PKG-INFO RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: content-core
-Version: 1.0.3
+Version: 1.0.4
 Summary: Extract what matters from any media source
 Author-email: LUIS NOVO <lfnovo@gmail.com>
 License-File: LICENSE

{content_core-1.0.3 → content_core-1.0.4}/pyproject.toml RENAMED Viewed

@@ -1,6 +1,6 @@
 [project]
 name = "content-core"
-version = "1.0.3"
+version = "1.0.4"
 description = "Extract what matters from any media source"
 readme = "README.md"
 homepage = "https://github.com/lfnovo/content-core"

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/summary/core.py RENAMED Viewed

@@ -8,7 +8,7 @@ async def summarize(content: str, context: str) -> str:
     templated_message_fn = partial(templated_message, model=ModelFactory.get_model('summary_model'))
     response = await templated_message_fn(
         TemplatedMessageInput(
-            user_prompt_template="content/summarize",
+            user_prompt_template="prompts/content/summarize",
             data={"content": content, "context": context},
         )
     )

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/youtube.py RENAMED Viewed

@@ -3,13 +3,12 @@ import ssl
 import aiohttp
 from bs4 import BeautifulSoup
-from youtube_transcript_api import YouTubeTranscriptApi  # type: ignore
-from youtube_transcript_api.formatters import TextFormatter  # type: ignore
 from content_core.common import ProcessSourceState
 from content_core.common.exceptions import NoTranscriptFound
 from content_core.config import CONFIG
 from content_core.logging import logger
+from youtube_transcript_api import YouTubeTranscriptApi  # type: ignore
+from youtube_transcript_api.formatters import TextFormatter  # type: ignore
 ssl._create_default_https_context = ssl._create_unverified_context
@@ -137,7 +136,7 @@ def extract_transcript_pytubefix(url, languages=["en", "es", "pt"]):
     from pytubefix import YouTube
     yt = YouTube(url)
-    print(yt.captions)
+    logger.debug(f"Captions: {yt.captions}")
     # Try to get captions in the preferred languages
     if yt.captions:
@@ -149,12 +148,20 @@ def extract_transcript_pytubefix(url, languages=["en", "es", "pt"]):
                 caption = yt.captions[f"a.{lang}"]
                 break
         else:  # No preferred language found, use the first available
-            caption_key = next(iter(yt.captions))
-            caption = yt.captions[caption_key]
-        srt_captions = caption.generate_srt_captions()
-        txt_captions = caption.generate_txt_captions()
-        return txt_captions, srt_captions
+            caption_key = list(yt.captions.keys())[0]
+            caption = yt.captions[caption_key.code]
+        try:
+            srt_captions = caption.generate_srt_captions()
+            txt_captions = caption.generate_txt_captions()
+            return txt_captions, srt_captions
+        except KeyError as e:
+            logger.error(f"KeyError while generating captions for {caption}: {e}")
+            return None, None
+        except Exception as e:
+            logger.error(
+                f"Unexpected error while generating captions for {caption}: {e}"
+            )
+            return None, None
     return None, None

{content_core-1.0.3 → content_core-1.0.4}/uv.lock RENAMED Viewed

@@ -410,7 +410,7 @@ wheels = [
 [[package]]
 name = "content-core"
-version = "1.0.3"
+version = "1.0.4"
 source = { editable = "." }
 dependencies = [
     { name = "ai-prompter" },

{content_core-1.0.3 → content_core-1.0.4}/.github/PULL_REQUEST_TEMPLATE.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/.github/workflows/publish.yml RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/.gitignore RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/.python-version RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/CONTRIBUTING.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/LICENSE RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/Makefile RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/README.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/docs/processors.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/docs/usage.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/prompts/content/cleanup.jinja RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/prompts/content/summarize.jinja RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/cc_config.yaml RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/common/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/common/exceptions.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/common/state.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/common/types.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/common/utils.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/config.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/cleanup/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/cleanup/core.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/extraction/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/extraction/graph.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/identification/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/content/summary/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/logging.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/models.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/models_config.yaml RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/notebooks/run.ipynb RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/audio.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/docling.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/office.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/pdf.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/text.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/url.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/processors/video.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/py.typed RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/templated_message.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/tools/__init__.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/tools/cleanup.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/tools/extract.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/src/content_core/tools/summarize.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.docx RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.epub RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.md RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.mp3 RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.mp4 RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.pdf RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.pptx RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.txt RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file.xlsx RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/input_content/file_audio.mp3 RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/integration/test_cli.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/integration/test_extraction.py RENAMED Viewed

File without changes

{content_core-1.0.3 → content_core-1.0.4}/tests/unit/test_docling.py RENAMED Viewed

File without changes

content-core 1.0.3__tar.gz → 1.0.4__tar.gz

Potentially problematic release.

content-core 1.0.3tar.gz → 1.0.4tar.gz