PyPI - mkv-episode-matcher - Versions diffs - 0.8.0__py3-none-any.whl → 0.8.1__py3-none-any.whl - Mend

mkv-episode-matcher 0.8.0py3-none-any.whl → 0.8.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mkv-episode-matcher might be problematic. Click here for more details.

Files changed (6) hide show

mkv_episode_matcher/episode_identification.py CHANGED Viewed

@@ -50,6 +50,7 @@ class EpisodeMatcher:
         self.min_confidence = min_confidence
         self.show_name = show_name
         self.chunk_duration = 30
+        self.skip_initial_duration = 300
         self.device = "cuda" if torch.cuda.is_available() else "cpu"
         self.temp_dir = Path(tempfile.gettempdir()) / "whisper_chunks"
         self.temp_dir.mkdir(exist_ok=True)
@@ -121,7 +122,8 @@ class EpisodeMatcher:
             str: Combined text from the subtitle chunk
         """
         try:
-            chunk_start = chunk_idx * self.chunk_duration
+            # Apply the same offset as in _try_match_with_model
+            chunk_start = self.skip_initial_duration + (chunk_idx * self.chunk_duration)
             chunk_end = chunk_start + self.chunk_duration
             return self.subtitle_cache.get_chunk(srt_file, chunk_idx, chunk_start, chunk_end)
@@ -133,8 +135,10 @@ class EpisodeMatcher:
     def get_reference_files(self, season_number):
         """Get reference subtitle files with caching."""
         cache_key = (self.show_name, season_number)
+        logger.debug(f"Reference cache key: {cache_key}")
         if cache_key in self.reference_files_cache:
+            logger.debug("Returning cached reference files")
             return self.reference_files_cache[cache_key]
         reference_dir = self.cache_dir / "data" / self.show_name
@@ -158,7 +162,7 @@ class EpisodeMatcher:
         # Remove duplicates while preserving order
         reference_files = list(dict.fromkeys(reference_files))
+        logger.debug(f"Found {len(reference_files)} reference files for season {season_number}")
         self.reference_files_cache[cache_key] = reference_files
         return reference_files
@@ -166,7 +170,8 @@ class EpisodeMatcher:
         self, video_file, model_name, max_duration, reference_files
     ):
         """
-        Attempt to match using specified model, checking multiple 30-second chunks up to max_duration.
+        Attempt to match using specified model, checking multiple chunks starting from skip_initial_duration
+        and continuing up to max_duration.
         Args:
             video_file: Path to the video file
@@ -177,7 +182,7 @@ class EpisodeMatcher:
         # Use cached model
         model = get_whisper_model(model_name, self.device)
-        # Calculate number of chunks to check (30 seconds each)
+        # Calculate number of chunks to check
         num_chunks = min(max_duration // self.chunk_duration, 10)  # Limit to 10 chunks for initial check
         # Pre-load all reference chunks for the chunks we'll check
@@ -186,14 +191,21 @@ class EpisodeMatcher:
                 self.load_reference_chunk(ref_file, chunk_idx)
         for chunk_idx in range(num_chunks):
-            start_time = chunk_idx * self.chunk_duration
+            # Start at self.skip_initial_duration and check subsequent chunks
+            start_time = self.skip_initial_duration + (chunk_idx * self.chunk_duration)
             logger.debug(f"Trying {model_name} model at {start_time} seconds")
             audio_path = self.extract_audio_chunk(video_file, start_time)
+            logger.debug(f"Extracted audio chunk: {audio_path}")
             result = model.transcribe(audio_path, task="transcribe", language="en")
             chunk_text = result["text"]
+            logger.debug(f"Transcription result: {chunk_text} ({len(chunk_text)} characters)")
+            if len(chunk_text) < 10:
+                logger.debug(f"Transcription result too short: {chunk_text} ({len(chunk_text)} characters)")
+                continue
             best_confidence = 0
             best_match = None
@@ -245,7 +257,7 @@ class EpisodeMatcher:
             # Try with tiny model first (fastest)
             logger.info("Attempting match with tiny model...")
             match = self._try_match_with_model(
-                video_file, "tiny", min(duration, 300), reference_files  # Limit to first 5 minutes
+                video_file, "tiny.en", min(duration, 300), reference_files  # Limit to first 5 minutes
             )
             if match and match["confidence"] > 0.65:  # Slightly lower threshold for tiny
                 logger.info(
@@ -255,10 +267,10 @@ class EpisodeMatcher:
             # If no match, try base model
             logger.info(
-                "No match with tiny model, extending base model search to 10 minutes..."
+                "No match with tiny model, extending base model search to 5 minutes..."
             )
             match = self._try_match_with_model(
-                video_file, "base", min(duration, 600), reference_files  # Limit to first 10 minutes
+                video_file, "base.en", min(duration, 300), reference_files  # Limit to first 5 minutes
             )
             if match:
                 logger.info(

{mkv_episode_matcher-0.8.0.dist-info → mkv_episode_matcher-0.8.1.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: mkv-episode-matcher
-Version: 0.8.0
+Version: 0.8.1
 Summary: The MKV Episode Matcher is a tool for identifying TV series episodes from MKV files and renaming the files accordingly.
 Home-page: https://github.com/Jsakkos/mkv-episode-matcher
 Author: Jonathan Sakkos

{mkv_episode_matcher-0.8.0.dist-info → mkv_episode_matcher-0.8.1.dist-info}/RECORD RENAMED Viewed

@@ -2,13 +2,13 @@ mkv_episode_matcher/.gitattributes,sha256=Gh2-F2vCM7SZ01pX23UT8pQcmauXWfF3gwyRSb
 mkv_episode_matcher/__init__.py,sha256=u3yZcpuK0ICeUjxYKePvW-zS61E5ss5q2AvqnSHuz9E,240
 mkv_episode_matcher/__main__.py,sha256=O3GQk5R9BFuA-QNlqfBgDSS7G_W8IGSxiV8CFUbcaLc,10059
 mkv_episode_matcher/config.py,sha256=EcJJjkekQ7oWtarUkufCYON_QWbQvq55-zMqCTOqSa4,2265
-mkv_episode_matcher/episode_identification.py,sha256=IMB1m3-oY4Z31XIWCFjpdXDENwmKMgzjctl3CilthJ4,15926
+mkv_episode_matcher/episode_identification.py,sha256=xH5HIa6oC4nXhlqzdqQn1XYQFNUrnbUVlW-R9RsBHq4,16745
 mkv_episode_matcher/episode_matcher.py,sha256=SxAbnXuTJITD1o0WohE9heE3Fm9zW_w0Nq3GzqtcIpQ,6329
 mkv_episode_matcher/subtitle_utils.py,sha256=Hz9b4CKPV07YKTY4dcN3WbvdbvH-S3J4zcb9CiyvPlE,2551
 mkv_episode_matcher/tmdb_client.py,sha256=LbMCgjmp7sCbrQo_CDlpcnryKPz5S7inE24YY9Pyjk4,4172
 mkv_episode_matcher/utils.py,sha256=modXMLmt2fpny8liXwqe4ylxnwwfg_98OLOacv5izps,14501
-mkv_episode_matcher-0.8.0.dist-info/METADATA,sha256=TcH5g5UfyJop2ZV_tWShEm4O28EkVGLlcpOXbG74mjI,5384
-mkv_episode_matcher-0.8.0.dist-info/WHEEL,sha256=7ciDxtlje1X8OhobNuGgi1t-ACdFSelPnSmDPrtlobY,91
-mkv_episode_matcher-0.8.0.dist-info/entry_points.txt,sha256=IglJ43SuCZq2eQ3shMFILCkmQASJHnDCI3ogohW2Hn4,64
-mkv_episode_matcher-0.8.0.dist-info/top_level.txt,sha256=XRLbd93HUaedeWLtkyTvQjFcE5QcBRYa3V-CfHrq-OI,20
-mkv_episode_matcher-0.8.0.dist-info/RECORD,,
+mkv_episode_matcher-0.8.1.dist-info/METADATA,sha256=JpSdL1OU5UwQb6aPARqV9YzQWtoEdmoJZkmw_7FcUwM,5384
+mkv_episode_matcher-0.8.1.dist-info/WHEEL,sha256=zaaOINJESkSfm_4HQVc5ssNzHCPXhJm0kEUakpsEHaU,91
+mkv_episode_matcher-0.8.1.dist-info/entry_points.txt,sha256=IglJ43SuCZq2eQ3shMFILCkmQASJHnDCI3ogohW2Hn4,64
+mkv_episode_matcher-0.8.1.dist-info/top_level.txt,sha256=XRLbd93HUaedeWLtkyTvQjFcE5QcBRYa3V-CfHrq-OI,20
+mkv_episode_matcher-0.8.1.dist-info/RECORD,,

{mkv_episode_matcher-0.8.0.dist-info → mkv_episode_matcher-0.8.1.dist-info}/WHEEL RENAMED Viewed

@@ -1,5 +1,5 @@
 Wheel-Version: 1.0
-Generator: setuptools (80.2.0)
+Generator: setuptools (80.8.0)
 Root-Is-Purelib: true
 Tag: py3-none-any

{mkv_episode_matcher-0.8.0.dist-info → mkv_episode_matcher-0.8.1.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{mkv_episode_matcher-0.8.0.dist-info → mkv_episode_matcher-0.8.1.dist-info}/top_level.txt RENAMED Viewed

File without changes

mkv-episode-matcher 0.8.0__py3-none-any.whl → 0.8.1__py3-none-any.whl

Potentially problematic release.

mkv-episode-matcher 0.8.0py3-none-any.whl → 0.8.1py3-none-any.whl