PyPI - GameSentenceMiner - Versions diffs - 2.18.7__py3-none-any.whl → 2.18.9__py3-none-any.whl - Mend

GameSentenceMiner 2.18.7py3-none-any.whl → 2.18.9py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (8) hide show

GameSentenceMiner/ui/anki_confirmation.py CHANGED Viewed

@@ -1,14 +1,18 @@
 import tkinter as tk
 from tkinter import scrolledtext
+from tkinter import messagebox
 from PIL import Image, ImageTk
 import ttkbootstrap as ttk
-from GameSentenceMiner.util.configuration import get_config, logger, gsm_state
+from GameSentenceMiner.util.configuration import get_config, logger, gsm_state, get_temporary_directory
 from GameSentenceMiner.util.audio_player import AudioPlayer
+from GameSentenceMiner.util.gsm_utils import make_unique_file_name
 import platform
 import subprocess
 import os
+import requests
+from urllib.parse import quote
 class AnkiConfirmationDialog(tk.Toplevel):
     """
@@ -18,13 +22,20 @@ class AnkiConfirmationDialog(tk.Toplevel):
         super().__init__(parent)
         self.config_app = config_app
         self.screenshot_timestamp = screenshot_timestamp
+        self.translation_text = None
+        self.sentence_text = None
+        self.sentence = sentence  # Store sentence text for TTS
         # Initialize screenshot_path here, will be updated by button if needed
-        self.screenshot_path = screenshot_path
+        self.screenshot_path = screenshot_path
+        self.audio_path = audio_path  # Store audio path so it can be updated
         # Audio player management
         self.audio_player = AudioPlayer(finished_callback=self._audio_finished)
         self.audio_button = None  # Store reference to audio button
+        self.audio_path_label = None  # Store reference to audio path label
+        self.tts_button = None  # Store reference to TTS button
+        self.tts_status_label = None  # Store reference to TTS status label
         self.title("Confirm Anki Card Details")
         self.result = None  # This will store the user's choice
@@ -121,18 +132,36 @@ class AnkiConfirmationDialog(tk.Toplevel):
         # Audio Path
         if audio_path and os.path.isfile(audio_path):
             ttk.Label(main_frame, text="Audio Path:", font=("-weight bold")).grid(row=row, column=0, sticky="ne", padx=5, pady=2)
-            ttk.Label(main_frame, text=audio_path if audio_path else "No Audio", wraplength=400, justify="left").grid(row=row, column=1, sticky="w", padx=5, pady=2)
+            self.audio_path_label = ttk.Label(main_frame, text=audio_path if audio_path else "No Audio", wraplength=400, justify="left")
+            self.audio_path_label.grid(row=row, column=1, sticky="w", padx=5, pady=2)
             if audio_path and os.path.isfile(audio_path):
                 self.audio_button = ttk.Button(
-                    main_frame,
-                    text="▶",
-                    command=lambda: self._play_audio(audio_path),
+                    main_frame,
+                    text="▶",
+                    command=lambda: self._play_audio(self.audio_path),
                     bootstyle="outline-info",
                     width=12
                 )
                 self.audio_button.grid(row=row, column=2, sticky="w", padx=5, pady=2)
             row += 1
+            # TTS Button - only show if TTS is enabled in config
+            if get_config().vad.use_tts_as_fallback and sentence:
+                self.tts_button = ttk.Button(
+                    main_frame,
+                    text="🔊 Generate TTS Audio",
+                    command=self._generate_tts_audio,
+                    bootstyle="info",
+                    width=20
+                )
+                self.tts_button.grid(row=row, column=1, sticky="w", padx=5, pady=2)
+                # TTS Status Label
+                self.tts_status_label = ttk.Label(main_frame, text="", foreground="green")
+                self.tts_status_label.grid(row=row, column=2, sticky="w", padx=5, pady=2)
+                row += 1
         # Action Buttons
         button_frame = ttk.Frame(main_frame)
@@ -213,6 +242,72 @@ class AnkiConfirmationDialog(tk.Toplevel):
             else:
                 self.audio_button.config(text="▶ Play Audio", bootstyle="outline-info")
+    def _generate_tts_audio(self):
+        """Generate TTS audio from the sentence text"""
+        try:
+            # Get the current sentence text from the widget
+            sentence_text = self.sentence_text.get("1.0", tk.END).strip()
+            if not sentence_text:
+                messagebox.showerror("TTS Error", "No sentence text available for TTS generation.")
+                return
+            # URL-encode the sentence text
+            encoded_text = quote(sentence_text)
+            # Build the TTS URL by replacing $s with the encoded text
+            tts_url = get_config().vad.tts_url.replace("$s", encoded_text)
+            logger.info(f"Fetching TTS audio from: {tts_url}")
+            # Fetch TTS audio from the URL
+            response = requests.get(tts_url, timeout=10)
+            if not response.ok:
+                error_msg = f"Failed to fetch TTS audio: HTTP {response.status_code}"
+                logger.error(error_msg)
+                messagebox.showerror("TTS Error", f"{error_msg}\n\nIs your TTS service running?")
+                return
+            # Save TTS audio to GSM temporary directory with game name
+            game_name = gsm_state.current_game if gsm_state.current_game else "tts"
+            filename = f"{game_name}_tts_audio.opus"
+            tts_audio_path = make_unique_file_name(
+                os.path.join(get_temporary_directory(), filename)
+            )
+            with open(tts_audio_path, 'wb') as f:
+                f.write(response.content)
+            logger.info(f"TTS audio saved to: {tts_audio_path}")
+            # Update the audio path
+            self.audio_path = tts_audio_path
+            # Update the audio path label
+            if self.audio_path_label:
+                self.audio_path_label.config(text=tts_audio_path)
+            # Update the audio button command to use the new path
+            if self.audio_button:
+                self.audio_button.config(command=lambda: self._play_audio(self.audio_path))
+            # Update status label to show success
+            if self.tts_status_label:
+                self.tts_status_label.config(text="✓ TTS Audio Generated", foreground="green")
+        except requests.exceptions.Timeout:
+            error_msg = "TTS request timed out. Please check if your TTS service is running."
+            logger.error(error_msg)
+            messagebox.showerror("TTS Error", error_msg)
+        except requests.exceptions.RequestException as e:
+            error_msg = f"Failed to connect to TTS service: {str(e)}"
+            logger.error(error_msg)
+            messagebox.showerror("TTS Error", f"{error_msg}\n\nPlease check your TTS URL configuration.")
+        except Exception as e:
+            error_msg = f"Unexpected error generating TTS: {str(e)}"
+            logger.error(error_msg)
+            messagebox.showerror("TTS Error", error_msg)
     def _cleanup_audio(self):
         """Clean up audio stream resources"""
         self.audio_player.cleanup()
@@ -226,13 +321,13 @@ class AnkiConfirmationDialog(tk.Toplevel):
         # Clean up audio before closing
         self._cleanup_audio()
         # The screenshot_path is now correctly updated if the user chose a new one
-        self.result = (True, self.sentence_text.get("1.0", tk.END).strip(), self.translation_text.get("1.0", tk.END).strip(), self.screenshot_path)
+        self.result = (True, self.sentence_text.get("1.0", tk.END).strip(), self.translation_text.get("1.0", tk.END).strip() if self.translation_text else None, self.screenshot_path)
         self.destroy()
     def _on_no_voice(self):
         # Clean up audio before closing
         self._cleanup_audio()
-        self.result = (False, self.sentence_text.get("1.0", tk.END).strip(), self.translation_text.get("1.0", tk.END).strip(), self.screenshot_path)
+        self.result = (False, self.sentence_text.get("1.0", tk.END).strip(), self.translation_text.get("1.0", tk.END).strip() if self.translation_text else None, self.screenshot_path)
         self.destroy()
     def _on_cancel(self):

GameSentenceMiner/util/get_overlay_coords.py CHANGED Viewed

@@ -106,10 +106,10 @@ class OverlayThread(threading.Thread):
         while True:
             if overlay_server_thread.has_clients():
                 if get_config().overlay.periodic:
-                    await self.overlay_processor.find_box_and_send_to_overlay('')
+                    await self.overlay_processor.find_box_and_send_to_overlay('', True)
                     await asyncio.sleep(get_config().overlay.periodic_interval)
                 elif self.first_time_run:
-                    await self.overlay_processor.find_box_and_send_to_overlay('')
+                    await self.overlay_processor.find_box_and_send_to_overlay('', False)
                     self.first_time_run = False
                 else:
                     await asyncio.sleep(3)
@@ -161,7 +161,7 @@ class OverlayProcessor:
             self.lens = None
             self.regex = None
-    async def find_box_and_send_to_overlay(self, sentence_to_check: str = None):
+    async def find_box_and_send_to_overlay(self, sentence_to_check: str = None, check_against_last: bool = False):
         """
         Sends the detected text boxes to the overlay via WebSocket.
         Cancels any running OCR task before starting a new one.
@@ -175,7 +175,7 @@ class OverlayProcessor:
                 logger.info("Previous OCR task was cancelled")
         # Start new task
-        self.current_task = asyncio.create_task(self.find_box_for_sentence(sentence_to_check))
+        self.current_task = asyncio.create_task(self.find_box_for_sentence(sentence_to_check, check_against_last))
         try:
             await self.current_task
         except asyncio.CancelledError:
@@ -183,7 +183,7 @@ class OverlayProcessor:
         # logger.info(f"Sending {len(boxes)} boxes to overlay.")
         # await send_word_coordinates_to_overlay(boxes)
-    async def find_box_for_sentence(self, sentence_to_check: str = None) -> List[Dict[str, Any]]:
+    async def find_box_for_sentence(self, sentence_to_check: str = None, check_against_last: bool = False) -> List[Dict[str, Any]]:
         """
         Public method to perform OCR and find text boxes for a given sentence.
@@ -191,7 +191,7 @@ class OverlayProcessor:
         error handling.
         """
         try:
-            return await self._do_work(sentence_to_check)
+            return await self._do_work(sentence_to_check, check_against_last=check_against_last)
         except Exception as e:
             logger.error(f"Error during OCR processing: {e}", exc_info=True)
             return []
@@ -304,7 +304,7 @@ class OverlayProcessor:
         return composite_img
-    async def _do_work(self, sentence_to_check: str = None) -> Tuple[List[Dict[str, Any]], int]:
+    async def _do_work(self, sentence_to_check: str = None, check_against_last: bool = False) -> Tuple[List[Dict[str, Any]], int]:
         """The main OCR workflow with cancellation support."""
         if not self.lens:
             logger.error("OCR engines are not initialized. Cannot perform OCR for Overlay.")
@@ -348,7 +348,7 @@ class OverlayProcessor:
             text_str = "".join([text for text in text if self.regex.match(text)])
             # RapidFuzz fuzzy match 90% to not send the same results repeatedly
-            if self.last_oneocr_result:
+            if self.last_oneocr_result and check_against_last:
                 score = fuzz.ratio(text_str, self.last_oneocr_result)
                 if score >= 80:
@@ -403,7 +403,7 @@ class OverlayProcessor:
         text_str = "".join([text for text in text_list if self.regex.match(text)])
         # RapidFuzz fuzzy match 90% to not send the same results repeatedly
-        if self.last_lens_result:
+        if self.last_lens_result and check_against_last:
             score = fuzz.ratio(text_str, self.last_lens_result)
             if score >= 80:
                 logger.info("Google Lens results are similar to the last results (score: %d). Skipping overlay update.", score)
@@ -596,7 +596,7 @@ async def main_run_ocr():
     """
     overlay_processor = OverlayProcessor()
     while True:
-        await overlay_processor.find_box_and_send_to_overlay('')
+        await overlay_processor.find_box_and_send_to_overlay('', False)
         await asyncio.sleep(10)

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/METADATA RENAMED Viewed

@@ -1,6 +1,6 @@
 Metadata-Version: 2.4
 Name: GameSentenceMiner
-Version: 2.18.7
+Version: 2.18.9
 Summary: A tool for mining sentences from games. Update: Overlay?
 Author-email: Beangate <bpwhelan95@gmail.com>
 License: MIT License

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/RECORD RENAMED Viewed

@@ -36,7 +36,7 @@ GameSentenceMiner/tools/furigana_filter_preview.py,sha256=BXv7FChPEJW_VeG5XYt6su
 GameSentenceMiner/tools/ss_selector.py,sha256=ob2oJdiYreDMMau7CvsglpnhZ1CDnJqop3lV54-PjRo,4782
 GameSentenceMiner/tools/window_transparency.py,sha256=GtbxbmZg0-UYPXhfHff-7IKZyY2DKe4B9GdyovfmpeM,8166
 GameSentenceMiner/ui/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/ui/anki_confirmation.py,sha256=fAPdZ_nfpSCuhLBim7jpHNXCnlODWwQs-c8qAS-brwU,10699
+GameSentenceMiner/ui/anki_confirmation.py,sha256=ohpWlPTvKn-_5_lpINdKZciR0k8RWRfnDrfuzyJgItc,15242
 GameSentenceMiner/ui/config_gui.py,sha256=4baqfL33oMshmqm903GZok32Y4JIEV-3K9gf5gxAJDU,152131
 GameSentenceMiner/ui/screenshot_selector.py,sha256=AKML87MpgYQeSuj1F10GngpNrn9qp06zLLzNRwrQWM8,8900
 GameSentenceMiner/util/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
@@ -45,7 +45,7 @@ GameSentenceMiner/util/configuration.py,sha256=lwo73S3xnIMPq8lWSWM6N0pd08A4-Jvre
 GameSentenceMiner/util/db.py,sha256=1DjGjlwWnPefmQfzvMqqFPW0a0qeO-fIXE1YqKiok18,32000
 GameSentenceMiner/util/electron_config.py,sha256=KfeJToeFFVw0IR5MKa-gBzpzaGrU-lyJbR9z-sDEHYU,8767
 GameSentenceMiner/util/ffmpeg.py,sha256=cAzztfY36Xf2WvsJDjavoiMOvA9ac2GVdCrSB4LzHk4,29007
-GameSentenceMiner/util/get_overlay_coords.py,sha256=4V04RNVSIoiGrxRbYgzec2r29L8s7kmOjI_tuwfjLhI,24592
+GameSentenceMiner/util/get_overlay_coords.py,sha256=MFl_JOjwzD0D0iZBPcq5Dgy32YPMKqRrugL0WsfMEu4,24819
 GameSentenceMiner/util/gsm_utils.py,sha256=mASECTmN10c2yPL4NEfLg0Y0YWwFso1i6r_hhJPR3MY,10974
 GameSentenceMiner/util/model.py,sha256=R-_RYTYLSDNgBoVTPuPBcIHeOznIqi_vBzQ7VQ20WYk,6727
 GameSentenceMiner/util/notification.py,sha256=YBhf_mSo_i3cjBz-pmeTPx3wchKiG9BK2VBdZSa2prQ,4597
@@ -125,9 +125,9 @@ GameSentenceMiner/web/templates/components/kanji_grid/thousand_character_classic
 GameSentenceMiner/web/templates/components/kanji_grid/wanikani_levels.json,sha256=8wjnnaYQqmho6t5tMxrIAc03512A2tYhQh5dfsQnfAM,11372
 GameSentenceMiner/web/templates/components/kanji_grid/words_hk_frequency_list.json,sha256=wRkqZNPzz6DT9OTPHpXwfqW96Qb96stCQNNgOL-ZdKk,17535
 GameSentenceMiner/wip/__init___.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-gamesentenceminer-2.18.7.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
-gamesentenceminer-2.18.7.dist-info/METADATA,sha256=tSdKTLxo7GQEm-9Zea4mSZs_2Z1unk-1jPRF3BXEM_Q,7487
-gamesentenceminer-2.18.7.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
-gamesentenceminer-2.18.7.dist-info/entry_points.txt,sha256=2APEP25DbfjSxGeHtwBstMH8mulVhLkqF_b9bqzU6vQ,65
-gamesentenceminer-2.18.7.dist-info/top_level.txt,sha256=V1hUY6xVSyUEohb0uDoN4UIE6rUZ_JYx8yMyPGX4PgQ,18
-gamesentenceminer-2.18.7.dist-info/RECORD,,
+gamesentenceminer-2.18.9.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
+gamesentenceminer-2.18.9.dist-info/METADATA,sha256=4CeXXcMgBMAwMH_61VDFQWr_xyt-5Fg4XDsQ2sfJA6s,7487
+gamesentenceminer-2.18.9.dist-info/WHEEL,sha256=_zCd3N1l69ArxyTb8rzEoP9TpbYXkqRFSNOD5OuxnTs,91
+gamesentenceminer-2.18.9.dist-info/entry_points.txt,sha256=2APEP25DbfjSxGeHtwBstMH8mulVhLkqF_b9bqzU6vQ,65
+gamesentenceminer-2.18.9.dist-info/top_level.txt,sha256=V1hUY6xVSyUEohb0uDoN4UIE6rUZ_JYx8yMyPGX4PgQ,18
+gamesentenceminer-2.18.9.dist-info/RECORD,,

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/WHEEL RENAMED Viewed

File without changes

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/entry_points.txt RENAMED Viewed

File without changes

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/licenses/LICENSE RENAMED Viewed

File without changes

{gamesentenceminer-2.18.7.dist-info → gamesentenceminer-2.18.9.dist-info}/top_level.txt RENAMED Viewed

File without changes

GameSentenceMiner 2.18.7__py3-none-any.whl → 2.18.9__py3-none-any.whl

GameSentenceMiner 2.18.7py3-none-any.whl → 2.18.9py3-none-any.whl