PyPI - GameSentenceMiner - Versions diffs - 2.8.54__py3-none-any.whl → 2.9.1__py3-none-any.whl - Mend

GameSentenceMiner 2.8.54py3-none-any.whl → 2.9.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

GameSentenceMiner/anki.py +1 -1
GameSentenceMiner/communication/websocket.py +7 -0
GameSentenceMiner/config_gui.py +63 -20
GameSentenceMiner/configuration.py +69 -3
GameSentenceMiner/ffmpeg.py +2 -2
GameSentenceMiner/gametext.py +71 -62
GameSentenceMiner/gsm.py +108 -55
GameSentenceMiner/obs.py +2 -2
GameSentenceMiner/ocr/owocr_helper.py +17 -25
GameSentenceMiner/owocr/owocr/ocr.py +4 -3
GameSentenceMiner/text_log.py +1 -1
GameSentenceMiner/vad/groq_trim.py +82 -0
GameSentenceMiner/vad/result.py +15 -2
GameSentenceMiner/vad/silero_trim.py +14 -10
GameSentenceMiner/vad/vad_utils.py +13 -0
GameSentenceMiner/vad/vosk_helper.py +2 -2
GameSentenceMiner/vad/whisper_helper.py +8 -7
GameSentenceMiner/web/templates/index.html +49 -0
GameSentenceMiner/web/templates/utility.html +2 -2
GameSentenceMiner/web/texthooking_page.py +54 -32
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/METADATA +4 -1
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/RECORD +26 -23
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/WHEEL +1 -1
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/entry_points.txt +0 -0
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/licenses/LICENSE +0 -0
{gamesentenceminer-2.8.54.dist-info → gamesentenceminer-2.9.1.dist-info}/top_level.txt +0 -0

GameSentenceMiner/vad/whisper_helper.py CHANGED Viewed

@@ -2,6 +2,7 @@ import tempfile
 import warnings
 import stable_whisper as whisper
+import torch
 from stable_whisper import WhisperResult
 from GameSentenceMiner  import configuration, ffmpeg
@@ -16,10 +17,9 @@ whisper_model = None
 def load_whisper_model():
     global whisper_model
     if whisper_model is None:
-        logger.info(f"Loading Whisper model '{get_config().vad.whisper_model}'... This may take a while.")
         with warnings.catch_warnings(action="ignore"):
             whisper_model = whisper.load_model(get_config().vad.whisper_model)
-        logger.info("Whisper model loaded.")
+        logger.info(f"Whisper model '{get_config().vad.whisper_model}' loaded.")
 # Use Whisper to detect voice activity with timestamps in the audio
@@ -35,8 +35,7 @@ def detect_voice_with_whisper(input_audio):
     # Transcribe the audio using Whisper
     with warnings.catch_warnings(action="ignore"):
-        result: WhisperResult = whisper_model.transcribe(temp_wav, vad=True, language='ja')
+        result: WhisperResult = whisper_model.transcribe(temp_wav, vad=True, language=get_config().vad.language, temperature=0.0)
     voice_activity = []
     logger.debug(result.to_dict())
@@ -75,7 +74,7 @@ def process_audio_with_whisper(input_audio, output_audio, game_line):
     if not voice_activity:
         logger.info("No voice activity detected in the audio.")
-        return VADResult(False, 0, 0)
+        return VADResult(False, 0, 0, WHISPER)
     # Trim based on the first and last speech detected
     start_time = voice_activity[0]['start'] if voice_activity else 0
@@ -95,10 +94,12 @@ def process_audio_with_whisper(input_audio, output_audio, game_line):
     # Trim the audio using FFmpeg
     ffmpeg.trim_audio(input_audio, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, output_audio)
-    return VADResult(True, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset)
+    return VADResult(True, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, WHISPER)
 # Load Whisper model initially
 def initialize_whisper_model():
     load_whisper_model()
-    logger.info(f"Using Whisper model '{get_config().vad.whisper_model}' for Japanese voice detection")
+# initialize_whisper_model()
+# process_audio_with_whisper("tmp6x81cy27.opus", "tmp6x81cy27_trimmed.opus", None)

GameSentenceMiner 2.8.54__py3-none-any.whl → 2.9.1__py3-none-any.whl

GameSentenceMiner 2.8.54py3-none-any.whl → 2.9.1py3-none-any.whl