PyPI - GameSentenceMiner - Versions diffs - 2.9.4__py3-none-any.whl → 2.9.6__py3-none-any.whl - Mend

GameSentenceMiner 2.9.4py3-none-any.whl → 2.9.6py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (42) hide show

gamesentenceminer-2.9.6.dist-info/RECORD ADDED Viewed

@@ -0,0 +1,67 @@
+GameSentenceMiner/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/anki.py,sha256=CuzVqzuFtZnbMbU2Zk-sxNGwSgyCpv5RLL7lOOX0Meg,14972
+GameSentenceMiner/config_gui.py,sha256=r-ASCXVNS4Io6Ej3svwC8aJEWc9Rc7u-pzfsAwD4ru8,82079
+GameSentenceMiner/gametext.py,sha256=mM-gw1d7c2EEvMUznaAevTQFLswNZavCuxMXhA9pV4g,6251
+GameSentenceMiner/gsm.py,sha256=SHvT3JZlYpZgKeJnVXrtk8ve4ubiM7YPv-9FDF7rVM4,27724
+GameSentenceMiner/obs.py,sha256=jdAKQFnXlviMupRUKBuK68Q1u8yEZNKBgFnvIq1hhnc,14810
+GameSentenceMiner/vad.py,sha256=Gk_VthD7mDp3-wM_S6bEv8ykGmqzCDbbcRiaEBzAE_o,14835
+GameSentenceMiner/ai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/ai/ai_prompting.py,sha256=tPDiTHlrfZul0hlvEFgZS4V_6oaHkVb-4v79Sd4gtlM,10018
+GameSentenceMiner/assets/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/assets/icon.png,sha256=9GRL8uXUAgkUSlvbm9Pv9o2poFVRGdW6s2ub_DeUD9M,937624
+GameSentenceMiner/assets/icon128.png,sha256=l90j7biwdz5ahwOd5wZ-406ryEV9Pan93dquJQ3e1CI,18395
+GameSentenceMiner/assets/icon256.png,sha256=JEW46wOrG1KR-907rvFaEdNbPtj5gu0HJmG7qUnIHxQ,51874
+GameSentenceMiner/assets/icon32.png,sha256=Kww0hU_qke9_22wBuO_Nq0Dv2SfnOLwMhCyGgbgXdg8,6089
+GameSentenceMiner/assets/icon512.png,sha256=HxUj2GHjyQsk8NV433256UxU9phPhtjCY-YB_7W4sqs,192487
+GameSentenceMiner/assets/icon64.png,sha256=N8xgdZXvhqVQP9QUK3wX5iqxX9LxHljD7c-Bmgim6tM,9301
+GameSentenceMiner/assets/pickaxe.png,sha256=VfIGyXyIZdzEnVcc4PmG3wszPMO1W4KCT7Q_nFK6eSE,1403829
+GameSentenceMiner/ocr/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/ocr/gsm_ocr_config.py,sha256=fEQ2o2NXksGRHpueO8c4TfAp75GEdAtAr1ngTFOsdpg,2257
+GameSentenceMiner/ocr/ocrconfig.py,sha256=_tY8mjnzHMJrLS8E5pHqYXZjMuLoGKYgJwdhYgN-ny4,6466
+GameSentenceMiner/ocr/owocr_area_selector.py,sha256=71trzwz9Isyy-kN9mLS8vIX-giC8Lkin4slLXaxudac,47162
+GameSentenceMiner/ocr/owocr_helper.py,sha256=FQXk5PSCS9gWtcgoIFsPxjVELUwA4Dg1hEX83902K0Q,18114
+GameSentenceMiner/owocr/owocr/__init__.py,sha256=opjBOyGGyEqZCE6YdZPnyt7nVfiwyELHsXA0jAsjm14,25
+GameSentenceMiner/owocr/owocr/__main__.py,sha256=XQaqZY99EKoCpU-gWQjNbTs7Kg17HvBVE7JY8LqIE0o,157
+GameSentenceMiner/owocr/owocr/config.py,sha256=qM7kISHdUhuygGXOxmgU6Ef2nwBShrZtdqu4InDCViE,8103
+GameSentenceMiner/owocr/owocr/lens_betterproto.py,sha256=oNoISsPilVVRBBPVDtb4-roJtAhp8ZAuFTci3TGXtMc,39141
+GameSentenceMiner/owocr/owocr/ocr.py,sha256=y8RHHaJw8M4BG4CbbtIw0DrV8KP9RjbJNJxjM5v91oU,42236
+GameSentenceMiner/owocr/owocr/run.py,sha256=jFN7gYYriHgfqORJiBTz8mPkQsDJ6ZugA0_ATWUxk-U,54750
+GameSentenceMiner/owocr/owocr/screen_coordinate_picker.py,sha256=Na6XStbQBtpQUSdbN3QhEswtKuU1JjReFk_K8t5ezQE,3395
+GameSentenceMiner/util/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/util/configuration.py,sha256=Qk5V4HA2FJbdMTa9jYZfNVQ_4rzvjbUtJgPejwQ3vwk,25856
+GameSentenceMiner/util/electron_config.py,sha256=ZZf54QifdNHbII-JDsMZmdT8nTyrq-7gVvalyLRecfw,9792
+GameSentenceMiner/util/ffmpeg.py,sha256=qaCXkfK2fd-1NRqbm7burrdBYgnGx07kBuyenee8Mtk,18697
+GameSentenceMiner/util/gsm_utils.py,sha256=RoOTvWCVpmfYA7fLDdIPcgH1c6TZK4jDZq98BectPhg,8272
+GameSentenceMiner/util/model.py,sha256=iDtLTfR6D-ZC0gCiDqYno6-gA6Z07PZTM4B5MAA6xZI,5704
+GameSentenceMiner/util/notification.py,sha256=euTnnNDJm0izr0Z5AhZGV2wrrioCASeKUtm5aZFO5zU,3462
+GameSentenceMiner/util/package.py,sha256=u1ym5z869lw5EHvIviC9h9uH97bzUXSXXA8KIn8rUvk,1157
+GameSentenceMiner/util/ss_selector.py,sha256=ATgwDXi4-TLv0hB21NV79FZnXgidiM0z7TgvO7eBnhw,4472
+GameSentenceMiner/util/text_log.py,sha256=XOq8tpJUpNa-mKJPui40P5aUTX2yzMHPnHgJ2obagw0,5201
+GameSentenceMiner/util/communication/__init__.py,sha256=xh__yn2MhzXi9eLi89PeZWlJPn-cbBSjskhi1BRraXg,643
+GameSentenceMiner/util/communication/send.py,sha256=Wki9qIY2CgYnuHbmnyKVIYkcKAN_oYS4up93XMikBaI,222
+GameSentenceMiner/util/communication/websocket.py,sha256=gPgxA2R2U6QZJjPqbUgODC87gtacPhmuC8lCprIkSmA,3287
+GameSentenceMiner/util/downloader/Untitled_json.py,sha256=RUUl2bbbCpUDUUS0fP0tdvf5FngZ7ILdA_J5TFYAXUQ,15272
+GameSentenceMiner/util/downloader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/util/downloader/download_tools.py,sha256=mvnOjDHFlV1AbjHaNI7mdnC5_CH5k3N4n1ezqzzbzGA,8139
+GameSentenceMiner/util/downloader/oneocr_dl.py,sha256=o3ANp5IodEQoQ8GPcJdg9Y8JzA_lictwnebFPwwUZVk,10144
+GameSentenceMiner/web/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/web/texthooking_page.py,sha256=RR70Vgde3wNHarQHbB-LBbEP-z95vRD5rtlW0GgdjmQ,15037
+GameSentenceMiner/web/static/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/web/static/apple-touch-icon.png,sha256=OcMI8af_68DA_tweOsQ5LytTyMwm7-hPW07IfrOVgEs,46132
+GameSentenceMiner/web/static/favicon-96x96.png,sha256=lOePzjiKl1JY2J1kT_PMdyEnrlJmi5GWbmXJunM12B4,16502
+GameSentenceMiner/web/static/favicon.ico,sha256=7d25r_FBqRSNsAoEHpSzNoT7zyVt2DJRLNDNq_HYoX8,15086
+GameSentenceMiner/web/static/favicon.svg,sha256=x305AP6WlXGtrXIZlaQspdLmwteoFYUoe5FyJ9MYlJ8,11517
+GameSentenceMiner/web/static/site.webmanifest,sha256=kaeNT-FjFt-T7JGzOhXH7YSqsrDeiplZ2kDxCN_CFU4,436
+GameSentenceMiner/web/static/style.css,sha256=bPZK0NVMuyRl5NNDuT7ZTzVLKlvSsdmeVHmAW4y5FM0,7001
+GameSentenceMiner/web/static/web-app-manifest-192x192.png,sha256=EfSNnBmsSaLfESbkGfYwbKzcjKOdzuWo18ABADfN974,51117
+GameSentenceMiner/web/static/web-app-manifest-512x512.png,sha256=wyqgCWCrLEUxSRXmaA3iJEESd-vM-ZmlTtZFBY4V8Pk,230819
+GameSentenceMiner/web/templates/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
+GameSentenceMiner/web/templates/index.html,sha256=HZKiIjiGJV8PGQ9T2aLDUNSfJn71qOwbYCjbRuSIjpY,213583
+GameSentenceMiner/web/templates/text_replacements.html,sha256=tV5c8mCaWSt_vKuUpbdbLAzXZ3ATZeDvQ9PnnAfqY0M,8598
+GameSentenceMiner/web/templates/utility.html,sha256=3flZinKNqUJ7pvrZk6xu__v67z44rXnaK7UTZ303R-8,16946
+gamesentenceminer-2.9.6.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
+gamesentenceminer-2.9.6.dist-info/METADATA,sha256=dXyoIXRhD6Qg7iCyRhGgoWjgR9PbS40yCmltnqTJZAA,7250
+gamesentenceminer-2.9.6.dist-info/WHEEL,sha256=zaaOINJESkSfm_4HQVc5ssNzHCPXhJm0kEUakpsEHaU,91
+gamesentenceminer-2.9.6.dist-info/entry_points.txt,sha256=2APEP25DbfjSxGeHtwBstMH8mulVhLkqF_b9bqzU6vQ,65
+gamesentenceminer-2.9.6.dist-info/top_level.txt,sha256=V1hUY6xVSyUEohb0uDoN4UIE6rUZ_JYx8yMyPGX4PgQ,18
+gamesentenceminer-2.9.6.dist-info/RECORD,,

GameSentenceMiner/vad/groq_trim.py DELETED Viewed

@@ -1,82 +0,0 @@
-import os
-import tempfile
-import time
-from groq import Groq
-# Assuming these are available from GameSentenceMiner
-from GameSentenceMiner import configuration, ffmpeg
-from GameSentenceMiner.configuration import get_config, logger, GROQ  # Import specific functions/objects
-from GameSentenceMiner.vad.result import VADResult
-from GameSentenceMiner.vad.vad_utils import get_audio_length
-# Initialize Groq Client
-client = Groq(api_key=get_config().ai.groq_api_key)
-def detect_voice_with_groq(input_audio_path):
-    """
-    Detects voice activity and extracts speech timestamps using the Groq Whisper API.
-    """
-    try:
-        with open(input_audio_path, "rb") as file:
-            transcription = client.audio.transcriptions.create(
-                file=(os.path.basename(input_audio_path), file.read()),
-                model="whisper-large-v3-turbo",
-                response_format="verbose_json",
-                language=get_config().vad.language,
-                temperature=0.0,
-                timestamp_granularities=["segment"],
-                prompt=f"Start detecting speech from the first spoken word. If there is music or background noise, ignore it completely. Be very careful to not hallucinate on silence. If the transcription is anything but language:{get_config().vad.language}, ignore it completely. If the end of the audio seems like the start of a new sentence, ignore it completely.",
-            )
-        logger.debug(transcription)
-        # print(transcription)
-        speech_segments = transcription.segments if hasattr(transcription, 'segments') else []
-        # print(f"Groq speech segments: {speech_segments}")
-        audio_length = get_audio_length(input_audio_path)
-        # print(f"FFPROBE Length of input audio: {audio_length}")
-        return speech_segments, audio_length
-    except Exception as e:
-        logger.error(f"Error detecting voice with Groq: {e}")
-        return [], 0.0
-def process_audio_with_groq(input_audio, output_audio, game_line):
-    """
-    Processes an audio file by detecting voice activity using Groq Whisper API,
-    trimming the audio based on detected speech timestamps, and saving the trimmed audio.
-    """
-    start = time.time()
-    voice_activity, audio_length = detect_voice_with_groq(input_audio)
-    logger.info(f"Processing time for Groq: {time.time() - start:.2f} seconds")
-    if not voice_activity:
-        logger.info(f"No voice activity detected in {input_audio}")
-        return VADResult(False, 0, 0, GROQ)
-    start_time = voice_activity[0]['start']
-    end_time = voice_activity[-1]['end']
-    # Logic to potentially use the second-to-last timestamp if a next game line is expected
-    # and there's a significant pause before the very last segment.
-    if (game_line and hasattr(game_line, 'next') and game_line.next and
-        len(voice_activity) > 1 and
-        (voice_activity[-1]['start'] - voice_activity[-2]['end']) > 3.0):
-        end_time = voice_activity[-2]['end']
-        logger.info("Using the second last timestamp for trimming due to game_line.next and significant pause.")
-    # Apply offsets from configuration, ensuring times are within valid bounds
-    final_start_time = max(0, start_time + get_config().vad.beginning_offset)
-    final_end_time = min(audio_length, end_time + get_config().audio.end_offset)
-    logger.debug(f"Trimming {input_audio} from {final_start_time:.2f}s to {final_end_time:.2f}s into {output_audio}")
-    ffmpeg.trim_audio(input_audio, final_start_time, final_end_time, output_audio)
-    return VADResult(True, final_start_time, final_end_time, GROQ)
-# Example usage (uncomment and modify with your actual file paths for testing)
-# process_audio_with_groq("tmp6x81cy27.opus", "tmp6x81cy27_trimmed_groq.opus", None)

GameSentenceMiner/vad/result.py DELETED Viewed

@@ -1,21 +0,0 @@
-from GameSentenceMiner.configuration import get_config
-class VADResult:
-    def __init__(self, success: bool, start: float, end: float, model: str):
-        self.success = success
-        self.start = start
-        self.end = end
-        self.model = model
-    def __repr__(self):
-        return f"VADResult(success={self.success}, start={self.start}, end={self.end}, model={self.model})"
-    def trim_successful_string(self):
-        if self.success:
-            if get_config().vad.trim_beginning:
-                return f"Trimmed audio from {self.start:.2f} to {self.end:.2f} seconds using {self.model}."
-            else:
-                return f"Trimmed end of audio to {self.end:.2f} seconds using {self.model}."
-        else:
-            return f"Failed to trim audio using {self.model}."

GameSentenceMiner/vad/silero_trim.py DELETED Viewed

@@ -1,52 +0,0 @@
-import tempfile
-from silero_vad import load_silero_vad, read_audio, get_speech_timestamps
-from GameSentenceMiner  import configuration, ffmpeg
-from GameSentenceMiner.configuration import *
-from GameSentenceMiner.vad.result import VADResult
-from GameSentenceMiner.vad.vad_utils import get_audio_length
-# Silero VAD setup
-vad_model = load_silero_vad()
-# Use Silero to detect voice activity with timestamps in the audio
-def detect_voice_with_silero(input_audio):
-    # Convert the audio to 16kHz mono WAV
-    temp_wav = tempfile.NamedTemporaryFile(dir=configuration.get_temporary_directory(), suffix='.wav').name
-    ffmpeg.convert_audio_to_wav(input_audio, temp_wav)
-    # Load the audio and detect speech timestamps
-    wav = read_audio(temp_wav)
-    speech_timestamps = get_speech_timestamps(wav, vad_model, return_seconds=True)
-    logger.debug(speech_timestamps)
-    # Return the speech timestamps (start and end in seconds)
-    return speech_timestamps, len(wav) / 16000
-# Example usage of Silero with trimming
-def process_audio_with_silero(input_audio, output_audio, game_line):
-    voice_activity, audio_length = detect_voice_with_silero(input_audio)
-    if not voice_activity:
-        return VADResult(False, 0, 0, SILERO)
-    # Trim based on the first and last speech detected
-    start_time = voice_activity[0]['start'] if voice_activity else 0
-    if game_line and game_line.next and len(voice_activity) > 1 and 0 > audio_length - voice_activity[-1]['start'] + get_config().audio.beginning_offset:
-    #         and (voice_activity[-1]['start'] - voice_activity[-2]['end']) > 3.0):
-            end_time = voice_activity[-2]['end']
-            logger.info("Using the second last timestamp for trimming")
-    else:
-        end_time = voice_activity[-1]['end'] if voice_activity else 0
-    # Trim the audio using FFmpeg
-    ffmpeg.trim_audio(input_audio, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, output_audio)
-    return VADResult(True, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, SILERO)
-# process_audio_with_silero("tmp6x81cy27.opus", "tmp6x81cy27_trimmed.opus", None)
-# print(detect_voice_with_silero("tmp6x81cy27.opus"))

GameSentenceMiner/vad/vad_utils.py DELETED Viewed

@@ -1,13 +0,0 @@
-import subprocess
-from GameSentenceMiner.ffmpeg import get_ffprobe_path
-def get_audio_length(path):
-    result = subprocess.run(
-        [get_ffprobe_path(), "-v", "error", "-show_entries", "format=duration", "-of", "default=noprint_wrappers=1:nokey=1", path],
-        stdout=subprocess.PIPE,
-        stderr=subprocess.PIPE,
-        text=True
-    )
-    return float(result.stdout.strip())

GameSentenceMiner/vad/vosk_helper.py DELETED Viewed

@@ -1,158 +0,0 @@
-import tarfile
-import tempfile
-import zipfile
-import numpy as np
-import requests
-import soundfile as sf
-import vosk
-from GameSentenceMiner  import configuration, ffmpeg
-from GameSentenceMiner.configuration import *
-from GameSentenceMiner.vad.result import VADResult
-ffmpeg_base_command_list = ["ffmpeg", "-hide_banner", "-loglevel", "error"]
-vosk.SetLogLevel(-1)
-vosk_model_path = ''
-vosk_model = None
-# Function to download and cache the Vosk model
-def download_and_cache_vosk_model(model_dir="vosk_model_cache"):
-    # Ensure the cache directory exists
-    if not os.path.exists(os.path.join(get_app_directory(), model_dir)):
-        os.makedirs(os.path.join(get_app_directory(), model_dir))
-    # Extract the model name from the URL
-    model_filename = get_config().vad.vosk_url.split("/")[-1]
-    model_path = os.path.join(get_app_directory(), model_dir, model_filename)
-    # If the model is already downloaded, skip the download
-    if not os.path.exists(model_path):
-        logger.info(
-            f"Downloading the Vosk model from {get_config().vad.vosk_url}... This will take a while if using large model, ~1G")
-        response = requests.get(get_config().vad.vosk_url, stream=True)
-        with open(model_path, "wb") as file:
-            for chunk in response.iter_content(chunk_size=8192):
-                if chunk:
-                    file.write(chunk)
-        logger.info("Download complete.")
-    # Extract the model if it's a zip or tar file
-    model_extract_path = os.path.join(get_app_directory(), model_dir, "vosk_model")
-    if not os.path.exists(model_extract_path):
-        logger.info("Extracting the Vosk model...")
-        if model_filename.endswith(".zip"):
-            with zipfile.ZipFile(model_path, "r") as zip_ref:
-                zip_ref.extractall(model_extract_path)
-        elif model_filename.endswith(".tar.gz"):
-            with tarfile.open(model_path, "r:gz") as tar_ref:
-                tar_ref.extractall(model_extract_path)
-        else:
-            logger.info("Unknown archive format. Model extraction skipped.")
-        logger.info(f"Model extracted to {model_extract_path}.")
-    else:
-        logger.info(f"Model already extracted at {model_extract_path}.")
-    # Return the path to the actual model folder inside the extraction directory
-    extracted_folders = os.listdir(model_extract_path)
-    if extracted_folders:
-        actual_model_folder = os.path.join(model_extract_path,
-                                           extracted_folders[0])  # Assuming the first folder is the model
-        return actual_model_folder
-    else:
-        return model_extract_path  # In case there's no subfolder, return the extraction path directly
-# Use Vosk to detect voice activity with timestamps in the audio
-def detect_voice_with_vosk(input_audio):
-    global vosk_model_path, vosk_model
-    # Convert the audio to 16kHz mono WAV
-    temp_wav = tempfile.NamedTemporaryFile(dir=configuration.get_temporary_directory(), suffix='.wav').name
-    ffmpeg.convert_audio_to_wav(input_audio, temp_wav)
-    if not vosk_model_path or not vosk_model:
-        vosk_model_path = download_and_cache_vosk_model()
-        vosk_model = vosk.Model(vosk_model_path)
-    # Open the audio file
-    with sf.SoundFile(temp_wav) as audio_file:
-        recognizer = vosk.KaldiRecognizer(vosk_model, audio_file.samplerate)
-        voice_activity = []
-        total_duration = len(audio_file) / audio_file.samplerate  # Get total duration in seconds
-        recognizer.SetWords(True)
-        # recognizer.SetPartialWords(True)
-        # Process audio in chunks
-        while True:
-            data = audio_file.buffer_read(4000, dtype='int16')
-            if len(data) == 0:
-                break
-            # Convert buffer to bytes using NumPy
-            data_bytes = np.frombuffer(data, dtype='int16').tobytes()
-            if recognizer.AcceptWaveform(data_bytes):
-                pass
-        final_result = json.loads(recognizer.FinalResult())
-        if 'result' in final_result:
-            should_use = False
-            unique_words = set()
-            for word in final_result['result']:
-                if word['conf'] >= .90:
-                    logger.debug(word)
-                    should_use = True
-                    unique_words.add(word['word'])
-            if len(unique_words) == 1 or all(item in ['えー', 'ん'] for item in unique_words):
-                should_use = False
-            if not should_use:
-                return None, 0
-            for word in final_result['result']:
-                voice_activity.append({
-                    'text': word['word'],
-                    'start': word['start'],
-                    'end': word['end']
-                })
-    # Return the detected voice activity and the total duration
-    return voice_activity, total_duration
-# Example usage of Vosk with trimming
-def process_audio_with_vosk(input_audio, output_audio, game_line):
-    voice_activity, total_duration = detect_voice_with_vosk(input_audio)
-    if not voice_activity:
-        logger.info("No voice activity detected in the audio.")
-        return VADResult(False, 0, 0, VOSK)
-    # Trim based on the first and last speech detected
-    start_time = voice_activity[0]['start'] if voice_activity else 0
-    # if (game_line.next and len(voice_activity) > 1
-    #         and voice_activity[-1]['start'] - get_config().audio.beginning_offset > len(input_audio) / 16000
-    #         and (voice_activity[-1]['start'] - voice_activity[-2]['end']) > 5.0):
-    #     end_time = voice_activity[-2]['end']
-    #     logger.info("Using the second last timestamp for trimming")
-    # else:
-    end_time = voice_activity[-1]['end'] if voice_activity else 0
-    if get_config().vad.trim_beginning:
-        logger.info(f"VAD Trimmed Beginning of Audio to {start_time}")
-    # Print detected speech details with timestamps
-    logger.info(f"VAD Trimmed End of Audio to {end_time} seconds:")
-    # Trim the audio using FFmpeg
-    ffmpeg.trim_audio(input_audio, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, output_audio)
-    return VADResult(True, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, VOSK)
-def get_vosk_model():
-    global vosk_model_path, vosk_model
-    vosk_model_path = download_and_cache_vosk_model()
-    vosk_model = vosk.Model(vosk_model_path)
-    logger.info(f"Using Vosk model from {vosk_model_path}")

GameSentenceMiner/vad/whisper_helper.py DELETED Viewed

@@ -1,105 +0,0 @@
-import tempfile
-import warnings
-import stable_whisper as whisper
-import torch
-from stable_whisper import WhisperResult
-from GameSentenceMiner  import configuration, ffmpeg
-from GameSentenceMiner.configuration import *
-from GameSentenceMiner.vad.result import VADResult
-ffmpeg_base_command_list = ["ffmpeg", "-hide_banner", "-loglevel", "error"]
-whisper_model = None
-# Function to download and load the Whisper model
-def load_whisper_model():
-    global whisper_model
-    if whisper_model is None:
-        with warnings.catch_warnings(action="ignore"):
-            whisper_model = whisper.load_model(get_config().vad.whisper_model)
-        logger.info(f"Whisper model '{get_config().vad.whisper_model}' loaded.")
-# Use Whisper to detect voice activity with timestamps in the audio
-def detect_voice_with_whisper(input_audio):
-    # Convert the audio to 16kHz mono WAV
-    temp_wav = tempfile.NamedTemporaryFile(dir=configuration.get_temporary_directory(), suffix='.wav').name
-    ffmpeg.convert_audio_to_wav(input_audio, temp_wav)
-    # Make sure Whisper is loaded
-    load_whisper_model()
-    logger.info('transcribing audio...')
-    # Transcribe the audio using Whisper
-    with warnings.catch_warnings(action="ignore"):
-        result: WhisperResult = whisper_model.transcribe(temp_wav, vad=True, language=get_config().vad.language, temperature=0.0)
-    voice_activity = []
-    logger.debug(result.to_dict())
-    # Process the segments to extract tokens, timestamps, and confidence
-    for segment in result.segments:
-        logger.debug(segment.to_dict())
-        for word in segment.words:
-            logger.debug(word.to_dict())
-            confidence = word.probability
-            if confidence > .1:
-                logger.debug(word)
-                voice_activity.append({
-                    'text': word.word,
-                    'start': word.start,
-                    'end': word.end,
-                    'confidence': word.probability
-                })
-    # Analyze the detected words to decide whether to use the audio
-    should_use = False
-    unique_words = set(word['text'] for word in voice_activity)
-    if len(unique_words) > 1 or not all(item in ['えー', 'ん'] for item in unique_words):
-        should_use = True
-    if not should_use:
-        return None
-    # Return the detected voice activity and the total duration
-    return voice_activity
-# Example usage of Whisper with trimming
-def process_audio_with_whisper(input_audio, output_audio, game_line):
-    voice_activity = detect_voice_with_whisper(input_audio)
-    if not voice_activity:
-        logger.info("No voice activity detected in the audio.")
-        return VADResult(False, 0, 0, WHISPER)
-    # Trim based on the first and last speech detected
-    start_time = voice_activity[0]['start'] if voice_activity else 0
-    # if (game_line.next and len(voice_activity) > 1
-    #     and voice_activity[-1]['start'] - get_config().audio.beginning_offset > len(input_audio) / 16000
-    #         and (voice_activity[-1]['start'] - voice_activity[-2]['end']) > 5.0):
-    #             end_time = voice_activity[-2]['end']
-    #             logger.info("Using the second last timestamp for trimming")
-    # else:
-    end_time = voice_activity[-1]['end'] if voice_activity else 0
-    if get_config().vad.trim_beginning:
-        logger.info(f"VAD Trimmed Beginning of Audio to {start_time}")
-    # Print detected speech details with timestamps
-    logger.info(f"VAD Trimmed End of Audio to {end_time} seconds:")
-    # Trim the audio using FFmpeg
-    ffmpeg.trim_audio(input_audio, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, output_audio)
-    return VADResult(True, start_time + get_config().vad.beginning_offset, end_time + get_config().audio.end_offset, WHISPER)
-# Load Whisper model initially
-def initialize_whisper_model():
-    load_whisper_model()
-# initialize_whisper_model()
-# process_audio_with_whisper("tmp6x81cy27.opus", "tmp6x81cy27_trimmed.opus", None)

gamesentenceminer-2.9.4.dist-info/RECORD DELETED Viewed

@@ -1,72 +0,0 @@
-GameSentenceMiner/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/anki.py,sha256=HAYblBjkth5p0tx9Z0LNQn6zuQC8_54RIB2BMzN8-LE,14705
-GameSentenceMiner/config_gui.py,sha256=h4zz85gfhxSphaJ-IZSu9D4jR70mDlKecZ9JRCO5Noc,80927
-GameSentenceMiner/configuration.py,sha256=KKW6fmpxya4dmXx9cERFVrzsKCTw0vmZrF2HAJDURBU,25667
-GameSentenceMiner/electron_config.py,sha256=dGcPYCISPehXubYSzsDuI2Gl092MYK0u3bTnkL9Jh1Y,9787
-GameSentenceMiner/ffmpeg.py,sha256=APa2vNdAgxYdG96_Z3Xdh1WqOiWaK6gTLJqzEvCMMeU,18323
-GameSentenceMiner/gametext.py,sha256=sll-6Pficd4ZXYy8yL8hBrEOSpfa53TOye7vtHHKFN4,6218
-GameSentenceMiner/gsm.py,sha256=olG3BIWjbVHWTsRKmeDVE5X8XrgppWke73Fy1J15dxA,29868
-GameSentenceMiner/model.py,sha256=1lRyJFf_LND_4O16h8CWVqDfosLgr0ZS6ufBZ3qJHpY,5699
-GameSentenceMiner/notification.py,sha256=e6TOzZJD7RTvMgxaY-V01r5OiocHhdqEIVdAnj4MGSw,3437
-GameSentenceMiner/obs.py,sha256=JiydRMpfSpNZ0nDAzH8OOECbYbsxMNSGz46lO8lZbvA,14871
-GameSentenceMiner/package.py,sha256=uu3Yb3pqu8vN5ISzP87YCHlFNR9wxMMf5hPRncTr7ws,1181
-GameSentenceMiner/ss_selector.py,sha256=csey9H3561-guRJcT6gQN6hXxvylP0CBI0dp2-kwo2Q,4446
-GameSentenceMiner/text_log.py,sha256=U2_g8THAYeexRiE2bLk_bCt_2ShiA8SQ9VdJsi4riHs,5181
-GameSentenceMiner/util.py,sha256=ZbK7i1UeOzKyc5WtCcttiGljR_stfu7qpnEpgqFBwro,8976
-GameSentenceMiner/ai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/ai/ai_prompting.py,sha256=xw8et6XNwQiDXOXZnw8iIntVSg8lni4YYZbgWsK7qDE,10013
-GameSentenceMiner/assets/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/assets/icon.png,sha256=9GRL8uXUAgkUSlvbm9Pv9o2poFVRGdW6s2ub_DeUD9M,937624
-GameSentenceMiner/assets/icon128.png,sha256=l90j7biwdz5ahwOd5wZ-406ryEV9Pan93dquJQ3e1CI,18395
-GameSentenceMiner/assets/icon256.png,sha256=JEW46wOrG1KR-907rvFaEdNbPtj5gu0HJmG7qUnIHxQ,51874
-GameSentenceMiner/assets/icon32.png,sha256=Kww0hU_qke9_22wBuO_Nq0Dv2SfnOLwMhCyGgbgXdg8,6089
-GameSentenceMiner/assets/icon512.png,sha256=HxUj2GHjyQsk8NV433256UxU9phPhtjCY-YB_7W4sqs,192487
-GameSentenceMiner/assets/icon64.png,sha256=N8xgdZXvhqVQP9QUK3wX5iqxX9LxHljD7c-Bmgim6tM,9301
-GameSentenceMiner/assets/pickaxe.png,sha256=VfIGyXyIZdzEnVcc4PmG3wszPMO1W4KCT7Q_nFK6eSE,1403829
-GameSentenceMiner/communication/__init__.py,sha256=_jGn9PJxtOAOPtJ2rI-Qu9hEHVZVpIvWlxKvqk91_zI,638
-GameSentenceMiner/communication/send.py,sha256=X0MytGv5hY-uUvkfvdCqQA_ljZFmV6UkJ6in1TA1bUE,217
-GameSentenceMiner/communication/websocket.py,sha256=8eFZaTtoFggEPdqw2Jl4zqHC2I7J3-Gk27CxVX7SyBo,3277
-GameSentenceMiner/downloader/Untitled_json.py,sha256=RUUl2bbbCpUDUUS0fP0tdvf5FngZ7ILdA_J5TFYAXUQ,15272
-GameSentenceMiner/downloader/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/downloader/download_tools.py,sha256=aRfpCqEmKUFRVsGipwY-7PhY6AeWiFJanW4ZCB9e2iE,8124
-GameSentenceMiner/downloader/oneocr_dl.py,sha256=o3ANp5IodEQoQ8GPcJdg9Y8JzA_lictwnebFPwwUZVk,10144
-GameSentenceMiner/ocr/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/ocr/gsm_ocr_config.py,sha256=fEQ2o2NXksGRHpueO8c4TfAp75GEdAtAr1ngTFOsdpg,2257
-GameSentenceMiner/ocr/ocrconfig.py,sha256=_tY8mjnzHMJrLS8E5pHqYXZjMuLoGKYgJwdhYgN-ny4,6466
-GameSentenceMiner/ocr/owocr_area_selector.py,sha256=Q8ETMHL7BKMA1mbtjrntDLyqCQB0lZ5T4RCZsodjH7Y,47186
-GameSentenceMiner/ocr/owocr_helper.py,sha256=M4Is-Ki5O3r4ixYhILibfjrVGD6xDlOcR3YvVGmETQ4,17363
-GameSentenceMiner/owocr/owocr/__init__.py,sha256=opjBOyGGyEqZCE6YdZPnyt7nVfiwyELHsXA0jAsjm14,25
-GameSentenceMiner/owocr/owocr/__main__.py,sha256=XQaqZY99EKoCpU-gWQjNbTs7Kg17HvBVE7JY8LqIE0o,157
-GameSentenceMiner/owocr/owocr/config.py,sha256=qM7kISHdUhuygGXOxmgU6Ef2nwBShrZtdqu4InDCViE,8103
-GameSentenceMiner/owocr/owocr/lens_betterproto.py,sha256=oNoISsPilVVRBBPVDtb4-roJtAhp8ZAuFTci3TGXtMc,39141
-GameSentenceMiner/owocr/owocr/ocr.py,sha256=V0HqVRQlaE1-12IH480IupfSv1BlDdEcwNPejhQZfS0,42292
-GameSentenceMiner/owocr/owocr/run.py,sha256=0UyjOKEP0MqSdCaagCUMGdqO-BMexPxCl7ZabGlic4E,54749
-GameSentenceMiner/owocr/owocr/screen_coordinate_picker.py,sha256=Na6XStbQBtpQUSdbN3QhEswtKuU1JjReFk_K8t5ezQE,3395
-GameSentenceMiner/vad/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/vad/groq_trim.py,sha256=MDYiApduwF7oDx3r0TXL3xQrTkbUC1RinMwNKSbF5gw,3764
-GameSentenceMiner/vad/result.py,sha256=aFlr2px90fn3qXj49dwF9BDXA5m4yXD_HYH01CVvP1U,799
-GameSentenceMiner/vad/silero_trim.py,sha256=u4BC93LieJW0CZ7HToz51FneojqW_SNjSKmJmHMKwUA,2240
-GameSentenceMiner/vad/vad_utils.py,sha256=_YC6rW2eXSBeLnYbVl_F3na1KCRL90VrnOzKYJ9RhUE,391
-GameSentenceMiner/vad/vosk_helper.py,sha256=h7yNHrzrzT-J74UniA0T2ZX8cHqhflCzwyDjoIdKLO4,6479
-GameSentenceMiner/vad/whisper_helper.py,sha256=B64-Eq_ZMCIyQX_A8uvYz-c48hSXJAyz6tSXNRaLjtA,4020
-GameSentenceMiner/web/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/web/texthooking_page.py,sha256=7Z7TGDcnj-94Y9ws7bQph4oIXrqf8Q9qVKowKimHWxM,14749
-GameSentenceMiner/web/static/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/web/static/apple-touch-icon.png,sha256=OcMI8af_68DA_tweOsQ5LytTyMwm7-hPW07IfrOVgEs,46132
-GameSentenceMiner/web/static/favicon-96x96.png,sha256=lOePzjiKl1JY2J1kT_PMdyEnrlJmi5GWbmXJunM12B4,16502
-GameSentenceMiner/web/static/favicon.ico,sha256=7d25r_FBqRSNsAoEHpSzNoT7zyVt2DJRLNDNq_HYoX8,15086
-GameSentenceMiner/web/static/favicon.svg,sha256=x305AP6WlXGtrXIZlaQspdLmwteoFYUoe5FyJ9MYlJ8,11517
-GameSentenceMiner/web/static/site.webmanifest,sha256=kaeNT-FjFt-T7JGzOhXH7YSqsrDeiplZ2kDxCN_CFU4,436
-GameSentenceMiner/web/static/style.css,sha256=bPZK0NVMuyRl5NNDuT7ZTzVLKlvSsdmeVHmAW4y5FM0,7001
-GameSentenceMiner/web/static/web-app-manifest-192x192.png,sha256=EfSNnBmsSaLfESbkGfYwbKzcjKOdzuWo18ABADfN974,51117
-GameSentenceMiner/web/static/web-app-manifest-512x512.png,sha256=wyqgCWCrLEUxSRXmaA3iJEESd-vM-ZmlTtZFBY4V8Pk,230819
-GameSentenceMiner/web/templates/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
-GameSentenceMiner/web/templates/index.html,sha256=HZKiIjiGJV8PGQ9T2aLDUNSfJn71qOwbYCjbRuSIjpY,213583
-GameSentenceMiner/web/templates/text_replacements.html,sha256=tV5c8mCaWSt_vKuUpbdbLAzXZ3ATZeDvQ9PnnAfqY0M,8598
-GameSentenceMiner/web/templates/utility.html,sha256=3flZinKNqUJ7pvrZk6xu__v67z44rXnaK7UTZ303R-8,16946
-gamesentenceminer-2.9.4.dist-info/licenses/LICENSE,sha256=OXLcl0T2SZ8Pmy2_dmlvKuetivmyPd5m1q-Gyd-zaYY,35149
-gamesentenceminer-2.9.4.dist-info/METADATA,sha256=jNhOj4IaiTEJqGlm4-VCtviW5hmN8J5XnvPBGWgcY0Y,7280
-gamesentenceminer-2.9.4.dist-info/WHEEL,sha256=zaaOINJESkSfm_4HQVc5ssNzHCPXhJm0kEUakpsEHaU,91
-gamesentenceminer-2.9.4.dist-info/entry_points.txt,sha256=2APEP25DbfjSxGeHtwBstMH8mulVhLkqF_b9bqzU6vQ,65
-gamesentenceminer-2.9.4.dist-info/top_level.txt,sha256=V1hUY6xVSyUEohb0uDoN4UIE6rUZ_JYx8yMyPGX4PgQ,18
-gamesentenceminer-2.9.4.dist-info/RECORD,,