GameSentenceMiner 2.7.17__py3-none-any.whl → 2.8.1__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (34) hide show
  1. GameSentenceMiner/anki.py +7 -8
  2. GameSentenceMiner/config_gui.py +19 -3
  3. GameSentenceMiner/configuration.py +8 -1
  4. GameSentenceMiner/downloader/oneocr_dl.py +243 -0
  5. GameSentenceMiner/ffmpeg.py +1 -3
  6. GameSentenceMiner/gametext.py +16 -155
  7. GameSentenceMiner/gsm.py +28 -29
  8. GameSentenceMiner/obs.py +0 -3
  9. GameSentenceMiner/ocr/ocrconfig.py +0 -1
  10. GameSentenceMiner/ocr/owocr_area_selector.py +0 -1
  11. GameSentenceMiner/ocr/owocr_helper.py +25 -26
  12. GameSentenceMiner/text_log.py +186 -0
  13. GameSentenceMiner/util.py +60 -3
  14. GameSentenceMiner/web/__init__.py +0 -0
  15. GameSentenceMiner/web/static/__init__.py +0 -0
  16. GameSentenceMiner/web/static/apple-touch-icon.png +0 -0
  17. GameSentenceMiner/web/static/favicon-96x96.png +0 -0
  18. GameSentenceMiner/web/static/favicon.ico +0 -0
  19. GameSentenceMiner/web/static/favicon.svg +3 -0
  20. GameSentenceMiner/web/static/site.webmanifest +21 -0
  21. GameSentenceMiner/web/static/style.css +292 -0
  22. GameSentenceMiner/web/static/text_replacements.html +238 -0
  23. GameSentenceMiner/web/static/utility.html +313 -0
  24. GameSentenceMiner/web/static/web-app-manifest-192x192.png +0 -0
  25. GameSentenceMiner/web/static/web-app-manifest-512x512.png +0 -0
  26. GameSentenceMiner/web/texthooking_page.py +234 -0
  27. {gamesentenceminer-2.7.17.dist-info → gamesentenceminer-2.8.1.dist-info}/METADATA +2 -1
  28. gamesentenceminer-2.8.1.dist-info/RECORD +58 -0
  29. {gamesentenceminer-2.7.17.dist-info → gamesentenceminer-2.8.1.dist-info}/WHEEL +1 -1
  30. GameSentenceMiner/utility_gui.py +0 -204
  31. gamesentenceminer-2.7.17.dist-info/RECORD +0 -44
  32. {gamesentenceminer-2.7.17.dist-info → gamesentenceminer-2.8.1.dist-info}/entry_points.txt +0 -0
  33. {gamesentenceminer-2.7.17.dist-info → gamesentenceminer-2.8.1.dist-info}/licenses/LICENSE +0 -0
  34. {gamesentenceminer-2.7.17.dist-info → gamesentenceminer-2.8.1.dist-info}/top_level.txt +0 -0
GameSentenceMiner/gsm.py CHANGED
@@ -10,7 +10,6 @@ from pystray import Icon, Menu, MenuItem
10
10
  from watchdog.events import FileSystemEventHandler
11
11
  from watchdog.observers import Observer
12
12
 
13
- import time
14
13
 
15
14
  from GameSentenceMiner import anki
16
15
  from GameSentenceMiner import config_gui
@@ -27,10 +26,11 @@ from GameSentenceMiner.communication.websocket import connect_websocket, registe
27
26
  from GameSentenceMiner.configuration import *
28
27
  from GameSentenceMiner.downloader.download_tools import download_obs_if_needed, download_ffmpeg_if_needed
29
28
  from GameSentenceMiner.ffmpeg import get_audio_and_trim, get_video_timings
30
- from GameSentenceMiner.gametext import get_text_event, get_mined_line, GameLine
31
29
  from GameSentenceMiner.obs import check_obs_folder_is_correct
30
+ from GameSentenceMiner.text_log import GameLine, get_text_event, get_mined_line, get_all_lines
32
31
  from GameSentenceMiner.util import *
33
- from GameSentenceMiner.utility_gui import init_utility_window, get_utility_window
32
+ from GameSentenceMiner.web import texthooking_page
33
+ from GameSentenceMiner.web.texthooking_page import start_web_server
34
34
 
35
35
  if is_windows():
36
36
  import win32api
@@ -57,9 +57,9 @@ class VideoToAudioHandler(FileSystemEventHandler):
57
57
  @staticmethod
58
58
  def convert_to_audio(video_path):
59
59
  try:
60
- if get_utility_window().line_for_audio:
61
- line: GameLine = get_utility_window().line_for_audio
62
- get_utility_window().line_for_audio = None
60
+ if texthooking_page.event_manager.line_for_audio:
61
+ line: GameLine = texthooking_page.event_manager.line_for_audio
62
+ texthooking_page.event_manager.line_for_audio = None
63
63
  if get_config().advanced.audio_player_path:
64
64
  audio = VideoToAudioHandler.get_audio(line, line.next.time if line.next else None, video_path, temporary=True)
65
65
  play_audio_in_external(audio)
@@ -67,9 +67,9 @@ class VideoToAudioHandler(FileSystemEventHandler):
67
67
  elif get_config().advanced.video_player_path:
68
68
  play_video_in_external(line, video_path)
69
69
  return
70
- if get_utility_window().line_for_screenshot:
71
- line: GameLine = get_utility_window().line_for_screenshot
72
- get_utility_window().line_for_screenshot = None
70
+ if texthooking_page.event_manager.line_for_screenshot:
71
+ line: GameLine = texthooking_page.event_manager.line_for_screenshot
72
+ texthooking_page.event_manager.line_for_screenshot = None
73
73
  screenshot = ffmpeg.get_screenshot_for_line(video_path, line)
74
74
  os.startfile(screenshot)
75
75
  os.remove(video_path)
@@ -109,18 +109,18 @@ class VideoToAudioHandler(FileSystemEventHandler):
109
109
  if mined_line.next:
110
110
  line_cutoff = mined_line.next.time
111
111
 
112
- if get_utility_window().lines_selected():
113
- lines = get_utility_window().get_selected_lines()
114
- start_line = lines[0]
115
- mined_line = get_mined_line(last_note, lines)
116
- line_cutoff = get_utility_window().get_next_line_timing()
112
+ selected_lines = []
113
+ if texthooking_page.are_lines_selected():
114
+ selected_lines = texthooking_page.get_selected_lines()
115
+ start_line = selected_lines[0]
116
+ mined_line = get_mined_line(last_note, selected_lines)
117
+ line_cutoff = selected_lines[-1].get_next_time()
117
118
 
118
119
  if last_note:
119
120
  logger.debug(last_note.to_json())
120
- selected_lines = get_utility_window().get_selected_lines()
121
121
  note = anki.get_initial_card_info(last_note, selected_lines)
122
122
  tango = last_note.get_field(get_config().anki.word_field) if last_note else ''
123
- get_utility_window().reset_checkboxes()
123
+ texthooking_page.reset_checked_lines()
124
124
 
125
125
  if get_config().anki.sentence_audio_field and get_config().audio.enabled:
126
126
  logger.debug("Attempting to get audio from video")
@@ -268,10 +268,10 @@ def register_hotkeys():
268
268
  keyboard.add_hotkey(get_config().hotkeys.reset_line, gametext.reset_line_hotkey_pressed)
269
269
  if get_config().hotkeys.take_screenshot:
270
270
  keyboard.add_hotkey(get_config().hotkeys.take_screenshot, get_screenshot)
271
- if get_config().hotkeys.open_utility:
272
- keyboard.add_hotkey(get_config().hotkeys.open_utility, open_multimine)
273
271
  if get_config().hotkeys.play_latest_audio:
274
272
  keyboard.add_hotkey(get_config().hotkeys.play_latest_audio, play_most_recent_audio)
273
+ if get_config().hotkeys.open_utility:
274
+ keyboard.add_hotkey(get_config().hotkeys.open_utility, texthooking_page.open_texthooker)
275
275
 
276
276
 
277
277
  def get_screenshot():
@@ -322,13 +322,10 @@ def open_settings():
322
322
  settings_window.show()
323
323
 
324
324
 
325
- def open_multimine():
326
- obs.update_current_game()
327
- get_utility_window().show()
328
-
329
325
  def play_most_recent_audio():
330
- if get_config().advanced.audio_player_path or get_config().advanced.video_player_path and len(gametext.line_history.values) > 0:
331
- get_utility_window().line_for_audio = gametext.line_history.values[-1]
326
+ if get_config().advanced.audio_player_path or get_config().advanced.video_player_path and len(
327
+ get_all_lines()) > 0:
328
+ texthooking_page.event_manager.line_for_audio = get_all_lines()[-1]
332
329
  obs.save_replay_buffer()
333
330
  else:
334
331
  logger.error("Feature Disabled. No audio or video player path set in config!")
@@ -368,6 +365,10 @@ def play_pause(icon, item):
368
365
  update_icon()
369
366
 
370
367
 
368
+ def open_multimine(icon, item):
369
+ texthooking_page.open_texthooker()
370
+
371
+
371
372
  def update_icon():
372
373
  global menu, icon
373
374
  # Recreate the menu with the updated button text
@@ -416,7 +417,7 @@ def run_tray():
416
417
 
417
418
  menu = Menu(
418
419
  MenuItem("Open Settings", open_settings),
419
- MenuItem("Open Multi-Mine GUI", open_multimine),
420
+ MenuItem("Open Texthooker", texthooking_page.open_texthooker),
420
421
  MenuItem("Open Log", open_log),
421
422
  MenuItem("Toggle Replay Buffer", play_pause),
422
423
  MenuItem("Restart OBS", restart_obs),
@@ -554,6 +555,7 @@ def post_init():
554
555
  whisper_helper.initialize_whisper_model()
555
556
  if get_config().vad.is_silero():
556
557
  from GameSentenceMiner.vad import silero_trim
558
+ start_web_server()
557
559
 
558
560
  util.run_new_thread(do_post_init)
559
561
 
@@ -576,7 +578,6 @@ def main(reloading=False):
576
578
  logger.info("Script started.")
577
579
  root = ttk.Window(themename='darkly')
578
580
  settings_window = config_gui.ConfigApp(root)
579
- init_utility_window(root)
580
581
  initialize(reloading)
581
582
  initialize_async()
582
583
  observer = Observer()
@@ -594,9 +595,7 @@ def main(reloading=False):
594
595
  try:
595
596
  # if get_config().general.open_config_on_startup:
596
597
  # root.after(0, settings_window.show)
597
- if get_config().general.open_multimine_on_startup:
598
- root.after(0, get_utility_window().show)
599
- root.after(0, post_init)
598
+ root.after(50, post_init)
600
599
  settings_window.add_save_hook(update_icon)
601
600
  settings_window.on_exit = exit_program
602
601
  root.mainloop()
GameSentenceMiner/obs.py CHANGED
@@ -1,10 +1,7 @@
1
- import logging
2
1
  import os.path
3
2
  import subprocess
4
- import tempfile
5
3
  import time
6
4
 
7
- import psutil
8
5
  from obswebsocket import obsws, requests
9
6
 
10
7
  from GameSentenceMiner import util, configuration
@@ -1,6 +1,5 @@
1
1
  import configparser
2
2
  import os
3
- import re
4
3
 
5
4
  class OCRConfig:
6
5
  def __init__(self, config_file=os.path.expanduser("~/.config/owocr_config.ini")):
@@ -7,7 +7,6 @@ import mss
7
7
  from PIL import Image, ImageTk, ImageDraw
8
8
 
9
9
  from GameSentenceMiner import obs # Import your actual obs module
10
- from GameSentenceMiner.ocr.owocr_helper import get_ocr_config
11
10
  from GameSentenceMiner.util import sanitize_filename # Import your actual util module
12
11
 
13
12
  try:
@@ -1,9 +1,9 @@
1
1
  import asyncio
2
- import difflib
3
2
  import json
4
3
  import logging
5
4
  import os
6
5
  import queue
6
+ import re
7
7
  import threading
8
8
  import time
9
9
  from datetime import datetime
@@ -14,17 +14,14 @@ from tkinter import messagebox
14
14
  import mss
15
15
  import websockets
16
16
  from rapidfuzz import fuzz
17
- from PIL import Image, ImageDraw
18
17
 
19
18
  from GameSentenceMiner import obs, util
20
- from GameSentenceMiner.configuration import get_config, get_app_directory
19
+ from GameSentenceMiner.configuration import get_config, get_app_directory, get_temporary_directory
21
20
  from GameSentenceMiner.electron_config import get_ocr_scan_rate, get_requires_open_window
22
21
  from GameSentenceMiner.ocr.gsm_ocr_config import OCRConfig, Rectangle
23
22
  from GameSentenceMiner.owocr.owocr import screen_coordinate_picker, run
24
23
  from GameSentenceMiner.owocr.owocr.run import TextFiltering
25
-
26
- from dataclasses import dataclass
27
- from typing import List, Optional
24
+ from GameSentenceMiner.util import do_text_replacements, OCR_REPLACEMENTS_FILE
28
25
 
29
26
  CONFIG_FILE = Path("ocr_config.json")
30
27
  DEFAULT_IMAGE_PATH = r"C:\Users\Beangate\Pictures\msedge_acbl8GL7Ax.jpg" # CHANGE THIS
@@ -80,6 +77,7 @@ def get_ocr_config() -> OCRConfig:
80
77
  """Loads and updates screen capture areas from the corresponding JSON file."""
81
78
  app_dir = Path.home() / "AppData" / "Roaming" / "GameSentenceMiner"
82
79
  ocr_config_dir = app_dir / "ocr_config"
80
+ os.makedirs(ocr_config_dir, exist_ok=True)
83
81
  obs.connect_to_obs()
84
82
  scene = util.sanitize_filename(obs.get_current_scene())
85
83
  config_path = ocr_config_dir / f"{scene}.json"
@@ -217,63 +215,62 @@ def do_second_ocr(ocr1_text, rectangle_index, time, img):
217
215
  if fuzz.ratio(previous_ocr2_text, text) >= 80:
218
216
  logger.info("Seems like the same text from previous ocr2 result, not sending")
219
217
  return
220
- img.save(os.path.join(get_app_directory(), "temp", "last_successful_ocr.png"))
218
+ img.save(os.path.join(get_temporary_directory(), "last_successful_ocr.png"))
221
219
  last_ocr2_results[rectangle_index] = text
222
- if get_config().advanced.ocr_sends_to_clipboard:
223
- import pyperclip
224
- pyperclip.copy(text)
225
- websocket_server_thread.send_text(text, time)
220
+ send_result(text, time)
226
221
  except json.JSONDecodeError:
227
222
  print("Invalid JSON received.")
228
223
  except Exception as e:
229
224
  logger.exception(e)
230
225
  print(f"Error processing message: {e}")
231
226
 
227
+ def send_result(text, time):
228
+ if text:
229
+ text = do_text_replacements(text, OCR_REPLACEMENTS_FILE)
230
+ if get_config().advanced.ocr_sends_to_clipboard:
231
+ import pyperclip
232
+ pyperclip.copy(text)
233
+ websocket_server_thread.send_text(text, time)
234
+
232
235
 
233
236
  last_oneocr_results_to_check = {} # Store last OCR result for each rectangle
234
237
  last_oneocr_times = {} # Store last OCR time for each rectangle
235
238
  text_stable_start_times = {} # Store the start time when text becomes stable for each rectangle
239
+ previous_imgs = {}
236
240
  orig_text_results = {} # Store original text results for each rectangle
237
241
  TEXT_APPEARENCE_DELAY = get_ocr_scan_rate() * 1000 + 500 # Adjust as needed
238
242
 
239
243
  def text_callback(text, orig_text, rectangle_index, time, img=None):
240
244
  global twopassocr, ocr2, last_oneocr_results_to_check, last_oneocr_times, text_stable_start_times, orig_text_results
241
245
  orig_text_string = ''.join([item for item in orig_text if item is not None]) if orig_text else ""
246
+ # logger.debug(orig_text_string)
242
247
 
243
248
  current_time = time if time else datetime.now()
244
249
 
245
- previous_text = last_oneocr_results_to_check.get(rectangle_index, "").strip()
250
+ previous_text = last_oneocr_results_to_check.pop(rectangle_index, "").strip()
246
251
  previous_orig_text = orig_text_results.get(rectangle_index, "").strip()
247
252
 
248
253
  # print(previous_orig_text)
249
254
  # if orig_text:
250
255
  # print(orig_text_string)
251
-
256
+ if not twopassocr:
257
+ img.save(os.path.join(get_temporary_directory(), "last_successful_ocr.png"))
258
+ send_result(text, time)
252
259
  if not text:
253
260
  if previous_text:
254
261
  if rectangle_index in text_stable_start_times:
255
- stable_time = text_stable_start_times[rectangle_index]
262
+ stable_time = text_stable_start_times.pop(rectangle_index)
263
+ previous_img = previous_imgs.pop(rectangle_index)
256
264
  previous_result = last_ocr1_results[rectangle_index]
257
265
  if previous_result and fuzz.ratio(previous_result, previous_text) >= 80:
258
266
  logger.info("Seems like the same text, not " + "doing second OCR" if twopassocr else "sending")
259
- del last_oneocr_results_to_check[rectangle_index]
260
267
  return
261
268
  if previous_orig_text and fuzz.ratio(orig_text_string, previous_orig_text) >= 80:
262
269
  logger.info("Seems like Text we already sent, not doing anything.")
263
- del last_oneocr_results_to_check[rectangle_index]
264
270
  return
265
271
  orig_text_results[rectangle_index] = orig_text_string
266
- if twopassocr:
267
- do_second_ocr(previous_text, rectangle_index, time, img)
268
- else:
269
- if get_config().advanced.ocr_sends_to_clipboard:
270
- import pyperclip
271
- pyperclip.copy(text)
272
- websocket_server_thread.send_text(previous_text, stable_time)
273
- img.save(os.path.join(get_app_directory(), "temp", "last_successful_ocr.png"))
272
+ do_second_ocr(previous_text, rectangle_index, stable_time, previous_img)
274
273
  last_ocr1_results[rectangle_index] = previous_text
275
- del text_stable_start_times[rectangle_index]
276
- del last_oneocr_results_to_check[rectangle_index]
277
274
  return
278
275
  return
279
276
 
@@ -281,6 +278,7 @@ def text_callback(text, orig_text, rectangle_index, time, img=None):
281
278
  last_oneocr_results_to_check[rectangle_index] = text
282
279
  last_oneocr_times[rectangle_index] = current_time
283
280
  text_stable_start_times[rectangle_index] = current_time
281
+ previous_imgs[rectangle_index] = img
284
282
  return
285
283
 
286
284
  stable = text_stable_start_times.get(rectangle_index)
@@ -294,6 +292,7 @@ def text_callback(text, orig_text, rectangle_index, time, img=None):
294
292
  else:
295
293
  last_oneocr_results_to_check[rectangle_index] = text
296
294
  last_oneocr_times[rectangle_index] = current_time
295
+ previous_imgs[rectangle_index] = img
297
296
 
298
297
  done = False
299
298
 
@@ -0,0 +1,186 @@
1
+ import uuid
2
+ from dataclasses import dataclass
3
+ from datetime import datetime
4
+ from difflib import SequenceMatcher
5
+ from typing import Optional
6
+
7
+ from GameSentenceMiner.configuration import logger, get_config
8
+ from GameSentenceMiner.model import AnkiCard
9
+ from GameSentenceMiner.util import remove_html_and_cloze_tags
10
+
11
+ initial_time = datetime.now()
12
+
13
+
14
+ @dataclass
15
+ class GameLine:
16
+ id: str
17
+ text: str
18
+ time: datetime
19
+ prev: 'GameLine | None'
20
+ next: 'GameLine | None'
21
+ index: int = 0
22
+
23
+ def get_previous_time(self):
24
+ if self.prev:
25
+ return self.prev.time
26
+ return initial_time
27
+
28
+ def get_next_time(self):
29
+ if self.next:
30
+ return self.next.time
31
+ return 0
32
+
33
+ def __str__(self):
34
+ return str({"text": self.text, "time": self.time})
35
+
36
+
37
+ @dataclass
38
+ class GameText:
39
+ values: list[GameLine]
40
+ values_dict: dict[str, GameLine]
41
+ game_line_index = 0
42
+
43
+ def __init__(self):
44
+ self.values = []
45
+ self.values_dict = {}
46
+
47
+ def __getitem__(self, key):
48
+ return self.values[key]
49
+
50
+ def get_by_id(self, line_id: str) -> Optional[GameLine]:
51
+ if not self.values_dict:
52
+ return None
53
+ return self.values_dict.get(line_id)
54
+
55
+ def get_time(self, line_text: str, occurrence: int = -1) -> datetime:
56
+ matches = [line for line in self.values if line.text == line_text]
57
+ if matches:
58
+ return matches[occurrence].time # Default to latest
59
+ return initial_time
60
+
61
+ def get_event(self, line_text: str, occurrence: int = -1) -> GameLine | None:
62
+ matches = [line for line in self.values if line.text == line_text]
63
+ if matches:
64
+ return matches[occurrence]
65
+ return None
66
+
67
+ def add_line(self, line_text, line_time=None):
68
+ if not line_text:
69
+ return
70
+ line_id = str(uuid.uuid1())
71
+ new_line = GameLine(
72
+ id=line_id, # Time-based UUID as an integer
73
+ text=line_text,
74
+ time=line_time if line_time else datetime.now(),
75
+ prev=self.values[-1] if self.values else None,
76
+ next=None,
77
+ index=self.game_line_index
78
+ )
79
+ self.values_dict[line_id] = new_line
80
+ logger.debug(f"Adding line: {new_line}")
81
+ self.game_line_index += 1
82
+ if self.values:
83
+ self.values[-1].next = new_line
84
+ self.values.append(new_line)
85
+ # self.remove_old_events(datetime.now() - timedelta(minutes=10))
86
+
87
+ def has_line(self, line_text) -> bool:
88
+ for game_line in self.values:
89
+ if game_line.text == line_text:
90
+ return True
91
+ return False
92
+
93
+
94
+ text_log = GameText()
95
+
96
+
97
+ def similar(a, b):
98
+ return SequenceMatcher(None, a, b).ratio()
99
+
100
+
101
+ def one_contains_the_other(a, b):
102
+ return a in b or b in a
103
+
104
+
105
+ def lines_match(a, b):
106
+ similarity = similar(a, b)
107
+ logger.debug(f"Comparing: {a} with {b} - Similarity: {similarity}, Or One contains the other: {one_contains_the_other(a, b)}")
108
+ return similar(a, b) >= 0.60 or one_contains_the_other(a, b)
109
+
110
+
111
+ def get_text_event(last_note) -> GameLine:
112
+ lines = text_log.values
113
+
114
+ if not lines:
115
+ raise Exception("No lines in history. Text is required from either clipboard or websocket for GSM to work. Please check your setup/config.")
116
+
117
+ if not last_note:
118
+ return lines[-1]
119
+
120
+ sentence = last_note.get_field(get_config().anki.sentence_field)
121
+ if not sentence:
122
+ return lines[-1]
123
+
124
+ for line in reversed(lines):
125
+ if lines_match(line.text, remove_html_and_cloze_tags(sentence)):
126
+ return line
127
+
128
+ logger.debug("Couldn't find a match in history, using last event")
129
+ return lines[-1]
130
+
131
+
132
+ def get_line_and_future_lines(last_note):
133
+ if not last_note:
134
+ return []
135
+
136
+ sentence = last_note.get_field(get_config().anki.sentence_field)
137
+ found_lines = []
138
+ if sentence:
139
+ found = False
140
+ for line in text_log.values:
141
+ if found:
142
+ found_lines.append(line.text)
143
+ if lines_match(line.text, remove_html_and_cloze_tags(sentence)): # 80% similarity threshold
144
+ found = True
145
+ found_lines.append(line.text)
146
+ return found_lines
147
+
148
+
149
+ def get_mined_line(last_note: AnkiCard, lines):
150
+ if not last_note:
151
+ return lines[-1]
152
+ if not lines:
153
+ lines = get_all_lines()
154
+
155
+ sentence = last_note.get_field(get_config().anki.sentence_field)
156
+ for line in lines:
157
+ if lines_match(line.text, remove_html_and_cloze_tags(sentence)):
158
+ return line
159
+ return lines[-1]
160
+
161
+
162
+ def get_time_of_line(line):
163
+ return text_log.get_time(line)
164
+
165
+
166
+ def get_all_lines():
167
+ return text_log.values
168
+
169
+
170
+ def get_text_log() -> GameText:
171
+ return text_log
172
+
173
+ def add_line(current_line_after_regex, line_time):
174
+ text_log.add_line(current_line_after_regex, line_time)
175
+
176
+ def get_line_by_id(line_id: str) -> Optional[GameLine]:
177
+ """
178
+ Retrieve a GameLine by its unique ID.
179
+
180
+ Args:
181
+ line_id (str): The unique identifier of the GameLine.
182
+
183
+ Returns:
184
+ Optional[GameLine]: The GameLine object if found, otherwise None.
185
+ """
186
+ return text_log.get_by_id(line_id)
GameSentenceMiner/util.py CHANGED
@@ -1,10 +1,9 @@
1
- import importlib
1
+ import json
2
2
  import os
3
3
  import random
4
4
  import re
5
5
  import string
6
6
  import subprocess
7
- import sys
8
7
  import threading
9
8
  import time
10
9
  from datetime import datetime
@@ -206,4 +205,62 @@ def import_vad_models():
206
205
  from GameSentenceMiner.vad import whisper_helper
207
206
  if get_config().vad.is_vosk():
208
207
  from GameSentenceMiner.vad import vosk_helper
209
- return silero_trim, whisper_helper, vosk_helper
208
+ return silero_trim, whisper_helper, vosk_helper
209
+
210
+
211
+ def isascii(s: str):
212
+ try:
213
+ return s.isascii()
214
+ except:
215
+ try:
216
+ s.encode("ascii")
217
+ return True
218
+ except:
219
+ return False
220
+
221
+ def do_text_replacements(text, replacements_json):
222
+ if not text:
223
+ return text
224
+
225
+ replacements = {}
226
+ if os.path.exists(replacements_json):
227
+ with open(replacements_json, 'r', encoding='utf-8') as f:
228
+ replacements.update(json.load(f))
229
+
230
+ if replacements.get("enabled", False):
231
+ orig_text = text
232
+ filters = replacements.get("args", {}).get("replacements", {})
233
+ for fil, replacement in filters.items():
234
+ if not fil:
235
+ continue
236
+ if fil.startswith("re:"):
237
+ pattern = fil[3:]
238
+ try:
239
+ text = re.sub(pattern, replacement, text)
240
+ except Exception:
241
+ logger.error(f"Invalid regex pattern: {pattern}")
242
+ continue
243
+ if isascii(fil):
244
+ text = re.sub(r"\b{}\b".format(re.escape(fil)), replacement, text)
245
+ else:
246
+ text = text.replace(fil, replacement)
247
+ if text != orig_text:
248
+ logger.info(f"Text replaced: '{orig_text}' -> '{text}' using replacements.")
249
+ return text
250
+
251
+
252
+ TEXT_REPLACEMENTS_FILE = os.path.join(os.getenv('APPDATA'), 'GameSentenceMiner', 'config', 'text_replacements.json')
253
+ OCR_REPLACEMENTS_FILE = os.path.join(os.getenv('APPDATA'), 'GameSentenceMiner', 'config', 'ocr_replacements.json')
254
+ os.makedirs(os.path.dirname(TEXT_REPLACEMENTS_FILE), exist_ok=True)
255
+
256
+ import urllib.request
257
+
258
+ if not os.path.exists(TEXT_REPLACEMENTS_FILE):
259
+ url = "https://raw.githubusercontent.com/bpwhelan/GameSentenceMiner/refs/heads/main/electron-src/assets/ocr_replacements.json"
260
+ try:
261
+ with urllib.request.urlopen(url) as response:
262
+ data = response.read().decode('utf-8')
263
+ with open(TEXT_REPLACEMENTS_FILE, 'w', encoding='utf-8') as f:
264
+ f.write(data)
265
+ except Exception as e:
266
+ logger.error(f"Failed to fetch JSON from {url}: {e}")
File without changes
File without changes
Binary file
@@ -0,0 +1,3 @@
1
+ <svg xmlns="http://www.w3.org/2000/svg" version="1.1" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:svgjs="http://svgjs.dev/svgjs" width="67" height="64" viewBox="0 0 67 64"><image width="67" height="64" xlink:href=""></image><style>@media (prefers-color-scheme: light) { :root { filter: none; } }
2
+ @media (prefers-color-scheme: dark) { :root { filter: none; } }
3
+ </style></svg>
@@ -0,0 +1,21 @@
1
+ {
2
+ "name": "MyWebSite",
3
+ "short_name": "MySite",
4
+ "icons": [
5
+ {
6
+ "src": "/web-app-manifest-192x192.png",
7
+ "sizes": "192x192",
8
+ "type": "image/png",
9
+ "purpose": "maskable"
10
+ },
11
+ {
12
+ "src": "/web-app-manifest-512x512.png",
13
+ "sizes": "512x512",
14
+ "type": "image/png",
15
+ "purpose": "maskable"
16
+ }
17
+ ],
18
+ "theme_color": "#ffffff",
19
+ "background_color": "#ffffff",
20
+ "display": "standalone"
21
+ }