karaoke-gen 0.75.54__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of karaoke-gen might be problematic. Click here for more details.

Files changed (287) hide show
  1. karaoke_gen/__init__.py +38 -0
  2. karaoke_gen/audio_fetcher.py +1614 -0
  3. karaoke_gen/audio_processor.py +790 -0
  4. karaoke_gen/config.py +83 -0
  5. karaoke_gen/file_handler.py +387 -0
  6. karaoke_gen/instrumental_review/__init__.py +45 -0
  7. karaoke_gen/instrumental_review/analyzer.py +408 -0
  8. karaoke_gen/instrumental_review/editor.py +322 -0
  9. karaoke_gen/instrumental_review/models.py +171 -0
  10. karaoke_gen/instrumental_review/server.py +475 -0
  11. karaoke_gen/instrumental_review/static/index.html +1529 -0
  12. karaoke_gen/instrumental_review/waveform.py +409 -0
  13. karaoke_gen/karaoke_finalise/__init__.py +1 -0
  14. karaoke_gen/karaoke_finalise/karaoke_finalise.py +1833 -0
  15. karaoke_gen/karaoke_gen.py +1026 -0
  16. karaoke_gen/lyrics_processor.py +474 -0
  17. karaoke_gen/metadata.py +160 -0
  18. karaoke_gen/pipeline/__init__.py +87 -0
  19. karaoke_gen/pipeline/base.py +215 -0
  20. karaoke_gen/pipeline/context.py +230 -0
  21. karaoke_gen/pipeline/executors/__init__.py +21 -0
  22. karaoke_gen/pipeline/executors/local.py +159 -0
  23. karaoke_gen/pipeline/executors/remote.py +257 -0
  24. karaoke_gen/pipeline/stages/__init__.py +27 -0
  25. karaoke_gen/pipeline/stages/finalize.py +202 -0
  26. karaoke_gen/pipeline/stages/render.py +165 -0
  27. karaoke_gen/pipeline/stages/screens.py +139 -0
  28. karaoke_gen/pipeline/stages/separation.py +191 -0
  29. karaoke_gen/pipeline/stages/transcription.py +191 -0
  30. karaoke_gen/resources/AvenirNext-Bold.ttf +0 -0
  31. karaoke_gen/resources/Montserrat-Bold.ttf +0 -0
  32. karaoke_gen/resources/Oswald-Bold.ttf +0 -0
  33. karaoke_gen/resources/Oswald-SemiBold.ttf +0 -0
  34. karaoke_gen/resources/Zurich_Cn_BT_Bold.ttf +0 -0
  35. karaoke_gen/style_loader.py +531 -0
  36. karaoke_gen/utils/__init__.py +18 -0
  37. karaoke_gen/utils/bulk_cli.py +492 -0
  38. karaoke_gen/utils/cli_args.py +432 -0
  39. karaoke_gen/utils/gen_cli.py +978 -0
  40. karaoke_gen/utils/remote_cli.py +3268 -0
  41. karaoke_gen/video_background_processor.py +351 -0
  42. karaoke_gen/video_generator.py +424 -0
  43. karaoke_gen-0.75.54.dist-info/METADATA +718 -0
  44. karaoke_gen-0.75.54.dist-info/RECORD +287 -0
  45. karaoke_gen-0.75.54.dist-info/WHEEL +4 -0
  46. karaoke_gen-0.75.54.dist-info/entry_points.txt +5 -0
  47. karaoke_gen-0.75.54.dist-info/licenses/LICENSE +21 -0
  48. lyrics_transcriber/__init__.py +10 -0
  49. lyrics_transcriber/cli/__init__.py +0 -0
  50. lyrics_transcriber/cli/cli_main.py +285 -0
  51. lyrics_transcriber/core/__init__.py +0 -0
  52. lyrics_transcriber/core/config.py +50 -0
  53. lyrics_transcriber/core/controller.py +594 -0
  54. lyrics_transcriber/correction/__init__.py +0 -0
  55. lyrics_transcriber/correction/agentic/__init__.py +9 -0
  56. lyrics_transcriber/correction/agentic/adapter.py +71 -0
  57. lyrics_transcriber/correction/agentic/agent.py +313 -0
  58. lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
  59. lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
  60. lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
  61. lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
  62. lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
  63. lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
  64. lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
  65. lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
  66. lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
  67. lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
  68. lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
  69. lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
  70. lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
  71. lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
  72. lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
  73. lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
  74. lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
  75. lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
  76. lyrics_transcriber/correction/agentic/models/enums.py +38 -0
  77. lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
  78. lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
  79. lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
  80. lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
  81. lyrics_transcriber/correction/agentic/models/utils.py +19 -0
  82. lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
  83. lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
  84. lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
  85. lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
  86. lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
  87. lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
  88. lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
  89. lyrics_transcriber/correction/agentic/providers/base.py +36 -0
  90. lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
  91. lyrics_transcriber/correction/agentic/providers/config.py +73 -0
  92. lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
  93. lyrics_transcriber/correction/agentic/providers/health.py +28 -0
  94. lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
  95. lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
  96. lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
  97. lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
  98. lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
  99. lyrics_transcriber/correction/agentic/router.py +35 -0
  100. lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
  101. lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
  102. lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
  103. lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
  104. lyrics_transcriber/correction/anchor_sequence.py +919 -0
  105. lyrics_transcriber/correction/corrector.py +760 -0
  106. lyrics_transcriber/correction/feedback/__init__.py +2 -0
  107. lyrics_transcriber/correction/feedback/schemas.py +107 -0
  108. lyrics_transcriber/correction/feedback/store.py +236 -0
  109. lyrics_transcriber/correction/handlers/__init__.py +0 -0
  110. lyrics_transcriber/correction/handlers/base.py +52 -0
  111. lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
  112. lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
  113. lyrics_transcriber/correction/handlers/llm.py +293 -0
  114. lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
  115. lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
  116. lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
  117. lyrics_transcriber/correction/handlers/repeat.py +88 -0
  118. lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
  119. lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
  120. lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
  121. lyrics_transcriber/correction/handlers/word_operations.py +187 -0
  122. lyrics_transcriber/correction/operations.py +352 -0
  123. lyrics_transcriber/correction/phrase_analyzer.py +435 -0
  124. lyrics_transcriber/correction/text_utils.py +30 -0
  125. lyrics_transcriber/frontend/.gitignore +23 -0
  126. lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
  127. lyrics_transcriber/frontend/.yarnrc.yml +3 -0
  128. lyrics_transcriber/frontend/README.md +50 -0
  129. lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
  130. lyrics_transcriber/frontend/__init__.py +25 -0
  131. lyrics_transcriber/frontend/eslint.config.js +28 -0
  132. lyrics_transcriber/frontend/index.html +18 -0
  133. lyrics_transcriber/frontend/package.json +42 -0
  134. lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
  135. lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
  136. lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
  137. lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
  138. lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
  139. lyrics_transcriber/frontend/public/favicon.ico +0 -0
  140. lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
  141. lyrics_transcriber/frontend/src/App.tsx +214 -0
  142. lyrics_transcriber/frontend/src/api.ts +254 -0
  143. lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
  144. lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
  145. lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
  146. lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
  147. lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
  148. lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
  149. lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
  150. lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
  151. lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
  152. lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
  153. lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
  154. lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
  155. lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
  156. lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
  157. lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
  158. lyrics_transcriber/frontend/src/components/Header.tsx +413 -0
  159. lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1387 -0
  160. lyrics_transcriber/frontend/src/components/LyricsSynchronizer/SyncControls.tsx +185 -0
  161. lyrics_transcriber/frontend/src/components/LyricsSynchronizer/TimelineCanvas.tsx +704 -0
  162. lyrics_transcriber/frontend/src/components/LyricsSynchronizer/UpcomingWordsBar.tsx +80 -0
  163. lyrics_transcriber/frontend/src/components/LyricsSynchronizer/index.tsx +905 -0
  164. lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
  165. lyrics_transcriber/frontend/src/components/ModeSelectionModal.tsx +127 -0
  166. lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
  167. lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
  168. lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
  169. lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
  170. lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +336 -0
  171. lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
  172. lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
  173. lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
  174. lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
  175. lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
  176. lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
  177. lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
  178. lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
  179. lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
  180. lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
  181. lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
  182. lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
  183. lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
  184. lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
  185. lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
  186. lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
  187. lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
  188. lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
  189. lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
  190. lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
  191. lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
  192. lyrics_transcriber/frontend/src/main.tsx +17 -0
  193. lyrics_transcriber/frontend/src/theme.ts +177 -0
  194. lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
  195. lyrics_transcriber/frontend/src/types.js +2 -0
  196. lyrics_transcriber/frontend/src/types.ts +199 -0
  197. lyrics_transcriber/frontend/src/validation.ts +132 -0
  198. lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
  199. lyrics_transcriber/frontend/tsconfig.app.json +26 -0
  200. lyrics_transcriber/frontend/tsconfig.json +25 -0
  201. lyrics_transcriber/frontend/tsconfig.node.json +23 -0
  202. lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
  203. lyrics_transcriber/frontend/update_version.js +11 -0
  204. lyrics_transcriber/frontend/vite.config.d.ts +2 -0
  205. lyrics_transcriber/frontend/vite.config.js +10 -0
  206. lyrics_transcriber/frontend/vite.config.ts +11 -0
  207. lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
  208. lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
  209. lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
  210. lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js +43288 -0
  211. lyrics_transcriber/frontend/web_assets/assets/index-BECn1o8Q.js.map +1 -0
  212. lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
  213. lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
  214. lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
  215. lyrics_transcriber/frontend/web_assets/index.html +18 -0
  216. lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
  217. lyrics_transcriber/frontend/yarn.lock +3752 -0
  218. lyrics_transcriber/lyrics/__init__.py +0 -0
  219. lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
  220. lyrics_transcriber/lyrics/file_provider.py +95 -0
  221. lyrics_transcriber/lyrics/genius.py +384 -0
  222. lyrics_transcriber/lyrics/lrclib.py +231 -0
  223. lyrics_transcriber/lyrics/musixmatch.py +156 -0
  224. lyrics_transcriber/lyrics/spotify.py +290 -0
  225. lyrics_transcriber/lyrics/user_input_provider.py +44 -0
  226. lyrics_transcriber/output/__init__.py +0 -0
  227. lyrics_transcriber/output/ass/__init__.py +21 -0
  228. lyrics_transcriber/output/ass/ass.py +2088 -0
  229. lyrics_transcriber/output/ass/ass_specs.txt +732 -0
  230. lyrics_transcriber/output/ass/config.py +180 -0
  231. lyrics_transcriber/output/ass/constants.py +23 -0
  232. lyrics_transcriber/output/ass/event.py +94 -0
  233. lyrics_transcriber/output/ass/formatters.py +132 -0
  234. lyrics_transcriber/output/ass/lyrics_line.py +265 -0
  235. lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
  236. lyrics_transcriber/output/ass/section_detector.py +89 -0
  237. lyrics_transcriber/output/ass/section_screen.py +106 -0
  238. lyrics_transcriber/output/ass/style.py +187 -0
  239. lyrics_transcriber/output/cdg.py +619 -0
  240. lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
  241. lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
  242. lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
  243. lyrics_transcriber/output/cdgmaker/config.py +151 -0
  244. lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
  245. lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
  246. lyrics_transcriber/output/cdgmaker/pack.py +507 -0
  247. lyrics_transcriber/output/cdgmaker/render.py +346 -0
  248. lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
  249. lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
  250. lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
  251. lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
  252. lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
  253. lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
  254. lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
  255. lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
  256. lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
  257. lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
  258. lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
  259. lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
  260. lyrics_transcriber/output/cdgmaker/utils.py +132 -0
  261. lyrics_transcriber/output/countdown_processor.py +306 -0
  262. lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
  263. lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
  264. lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
  265. lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
  266. lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
  267. lyrics_transcriber/output/fonts/arial.ttf +0 -0
  268. lyrics_transcriber/output/fonts/georgia.ttf +0 -0
  269. lyrics_transcriber/output/fonts/verdana.ttf +0 -0
  270. lyrics_transcriber/output/generator.py +257 -0
  271. lyrics_transcriber/output/lrc_to_cdg.py +61 -0
  272. lyrics_transcriber/output/lyrics_file.py +102 -0
  273. lyrics_transcriber/output/plain_text.py +96 -0
  274. lyrics_transcriber/output/segment_resizer.py +431 -0
  275. lyrics_transcriber/output/subtitles.py +397 -0
  276. lyrics_transcriber/output/video.py +544 -0
  277. lyrics_transcriber/review/__init__.py +0 -0
  278. lyrics_transcriber/review/server.py +676 -0
  279. lyrics_transcriber/storage/__init__.py +0 -0
  280. lyrics_transcriber/storage/dropbox.py +225 -0
  281. lyrics_transcriber/transcribers/__init__.py +0 -0
  282. lyrics_transcriber/transcribers/audioshake.py +379 -0
  283. lyrics_transcriber/transcribers/base_transcriber.py +157 -0
  284. lyrics_transcriber/transcribers/whisper.py +330 -0
  285. lyrics_transcriber/types.py +650 -0
  286. lyrics_transcriber/utils/__init__.py +0 -0
  287. lyrics_transcriber/utils/word_utils.py +27 -0
@@ -0,0 +1,435 @@
1
+ import { useState, useCallback, useEffect, useRef } from 'react'
2
+ import { LyricsSegment, Word } from '../types'
3
+
4
+ interface UseManualSyncProps {
5
+ editedSegment: LyricsSegment | null
6
+ currentTime: number
7
+ onPlaySegment?: (startTime: number) => void
8
+ updateSegment: (words: Word[]) => void
9
+ }
10
+
11
+ // Constants for tap detection
12
+ const TAP_THRESHOLD_MS = 200 // If spacebar is pressed for less than this time, it's considered a tap
13
+ const DEFAULT_WORD_DURATION = 0.5 // Default duration in seconds when tapping (500ms)
14
+ const OVERLAP_BUFFER = 0.01 // Buffer to prevent word overlap (10ms)
15
+
16
+ export default function useManualSync({
17
+ editedSegment,
18
+ currentTime,
19
+ onPlaySegment,
20
+ updateSegment
21
+ }: UseManualSyncProps) {
22
+ const [isManualSyncing, setIsManualSyncing] = useState(false)
23
+ const [isPaused, setIsPaused] = useState(false)
24
+ const [syncWordIndex, setSyncWordIndex] = useState<number>(-1)
25
+ const currentTimeRef = useRef(currentTime)
26
+ const [isSpacebarPressed, setIsSpacebarPressed] = useState(false)
27
+ const wordStartTimeRef = useRef<number | null>(null)
28
+ const wordsRef = useRef<Word[]>([])
29
+ const spacebarPressTimeRef = useRef<number | null>(null)
30
+
31
+ // Use ref to track if we need to update segment to avoid calling it too frequently
32
+ const needsSegmentUpdateRef = useRef(false)
33
+
34
+ // Keep currentTimeRef up to date
35
+ useEffect(() => {
36
+ currentTimeRef.current = currentTime
37
+ }, [currentTime])
38
+
39
+ // Keep wordsRef up to date
40
+ useEffect(() => {
41
+ if (editedSegment) {
42
+ wordsRef.current = [...editedSegment.words]
43
+ }
44
+ }, [editedSegment])
45
+
46
+ // Debounced segment update to batch multiple word changes
47
+ useEffect(() => {
48
+ if (needsSegmentUpdateRef.current) {
49
+ needsSegmentUpdateRef.current = false
50
+ updateSegment(wordsRef.current)
51
+ }
52
+ }, [updateSegment, syncWordIndex]) // Only update when syncWordIndex changes
53
+
54
+ const cleanupManualSync = useCallback(() => {
55
+ setIsManualSyncing(false)
56
+ setIsPaused(false)
57
+ setSyncWordIndex(-1)
58
+ setIsSpacebarPressed(false)
59
+ wordStartTimeRef.current = null
60
+ spacebarPressTimeRef.current = null
61
+ needsSegmentUpdateRef.current = false
62
+
63
+ // Stop audio playback when cleaning up manual sync
64
+ if (window.toggleAudioPlayback && window.isAudioPlaying) {
65
+ window.toggleAudioPlayback()
66
+ }
67
+ }, [])
68
+
69
+ const pauseManualSync = useCallback(() => {
70
+ if (isManualSyncing && !isPaused) {
71
+ console.log('useManualSync - Pausing manual sync')
72
+ setIsPaused(true)
73
+ // Pause audio playback
74
+ if (window.toggleAudioPlayback && window.isAudioPlaying) {
75
+ window.toggleAudioPlayback()
76
+ }
77
+ }
78
+ }, [isManualSyncing, isPaused])
79
+
80
+ const resumeManualSync = useCallback(() => {
81
+ if (isManualSyncing && isPaused) {
82
+ console.log('useManualSync - Resuming manual sync')
83
+ setIsPaused(false)
84
+
85
+ // Find the first unsynced word and resume from there
86
+ if (editedSegment) {
87
+ const firstUnsyncedIndex = editedSegment.words.findIndex(word =>
88
+ word.start_time === null || word.end_time === null
89
+ )
90
+
91
+ if (firstUnsyncedIndex !== -1 && firstUnsyncedIndex !== syncWordIndex) {
92
+ console.log('useManualSync - Resuming from first unsynced word', {
93
+ previousIndex: syncWordIndex,
94
+ newIndex: firstUnsyncedIndex,
95
+ wordText: editedSegment.words[firstUnsyncedIndex]?.text
96
+ })
97
+ setSyncWordIndex(firstUnsyncedIndex)
98
+ } else {
99
+ console.log('useManualSync - Resuming from current position', { syncWordIndex })
100
+ }
101
+ }
102
+
103
+ // Resume audio playback if we have an onPlaySegment function
104
+ if (onPlaySegment && currentTimeRef.current !== undefined) {
105
+ onPlaySegment(currentTimeRef.current)
106
+ }
107
+ }
108
+ }, [isManualSyncing, isPaused, onPlaySegment, editedSegment, syncWordIndex])
109
+
110
+ const handleKeyDown = useCallback((e: KeyboardEvent) => {
111
+ if (e.code !== 'Space') return
112
+
113
+ console.log('useManualSync - Spacebar pressed down', {
114
+ isManualSyncing,
115
+ hasEditedSegment: !!editedSegment,
116
+ syncWordIndex,
117
+ currentTime: currentTimeRef.current
118
+ })
119
+
120
+ e.preventDefault()
121
+ e.stopPropagation()
122
+
123
+ if (isManualSyncing && editedSegment && !isSpacebarPressed && !isPaused) {
124
+ setIsSpacebarPressed(true)
125
+
126
+ // Record the start time of the current word
127
+ wordStartTimeRef.current = currentTimeRef.current
128
+
129
+ // Record when the spacebar was pressed (for tap detection)
130
+ spacebarPressTimeRef.current = Date.now()
131
+
132
+ // Update the word's start time immediately
133
+ if (syncWordIndex < editedSegment.words.length) {
134
+ const newWords = [...wordsRef.current]
135
+ const currentWord = newWords[syncWordIndex]
136
+ const currentStartTime = currentTimeRef.current
137
+
138
+ // Set the start time for the current word
139
+ currentWord.start_time = currentStartTime
140
+
141
+ // Handle the end time of the previous word (if it exists)
142
+ if (syncWordIndex > 0) {
143
+ const previousWord = newWords[syncWordIndex - 1]
144
+ if (previousWord.start_time !== null) {
145
+ const timeSincePreviousStart = currentStartTime - previousWord.start_time
146
+
147
+ // Only adjust previous word's end time if:
148
+ // 1. It doesn't have an end time set yet (was never released), OR
149
+ // 2. The current start would overlap with existing end time
150
+ const needsAdjustment = previousWord.end_time === null ||
151
+ (previousWord.end_time !== null && previousWord.end_time > currentStartTime)
152
+
153
+ if (needsAdjustment) {
154
+ if (timeSincePreviousStart > 1.0) {
155
+ // Gap of over 1 second - set previous word's end time to 500ms after its start
156
+ previousWord.end_time = previousWord.start_time + 0.5
157
+ console.log('useManualSync - Gap detected, setting previous word end time to +500ms', {
158
+ previousWordIndex: syncWordIndex - 1,
159
+ previousWordText: previousWord.text,
160
+ previousStartTime: previousWord.start_time,
161
+ previousEndTime: previousWord.end_time,
162
+ gap: timeSincePreviousStart.toFixed(2) + 's',
163
+ reason: 'gap > 1s'
164
+ })
165
+ } else {
166
+ // Normal flow - set previous word's end time to current word's start time minus 5ms
167
+ previousWord.end_time = currentStartTime - 0.005
168
+ console.log('useManualSync - Setting previous word end time to current start - 5ms', {
169
+ previousWordIndex: syncWordIndex - 1,
170
+ previousWordText: previousWord.text,
171
+ previousEndTime: previousWord.end_time,
172
+ currentStartTime: currentStartTime,
173
+ gap: timeSincePreviousStart.toFixed(2) + 's',
174
+ reason: 'normal flow'
175
+ })
176
+ }
177
+ } else {
178
+ console.log('useManualSync - Preserving previous word timing (manually set)', {
179
+ previousWordIndex: syncWordIndex - 1,
180
+ previousWordText: previousWord.text,
181
+ previousStartTime: previousWord.start_time,
182
+ previousEndTime: previousWord.end_time,
183
+ preservedDuration: previousWord.end_time !== null ?
184
+ (previousWord.end_time - previousWord.start_time).toFixed(2) + 's' : 'N/A',
185
+ reason: 'already timed correctly'
186
+ })
187
+ }
188
+ }
189
+ }
190
+
191
+ console.log('useManualSync - Recording word start time', {
192
+ wordIndex: syncWordIndex,
193
+ wordText: currentWord?.text,
194
+ time: currentStartTime
195
+ })
196
+
197
+ // Update our ref
198
+ wordsRef.current = newWords
199
+
200
+ // Mark that we need to update the segment
201
+ needsSegmentUpdateRef.current = true
202
+ }
203
+ } else if (!isManualSyncing && editedSegment && onPlaySegment) {
204
+ console.log('useManualSync - Handling segment playback', {
205
+ editedSegmentId: editedSegment.id,
206
+ isGlobalReplacement: editedSegment.id === 'global-replacement'
207
+ })
208
+
209
+ // For global replacement segments, don't handle general playback
210
+ // since we want the user to use Manual Sync instead
211
+ if (editedSegment.id === 'global-replacement') {
212
+ console.log('useManualSync - Ignoring playback for global replacement - please use Manual Sync')
213
+ return
214
+ }
215
+
216
+ // Toggle segment playback when not in manual sync mode
217
+ const startTime = editedSegment.start_time ?? 0
218
+ const endTime = editedSegment.end_time ?? 0
219
+
220
+ if (currentTimeRef.current >= startTime && currentTimeRef.current <= endTime) {
221
+ if (window.toggleAudioPlayback) {
222
+ window.toggleAudioPlayback()
223
+ }
224
+ } else {
225
+ onPlaySegment(startTime)
226
+ }
227
+ }
228
+ }, [isManualSyncing, editedSegment, syncWordIndex, onPlaySegment, isSpacebarPressed, isPaused])
229
+
230
+ const handleKeyUp = useCallback((e: KeyboardEvent) => {
231
+ if (e.code !== 'Space') return
232
+
233
+ console.log('useManualSync - Spacebar released', {
234
+ isManualSyncing,
235
+ hasEditedSegment: !!editedSegment,
236
+ syncWordIndex,
237
+ currentTime: currentTimeRef.current,
238
+ wordStartTime: wordStartTimeRef.current
239
+ })
240
+
241
+ e.preventDefault()
242
+ e.stopPropagation()
243
+
244
+ if (isManualSyncing && editedSegment && isSpacebarPressed && !isPaused) {
245
+ const currentWord = syncWordIndex < editedSegment.words.length ? editedSegment.words[syncWordIndex] : null
246
+ const pressDuration = spacebarPressTimeRef.current ? Date.now() - spacebarPressTimeRef.current : 0
247
+ const isTap = pressDuration < TAP_THRESHOLD_MS
248
+
249
+ console.log('useManualSync - Recording word end time', {
250
+ wordIndex: syncWordIndex,
251
+ wordText: currentWord?.text,
252
+ startTime: wordStartTimeRef.current,
253
+ endTime: currentTimeRef.current,
254
+ pressDuration: `${pressDuration}ms`,
255
+ isTap,
256
+ tapThreshold: TAP_THRESHOLD_MS,
257
+ duration: currentWord ? (currentTimeRef.current - (wordStartTimeRef.current || 0)).toFixed(2) + 's' : 'N/A'
258
+ })
259
+
260
+ setIsSpacebarPressed(false)
261
+
262
+ if (syncWordIndex < editedSegment.words.length) {
263
+ const newWords = [...wordsRef.current]
264
+ const currentWord = newWords[syncWordIndex]
265
+
266
+ // Set the end time for the current word based on whether it was a tap or hold
267
+ if (isTap) {
268
+ // For a tap, set a default duration
269
+ const defaultEndTime = (wordStartTimeRef.current || currentTimeRef.current) + DEFAULT_WORD_DURATION
270
+ currentWord.end_time = defaultEndTime
271
+ console.log('useManualSync - Tap detected, setting default duration', {
272
+ wordText: currentWord.text,
273
+ startTime: wordStartTimeRef.current,
274
+ defaultEndTime,
275
+ duration: DEFAULT_WORD_DURATION
276
+ })
277
+ } else {
278
+ // For a hold, use the current time as the end time
279
+ currentWord.end_time = currentTimeRef.current
280
+ console.log('useManualSync - Hold detected, using actual timing', {
281
+ wordText: currentWord.text,
282
+ startTime: wordStartTimeRef.current,
283
+ endTime: currentTimeRef.current,
284
+ actualDuration: (currentTimeRef.current - (wordStartTimeRef.current || 0)).toFixed(2) + 's'
285
+ })
286
+ }
287
+
288
+ // Update our ref
289
+ wordsRef.current = newWords
290
+
291
+ // Move to the next word
292
+ if (syncWordIndex === editedSegment.words.length - 1) {
293
+ // If this was the last word, finish manual sync
294
+ console.log('useManualSync - Completed manual sync for all words')
295
+ setIsManualSyncing(false)
296
+ setSyncWordIndex(-1)
297
+ wordStartTimeRef.current = null
298
+ spacebarPressTimeRef.current = null
299
+ } else {
300
+ // Otherwise, move to the next word
301
+ const nextWord = editedSegment.words[syncWordIndex + 1]
302
+ console.log('useManualSync - Moving to next word', {
303
+ nextWordIndex: syncWordIndex + 1,
304
+ nextWordText: nextWord?.text
305
+ })
306
+ setSyncWordIndex(syncWordIndex + 1)
307
+ }
308
+
309
+ // Mark that we need to update the segment
310
+ needsSegmentUpdateRef.current = true
311
+ }
312
+ }
313
+ }, [isManualSyncing, editedSegment, syncWordIndex, isSpacebarPressed, isPaused])
314
+
315
+ // Add a handler for when the next word starts to adjust previous word's end time if needed
316
+ useEffect(() => {
317
+ if (isManualSyncing && editedSegment && syncWordIndex > 0) {
318
+ const newWords = [...wordsRef.current]
319
+ const prevWord = newWords[syncWordIndex - 1]
320
+ const currentWord = newWords[syncWordIndex]
321
+
322
+ // If the previous word's end time overlaps with the current word's start time,
323
+ // adjust the previous word's end time
324
+ if (prevWord && currentWord &&
325
+ prevWord.end_time !== null && currentWord.start_time !== null &&
326
+ prevWord.end_time > currentWord.start_time) {
327
+
328
+ console.log('useManualSync - Adjusting previous word end time to prevent overlap', {
329
+ prevWordIndex: syncWordIndex - 1,
330
+ prevWordText: prevWord.text,
331
+ prevWordEndTime: prevWord.end_time,
332
+ currentWordStartTime: currentWord.start_time,
333
+ newEndTime: currentWord.start_time - OVERLAP_BUFFER
334
+ })
335
+
336
+ prevWord.end_time = currentWord.start_time - OVERLAP_BUFFER
337
+
338
+ // Update our ref
339
+ wordsRef.current = newWords
340
+
341
+ // Mark that we need to update the segment
342
+ needsSegmentUpdateRef.current = true
343
+ }
344
+ }
345
+ }, [syncWordIndex, isManualSyncing, editedSegment])
346
+
347
+ // Combine the key handlers into a single function for external use
348
+ const handleSpacebar = useCallback((e: KeyboardEvent) => {
349
+ if (e.type === 'keydown') {
350
+ handleKeyDown(e)
351
+ } else if (e.type === 'keyup') {
352
+ handleKeyUp(e)
353
+ }
354
+ }, [handleKeyDown, handleKeyUp])
355
+
356
+ const startManualSync = useCallback(() => {
357
+ if (isManualSyncing) {
358
+ cleanupManualSync()
359
+ return
360
+ }
361
+
362
+ if (!editedSegment || !onPlaySegment) return
363
+
364
+ // Make sure we have the latest words
365
+ wordsRef.current = [...editedSegment.words]
366
+
367
+ // Find the first unsynced word to start from
368
+ const firstUnsyncedIndex = editedSegment.words.findIndex(word =>
369
+ word.start_time === null || word.end_time === null
370
+ )
371
+
372
+ const startIndex = firstUnsyncedIndex !== -1 ? firstUnsyncedIndex : 0
373
+
374
+ console.log('useManualSync - Starting manual sync', {
375
+ totalWords: editedSegment.words.length,
376
+ startingFromIndex: startIndex,
377
+ startingWord: editedSegment.words[startIndex]?.text
378
+ })
379
+
380
+ setIsManualSyncing(true)
381
+ setSyncWordIndex(startIndex)
382
+ setIsSpacebarPressed(false)
383
+ wordStartTimeRef.current = null
384
+ spacebarPressTimeRef.current = null
385
+ needsSegmentUpdateRef.current = false
386
+ // Start playing 3 seconds before segment start
387
+ onPlaySegment((editedSegment.start_time ?? 0) - 3)
388
+ }, [isManualSyncing, editedSegment, onPlaySegment, cleanupManualSync])
389
+
390
+ // Auto-stop sync if we go past the end time (but not for global replacement segments)
391
+ useEffect(() => {
392
+ if (!editedSegment || !isManualSyncing) return
393
+
394
+ // Don't auto-stop for global replacement segments - let user manually finish
395
+ if (editedSegment.id === 'global-replacement') {
396
+ console.log('useManualSync - Skipping auto-stop for global replacement segment')
397
+ return
398
+ }
399
+
400
+ // Set up an interval to check if we should auto-stop
401
+ const checkAutoStop = () => {
402
+ const endTime = editedSegment.end_time ?? 0
403
+
404
+ if (window.isAudioPlaying && currentTimeRef.current > endTime) {
405
+ console.log('useManualSync - Auto-stopping: current time exceeded end time', {
406
+ currentTime: currentTimeRef.current,
407
+ endTime,
408
+ segmentId: editedSegment.id
409
+ })
410
+ window.toggleAudioPlayback?.()
411
+ cleanupManualSync()
412
+ }
413
+ }
414
+
415
+ // Check immediately and then every 100ms
416
+ checkAutoStop()
417
+ const intervalId = setInterval(checkAutoStop, 100)
418
+
419
+ return () => {
420
+ clearInterval(intervalId)
421
+ }
422
+ }, [isManualSyncing, editedSegment, cleanupManualSync])
423
+
424
+ return {
425
+ isManualSyncing,
426
+ isPaused,
427
+ syncWordIndex,
428
+ startManualSync,
429
+ pauseManualSync,
430
+ resumeManualSync,
431
+ cleanupManualSync,
432
+ handleSpacebar,
433
+ isSpacebarPressed
434
+ }
435
+ }
@@ -0,0 +1,17 @@
1
+ import ReactDOM from 'react-dom/client'
2
+ import { ThemeProvider } from '@mui/material/styles'
3
+ import CssBaseline from '@mui/material/CssBaseline'
4
+ import App from './App'
5
+ import theme from './theme'
6
+ // Import version from package.json
7
+ import packageJson from '../package.json'
8
+
9
+ // Log the frontend version when the app loads
10
+ console.log(`🎵 Lyrics Transcriber Frontend v${packageJson.version}`)
11
+
12
+ ReactDOM.createRoot(document.getElementById('root')!).render(
13
+ <ThemeProvider theme={theme}>
14
+ <CssBaseline />
15
+ <App />
16
+ </ThemeProvider>
17
+ )
@@ -0,0 +1,177 @@
1
+ import { createTheme } from '@mui/material/styles';
2
+
3
+ // Create a theme with smaller typography and spacing
4
+ const theme = createTheme({
5
+ typography: {
6
+ // Scale down all typography by about 20%
7
+ fontSize: 14, // Default is 16
8
+ h1: {
9
+ fontSize: '2.5rem', // Default is ~3rem
10
+ },
11
+ h2: {
12
+ fontSize: '2rem', // Default is ~2.5rem
13
+ },
14
+ h3: {
15
+ fontSize: '1.5rem', // Default is ~1.75rem
16
+ },
17
+ h4: {
18
+ fontSize: '1.2rem', // Default is ~1.5rem
19
+ marginBottom: '0.5rem',
20
+ },
21
+ h5: {
22
+ fontSize: '1rem', // Default is ~1.25rem
23
+ },
24
+ h6: {
25
+ fontSize: '0.9rem', // Default is ~1.1rem
26
+ marginBottom: '0.5rem',
27
+ },
28
+ body1: {
29
+ fontSize: '0.85rem', // Default is ~1rem
30
+ },
31
+ body2: {
32
+ fontSize: '0.75rem', // Default is ~0.875rem
33
+ },
34
+ button: {
35
+ fontSize: '0.8rem', // Default is ~0.875rem
36
+ },
37
+ caption: {
38
+ fontSize: '0.7rem', // Default is ~0.75rem
39
+ },
40
+ },
41
+ components: {
42
+ MuiButton: {
43
+ styleOverrides: {
44
+ root: {
45
+ padding: '3px 10px', // Further reduced from 4px 12px
46
+ minHeight: '30px', // Further reduced from 32px
47
+ },
48
+ sizeSmall: {
49
+ padding: '1px 6px', // Further reduced from 2px 8px
50
+ minHeight: '24px', // Further reduced from 28px
51
+ },
52
+ },
53
+ },
54
+ MuiIconButton: {
55
+ styleOverrides: {
56
+ root: {
57
+ padding: '4px', // Further reduced from 6px
58
+ },
59
+ sizeSmall: {
60
+ padding: '2px', // Further reduced from 4px
61
+ },
62
+ },
63
+ },
64
+ MuiTextField: {
65
+ styleOverrides: {
66
+ root: {
67
+ '& .MuiInputBase-root': {
68
+ minHeight: '32px', // Further reduced from 36px
69
+ },
70
+ },
71
+ },
72
+ },
73
+ MuiDialog: {
74
+ styleOverrides: {
75
+ paper: {
76
+ padding: '8px', // Further reduced from 12px
77
+ },
78
+ },
79
+ },
80
+ MuiDialogTitle: {
81
+ styleOverrides: {
82
+ root: {
83
+ padding: '8px 12px', // Further reduced from 12px 16px
84
+ },
85
+ },
86
+ },
87
+ MuiDialogContent: {
88
+ styleOverrides: {
89
+ root: {
90
+ padding: '6px 12px', // Further reduced from 8px 16px
91
+ },
92
+ },
93
+ },
94
+ MuiDialogActions: {
95
+ styleOverrides: {
96
+ root: {
97
+ padding: '6px 12px', // Further reduced from 8px 16px
98
+ },
99
+ },
100
+ },
101
+ MuiPaper: {
102
+ styleOverrides: {
103
+ root: {
104
+ padding: '8px', // Further reduced from 12px
105
+ },
106
+ },
107
+ },
108
+ MuiList: {
109
+ styleOverrides: {
110
+ root: {
111
+ padding: '2px 0', // Further reduced from 4px 0
112
+ },
113
+ },
114
+ },
115
+ MuiListItem: {
116
+ styleOverrides: {
117
+ root: {
118
+ padding: '2px 8px', // Further reduced from 4px 12px
119
+ },
120
+ },
121
+ },
122
+ MuiTableCell: {
123
+ styleOverrides: {
124
+ root: {
125
+ padding: '4px 8px', // Further reduced from 8px 12px
126
+ },
127
+ },
128
+ },
129
+ MuiCard: {
130
+ styleOverrides: {
131
+ root: {
132
+ padding: '8px',
133
+ },
134
+ },
135
+ },
136
+ MuiCardContent: {
137
+ styleOverrides: {
138
+ root: {
139
+ padding: '8px',
140
+ '&:last-child': {
141
+ paddingBottom: '8px',
142
+ },
143
+ },
144
+ },
145
+ },
146
+ MuiCardHeader: {
147
+ styleOverrides: {
148
+ root: {
149
+ padding: '8px',
150
+ },
151
+ },
152
+ },
153
+ MuiCardActions: {
154
+ styleOverrides: {
155
+ root: {
156
+ padding: '4px 8px',
157
+ },
158
+ },
159
+ },
160
+ MuiGrid: {
161
+ styleOverrides: {
162
+ container: {
163
+ marginTop: '-4px',
164
+ marginLeft: '-4px',
165
+ width: 'calc(100% + 8px)',
166
+ },
167
+ item: {
168
+ paddingTop: '4px',
169
+ paddingLeft: '4px',
170
+ },
171
+ },
172
+ },
173
+ },
174
+ spacing: (factor: number) => `${0.6 * factor}rem`, // Further reduced from 0.8 * factor
175
+ });
176
+
177
+ export default theme;
@@ -0,0 +1,9 @@
1
+ declare global {
2
+ interface Window {
3
+ toggleAudioPlayback?: () => void;
4
+ seekAndPlayAudio?: (startTime: number) => void;
5
+ isAudioPlaying?: boolean;
6
+ }
7
+ }
8
+
9
+ export {}
@@ -0,0 +1,2 @@
1
+ "use strict";
2
+ Object.defineProperty(exports, "__esModule", { value: true });