karaoke-gen 0.57.0__py3-none-any.whl → 0.71.27__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (268) hide show
  1. karaoke_gen/audio_fetcher.py +461 -0
  2. karaoke_gen/audio_processor.py +407 -30
  3. karaoke_gen/config.py +62 -113
  4. karaoke_gen/file_handler.py +32 -59
  5. karaoke_gen/karaoke_finalise/karaoke_finalise.py +148 -67
  6. karaoke_gen/karaoke_gen.py +270 -61
  7. karaoke_gen/lyrics_processor.py +13 -1
  8. karaoke_gen/metadata.py +78 -73
  9. karaoke_gen/pipeline/__init__.py +87 -0
  10. karaoke_gen/pipeline/base.py +215 -0
  11. karaoke_gen/pipeline/context.py +230 -0
  12. karaoke_gen/pipeline/executors/__init__.py +21 -0
  13. karaoke_gen/pipeline/executors/local.py +159 -0
  14. karaoke_gen/pipeline/executors/remote.py +257 -0
  15. karaoke_gen/pipeline/stages/__init__.py +27 -0
  16. karaoke_gen/pipeline/stages/finalize.py +202 -0
  17. karaoke_gen/pipeline/stages/render.py +165 -0
  18. karaoke_gen/pipeline/stages/screens.py +139 -0
  19. karaoke_gen/pipeline/stages/separation.py +191 -0
  20. karaoke_gen/pipeline/stages/transcription.py +191 -0
  21. karaoke_gen/style_loader.py +531 -0
  22. karaoke_gen/utils/bulk_cli.py +6 -0
  23. karaoke_gen/utils/cli_args.py +424 -0
  24. karaoke_gen/utils/gen_cli.py +26 -261
  25. karaoke_gen/utils/remote_cli.py +1965 -0
  26. karaoke_gen/video_background_processor.py +351 -0
  27. karaoke_gen-0.71.27.dist-info/METADATA +610 -0
  28. karaoke_gen-0.71.27.dist-info/RECORD +275 -0
  29. {karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/WHEEL +1 -1
  30. {karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info}/entry_points.txt +1 -0
  31. lyrics_transcriber/__init__.py +10 -0
  32. lyrics_transcriber/cli/__init__.py +0 -0
  33. lyrics_transcriber/cli/cli_main.py +285 -0
  34. lyrics_transcriber/core/__init__.py +0 -0
  35. lyrics_transcriber/core/config.py +50 -0
  36. lyrics_transcriber/core/controller.py +520 -0
  37. lyrics_transcriber/correction/__init__.py +0 -0
  38. lyrics_transcriber/correction/agentic/__init__.py +9 -0
  39. lyrics_transcriber/correction/agentic/adapter.py +71 -0
  40. lyrics_transcriber/correction/agentic/agent.py +313 -0
  41. lyrics_transcriber/correction/agentic/feedback/aggregator.py +12 -0
  42. lyrics_transcriber/correction/agentic/feedback/collector.py +17 -0
  43. lyrics_transcriber/correction/agentic/feedback/retention.py +24 -0
  44. lyrics_transcriber/correction/agentic/feedback/store.py +76 -0
  45. lyrics_transcriber/correction/agentic/handlers/__init__.py +24 -0
  46. lyrics_transcriber/correction/agentic/handlers/ambiguous.py +44 -0
  47. lyrics_transcriber/correction/agentic/handlers/background_vocals.py +68 -0
  48. lyrics_transcriber/correction/agentic/handlers/base.py +51 -0
  49. lyrics_transcriber/correction/agentic/handlers/complex_multi_error.py +46 -0
  50. lyrics_transcriber/correction/agentic/handlers/extra_words.py +74 -0
  51. lyrics_transcriber/correction/agentic/handlers/no_error.py +42 -0
  52. lyrics_transcriber/correction/agentic/handlers/punctuation.py +44 -0
  53. lyrics_transcriber/correction/agentic/handlers/registry.py +60 -0
  54. lyrics_transcriber/correction/agentic/handlers/repeated_section.py +44 -0
  55. lyrics_transcriber/correction/agentic/handlers/sound_alike.py +126 -0
  56. lyrics_transcriber/correction/agentic/models/__init__.py +5 -0
  57. lyrics_transcriber/correction/agentic/models/ai_correction.py +31 -0
  58. lyrics_transcriber/correction/agentic/models/correction_session.py +30 -0
  59. lyrics_transcriber/correction/agentic/models/enums.py +38 -0
  60. lyrics_transcriber/correction/agentic/models/human_feedback.py +30 -0
  61. lyrics_transcriber/correction/agentic/models/learning_data.py +26 -0
  62. lyrics_transcriber/correction/agentic/models/observability_metrics.py +28 -0
  63. lyrics_transcriber/correction/agentic/models/schemas.py +46 -0
  64. lyrics_transcriber/correction/agentic/models/utils.py +19 -0
  65. lyrics_transcriber/correction/agentic/observability/__init__.py +5 -0
  66. lyrics_transcriber/correction/agentic/observability/langfuse_integration.py +35 -0
  67. lyrics_transcriber/correction/agentic/observability/metrics.py +46 -0
  68. lyrics_transcriber/correction/agentic/observability/performance.py +19 -0
  69. lyrics_transcriber/correction/agentic/prompts/__init__.py +2 -0
  70. lyrics_transcriber/correction/agentic/prompts/classifier.py +227 -0
  71. lyrics_transcriber/correction/agentic/providers/__init__.py +6 -0
  72. lyrics_transcriber/correction/agentic/providers/base.py +36 -0
  73. lyrics_transcriber/correction/agentic/providers/circuit_breaker.py +145 -0
  74. lyrics_transcriber/correction/agentic/providers/config.py +73 -0
  75. lyrics_transcriber/correction/agentic/providers/constants.py +24 -0
  76. lyrics_transcriber/correction/agentic/providers/health.py +28 -0
  77. lyrics_transcriber/correction/agentic/providers/langchain_bridge.py +212 -0
  78. lyrics_transcriber/correction/agentic/providers/model_factory.py +209 -0
  79. lyrics_transcriber/correction/agentic/providers/response_cache.py +218 -0
  80. lyrics_transcriber/correction/agentic/providers/response_parser.py +111 -0
  81. lyrics_transcriber/correction/agentic/providers/retry_executor.py +127 -0
  82. lyrics_transcriber/correction/agentic/router.py +35 -0
  83. lyrics_transcriber/correction/agentic/workflows/__init__.py +5 -0
  84. lyrics_transcriber/correction/agentic/workflows/consensus_workflow.py +24 -0
  85. lyrics_transcriber/correction/agentic/workflows/correction_graph.py +59 -0
  86. lyrics_transcriber/correction/agentic/workflows/feedback_workflow.py +24 -0
  87. lyrics_transcriber/correction/anchor_sequence.py +1043 -0
  88. lyrics_transcriber/correction/corrector.py +760 -0
  89. lyrics_transcriber/correction/feedback/__init__.py +2 -0
  90. lyrics_transcriber/correction/feedback/schemas.py +107 -0
  91. lyrics_transcriber/correction/feedback/store.py +236 -0
  92. lyrics_transcriber/correction/handlers/__init__.py +0 -0
  93. lyrics_transcriber/correction/handlers/base.py +52 -0
  94. lyrics_transcriber/correction/handlers/extend_anchor.py +149 -0
  95. lyrics_transcriber/correction/handlers/levenshtein.py +189 -0
  96. lyrics_transcriber/correction/handlers/llm.py +293 -0
  97. lyrics_transcriber/correction/handlers/llm_providers.py +60 -0
  98. lyrics_transcriber/correction/handlers/no_space_punct_match.py +154 -0
  99. lyrics_transcriber/correction/handlers/relaxed_word_count_match.py +85 -0
  100. lyrics_transcriber/correction/handlers/repeat.py +88 -0
  101. lyrics_transcriber/correction/handlers/sound_alike.py +259 -0
  102. lyrics_transcriber/correction/handlers/syllables_match.py +252 -0
  103. lyrics_transcriber/correction/handlers/word_count_match.py +80 -0
  104. lyrics_transcriber/correction/handlers/word_operations.py +187 -0
  105. lyrics_transcriber/correction/operations.py +352 -0
  106. lyrics_transcriber/correction/phrase_analyzer.py +435 -0
  107. lyrics_transcriber/correction/text_utils.py +30 -0
  108. lyrics_transcriber/frontend/.gitignore +23 -0
  109. lyrics_transcriber/frontend/.yarn/releases/yarn-4.7.0.cjs +935 -0
  110. lyrics_transcriber/frontend/.yarnrc.yml +3 -0
  111. lyrics_transcriber/frontend/README.md +50 -0
  112. lyrics_transcriber/frontend/REPLACE_ALL_FUNCTIONALITY.md +210 -0
  113. lyrics_transcriber/frontend/__init__.py +25 -0
  114. lyrics_transcriber/frontend/eslint.config.js +28 -0
  115. lyrics_transcriber/frontend/index.html +18 -0
  116. lyrics_transcriber/frontend/package.json +42 -0
  117. lyrics_transcriber/frontend/public/android-chrome-192x192.png +0 -0
  118. lyrics_transcriber/frontend/public/android-chrome-512x512.png +0 -0
  119. lyrics_transcriber/frontend/public/apple-touch-icon.png +0 -0
  120. lyrics_transcriber/frontend/public/favicon-16x16.png +0 -0
  121. lyrics_transcriber/frontend/public/favicon-32x32.png +0 -0
  122. lyrics_transcriber/frontend/public/favicon.ico +0 -0
  123. lyrics_transcriber/frontend/public/nomad-karaoke-logo.png +0 -0
  124. lyrics_transcriber/frontend/src/App.tsx +212 -0
  125. lyrics_transcriber/frontend/src/api.ts +239 -0
  126. lyrics_transcriber/frontend/src/components/AIFeedbackModal.tsx +77 -0
  127. lyrics_transcriber/frontend/src/components/AddLyricsModal.tsx +114 -0
  128. lyrics_transcriber/frontend/src/components/AgenticCorrectionMetrics.tsx +204 -0
  129. lyrics_transcriber/frontend/src/components/AudioPlayer.tsx +180 -0
  130. lyrics_transcriber/frontend/src/components/CorrectedWordWithActions.tsx +167 -0
  131. lyrics_transcriber/frontend/src/components/CorrectionAnnotationModal.tsx +359 -0
  132. lyrics_transcriber/frontend/src/components/CorrectionDetailCard.tsx +281 -0
  133. lyrics_transcriber/frontend/src/components/CorrectionMetrics.tsx +162 -0
  134. lyrics_transcriber/frontend/src/components/DurationTimelineView.tsx +257 -0
  135. lyrics_transcriber/frontend/src/components/EditActionBar.tsx +68 -0
  136. lyrics_transcriber/frontend/src/components/EditModal.tsx +702 -0
  137. lyrics_transcriber/frontend/src/components/EditTimelineSection.tsx +496 -0
  138. lyrics_transcriber/frontend/src/components/EditWordList.tsx +379 -0
  139. lyrics_transcriber/frontend/src/components/FileUpload.tsx +77 -0
  140. lyrics_transcriber/frontend/src/components/FindReplaceModal.tsx +467 -0
  141. lyrics_transcriber/frontend/src/components/Header.tsx +387 -0
  142. lyrics_transcriber/frontend/src/components/LyricsAnalyzer.tsx +1373 -0
  143. lyrics_transcriber/frontend/src/components/MetricsDashboard.tsx +51 -0
  144. lyrics_transcriber/frontend/src/components/ModeSelector.tsx +67 -0
  145. lyrics_transcriber/frontend/src/components/ModelSelector.tsx +23 -0
  146. lyrics_transcriber/frontend/src/components/PreviewVideoSection.tsx +144 -0
  147. lyrics_transcriber/frontend/src/components/ReferenceView.tsx +268 -0
  148. lyrics_transcriber/frontend/src/components/ReplaceAllLyricsModal.tsx +688 -0
  149. lyrics_transcriber/frontend/src/components/ReviewChangesModal.tsx +354 -0
  150. lyrics_transcriber/frontend/src/components/SegmentDetailsModal.tsx +64 -0
  151. lyrics_transcriber/frontend/src/components/TimelineEditor.tsx +376 -0
  152. lyrics_transcriber/frontend/src/components/TimingOffsetModal.tsx +131 -0
  153. lyrics_transcriber/frontend/src/components/TranscriptionView.tsx +256 -0
  154. lyrics_transcriber/frontend/src/components/WordDivider.tsx +187 -0
  155. lyrics_transcriber/frontend/src/components/shared/components/HighlightedText.tsx +379 -0
  156. lyrics_transcriber/frontend/src/components/shared/components/SourceSelector.tsx +56 -0
  157. lyrics_transcriber/frontend/src/components/shared/components/Word.tsx +87 -0
  158. lyrics_transcriber/frontend/src/components/shared/constants.ts +20 -0
  159. lyrics_transcriber/frontend/src/components/shared/hooks/useWordClick.ts +180 -0
  160. lyrics_transcriber/frontend/src/components/shared/styles.ts +13 -0
  161. lyrics_transcriber/frontend/src/components/shared/types.js +2 -0
  162. lyrics_transcriber/frontend/src/components/shared/types.ts +129 -0
  163. lyrics_transcriber/frontend/src/components/shared/utils/keyboardHandlers.ts +177 -0
  164. lyrics_transcriber/frontend/src/components/shared/utils/localStorage.ts +78 -0
  165. lyrics_transcriber/frontend/src/components/shared/utils/referenceLineCalculator.ts +75 -0
  166. lyrics_transcriber/frontend/src/components/shared/utils/segmentOperations.ts +360 -0
  167. lyrics_transcriber/frontend/src/components/shared/utils/timingUtils.ts +110 -0
  168. lyrics_transcriber/frontend/src/components/shared/utils/wordUtils.ts +22 -0
  169. lyrics_transcriber/frontend/src/hooks/useManualSync.ts +435 -0
  170. lyrics_transcriber/frontend/src/main.tsx +17 -0
  171. lyrics_transcriber/frontend/src/theme.ts +177 -0
  172. lyrics_transcriber/frontend/src/types/global.d.ts +9 -0
  173. lyrics_transcriber/frontend/src/types.js +2 -0
  174. lyrics_transcriber/frontend/src/types.ts +199 -0
  175. lyrics_transcriber/frontend/src/validation.ts +132 -0
  176. lyrics_transcriber/frontend/src/vite-env.d.ts +1 -0
  177. lyrics_transcriber/frontend/tsconfig.app.json +26 -0
  178. lyrics_transcriber/frontend/tsconfig.json +25 -0
  179. lyrics_transcriber/frontend/tsconfig.node.json +23 -0
  180. lyrics_transcriber/frontend/tsconfig.tsbuildinfo +1 -0
  181. lyrics_transcriber/frontend/update_version.js +11 -0
  182. lyrics_transcriber/frontend/vite.config.d.ts +2 -0
  183. lyrics_transcriber/frontend/vite.config.js +10 -0
  184. lyrics_transcriber/frontend/vite.config.ts +11 -0
  185. lyrics_transcriber/frontend/web_assets/android-chrome-192x192.png +0 -0
  186. lyrics_transcriber/frontend/web_assets/android-chrome-512x512.png +0 -0
  187. lyrics_transcriber/frontend/web_assets/apple-touch-icon.png +0 -0
  188. lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js +42039 -0
  189. lyrics_transcriber/frontend/web_assets/assets/index-DdJTDWH3.js.map +1 -0
  190. lyrics_transcriber/frontend/web_assets/favicon-16x16.png +0 -0
  191. lyrics_transcriber/frontend/web_assets/favicon-32x32.png +0 -0
  192. lyrics_transcriber/frontend/web_assets/favicon.ico +0 -0
  193. lyrics_transcriber/frontend/web_assets/index.html +18 -0
  194. lyrics_transcriber/frontend/web_assets/nomad-karaoke-logo.png +0 -0
  195. lyrics_transcriber/frontend/yarn.lock +3752 -0
  196. lyrics_transcriber/lyrics/__init__.py +0 -0
  197. lyrics_transcriber/lyrics/base_lyrics_provider.py +211 -0
  198. lyrics_transcriber/lyrics/file_provider.py +95 -0
  199. lyrics_transcriber/lyrics/genius.py +384 -0
  200. lyrics_transcriber/lyrics/lrclib.py +231 -0
  201. lyrics_transcriber/lyrics/musixmatch.py +156 -0
  202. lyrics_transcriber/lyrics/spotify.py +290 -0
  203. lyrics_transcriber/lyrics/user_input_provider.py +44 -0
  204. lyrics_transcriber/output/__init__.py +0 -0
  205. lyrics_transcriber/output/ass/__init__.py +21 -0
  206. lyrics_transcriber/output/ass/ass.py +2088 -0
  207. lyrics_transcriber/output/ass/ass_specs.txt +732 -0
  208. lyrics_transcriber/output/ass/config.py +180 -0
  209. lyrics_transcriber/output/ass/constants.py +23 -0
  210. lyrics_transcriber/output/ass/event.py +94 -0
  211. lyrics_transcriber/output/ass/formatters.py +132 -0
  212. lyrics_transcriber/output/ass/lyrics_line.py +265 -0
  213. lyrics_transcriber/output/ass/lyrics_screen.py +252 -0
  214. lyrics_transcriber/output/ass/section_detector.py +89 -0
  215. lyrics_transcriber/output/ass/section_screen.py +106 -0
  216. lyrics_transcriber/output/ass/style.py +187 -0
  217. lyrics_transcriber/output/cdg.py +619 -0
  218. lyrics_transcriber/output/cdgmaker/__init__.py +0 -0
  219. lyrics_transcriber/output/cdgmaker/cdg.py +262 -0
  220. lyrics_transcriber/output/cdgmaker/composer.py +2260 -0
  221. lyrics_transcriber/output/cdgmaker/config.py +151 -0
  222. lyrics_transcriber/output/cdgmaker/images/instrumental.png +0 -0
  223. lyrics_transcriber/output/cdgmaker/images/intro.png +0 -0
  224. lyrics_transcriber/output/cdgmaker/pack.py +507 -0
  225. lyrics_transcriber/output/cdgmaker/render.py +346 -0
  226. lyrics_transcriber/output/cdgmaker/transitions/centertexttoplogobottomtext.png +0 -0
  227. lyrics_transcriber/output/cdgmaker/transitions/circlein.png +0 -0
  228. lyrics_transcriber/output/cdgmaker/transitions/circleout.png +0 -0
  229. lyrics_transcriber/output/cdgmaker/transitions/fizzle.png +0 -0
  230. lyrics_transcriber/output/cdgmaker/transitions/largecentertexttoplogo.png +0 -0
  231. lyrics_transcriber/output/cdgmaker/transitions/rectangle.png +0 -0
  232. lyrics_transcriber/output/cdgmaker/transitions/spiral.png +0 -0
  233. lyrics_transcriber/output/cdgmaker/transitions/topleftmusicalnotes.png +0 -0
  234. lyrics_transcriber/output/cdgmaker/transitions/wipein.png +0 -0
  235. lyrics_transcriber/output/cdgmaker/transitions/wipeleft.png +0 -0
  236. lyrics_transcriber/output/cdgmaker/transitions/wipeout.png +0 -0
  237. lyrics_transcriber/output/cdgmaker/transitions/wiperight.png +0 -0
  238. lyrics_transcriber/output/cdgmaker/utils.py +132 -0
  239. lyrics_transcriber/output/countdown_processor.py +267 -0
  240. lyrics_transcriber/output/fonts/AvenirNext-Bold.ttf +0 -0
  241. lyrics_transcriber/output/fonts/DMSans-VariableFont_opsz,wght.ttf +0 -0
  242. lyrics_transcriber/output/fonts/DMSerifDisplay-Regular.ttf +0 -0
  243. lyrics_transcriber/output/fonts/Oswald-SemiBold.ttf +0 -0
  244. lyrics_transcriber/output/fonts/Zurich_Cn_BT_Bold.ttf +0 -0
  245. lyrics_transcriber/output/fonts/arial.ttf +0 -0
  246. lyrics_transcriber/output/fonts/georgia.ttf +0 -0
  247. lyrics_transcriber/output/fonts/verdana.ttf +0 -0
  248. lyrics_transcriber/output/generator.py +257 -0
  249. lyrics_transcriber/output/lrc_to_cdg.py +61 -0
  250. lyrics_transcriber/output/lyrics_file.py +102 -0
  251. lyrics_transcriber/output/plain_text.py +96 -0
  252. lyrics_transcriber/output/segment_resizer.py +431 -0
  253. lyrics_transcriber/output/subtitles.py +397 -0
  254. lyrics_transcriber/output/video.py +544 -0
  255. lyrics_transcriber/review/__init__.py +0 -0
  256. lyrics_transcriber/review/server.py +676 -0
  257. lyrics_transcriber/storage/__init__.py +0 -0
  258. lyrics_transcriber/storage/dropbox.py +225 -0
  259. lyrics_transcriber/transcribers/__init__.py +0 -0
  260. lyrics_transcriber/transcribers/audioshake.py +290 -0
  261. lyrics_transcriber/transcribers/base_transcriber.py +157 -0
  262. lyrics_transcriber/transcribers/whisper.py +330 -0
  263. lyrics_transcriber/types.py +648 -0
  264. lyrics_transcriber/utils/__init__.py +0 -0
  265. lyrics_transcriber/utils/word_utils.py +27 -0
  266. karaoke_gen-0.57.0.dist-info/METADATA +0 -167
  267. karaoke_gen-0.57.0.dist-info/RECORD +0 -23
  268. {karaoke_gen-0.57.0.dist-info → karaoke_gen-0.71.27.dist-info/licenses}/LICENSE +0 -0
@@ -0,0 +1,3 @@
1
+ nodeLinker: node-modules
2
+
3
+ yarnPath: .yarn/releases/yarn-4.7.0.cjs
@@ -0,0 +1,50 @@
1
+ # React + TypeScript + Vite
2
+
3
+ This template provides a minimal setup to get React working in Vite with HMR and some ESLint rules.
4
+
5
+ Currently, two official plugins are available:
6
+
7
+ - [@vitejs/plugin-react](https://github.com/vitejs/vite-plugin-react/blob/main/packages/plugin-react/README.md) uses [Babel](https://babeljs.io/) for Fast Refresh
8
+ - [@vitejs/plugin-react-swc](https://github.com/vitejs/vite-plugin-react-swc) uses [SWC](https://swc.rs/) for Fast Refresh
9
+
10
+ ## Expanding the ESLint configuration
11
+
12
+ If you are developing a production application, we recommend updating the configuration to enable type aware lint rules:
13
+
14
+ - Configure the top-level `parserOptions` property like this:
15
+
16
+ ```js
17
+ export default tseslint.config({
18
+ languageOptions: {
19
+ // other options...
20
+ parserOptions: {
21
+ project: ['./tsconfig.node.json', './tsconfig.app.json'],
22
+ tsconfigRootDir: import.meta.dirname,
23
+ },
24
+ },
25
+ })
26
+ ```
27
+
28
+ - Replace `tseslint.configs.recommended` to `tseslint.configs.recommendedTypeChecked` or `tseslint.configs.strictTypeChecked`
29
+ - Optionally add `...tseslint.configs.stylisticTypeChecked`
30
+ - Install [eslint-plugin-react](https://github.com/jsx-eslint/eslint-plugin-react) and update the config:
31
+
32
+ ```js
33
+ // eslint.config.js
34
+ import react from 'eslint-plugin-react'
35
+
36
+ export default tseslint.config({
37
+ // Set the react version
38
+ settings: { react: { version: '18.3' } },
39
+ plugins: {
40
+ // Add the react plugin
41
+ react,
42
+ },
43
+ rules: {
44
+ // other rules...
45
+ // Enable its recommended rules
46
+ ...react.configs.recommended.rules,
47
+ ...react.configs['jsx-runtime'].rules,
48
+ },
49
+ })
50
+ ```
@@ -0,0 +1,210 @@
1
+ Please read this doc to understand the "Replace All" modal we implemented in a previous chat: @REPLACE_ALL_FUNCTIONALITY.md
2
+
3
+ The primary code for the new modal is here: @ReplaceAllLyricsModal.tsx
4
+ but the manual sync functionality relies heavily on @EditTimelineSection.tsx, @useManualSync.ts and @EditActionBar.tsx
5
+
6
+ The functionality mostly works but we need to continue refining it and fixing issues until it is good enough for me and other users to use. Please let me know once you've reviewed the above and you're ready for me to explain the first issue.
7
+
8
+ # Replace All Lyrics Functionality
9
+
10
+ ## Overview
11
+
12
+ The "Replace All Lyrics" functionality provides a complete solution for replacing transcribed lyrics when the original transcription quality is too poor to edit word-by-word. This feature allows users to start fresh with clipboard content and manually sync timing for the entire song.
13
+
14
+ ## Key Components
15
+
16
+ ### 1. ReplaceAllLyricsModal.tsx
17
+ - **Location**: `src/components/ReplaceAllLyricsModal.tsx`
18
+ - **Purpose**: Standalone modal for replacing all lyrics with clipboard content
19
+ - **Design**: Separate from EditModal.tsx to maintain clean separation of concerns
20
+
21
+ ### 2. Integration Points
22
+ - **useManualSync Hook**: Reuses existing manual sync functionality
23
+ - **AudioPlayer Integration**: Leverages global audio controls and duration
24
+ - **Types**: Uses existing LyricsSegment and Word types
25
+
26
+ ## User Workflow
27
+
28
+ ### Phase 1: Input
29
+ 1. **Open Modal**: Access via "Replace All Lyrics" button/action
30
+ 2. **Paste Content**: Large textarea for pasting lyrics from clipboard
31
+ 3. **Real-time Feedback**:
32
+ - Line count display
33
+ - Word count display
34
+ - Preview of how content will be parsed
35
+ 4. **Validation**: Ensures content is not empty before proceeding
36
+
37
+ ### Phase 2: Manual Sync
38
+ 1. **Automatic Conversion**: Each line becomes a LyricsSegment, each word becomes a Word object
39
+ 2. **Timeline View**:
40
+ - Fixed 30-second zoom window
41
+ - Shows entire song duration (0 to audio duration)
42
+ - Visual indicators for word positions
43
+ 3. **Manual Timing**:
44
+ - Spacebar to mark word timings during playback
45
+ - Pause/resume functionality for corrections
46
+ - Real-time progress tracking
47
+ 4. **Progress Panel**:
48
+ - Shows all segments with sync status
49
+ - Active segment highlighting (blue)
50
+ - Completed segments (green) with timing display
51
+ - Progress indicators (X/Y words synced)
52
+ - Auto-scroll to follow playback
53
+
54
+ ## Technical Implementation
55
+
56
+ ### Data Structure
57
+ ```typescript
58
+ // Each line becomes a LyricsSegment
59
+ {
60
+ id: string,
61
+ text: string, // Full line text
62
+ start_time: number | null,
63
+ end_time: number | null,
64
+ words: Word[] // Each word in the line
65
+ }
66
+
67
+ // Each word becomes a Word object
68
+ {
69
+ id: string,
70
+ text: string, // Individual word
71
+ start_time: number | null,
72
+ end_time: number | null,
73
+ confidence: number // Set to 1.0 for manual entries
74
+ }
75
+ ```
76
+
77
+ ### Modal Layout
78
+ - **Full Browser Width**: Uses `maxWidth={false}` and viewport-based calculations
79
+ - **Split Layout**:
80
+ - Timeline Section: 2/3 width
81
+ - Progress Panel: 1/3 width
82
+ - **Responsive Design**: Adapts to different screen sizes
83
+
84
+ ### Audio Integration
85
+ - **Duration Detection**: Uses `window.getAudioDuration()` for accurate song length
86
+ - **Playback Control**: Integrates with existing audio controls
87
+ - **Auto-cleanup**: Stops audio when canceling sync
88
+
89
+ ## Key Features Implemented
90
+
91
+ ### 1. Stable Timeline View
92
+ - **Fixed Zoom**: Always shows 30-second window
93
+ - **Full Song Range**: Timeline spans 0 to full audio duration
94
+ - **Prevents Zoom Changes**: Disabled during manual sync to maintain consistency
95
+
96
+ ### 2. Manual Sync Enhancement
97
+ - **Spacebar Timing**: Press spacebar to mark word timings
98
+ - **Pause/Resume**: Alt+P to pause/resume for corrections
99
+ - **Visual Feedback**:
100
+ - Current word highlighting
101
+ - Spacebar press indication
102
+ - Progress tracking
103
+
104
+ ### 3. Progress Tracking
105
+ - **Segment Status**: Visual indicators for sync progress
106
+ - **Real-time Updates**: Timing updates as words are synced
107
+ - **Auto-scroll**: Follows active segment during sync
108
+ - **Completion Status**: Clear visual feedback for completed segments
109
+
110
+ ### 4. Error Prevention
111
+ - **Input Validation**: Ensures content exists before proceeding
112
+ - **Safe Navigation**: Proper cleanup when canceling
113
+ - **State Management**: Prevents conflicts with existing edit modals
114
+
115
+ ## Bug Fixes Implemented
116
+
117
+ ### 1. Manual Sync Issues
118
+ - **Problem**: Sync stopping after first spacebar press
119
+ - **Solution**: Fixed infinite re-renders in useEffect dependencies
120
+ - **Result**: Stable manual sync throughout entire song
121
+
122
+ ### 2. Timeline Zoom Problems
123
+ - **Problem**: Timeline zooming to single word duration after sync
124
+ - **Solution**: Fixed timeRange calculation to always use full song duration
125
+ - **Result**: Consistent 30-second view regardless of sync progress
126
+
127
+ ### 3. Audio Duration
128
+ - **Problem**: Hardcoded duration fallbacks causing inaccurate timelines
129
+ - **Solution**: Integration with real audio duration from AudioPlayer
130
+ - **Result**: Accurate timeline representation of song length
131
+
132
+ ### 4. Keyboard Conflicts
133
+ - **Problem**: Multiple keyboard handlers causing conflicts
134
+ - **Solution**: Proper handler cleanup and event management
135
+ - **Result**: Clean keyboard interaction without conflicts
136
+
137
+ ## User Experience Improvements
138
+
139
+ ### 1. Visual Feedback
140
+ - **Real-time Counts**: Live word/line counting during input
141
+ - **Progress Indicators**: Clear visual feedback on sync progress
142
+ - **Color Coding**: Blue for active, green for completed segments
143
+
144
+ ### 2. Navigation
145
+ - **Auto-scroll**: Automatically follows playback position
146
+ - **Manual Navigation**: Can manually scroll through segments
147
+ - **Status Preservation**: Maintains state during navigation
148
+
149
+ ### 3. Error Recovery
150
+ - **Pause/Resume**: Ability to pause and correct timing
151
+ - **Cancel Support**: Safe cancellation with proper cleanup
152
+ - **State Reset**: Clean state management between sessions
153
+
154
+ ## Integration with Existing Codebase
155
+
156
+ ### 1. Reused Components
157
+ - **useManualSync**: Leverages existing manual sync logic
158
+ - **Timeline Components**: Reuses timeline visualization
159
+ - **Audio Controls**: Integrates with existing audio system
160
+
161
+ ### 2. Type Safety
162
+ - **TypeScript**: Fully typed implementation
163
+ - **Consistent Interfaces**: Uses existing type definitions
164
+ - **Validation**: Runtime validation for data integrity
165
+
166
+ ### 3. State Management
167
+ - **Isolated State**: Doesn't interfere with existing edit functionality
168
+ - **Clean Separation**: Separate modal for replace vs. edit operations
169
+ - **Proper Cleanup**: Ensures no state leakage between modals
170
+
171
+ ## Performance Considerations
172
+
173
+ ### 1. Rendering Optimization
174
+ - **Memoization**: Strategic use of React.memo and useCallback
175
+ - **Efficient Updates**: Minimal re-renders during sync
176
+ - **Progressive Loading**: Handles large lyric sets efficiently
177
+
178
+ ### 2. Memory Management
179
+ - **Cleanup**: Proper cleanup of event listeners and timers
180
+ - **State Reset**: Clean state management between sessions
181
+ - **Audio Integration**: Efficient audio control integration
182
+
183
+ ## Future Enhancement Opportunities
184
+
185
+ ### 1. Batch Operations
186
+ - **Multi-line Selection**: Select and sync multiple segments at once
187
+ - **Timing Adjustment**: Bulk timing adjustments
188
+ - **Smart Defaults**: AI-suggested timing based on audio analysis
189
+
190
+ ### 2. Import/Export
191
+ - **Format Support**: Support for various lyric file formats
192
+ - **Backup/Restore**: Save and restore sync sessions
193
+ - **Templates**: Predefined timing templates
194
+
195
+ ### 3. Advanced Sync
196
+ - **Beat Detection**: Automatic beat-based timing suggestions
197
+ - **Voice Activity**: Audio analysis for timing hints
198
+ - **Collaborative Sync**: Multi-user timing collaboration
199
+
200
+ ## Summary
201
+
202
+ The "Replace All Lyrics" functionality provides a comprehensive solution for handling poor-quality transcriptions by:
203
+
204
+ 1. **Complete Replacement**: Replaces all existing lyrics with fresh clipboard content
205
+ 2. **Manual Control**: Gives users full control over timing through manual sync
206
+ 3. **Visual Feedback**: Provides clear progress tracking and status indicators
207
+ 4. **Stable Interface**: Maintains consistent timeline view throughout the process
208
+ 5. **Clean Integration**: Works seamlessly with existing audio and editing systems
209
+
210
+ This implementation significantly improves the user experience for cases where starting fresh is more efficient than editing individual words, while maintaining the high-quality timing precision needed for karaoke applications.
@@ -0,0 +1,25 @@
1
+ """Frontend module for lyrics transcriber web interface."""
2
+
3
+ import os
4
+
5
+ # Get the directory containing this file
6
+ __frontend_dir__ = os.path.dirname(os.path.abspath(__file__))
7
+
8
+ def get_frontend_assets_dir():
9
+ """Get the path to the frontend assets directory.
10
+
11
+ Returns the web_assets directory if it exists (packaged version),
12
+ otherwise returns the dist directory (development version).
13
+ """
14
+ web_assets_dir = os.path.join(__frontend_dir__, "web_assets")
15
+ dist_dir = os.path.join(__frontend_dir__, "dist")
16
+
17
+ if os.path.exists(web_assets_dir):
18
+ return web_assets_dir
19
+ elif os.path.exists(dist_dir):
20
+ return dist_dir
21
+ else:
22
+ raise FileNotFoundError(
23
+ "Frontend assets not found. Please build the frontend first with: "
24
+ "./scripts/build_frontend.sh"
25
+ )
@@ -0,0 +1,28 @@
1
+ import js from '@eslint/js'
2
+ import globals from 'globals'
3
+ import reactHooks from 'eslint-plugin-react-hooks'
4
+ import reactRefresh from 'eslint-plugin-react-refresh'
5
+ import tseslint from 'typescript-eslint'
6
+
7
+ export default tseslint.config(
8
+ { ignores: ['dist'] },
9
+ {
10
+ extends: [js.configs.recommended, ...tseslint.configs.recommended],
11
+ files: ['**/*.{ts,tsx}'],
12
+ languageOptions: {
13
+ ecmaVersion: 2020,
14
+ globals: globals.browser,
15
+ },
16
+ plugins: {
17
+ 'react-hooks': reactHooks,
18
+ 'react-refresh': reactRefresh,
19
+ },
20
+ rules: {
21
+ ...reactHooks.configs.recommended.rules,
22
+ 'react-refresh/only-export-components': [
23
+ 'warn',
24
+ { allowConstantExport: true },
25
+ ],
26
+ },
27
+ },
28
+ )
@@ -0,0 +1,18 @@
1
+ <!doctype html>
2
+ <html lang="en">
3
+ <head>
4
+ <meta charset="UTF-8" />
5
+ <link rel="icon" type="image/x-icon" href="/favicon.ico" />
6
+ <link rel="icon" type="image/png" sizes="16x16" href="/favicon-16x16.png" />
7
+ <link rel="icon" type="image/png" sizes="32x32" href="/favicon-32x32.png" />
8
+ <link rel="apple-touch-icon" sizes="180x180" href="/apple-touch-icon.png" />
9
+ <link rel="icon" type="image/png" sizes="192x192" href="/android-chrome-192x192.png" />
10
+ <link rel="icon" type="image/png" sizes="512x512" href="/android-chrome-512x512.png" />
11
+ <meta name="viewport" content="width=device-width, initial-scale=1.0" />
12
+ <title>Nomad Karaoke: Lyrics Review</title>
13
+ </head>
14
+ <body>
15
+ <div id="root"></div>
16
+ <script type="module" src="/src/main.tsx"></script>
17
+ </body>
18
+ </html>
@@ -0,0 +1,42 @@
1
+ {
2
+ "name": "lyrics-transcriber-frontend",
3
+ "private": true,
4
+ "homepage": "https://nomadkaraoke.github.io/lyrics-transcriber-frontend",
5
+ "version": "0.80.0",
6
+ "type": "module",
7
+ "scripts": {
8
+ "dev": "vite",
9
+ "build": "tsc -b && vite build --mode development",
10
+ "build-prod": "tsc -b && vite build",
11
+ "lint": "eslint .",
12
+ "preview": "vite preview",
13
+ "predeploy": "npm run build-prod",
14
+ "deploy": "gh-pages -d dist"
15
+ },
16
+ "dependencies": {
17
+ "@emotion/react": "^11.14.0",
18
+ "@emotion/styled": "^11.14.0",
19
+ "@mui/icons-material": "^6.3.0",
20
+ "@mui/material": "^6.3.0",
21
+ "@mui/system": "^6.4.3",
22
+ "nanoid": "^5.0.9",
23
+ "react": "^18.3.1",
24
+ "react-dom": "^18.3.1",
25
+ "zod": "^3.24.1"
26
+ },
27
+ "devDependencies": {
28
+ "@eslint/js": "^9.17.0",
29
+ "@types/react": "^18.3.18",
30
+ "@types/react-dom": "^18.3.5",
31
+ "@vitejs/plugin-react": "^4.3.4",
32
+ "eslint": "^9.17.0",
33
+ "eslint-plugin-react-hooks": "^5.0.0",
34
+ "eslint-plugin-react-refresh": "^0.4.16",
35
+ "gh-pages": "^6.3.0",
36
+ "globals": "^15.14.0",
37
+ "typescript": "~5.6.2",
38
+ "typescript-eslint": "^8.18.2",
39
+ "vite": "^6.0.5"
40
+ },
41
+ "packageManager": "yarn@4.7.0"
42
+ }
@@ -0,0 +1,212 @@
1
+ import UploadFileIcon from '@mui/icons-material/UploadFile'
2
+ import { Alert, Box, Button, Modal, Typography } from '@mui/material'
3
+ import { useEffect, useState } from 'react'
4
+ import { ApiClient, FileOnlyClient, LiveApiClient } from './api'
5
+ import CorrectionMetrics from './components/CorrectionMetrics'
6
+ import LyricsAnalyzer from './components/LyricsAnalyzer'
7
+ import { CorrectionData } from './types'
8
+
9
+ export default function App() {
10
+ const [data, setData] = useState<CorrectionData | null>(null)
11
+ const [showMetadata, setShowMetadata] = useState(false)
12
+ const [error, setError] = useState<string | null>(null)
13
+ const [apiClient, setApiClient] = useState<ApiClient | null>(null)
14
+ const [isReadOnly, setIsReadOnly] = useState(true)
15
+ const [audioHash, setAudioHash] = useState<string>('')
16
+
17
+ useEffect(() => {
18
+ // Parse query parameters
19
+ const params = new URLSearchParams(window.location.search)
20
+ const encodedApiUrl = params.get('baseApiUrl')
21
+ const audioHashParam = params.get('audioHash')
22
+
23
+ if (encodedApiUrl) {
24
+ const baseApiUrl = decodeURIComponent(encodedApiUrl)
25
+ setApiClient(new LiveApiClient(baseApiUrl))
26
+ setIsReadOnly(false)
27
+ if (audioHashParam) {
28
+ setAudioHash(audioHashParam)
29
+ }
30
+ // Fetch initial data
31
+ fetchData(baseApiUrl)
32
+ } else {
33
+ setApiClient(new FileOnlyClient())
34
+ setIsReadOnly(true)
35
+ }
36
+ }, [])
37
+
38
+ const fetchData = async (baseUrl: string) => {
39
+ try {
40
+ const client = new LiveApiClient(baseUrl)
41
+ const data = await client.getCorrectionData()
42
+ // console.log('Full correction data from API:', data)
43
+ setData(data)
44
+ } catch (err) {
45
+ const error = err as Error
46
+ setError(`Failed to fetch data: ${error.message}`)
47
+ }
48
+ }
49
+
50
+ const handleFileLoad = async () => {
51
+ const input = document.createElement('input')
52
+ input.type = 'file'
53
+ input.accept = '.json'
54
+
55
+ input.onchange = async (e) => {
56
+ const file = (e.target as HTMLInputElement).files?.[0]
57
+ if (!file) return
58
+
59
+ try {
60
+ const text = await file.text()
61
+ const parsedData = JSON.parse(text) as CorrectionData
62
+ console.log('File data loaded:', {
63
+ sampleGap: parsedData.gap_sequences?.[0],
64
+ sampleWord: parsedData.corrected_segments?.[0]?.words?.[0],
65
+ sampleCorrection: parsedData.corrections?.[0]
66
+ })
67
+
68
+ // Validate the structure
69
+ if (!parsedData.corrected_segments || !parsedData.gap_sequences) {
70
+ throw new Error('Invalid file format: missing required fields')
71
+ }
72
+
73
+ setData(parsedData)
74
+ } catch (err) {
75
+ const error = err as Error
76
+ setError(`Error loading file: ${error.message}. Please make sure it is a valid JSON file.`)
77
+ }
78
+ }
79
+
80
+ input.click()
81
+ }
82
+
83
+ const renderMetadataModal = () => {
84
+ if (!data) return null
85
+
86
+ return (
87
+ <Modal
88
+ open={showMetadata}
89
+ onClose={() => setShowMetadata(false)}
90
+ aria-labelledby="metadata-modal"
91
+ >
92
+ <Box sx={{
93
+ position: 'absolute',
94
+ top: '50%',
95
+ left: '50%',
96
+ transform: 'translate(-50%, -50%)',
97
+ width: 400,
98
+ bgcolor: 'background.paper',
99
+ boxShadow: 24,
100
+ p: 4,
101
+ borderRadius: 1,
102
+ }}>
103
+ <Typography variant="h6" gutterBottom>
104
+ Correction Process Details
105
+ </Typography>
106
+ <Box sx={{ mb: 2 }}>
107
+ <Typography variant="subtitle2" color="text.secondary">
108
+ Total Words
109
+ </Typography>
110
+ <Typography>
111
+ {data.metadata.total_words}
112
+ </Typography>
113
+ </Box>
114
+ <Box sx={{ mb: 2 }}>
115
+ <Typography variant="subtitle2" color="text.secondary">
116
+ Gap Sequences
117
+ </Typography>
118
+ <Typography>
119
+ {data.metadata.gap_sequences_count}
120
+ </Typography>
121
+ </Box>
122
+ <Box sx={{ mb: 2 }}>
123
+ <Typography variant="subtitle2" color="text.secondary">
124
+ Corrections Made
125
+ </Typography>
126
+ <Typography>
127
+ {data.corrections_made}
128
+ </Typography>
129
+ </Box>
130
+ <Box sx={{ mb: 2 }}>
131
+ <Typography variant="subtitle2" color="text.secondary">
132
+ Correction Ratio
133
+ </Typography>
134
+ <Typography>
135
+ {(data.metadata.correction_ratio * 100).toFixed(1)}%
136
+ </Typography>
137
+ </Box>
138
+ {/* Add any other metadata fields that are available */}
139
+ </Box>
140
+ </Modal>
141
+ )
142
+ }
143
+
144
+ if (!data) {
145
+ return (
146
+ <Box sx={{ p: 3 }}>
147
+ {error && (
148
+ <Alert severity="error" sx={{ mb: 2 }} onClose={() => setError(null)}>
149
+ {error}
150
+ </Alert>
151
+ )}
152
+ {isReadOnly ? (
153
+ <>
154
+ <Alert severity="info" sx={{ mb: 2 }}>
155
+ Running in read-only mode. Connect to an API to enable editing.
156
+ </Alert>
157
+ <Box sx={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', mb: 3 }}>
158
+ <Typography variant="h4">
159
+ Lyrics Correction Review
160
+ </Typography>
161
+ <Button
162
+ variant="outlined"
163
+ startIcon={<UploadFileIcon />}
164
+ onClick={handleFileLoad}
165
+ >
166
+ Load File
167
+ </Button>
168
+ </Box>
169
+ <Box sx={{ mb: 3 }}>
170
+ <CorrectionMetrics />
171
+ </Box>
172
+ </>
173
+ ) : (
174
+ <Box sx={{ display: 'flex', justifyContent: 'center', alignItems: 'center', height: '50vh' }}>
175
+ <Typography variant="h6" color="text.secondary">
176
+ Loading Lyrics Correction Review...
177
+ </Typography>
178
+ </Box>
179
+ )}
180
+ </Box>
181
+ )
182
+ }
183
+
184
+ return (
185
+ <Box sx={{
186
+ p: 1.5,
187
+ pb: 3,
188
+ maxWidth: '100%',
189
+ overflowX: 'hidden'
190
+ }}>
191
+ {error && (
192
+ <Alert severity="error" sx={{ mb: 1 }} onClose={() => setError(null)}>
193
+ {error}
194
+ </Alert>
195
+ )}
196
+ {isReadOnly && (
197
+ <Alert severity="info" sx={{ mb: 1 }}>
198
+ Running in read-only mode. Connect to an API to enable editing.
199
+ </Alert>
200
+ )}
201
+ <LyricsAnalyzer
202
+ data={data}
203
+ onFileLoad={handleFileLoad}
204
+ onShowMetadata={() => setShowMetadata(true)}
205
+ apiClient={apiClient}
206
+ isReadOnly={isReadOnly}
207
+ audioHash={audioHash}
208
+ />
209
+ {renderMetadataModal()}
210
+ </Box>
211
+ )
212
+ }